We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6be6496 commit fb84464Copy full SHA for fb84464
vllm/v1/attention/backends/mla/cutlass_mla.py
@@ -109,12 +109,6 @@ def __init__(
109
"are not implemented for "
110
"CutlassMLAImpl")
111
112
- self._use_old_cutlass_mla = False
113
- force_old_cutlass = os.environ.get("FORCE_OLD_CUTLASS_MLA", None)
114
- if force_old_cutlass:
115
- logger.warning_once("Forcing old cutlass mla kernel")
116
- self._use_old_cutlass_mla = True
117
-
118
# TODO: Currently, num_kv_splits is limited to 16 to avoid hanging
119
# issues. In case the code hangs, use:
120
# FORCE_NUM_KV_SPLITS=1
0 commit comments