[CI/Build] upgrade compressed-tensors to 0.12.2 to address LGPLv3 (vllm-project#26501)

csy1204 · xuebwang-amd · commit c08b543162c0 · 2025-10-24T09:27:25.000Z
Signed-off-by: Sangyeon Cho &lt;josang1204@gmail.com&gt;
Signed-off-by: xuebwang-amd &lt;xuebwang@amd.com&gt;
diff --git a/requirements/common.txt b/requirements/common.txt
@@ -38,7 +38,7 @@ pyyaml
 six>=1.16.0; python_version > '3.11' # transitive dependency of pandas that needs to be the latest version for python 3.12
 setuptools>=77.0.3,<80; python_version > '3.11' # Setuptools is used by triton, we need to ensure a modern version is installed for 3.12+ so that it does not try to import distutils, which was removed in 3.12
 einops # Required for Qwen2-VL.
-compressed-tensors == 0.11.0 # required for compressed-tensors
+compressed-tensors == 0.12.2 # required for compressed-tensors
 depyf==0.19.0 # required for profiling and debugging with compilation config
 cloudpickle # allows pickling lambda functions in model_executor/models/registry.py
 watchfiles # required for http server to monitor the updates of TLS files
diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors.py b/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors.py
@@ -310,7 +310,7 @@ def _is_fp4a4_nvfp4(
         )
         is_float_type = (
             weight_quant.type == QuantizationType.FLOAT
-            and input_quant.type == QuantizationType.FLOAT.value
+            and input_quant.type == QuantizationType.FLOAT
         )
         is_4_bits = weight_quant.num_bits == 4 and input_quant.num_bits == 4
 
diff --git a/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe.py b/vllm/model_executor/layers/quantization/compressed_tensors/compressed_tensors_moe.py
@@ -143,7 +143,7 @@ def get_moe_method(
             # Prefer to use the MarlinMoE kernel when it is supported.
             if not check_moe_marlin_supports_layer(layer, group_size):
                 if (
-                    weight_quant.strategy in QuantizationStrategy.GROUP
+                    weight_quant.strategy == QuantizationStrategy.GROUP
                     and weight_quant.actorder
                     in (ActivationOrdering.GROUP, ActivationOrdering.DYNAMIC)
                 ):

Original file line number	Diff line number	Diff line change
`@@ -310,7 +310,7 @@ def _is_fp4a4_nvfp4(`
`310`	`310`	`)`
`311`	`311`	`is_float_type = (`
`312`	`312`	`weight_quant.type == QuantizationType.FLOAT`
`313`		`- and input_quant.type == QuantizationType.FLOAT.value`
	`313`	`+ and input_quant.type == QuantizationType.FLOAT`
`314`	`314`	`)`
`315`	`315`	`is_4_bits = weight_quant.num_bits == 4 and input_quant.num_bits == 4`
`316`	`316`