We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 43f0ae8 commit c537c76Copy full SHA for c537c76
vllm/model_executor/layers/fused_moe/config.py
@@ -60,9 +60,9 @@ def get_config_quant_dtype(
60
return torch.int8
61
elif ocp_mx_scheme == "w_fp4_a_fp4":
62
return "fp4"
63
- elif ocp_mx_scheme in ["w_fp4_a_fp6_e3m2", "w_fp4_a_fp6_e2m3", "w_fp6_e3m2_a_fp6_e3m2"]:
+ elif ocp_mx_scheme in {"w_fp4_a_fp6_e3m2", "w_fp6_e3m2_a_fp6_e3m2"}:
64
return "fp6_e3m2"
65
- elif ocp_mx_scheme == "w_fp6_e2m3_a_fp6_e2m3":
+ elif ocp_mx_scheme in {"w_fp4_a_fp6_e2m3", "w_fp6_e2m3_a_fp6_e2m3"}:
66
return "fp6_e2m3"
67
return None
68
0 commit comments