Skip to content

Commit c537c76

Browse files
committed
fix e2m3/e3m2 bug
Signed-off-by: Felix Marty <Felix.Marty@amd.com>
1 parent 43f0ae8 commit c537c76

File tree

1 file changed

+2
-2
lines changed
  • vllm/model_executor/layers/fused_moe

1 file changed

+2
-2
lines changed

vllm/model_executor/layers/fused_moe/config.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -60,9 +60,9 @@ def get_config_quant_dtype(
6060
return torch.int8
6161
elif ocp_mx_scheme == "w_fp4_a_fp4":
6262
return "fp4"
63-
elif ocp_mx_scheme in ["w_fp4_a_fp6_e3m2", "w_fp4_a_fp6_e2m3", "w_fp6_e3m2_a_fp6_e3m2"]:
63+
elif ocp_mx_scheme in {"w_fp4_a_fp6_e3m2", "w_fp6_e3m2_a_fp6_e3m2"}:
6464
return "fp6_e3m2"
65-
elif ocp_mx_scheme == "w_fp6_e2m3_a_fp6_e2m3":
65+
elif ocp_mx_scheme in {"w_fp4_a_fp6_e2m3", "w_fp6_e2m3_a_fp6_e2m3"}:
6666
return "fp6_e2m3"
6767
return None
6868

0 commit comments

Comments
 (0)