We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e1bc323 commit 6d7e988Copy full SHA for 6d7e988
vllm/model_executor/layers/fused_moe/flashinfer_cutlass_moe.py
@@ -110,7 +110,7 @@ def workspace_shapes(
110
"""
111
workspace1 = (curr_M, K)
112
workspace2 = (0, )
113
- output_shape = (M, K * 2 if if self.quant_dtype == "nvfp4" else K)
+ output_shape = (M, K * 2 if self.quant_dtype == "nvfp4" else K)
114
# The workspace is determined by `aq`, since it comes after any
115
# potential communication op and is involved in the expert computation.
116
return (workspace1, workspace2, output_shape)
0 commit comments