We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 9a40c48 commit 2566c79Copy full SHA for 2566c79
CMakeLists.txt
@@ -215,7 +215,7 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
215
"hopper/instantiations/flash_fwd_hdim64_e4m3*_sm90.cu"
216
"hopper/instantiations/flash_fwd_hdim96_e4m3*_sm90.cu"
217
"hopper/instantiations/flash_fwd_hdim128_e4m3*_sm90.cu"
218
- "hopper/instantiations/flash_fwd_hdim196_e4m3*_sm90.cu"
+ "hopper/instantiations/flash_fwd_hdim192_e4m3*_sm90.cu"
219
"hopper/instantiations/flash_fwd_hdim256_e4m3*_sm90.cu")
220
# Add these for hdim diff cases (192 only)
221
file(GLOB FA3_FP8_GEN_SRCS_
0 commit comments