@@ -185,8 +185,8 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
185185 "hopper/instantiations/flash_fwd_hdim256_bf16*_sm90.cu" )
186186 # Add these for hdim diff cases
187187 file (GLOB FA3_BF16_GEN_SRCS_
188- # "hopper/instantiations/flash_fwd_hdim64_256_bf16*_sm90.cu"
189- # "hopper/instantiations/flash_fwd_hdim64_512_bf16*_sm90.cu"
188+ "hopper/instantiations/flash_fwd_hdim64_256_bf16*_sm90.cu"
189+ "hopper/instantiations/flash_fwd_hdim64_512_bf16*_sm90.cu"
190190 "hopper/instantiations/flash_fwd_hdim192_128_bf16*_sm90.cu" )
191191 list (APPEND FA3_BF16_GEN_SRCS ${FA3_BF16_GEN_SRCS_} )
192192 file (GLOB FA3_BF16_GEN_SRCS_
@@ -202,8 +202,8 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
202202 "hopper/instantiations/flash_fwd_hdim256_fp16*_sm90.cu" )
203203 # Add these for hdim diff cases
204204 file (GLOB FA3_FP16_GEN_SRCS_
205- # "hopper/instantiations/flash_fwd_hdim64_256_fp16*_sm90.cu"
206- # "hopper/instantiations/flash_fwd_hdim64_512_fp16*_sm90.cu"
205+ "hopper/instantiations/flash_fwd_hdim64_256_fp16*_sm90.cu"
206+ "hopper/instantiations/flash_fwd_hdim64_512_fp16*_sm90.cu"
207207 "hopper/instantiations/flash_fwd_hdim192_128_fp16*_sm90.cu" )
208208 list (APPEND FA3_FP16_GEN_SRCS ${FA3_FP16_GEN_SRCS_} )
209209 file (GLOB FA3_FP16_GEN_SRCS_
@@ -272,7 +272,7 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
272272 FLASHATTENTION_VARLEN_ONLY # Custom flag to save on binary size
273273 FLASHATTENTION_DISABLE_CLUSTER # disabled for varlen in any case
274274 # FLASHATTENTION_DISABLE_SM8x
275- FLASHATTENTION_DISABLE_HDIMDIFF64
275+ # FLASHATTENTION_DISABLE_HDIMDIFF64
276276 # FLASHATTENTION_DISABLE_HDIMDIFF192
277277 CUTE_SM90_EXTENDED_MMA_SHAPES_ENABLED
278278 CUTLASS_ENABLE_GDC_FOR_SM90
0 commit comments