Skip to content

Commit ee4d25b

Browse files
Enable HDIMDIFF64 (#84)
* Enable HDIMDIFF64 Signed-off-by: Matthew Bonanni <mbonanni@redhat.com> * Add instantiations Signed-off-by: Matthew Bonanni <mbonanni@redhat.com> --------- Signed-off-by: Matthew Bonanni <mbonanni@redhat.com>
1 parent 57b4e68 commit ee4d25b

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

CMakeLists.txt

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -185,8 +185,8 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
185185
"hopper/instantiations/flash_fwd_hdim256_bf16*_sm90.cu")
186186
# Add these for hdim diff cases
187187
file(GLOB FA3_BF16_GEN_SRCS_
188-
# "hopper/instantiations/flash_fwd_hdim64_256_bf16*_sm90.cu"
189-
# "hopper/instantiations/flash_fwd_hdim64_512_bf16*_sm90.cu"
188+
"hopper/instantiations/flash_fwd_hdim64_256_bf16*_sm90.cu"
189+
"hopper/instantiations/flash_fwd_hdim64_512_bf16*_sm90.cu"
190190
"hopper/instantiations/flash_fwd_hdim192_128_bf16*_sm90.cu")
191191
list(APPEND FA3_BF16_GEN_SRCS ${FA3_BF16_GEN_SRCS_})
192192
file(GLOB FA3_BF16_GEN_SRCS_
@@ -202,8 +202,8 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
202202
"hopper/instantiations/flash_fwd_hdim256_fp16*_sm90.cu")
203203
# Add these for hdim diff cases
204204
file(GLOB FA3_FP16_GEN_SRCS_
205-
# "hopper/instantiations/flash_fwd_hdim64_256_fp16*_sm90.cu"
206-
# "hopper/instantiations/flash_fwd_hdim64_512_fp16*_sm90.cu"
205+
"hopper/instantiations/flash_fwd_hdim64_256_fp16*_sm90.cu"
206+
"hopper/instantiations/flash_fwd_hdim64_512_fp16*_sm90.cu"
207207
"hopper/instantiations/flash_fwd_hdim192_128_fp16*_sm90.cu")
208208
list(APPEND FA3_FP16_GEN_SRCS ${FA3_FP16_GEN_SRCS_})
209209
file(GLOB FA3_FP16_GEN_SRCS_
@@ -272,7 +272,7 @@ if (FA3_ENABLED AND ${CMAKE_CUDA_COMPILER_VERSION} GREATER_EQUAL 12.0)
272272
FLASHATTENTION_VARLEN_ONLY # Custom flag to save on binary size
273273
FLASHATTENTION_DISABLE_CLUSTER # disabled for varlen in any case
274274
# FLASHATTENTION_DISABLE_SM8x
275-
FLASHATTENTION_DISABLE_HDIMDIFF64
275+
# FLASHATTENTION_DISABLE_HDIMDIFF64
276276
# FLASHATTENTION_DISABLE_HDIMDIFF192
277277
CUTE_SM90_EXTENDED_MMA_SHAPES_ENABLED
278278
CUTLASS_ENABLE_GDC_FOR_SM90

0 commit comments

Comments
 (0)