We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 48207c9 commit c215c6aCopy full SHA for c215c6a
cmake/external_projects/flashmla.cmake
@@ -37,7 +37,8 @@ cuda_archs_loose_intersection(FLASH_MLA_ARCHS "9.0a" "${CUDA_ARCHS}")
37
if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER 12.3 AND FLASH_MLA_ARCHS)
38
set(FlashMLA_SOURCES
39
${flashmla_SOURCE_DIR}/csrc/flash_api.cpp
40
- ${flashmla_SOURCE_DIR}/csrc/flash_fwd_mla_bf16_sm90.cu)
+ ${flashmla_SOURCE_DIR}/csrc/flash_fwd_mla_bf16_sm90.cu
41
+ ${flashmla_SOURCE_DIR}/csrc/flash_fwd_mla_fp16_sm90.cu)
42
43
set(FlashMLA_INCLUDES
44
${flashmla_SOURCE_DIR}/csrc/cutlass/include
0 commit comments