@@ -41,6 +41,8 @@ onnxruntime_add_static_library(onnxruntime_mlas
4141 ${MLAS_SRC_DIR} /sqnbitgemm_q8_block.h
4242 ${MLAS_SRC_DIR} /flashattn.cpp
4343 ${MLAS_SRC_DIR} /cast.cpp
44+ ${MLAS_SRC_DIR} /rotary_embedding.h
45+ ${MLAS_SRC_DIR} /rotary_embedding.cpp
4446)
4547
4648target_sources (onnxruntime_mlas PRIVATE
@@ -88,8 +90,11 @@ function(setup_mlas_source_for_windows)
8890 ${MLAS_SRC_DIR} /qnbitgemm_kernel_neon.cpp
8991 ${MLAS_SRC_DIR} /sqnbitgemm_kernel_neon_fp32.cpp
9092 ${MLAS_SRC_DIR} /sqnbitgemm_kernel_neon_int8.cpp
91- ${MLAS_SRC_DIR} /fp16_neon_common .cpp
93+ ${MLAS_SRC_DIR} /cast_kernel_neon .cpp
9294 ${MLAS_SRC_DIR} /hqnbitgemm_kernel_neon_fp16.cpp
95+ ${MLAS_SRC_DIR} /rotary_embedding_kernel_neon.h
96+ ${MLAS_SRC_DIR} /rotary_embedding_kernel_neon.cpp
97+ ${MLAS_SRC_DIR} /rotary_embedding_kernel_neon_fp16.cpp
9398 )
9499
95100 set (mlas_platform_preprocess_srcs
@@ -367,6 +372,8 @@ else()
367372 ${MLAS_SRC_DIR} /qnbitgemm_kernel_neon.cpp
368373 ${MLAS_SRC_DIR} /sqnbitgemm_kernel_neon_fp32.cpp
369374 ${MLAS_SRC_DIR} /sqnbitgemm_kernel_neon_int8.cpp
375+ ${MLAS_SRC_DIR} /rotary_embedding_kernel_neon.h
376+ ${MLAS_SRC_DIR} /rotary_embedding_kernel_neon.cpp
370377 )
371378 set_source_files_properties (${MLAS_SRC_DIR} /sqnbitgemm_kernel_neon_int8.cpp
372379 PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+dotprod" )
@@ -384,8 +391,9 @@ else()
384391 ${MLAS_SRC_DIR} /qgemm_kernel_smmla.cpp
385392 ${MLAS_SRC_DIR} /qgemm_kernel_ummla.cpp
386393 ${MLAS_SRC_DIR} /sbgemm_kernel_neon.cpp
387- ${MLAS_SRC_DIR} /fp16_neon_common .cpp
394+ ${MLAS_SRC_DIR} /cast_kernel_neon .cpp
388395 ${MLAS_SRC_DIR} /hqnbitgemm_kernel_neon_fp16.cpp
396+ ${MLAS_SRC_DIR} /rotary_embedding_kernel_neon_fp16.cpp
389397 )
390398 set_source_files_properties (${MLAS_SRC_DIR} /aarch64/HalfGemmKernelNeon.S PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
391399 set_source_files_properties (${MLAS_SRC_DIR} /aarch64/QgemmS8S8KernelSmmla.S PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+i8mm " )
@@ -395,8 +403,9 @@ else()
395403 set_source_files_properties (${MLAS_SRC_DIR} /dwconv.cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
396404 set_source_files_properties (${MLAS_SRC_DIR} /pooling_fp16.cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
397405 set_source_files_properties (${MLAS_SRC_DIR} /sbgemm_kernel_neon.cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+bf16 " )
398- set_source_files_properties (${MLAS_SRC_DIR} /fp16_neon_common .cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
406+ set_source_files_properties (${MLAS_SRC_DIR} /cast_kernel_neon .cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
399407 set_source_files_properties (${MLAS_SRC_DIR} /hqnbitgemm_kernel_neon_fp16.cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
408+ set_source_files_properties (${MLAS_SRC_DIR} /rotary_embedding_kernel_neon_fp16.cpp PROPERTIES COMPILE_FLAGS " -march=armv8.2-a+fp16 " )
400409 endif ()
401410
402411 if (ONNXRUNTIME_MLAS_MULTI_ARCH)
0 commit comments