File tree Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Expand file tree Collapse file tree 1 file changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -243,6 +243,7 @@ set(VLLM_EXT_SRC
243243 "csrc/sampler.cu"
244244 "csrc/cuda_view.cu"
245245 "csrc/quantization/gptq/q_gemm.cu"
246+ "csrc/quantization/compressed_tensors/int8_quant_kernels.cu"
246247 "csrc/quantization/fp8/common.cu"
247248 "csrc/quantization/fused_kernels/fused_layernorm_dynamic_per_token_quant.cu"
248249 "csrc/quantization/gguf/gguf_kernel.cu"
@@ -296,8 +297,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA")
296297 "csrc/sparse/cutlass/sparse_scaled_mm_entry.cu"
297298 "csrc/cutlass_extensions/common.cpp"
298299 "csrc/attention/mla/cutlass_mla_entry.cu"
299- "csrc/quantization/fp8/per_token_group_quant.cu"
300- "csrc/quantization/compressed_tensors/int8_quant_kernels.cu" )
300+ "csrc/quantization/fp8/per_token_group_quant.cu" )
301301
302302 set_gencode_flags_for_srcs(
303303 SRCS "${VLLM_EXT_SRC} "
You can’t perform that action at this time.
0 commit comments