diff --git a/setup.py b/setup.py index bd610bc..b7fbdc8 100644 --- a/setup.py +++ b/setup.py @@ -13,7 +13,7 @@ setup( name='quant_cuda', ext_modules=[cpp_extension.CUDAExtension( - 'llmtune.engine.quant.quant_cuda', + 'quant_cuda', [ 'llmtools/engine/inference/cuda/quant_cuda.cpp', 'llmtools/engine/inference/cuda/quant_cuda_kernel.cu'