-
Notifications
You must be signed in to change notification settings - Fork 2
/
setup.py
26 lines (25 loc) · 798 Bytes
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from setuptools import setup
from torch.utils import cpp_extension
setup(
name="marlin",
version="0.2.1",
author="Roberto Lopez Castro",
author_email="roberto.lopez.castro@udc.es",
description="Highly optimized FP16x(INT4+2:4 sparsity) CUDA matmul kernel.",
install_requires=["numpy", "torch"],
packages=["marlin"],
ext_modules=[
cpp_extension.CUDAExtension(
"marlin_cuda",
[
"marlin/marlin_cuda.cpp",
"marlin/marlin_cuda_kernel.cu",
"marlin/marlin_cuda_kernel_nm.cu",
],
extra_compile_args={
"nvcc": ["-arch=sm_86", "--ptxas-options=-v", "-lineinfo"]
},
),
],
cmdclass={"build_ext": cpp_extension.BuildExtension},
)