mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-06 12:40:02 +00:00
18 lines
493 B
Python
18 lines
493 B
Python
|
|
from setuptools import setup, Extension
|
|
from torch.utils import cpp_extension
|
|
from torch.utils.cpp_extension import BuildExtension, CUDAExtension
|
|
|
|
# setup marlin gemm
|
|
setup(name='KTransformersOps',
|
|
ext_modules=[
|
|
CUDAExtension('KTransformersOps', [
|
|
'custom_gguf/dequant.cu',
|
|
'binding.cpp',
|
|
'gptq_marlin/gptq_marlin.cu',
|
|
# 'gptq_marlin_repack.cu',
|
|
])
|
|
],
|
|
cmdclass={'build_ext': BuildExtension
|
|
})
|
|
|