mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2025-09-05 20:19:51 +00:00
26 lines
No EOL
729 B
Python
26 lines
No EOL
729 B
Python
|
|
from setuptools import setup, Extension
|
|
from torch.utils import cpp_extension
|
|
from torch.utils.cpp_extension import BuildExtension, CUDAExtension
|
|
setup(
|
|
name='KTransformersOps',
|
|
ext_modules=[
|
|
CUDAExtension(
|
|
'KTransformersOps', [
|
|
'custom_gguf/dequant.cu',
|
|
'binding.cpp',
|
|
'gptq_marlin/gptq_marlin.cu',
|
|
# 'gptq_marlin_repack.cu',
|
|
],
|
|
extra_compile_args={
|
|
'cxx': ['-O3'],
|
|
'nvcc': [
|
|
'-O3',
|
|
'--use_fast_math',
|
|
'-Xcompiler', '-fPIC',
|
|
]
|
|
},
|
|
)
|
|
],
|
|
cmdclass={'build_ext': BuildExtension}
|
|
) |