mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 11:54:52 +00:00
Add kernel target.
This commit is contained in:
parent
12191b7e42
commit
c6e702fb2f
@ -23,6 +23,7 @@ setup(
|
||||
"custom_kernels/exllama/cuda_func/q4_matmul.cu",
|
||||
"custom_kernels/exllama/cuda_func/q4_matrix.cu"
|
||||
],
|
||||
sources=["custom_kernels/fused_attention_cuda.cu"],
|
||||
)
|
||||
],
|
||||
cmdclass={"build_ext": BuildExtension},
|
||||
|
Loading…
Reference in New Issue
Block a user