mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-09 02:42:05 +00:00
add attribution
This commit is contained in:
parent
ee7ba48b9a
commit
c858d791e5
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#define _cuda_buffers_cu
|
#define _cuda_buffers_cu
|
||||||
#include "cuda_buffers.cuh"
|
#include "cuda_buffers.cuh"
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _cuda_buffers_cuh
|
#ifndef _cuda_buffers_cuh
|
||||||
#define _cuda_buffers_cuh
|
#define _cuda_buffers_cuh
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _cuda_compat_cuh
|
#ifndef _cuda_compat_cuh
|
||||||
#define _cuda_compat_cuh
|
#define _cuda_compat_cuh
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#include "column_remap.cuh"
|
#include "column_remap.cuh"
|
||||||
#include "../util.cuh"
|
#include "../util.cuh"
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _column_remap_cuh
|
#ifndef _column_remap_cuh
|
||||||
#define _column_remap_cuh
|
#define _column_remap_cuh
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _q4_matmul_cuh
|
#ifndef _q4_matmul_cuh
|
||||||
#define _q4_matmul_cuh
|
#define _q4_matmul_cuh
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#include "q4_matrix.cuh"
|
#include "q4_matrix.cuh"
|
||||||
#include <vector>
|
#include <vector>
|
||||||
#include "../util.cuh"
|
#include "../util.cuh"
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _q4_matrix_cuh
|
#ifndef _q4_matrix_cuh
|
||||||
#define _q4_matrix_cuh
|
#define _q4_matrix_cuh
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#include <torch/extension.h>
|
#include <torch/extension.h>
|
||||||
#include <c10/cuda/CUDAGuard.h>
|
#include <c10/cuda/CUDAGuard.h>
|
||||||
#include <ATen/cuda/CUDAContext.h>
|
#include <ATen/cuda/CUDAContext.h>
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _matrix_cuh
|
#ifndef _matrix_cuh
|
||||||
#define _matrix_cuh
|
#define _matrix_cuh
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _tuning_h
|
#ifndef _tuning_h
|
||||||
#define _tuning_h
|
#define _tuning_h
|
||||||
|
|
||||||
|
@ -1,3 +1,5 @@
|
|||||||
|
// Adapted from turboderp exllama: https://github.com/turboderp/exllama
|
||||||
|
|
||||||
#ifndef _util_cuh
|
#ifndef _util_cuh
|
||||||
#define _util_cuh
|
#define _util_cuh
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user