mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-23 07:52:06 +00:00
18 lines
478 B
Python
18 lines
478 B
Python
|
from text_generation_server.layers.marlin.fp8 import GPTQMarlinFP8Linear
|
||
|
from text_generation_server.layers.marlin.gptq import (
|
||
|
GPTQMarlinLinear,
|
||
|
GPTQMarlinWeight,
|
||
|
can_use_gptq_marlin,
|
||
|
repack_gptq_for_marlin,
|
||
|
)
|
||
|
from text_generation_server.layers.marlin.marlin import MarlinWeightsLoader
|
||
|
|
||
|
__all__ = [
|
||
|
"GPTQMarlinFP8Linear",
|
||
|
"GPTQMarlinLinear",
|
||
|
"GPTQMarlinWeight",
|
||
|
"MarlinWeightsLoader",
|
||
|
"can_use_gptq_marlin",
|
||
|
"repack_gptq_for_marlin",
|
||
|
]
|