mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-24 00:12:08 +00:00
21 lines
523 B
Python
21 lines
523 B
Python
from typing import List, Tuple
|
|
|
|
import torch
|
|
from text_generation_server.layers.marlin.fp8 import GPTQMarlinFP8Linear
|
|
from text_generation_server.layers.marlin.gptq import (
|
|
GPTQMarlinLinear,
|
|
GPTQMarlinWeight,
|
|
can_use_gptq_marlin,
|
|
repack_gptq_for_marlin,
|
|
)
|
|
from text_generation_server.layers.marlin.marlin import MarlinWeightsLoader
|
|
|
|
__all__ = [
|
|
"GPTQMarlinFP8Linear",
|
|
"GPTQMarlinLinear",
|
|
"GPTQMarlinWeight",
|
|
"MarlinWeightsLoader",
|
|
"can_use_gptq_marlin",
|
|
"repack_gptq_for_marlin",
|
|
]
|