text-generation-inference/server/text_generation_server/quant/__init__.py
2023-05-11 12:05:35 +00:00

5 lines
255 B
Python

from .quantizer import Quantizer
from .fused_attn import QuantLlamaAttention, make_quant_attn
from .fused_mlp import QuantLlamaMLP, make_fused_mlp, autotune_warmup_fused
from .quant_linear import QuantLinear, make_quant_linear, autotune_warmup_linear