from typing import List, Tuple import torch from text_generation_server.layers.marlin.fp8 import GPTQMarlinFP8Linear from text_generation_server.layers.marlin.gptq import ( GPTQMarlinLinear, GPTQMarlinWeight, can_use_gptq_marlin, repack_gptq_for_marlin, ) from text_generation_server.layers.marlin.marlin import MarlinWeightsLoader __all__ = [ "GPTQMarlinFP8Linear", "GPTQMarlinLinear", "GPTQMarlinWeight", "MarlinWeightsLoader", "can_use_gptq_marlin", "repack_gptq_for_marlin", ]