mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-24 00:12:08 +00:00
38 lines
1014 B
Python
38 lines
1014 B
Python
from text_generation_server.layers.tensor_parallel import (
|
|
TensorParallelColumnLinear,
|
|
TensorParallelRowLinear,
|
|
TensorParallelEmbedding,
|
|
)
|
|
from text_generation_server.layers.linear import (
|
|
get_linear,
|
|
FastLinear,
|
|
)
|
|
from text_generation_server.layers.speculative import SpeculativeHead
|
|
|
|
# Just to add the `load` methods.
|
|
from text_generation_server.layers.layernorm import load_layer_norm
|
|
from text_generation_server.layers.conv import load_conv2d
|
|
|
|
from text_generation_server.layers.lora import (
|
|
LoraLinear,
|
|
TensorParallelMultiAdapterLinear,
|
|
TensorParallelAdapterRowLinear,
|
|
)
|
|
|
|
from text_generation_server.layers.moe.fused_moe_rocm import grouped_topk
|
|
|
|
__all__ = [
|
|
"get_linear",
|
|
"FastLinear",
|
|
"TensorParallelColumnLinear",
|
|
"TensorParallelRowLinear",
|
|
"TensorParallelEmbedding",
|
|
"SpeculativeHead",
|
|
"LoraLinear",
|
|
"TensorParallelMultiAdapterLinear",
|
|
"TensorParallelAdapterRowLinear",
|
|
"load_layer_norm",
|
|
"load_conv2d",
|
|
"grouped_topk",
|
|
]
|