2024-05-13 10:44:30 +00:00
|
|
|
from text_generation_server.layers.tensor_parallel import (
|
|
|
|
TensorParallelColumnLinear,
|
|
|
|
TensorParallelRowLinear,
|
|
|
|
TensorParallelEmbedding,
|
|
|
|
)
|
|
|
|
from text_generation_server.layers.linear import (
|
|
|
|
get_linear,
|
|
|
|
FastLinear,
|
|
|
|
)
|
2024-05-14 10:33:18 +00:00
|
|
|
from text_generation_server.layers.speculative import SpeculativeHead
|
2024-05-13 10:44:30 +00:00
|
|
|
|
|
|
|
# Just to add the `load` methods.
|
|
|
|
from text_generation_server.layers.layernorm import load_layer_norm
|
|
|
|
from text_generation_server.layers.conv import load_conv2d
|
2024-06-25 18:46:27 +00:00
|
|
|
|
|
|
|
from text_generation_server.layers.lora import (
|
|
|
|
LoraLinear,
|
|
|
|
TensorParallelMultiAdapterLinear,
|
|
|
|
TensorParallelAdapterRowLinear,
|
|
|
|
)
|
2024-07-26 14:29:09 +00:00
|
|
|
|
|
|
|
__all__ = [
|
|
|
|
"get_linear",
|
|
|
|
"FastLinear",
|
|
|
|
"TensorParallelColumnLinear",
|
|
|
|
"TensorParallelRowLinear",
|
|
|
|
"TensorParallelEmbedding",
|
|
|
|
"SpeculativeHead",
|
|
|
|
"LoraLinear",
|
|
|
|
"TensorParallelMultiAdapterLinear",
|
|
|
|
"TensorParallelAdapterRowLinear",
|
|
|
|
"load_layer_norm",
|
|
|
|
"load_conv2d",
|
|
|
|
]
|