mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-06-06 17:32:09 +00:00
add FastLinear import (#750)
# What does this PR do? Fixes #749 ## Who can review? Anyone in the community is free to review the PR once the tests have passed. Feel free to tag members/contributors who may be interested in your PR. <!-- Your PR will be replied to more quickly if you can figure out the right person to tag with @ @OlivierDehaene OR @Narsil --> Co-authored-by: p_spozzhang <p_spozzhang@tencent.com>
This commit is contained in:
parent
7766fee9b1
commit
bd3088748e
@ -28,6 +28,7 @@ from transformers.modeling_outputs import (
|
|||||||
from transformers.modeling_utils import PreTrainedModel
|
from transformers.modeling_utils import PreTrainedModel
|
||||||
from transformers import OPTConfig
|
from transformers import OPTConfig
|
||||||
from text_generation_server.utils.layers import (
|
from text_generation_server.utils.layers import (
|
||||||
|
FastLinear,
|
||||||
TensorParallelColumnLinear,
|
TensorParallelColumnLinear,
|
||||||
TensorParallelEmbedding,
|
TensorParallelEmbedding,
|
||||||
TensorParallelRowLinear,
|
TensorParallelRowLinear,
|
||||||
|
Loading…
Reference in New Issue
Block a user