mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 20:34:54 +00:00
fix: run lint and update docs
This commit is contained in:
parent
1fb9d406e7
commit
1c917c0349
@ -2183,4 +2183,4 @@
|
|||||||
"description": "Hugging Face Text Generation Inference API"
|
"description": "Hugging Face Text Generation Inference API"
|
||||||
}
|
}
|
||||||
]
|
]
|
||||||
}
|
}
|
@ -20,6 +20,7 @@ Text Generation Inference enables serving optimized models on specific hardware
|
|||||||
- [Mixtral](https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1)
|
- [Mixtral](https://huggingface.co/mistralai/Mixtral-8x22B-Instruct-v0.1)
|
||||||
- [Gpt Bigcode](https://huggingface.co/bigcode/gpt_bigcode-santacoder)
|
- [Gpt Bigcode](https://huggingface.co/bigcode/gpt_bigcode-santacoder)
|
||||||
- [Phi](https://huggingface.co/microsoft/phi-1_5)
|
- [Phi](https://huggingface.co/microsoft/phi-1_5)
|
||||||
|
- [PhiMoe](https://huggingface.co/microsoft/Phi-3.5-MoE-instruct)
|
||||||
- [Baichuan](https://huggingface.co/baichuan-inc/Baichuan2-7B-Chat)
|
- [Baichuan](https://huggingface.co/baichuan-inc/Baichuan2-7B-Chat)
|
||||||
- [Falcon](https://huggingface.co/tiiuae/falcon-7b-instruct)
|
- [Falcon](https://huggingface.co/tiiuae/falcon-7b-instruct)
|
||||||
- [StarCoder 2](https://huggingface.co/bigcode/starcoder2-15b-instruct-v0.1)
|
- [StarCoder 2](https://huggingface.co/bigcode/starcoder2-15b-instruct-v0.1)
|
||||||
|
@ -4,9 +4,7 @@ import pytest
|
|||||||
@pytest.fixture(scope="module")
|
@pytest.fixture(scope="module")
|
||||||
def flash_llama_chat_handle(launcher):
|
def flash_llama_chat_handle(launcher):
|
||||||
with launcher(
|
with launcher(
|
||||||
"microsoft/Phi-3.5-MoE-instruct",
|
"microsoft/Phi-3.5-MoE-instruct", num_shard=4, cuda_graphs=[1, 2]
|
||||||
num_shard=4,
|
|
||||||
cuda_graphs=[1, 2]
|
|
||||||
) as handle:
|
) as handle:
|
||||||
yield handle
|
yield handle
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user