mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
Fix .
This commit is contained in:
parent
fa40801fb6
commit
e672f976fb
@ -236,6 +236,7 @@ def launcher(event_loop):
|
||||
use_flash_attention: bool = True,
|
||||
disable_grammar_support: bool = False,
|
||||
dtype: Optional[str] = None,
|
||||
revision: Optional[str] = None,
|
||||
):
|
||||
port = random.randint(8000, 10_000)
|
||||
master_port = random.randint(10_000, 20_000)
|
||||
@ -268,6 +269,9 @@ def launcher(event_loop):
|
||||
if dtype is not None:
|
||||
args.append("--dtype")
|
||||
args.append(dtype)
|
||||
if revision is not None:
|
||||
args.append("--revision")
|
||||
args.append(revision)
|
||||
if trust_remote_code:
|
||||
args.append("--trust-remote-code")
|
||||
|
||||
|
@ -3,7 +3,9 @@ import pytest
|
||||
|
||||
@pytest.fixture(scope="module")
|
||||
def flash_medusa_handle(launcher):
|
||||
with launcher("FasterDecoding/medusa-vicuna-7b-v1.3", num_shard=2, revision="refs/pr/1") as handle:
|
||||
with launcher(
|
||||
"FasterDecoding/medusa-vicuna-7b-v1.3", num_shard=2, revision="refs/pr/1"
|
||||
) as handle:
|
||||
yield handle
|
||||
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user