mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
Fix .
This commit is contained in:
parent
fa40801fb6
commit
e672f976fb
@ -236,6 +236,7 @@ def launcher(event_loop):
|
|||||||
use_flash_attention: bool = True,
|
use_flash_attention: bool = True,
|
||||||
disable_grammar_support: bool = False,
|
disable_grammar_support: bool = False,
|
||||||
dtype: Optional[str] = None,
|
dtype: Optional[str] = None,
|
||||||
|
revision: Optional[str] = None,
|
||||||
):
|
):
|
||||||
port = random.randint(8000, 10_000)
|
port = random.randint(8000, 10_000)
|
||||||
master_port = random.randint(10_000, 20_000)
|
master_port = random.randint(10_000, 20_000)
|
||||||
@ -268,6 +269,9 @@ def launcher(event_loop):
|
|||||||
if dtype is not None:
|
if dtype is not None:
|
||||||
args.append("--dtype")
|
args.append("--dtype")
|
||||||
args.append(dtype)
|
args.append(dtype)
|
||||||
|
if revision is not None:
|
||||||
|
args.append("--revision")
|
||||||
|
args.append(revision)
|
||||||
if trust_remote_code:
|
if trust_remote_code:
|
||||||
args.append("--trust-remote-code")
|
args.append("--trust-remote-code")
|
||||||
|
|
||||||
|
@ -3,7 +3,9 @@ import pytest
|
|||||||
|
|
||||||
@pytest.fixture(scope="module")
|
@pytest.fixture(scope="module")
|
||||||
def flash_medusa_handle(launcher):
|
def flash_medusa_handle(launcher):
|
||||||
with launcher("FasterDecoding/medusa-vicuna-7b-v1.3", num_shard=2, revision="refs/pr/1") as handle:
|
with launcher(
|
||||||
|
"FasterDecoding/medusa-vicuna-7b-v1.3", num_shard=2, revision="refs/pr/1"
|
||||||
|
) as handle:
|
||||||
yield handle
|
yield handle
|
||||||
|
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user