mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
Forgot docker launcher.
This commit is contained in:
parent
bfec09ecc2
commit
915e5f088c
@ -306,6 +306,7 @@ def launcher(event_loop):
|
|||||||
use_flash_attention: bool = True,
|
use_flash_attention: bool = True,
|
||||||
disable_grammar_support: bool = False,
|
disable_grammar_support: bool = False,
|
||||||
dtype: Optional[str] = None,
|
dtype: Optional[str] = None,
|
||||||
|
revision: Optional[str] = None,
|
||||||
):
|
):
|
||||||
port = random.randint(8000, 10_000)
|
port = random.randint(8000, 10_000)
|
||||||
|
|
||||||
@ -321,6 +322,9 @@ def launcher(event_loop):
|
|||||||
if dtype is not None:
|
if dtype is not None:
|
||||||
args.append("--dtype")
|
args.append("--dtype")
|
||||||
args.append(dtype)
|
args.append(dtype)
|
||||||
|
if revision is not None:
|
||||||
|
args.append("--revision")
|
||||||
|
args.append(revision)
|
||||||
if trust_remote_code:
|
if trust_remote_code:
|
||||||
args.append("--trust-remote-code")
|
args.append("--trust-remote-code")
|
||||||
|
|
||||||
|
@ -154,12 +154,8 @@ def download_weights(
|
|||||||
import json
|
import json
|
||||||
|
|
||||||
medusa_head = hf_hub_download(
|
medusa_head = hf_hub_download(
|
||||||
model_id, revision=revision, filename="medusa_lm_head.pt"
|
model_id, revision=revision, filename="medusa_lm_head.safetensors"
|
||||||
)
|
)
|
||||||
if auto_convert:
|
|
||||||
medusa_sf = Path(medusa_head[: -len(".pt")] + ".safetensors")
|
|
||||||
if not medusa_sf.exists():
|
|
||||||
utils.convert_files([Path(medusa_head)], [medusa_sf], [])
|
|
||||||
medusa_config = hf_hub_download(
|
medusa_config = hf_hub_download(
|
||||||
model_id, revision=revision, filename="config.json"
|
model_id, revision=revision, filename="config.json"
|
||||||
)
|
)
|
||||||
|
Loading…
Reference in New Issue
Block a user