mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
Forgot docker launcher.
This commit is contained in:
parent
bfec09ecc2
commit
915e5f088c
@ -306,6 +306,7 @@ def launcher(event_loop):
|
||||
use_flash_attention: bool = True,
|
||||
disable_grammar_support: bool = False,
|
||||
dtype: Optional[str] = None,
|
||||
revision: Optional[str] = None,
|
||||
):
|
||||
port = random.randint(8000, 10_000)
|
||||
|
||||
@ -321,6 +322,9 @@ def launcher(event_loop):
|
||||
if dtype is not None:
|
||||
args.append("--dtype")
|
||||
args.append(dtype)
|
||||
if revision is not None:
|
||||
args.append("--revision")
|
||||
args.append(revision)
|
||||
if trust_remote_code:
|
||||
args.append("--trust-remote-code")
|
||||
|
||||
|
@ -154,12 +154,8 @@ def download_weights(
|
||||
import json
|
||||
|
||||
medusa_head = hf_hub_download(
|
||||
model_id, revision=revision, filename="medusa_lm_head.pt"
|
||||
model_id, revision=revision, filename="medusa_lm_head.safetensors"
|
||||
)
|
||||
if auto_convert:
|
||||
medusa_sf = Path(medusa_head[: -len(".pt")] + ".safetensors")
|
||||
if not medusa_sf.exists():
|
||||
utils.convert_files([Path(medusa_head)], [medusa_sf], [])
|
||||
medusa_config = hf_hub_download(
|
||||
model_id, revision=revision, filename="config.json"
|
||||
)
|
||||
|
Loading…
Reference in New Issue
Block a user