mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-10 20:04:52 +00:00
Adding the flag to docker laucnher.
This commit is contained in:
parent
e3c31c9d92
commit
26a271fad5
3
integration-tests/UNKNOWN.egg-info/PKG-INFO
Normal file
3
integration-tests/UNKNOWN.egg-info/PKG-INFO
Normal file
@ -0,0 +1,3 @@
|
||||
Metadata-Version: 2.1
|
||||
Name: UNKNOWN
|
||||
Version: 0.0.0
|
24
integration-tests/UNKNOWN.egg-info/SOURCES.txt
Normal file
24
integration-tests/UNKNOWN.egg-info/SOURCES.txt
Normal file
@ -0,0 +1,24 @@
|
||||
pyproject.toml
|
||||
UNKNOWN.egg-info/PKG-INFO
|
||||
UNKNOWN.egg-info/SOURCES.txt
|
||||
UNKNOWN.egg-info/dependency_links.txt
|
||||
UNKNOWN.egg-info/top_level.txt
|
||||
models/test_bloom_560m.py
|
||||
models/test_bloom_560m_sharded.py
|
||||
models/test_flash_awq.py
|
||||
models/test_flash_awq_sharded.py
|
||||
models/test_flash_falcon.py
|
||||
models/test_flash_llama.py
|
||||
models/test_flash_llama_gptq.py
|
||||
models/test_flash_mistral.py
|
||||
models/test_flash_neox.py
|
||||
models/test_flash_neox_sharded.py
|
||||
models/test_flash_santacoder.py
|
||||
models/test_flash_starcoder.py
|
||||
models/test_flash_starcoder_gptq.py
|
||||
models/test_idefics.py
|
||||
models/test_mpt.py
|
||||
models/test_mt0_base.py
|
||||
models/test_neox.py
|
||||
models/test_neox_sharded.py
|
||||
models/test_t5_sharded.py
|
1
integration-tests/UNKNOWN.egg-info/dependency_links.txt
Normal file
1
integration-tests/UNKNOWN.egg-info/dependency_links.txt
Normal file
@ -0,0 +1 @@
|
||||
|
1
integration-tests/UNKNOWN.egg-info/top_level.txt
Normal file
1
integration-tests/UNKNOWN.egg-info/top_level.txt
Normal file
@ -0,0 +1 @@
|
||||
models
|
@ -273,6 +273,7 @@ def launcher(event_loop):
|
||||
quantize: Optional[str] = None,
|
||||
trust_remote_code: bool = False,
|
||||
use_flash_attention: bool = True,
|
||||
dtype: Optional[str] = None
|
||||
):
|
||||
port = random.randint(8000, 10_000)
|
||||
|
||||
@ -283,6 +284,9 @@ def launcher(event_loop):
|
||||
if quantize is not None:
|
||||
args.append("--quantize")
|
||||
args.append(quantize)
|
||||
if dtype is not None:
|
||||
args.append("--dtype")
|
||||
args.append(dtype)
|
||||
if trust_remote_code:
|
||||
args.append("--trust-remote-code")
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user