mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-05-23 02:32:09 +00:00
enable multi-card test
This commit is contained in:
parent
29b9c320fc
commit
c3241f4279
2
.github/workflows/build.yaml
vendored
2
.github/workflows/build.yaml
vendored
@ -129,7 +129,7 @@ jobs:
|
|||||||
export label_extension="-gaudi"
|
export label_extension="-gaudi"
|
||||||
export docker_volume="/mnt/cache"
|
export docker_volume="/mnt/cache"
|
||||||
export docker_devices=""
|
export docker_devices=""
|
||||||
export runs_on="itac-bm-emr-gaudi3-dell-1gaudi"
|
export runs_on="itac-bm-emr-gaudi3-dell-8gaudi"
|
||||||
export platform=""
|
export platform=""
|
||||||
export extra_pytest="--gaudi"
|
export extra_pytest="--gaudi"
|
||||||
export target=""
|
export target=""
|
||||||
|
@ -32,6 +32,7 @@ TEST_CONFIGS = {
|
|||||||
"--max-batch-prefill-tokens",
|
"--max-batch-prefill-tokens",
|
||||||
"2048",
|
"2048",
|
||||||
],
|
],
|
||||||
|
"run_by_default": True,
|
||||||
},
|
},
|
||||||
"meta-llama/Llama-3.1-8B-Instruct": {
|
"meta-llama/Llama-3.1-8B-Instruct": {
|
||||||
"model_id": "meta-llama/Llama-3.1-8B-Instruct",
|
"model_id": "meta-llama/Llama-3.1-8B-Instruct",
|
||||||
|
Loading…
Reference in New Issue
Block a user