mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-12 04:44:52 +00:00
On 2 GPUs
This commit is contained in:
parent
ccc4fa24f8
commit
7081b8fb4d
4
.github/workflows/build.yaml
vendored
4
.github/workflows/build.yaml
vendored
@ -183,7 +183,7 @@ jobs:
|
||||
- name: Set up Python
|
||||
uses: actions/setup-python@v4
|
||||
with:
|
||||
python-version: "3.10"
|
||||
python-version: "3.11"
|
||||
- name: Install
|
||||
run: |
|
||||
make install-integration-tests
|
||||
@ -197,7 +197,7 @@ jobs:
|
||||
# export EXTRA_PYTEST="${{ needs.build-and-push.outputs.extra_pytest }}"
|
||||
export HF_TOKEN=${{ secrets.HF_TOKEN }}
|
||||
echo $DOCKER_IMAGE
|
||||
python -c 'import docker; client = docker.from_env(); client.containers.run("registry.internal.huggingface.tech/api-inference/community/text-generation-inference:sha-318bbc7-rocm", devices=["/dev/kfd", "/dev/dri"], environment={"MODEL_ID": "gpt2"})'
|
||||
python -c 'import docker; client = docker.from_env(); client.containers.run("registry.internal.huggingface.tech/api-inference/community/text-generation-inference:sha-318bbc7-rocm", devices=["/dev/kfd", "/dev/dri"], environment={"MODEL_ID": "gpt2", "NUM_SHARD": 2})'
|
||||
# which pytest
|
||||
pip freeze
|
||||
# pytest -s -vv integration-tests -k flash_llama_grammar_tools_auto
|
||||
|
Loading…
Reference in New Issue
Block a user