diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml index 09302cc4..99844974 100644 --- a/.github/workflows/build.yaml +++ b/.github/workflows/build.yaml @@ -193,5 +193,7 @@ jobs: export DOCKER_DEVICES=${{ needs.build-and-push.outputs.docker_devices }} export EXTRA_PYTEST="${{ needs.build-and-push.outputs.extra_pytest }}" export HF_TOKEN=${{ secrets.HF_TOKEN }} + export ROCR_VISIBLE_DEVICES=0,1 echo $DOCKER_IMAGE + rocm-smi pytest -s -vv integration-tests ${PYTEST_FLAGS} ${EXTRA_PYTEST} diff --git a/integration-tests/conftest.py b/integration-tests/conftest.py index eb55ebb9..b188e264 100644 --- a/integration-tests/conftest.py +++ b/integration-tests/conftest.py @@ -534,6 +534,10 @@ def launcher(event_loop): yield ContainerLauncherHandle(client, container.name, port) + import time + + time.sleep(600) + if not use_flash_attention: del env["USE_FLASH_ATTENTION"] @@ -589,7 +593,6 @@ def generate_multi(): max_new_tokens: int, seed: Optional[int] = None, ) -> List[Response]: - import numpy as np arange = np.arange(len(prompts))