diff --git a/.github/workflows/nix_integration_tests.yaml b/.github/workflows/nix_integration_tests.yaml index 4da36ec8..e480ba62 100644 --- a/.github/workflows/nix_integration_tests.yaml +++ b/.github/workflows/nix_integration_tests.yaml @@ -38,7 +38,8 @@ jobs: export NCCL_P2P_DISABLE=1 sudo find $NVIDIA . -name 'libcuda.so*' -exec ln -s {} /run/opengl-driver/lib/ \; sudo find $NVIDIA . -name 'libnvidia-ml.so*' -exec ln -s {} /run/opengl-driver/lib/ \; - nix develop .#test --command pytest -svvx integration-tests/ --release + nix develop .#test --command pytest -svvx integration-tests/models/test_bloom_560m.py::test_bloom_560m_all_params --release + # nix develop .#test --command pytest -svvx integration-tests/ --release env: HF_TOKEN: ${{ secrets.HF_TOKEN }} HF_HOME: /mnt/hf_cache/ diff --git a/integration-tests/conftest.py b/integration-tests/conftest.py index 83ba2d71..bcc4342c 100644 --- a/integration-tests/conftest.py +++ b/integration-tests/conftest.py @@ -456,6 +456,12 @@ def launcher(event_loop): args.append("--disable-grammar-support") if num_shard is not None: args.extend(["--num-shard", str(num_shard)]) + else: + try: + os.environ["WORLD_SIZE"] = 1 + del os.environ["NUM_SHARD"] + except Exception: + pass if quantize is not None: args.append("--quantize") args.append(quantize)