mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-29 14:02:12 +00:00
Wtf ?
This commit is contained in:
parent
a34dbb0ca1
commit
5827137a29
3
.github/workflows/nix_integration_tests.yaml
vendored
3
.github/workflows/nix_integration_tests.yaml
vendored
@ -38,7 +38,8 @@ jobs:
|
|||||||
export NCCL_P2P_DISABLE=1
|
export NCCL_P2P_DISABLE=1
|
||||||
sudo find $NVIDIA . -name 'libcuda.so*' -exec ln -s {} /run/opengl-driver/lib/ \;
|
sudo find $NVIDIA . -name 'libcuda.so*' -exec ln -s {} /run/opengl-driver/lib/ \;
|
||||||
sudo find $NVIDIA . -name 'libnvidia-ml.so*' -exec ln -s {} /run/opengl-driver/lib/ \;
|
sudo find $NVIDIA . -name 'libnvidia-ml.so*' -exec ln -s {} /run/opengl-driver/lib/ \;
|
||||||
nix develop .#test --command pytest -svvx integration-tests/ --release
|
nix develop .#test --command pytest -svvx integration-tests/models/test_bloom_560m.py::test_bloom_560m_all_params --release
|
||||||
|
# nix develop .#test --command pytest -svvx integration-tests/ --release
|
||||||
env:
|
env:
|
||||||
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
HF_TOKEN: ${{ secrets.HF_TOKEN }}
|
||||||
HF_HOME: /mnt/hf_cache/
|
HF_HOME: /mnt/hf_cache/
|
||||||
|
@ -456,6 +456,12 @@ def launcher(event_loop):
|
|||||||
args.append("--disable-grammar-support")
|
args.append("--disable-grammar-support")
|
||||||
if num_shard is not None:
|
if num_shard is not None:
|
||||||
args.extend(["--num-shard", str(num_shard)])
|
args.extend(["--num-shard", str(num_shard)])
|
||||||
|
else:
|
||||||
|
try:
|
||||||
|
os.environ["WORLD_SIZE"] = 1
|
||||||
|
del os.environ["NUM_SHARD"]
|
||||||
|
except Exception:
|
||||||
|
pass
|
||||||
if quantize is not None:
|
if quantize is not None:
|
||||||
args.append("--quantize")
|
args.append("--quantize")
|
||||||
args.append(quantize)
|
args.append(quantize)
|
||||||
|
Loading…
Reference in New Issue
Block a user