mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-21 23:12:07 +00:00
Disabling the sharding please.
This commit is contained in:
parent
5827137a29
commit
e680a57147
4
.github/workflows/nix_integration_tests.yaml
vendored
4
.github/workflows/nix_integration_tests.yaml
vendored
@ -21,6 +21,10 @@ jobs:
|
|||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
- uses: cachix/install-nix-action@v27
|
- uses: cachix/install-nix-action@v27
|
||||||
|
- name: Setup nix to mounted disk
|
||||||
|
run: |
|
||||||
|
sudo mkdir -p /mnt/hf_cache/nix/
|
||||||
|
sudo ln -s /mnt/hf_cache/nix /nix
|
||||||
- uses: cachix/cachix-action@v14
|
- uses: cachix/cachix-action@v14
|
||||||
with:
|
with:
|
||||||
name: text-generation-inference
|
name: text-generation-inference
|
||||||
|
@ -370,11 +370,7 @@ def launcher(event_loop):
|
|||||||
if num_shard is not None:
|
if num_shard is not None:
|
||||||
args.extend(["--num-shard", str(num_shard)])
|
args.extend(["--num-shard", str(num_shard)])
|
||||||
else:
|
else:
|
||||||
try:
|
args.extend(["--sharded", "false"])
|
||||||
os.environ["WORLD_SIZE"] = 1
|
|
||||||
del os.environ["NUM_SHARD"]
|
|
||||||
except Exception:
|
|
||||||
pass
|
|
||||||
if quantize is not None:
|
if quantize is not None:
|
||||||
args.append("--quantize")
|
args.append("--quantize")
|
||||||
args.append(quantize)
|
args.append(quantize)
|
||||||
@ -457,11 +453,7 @@ def launcher(event_loop):
|
|||||||
if num_shard is not None:
|
if num_shard is not None:
|
||||||
args.extend(["--num-shard", str(num_shard)])
|
args.extend(["--num-shard", str(num_shard)])
|
||||||
else:
|
else:
|
||||||
try:
|
args.extend(["--sharded", "false"])
|
||||||
os.environ["WORLD_SIZE"] = 1
|
|
||||||
del os.environ["NUM_SHARD"]
|
|
||||||
except Exception:
|
|
||||||
pass
|
|
||||||
if quantize is not None:
|
if quantize is not None:
|
||||||
args.append("--quantize")
|
args.append("--quantize")
|
||||||
args.append(quantize)
|
args.append(quantize)
|
||||||
|
Loading…
Reference in New Issue
Block a user