mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-20 06:12:07 +00:00
revert to old version
This commit is contained in:
parent
c3e2b79a9e
commit
c01d9b9d99
@ -8,7 +8,7 @@ environment_variables:
|
|||||||
MODEL_ID: bigscience/bloom
|
MODEL_ID: bigscience/bloom
|
||||||
NUM_SHARD: 8
|
NUM_SHARD: 8
|
||||||
environment:
|
environment:
|
||||||
image: db4c2190dd824d1f950f5d1555fbadf0.azurecr.io/text-generation-inference:sha-941cd42
|
image: db4c2190dd824d1f950f5d1555fbadf0.azurecr.io/text-generation-inference:sha-4e685d9
|
||||||
inference_config:
|
inference_config:
|
||||||
liveness_route:
|
liveness_route:
|
||||||
port: 80
|
port: 80
|
||||||
@ -25,14 +25,14 @@ request_settings:
|
|||||||
max_concurrent_requests_per_instance: 256
|
max_concurrent_requests_per_instance: 256
|
||||||
liveness_probe:
|
liveness_probe:
|
||||||
initial_delay: 200
|
initial_delay: 200
|
||||||
timeout: 20
|
timeout: 60
|
||||||
period: 60
|
period: 60
|
||||||
success_threshold: 1
|
success_threshold: 1
|
||||||
failure_threshold: 5
|
failure_threshold: 2
|
||||||
readiness_probe:
|
readiness_probe:
|
||||||
initial_delay: 200
|
initial_delay: 200
|
||||||
timeout: 20
|
timeout: 60
|
||||||
period: 60
|
period: 60
|
||||||
success_threshold: 1
|
success_threshold: 1
|
||||||
failure_threshold: 5
|
failure_threshold: 2
|
||||||
instance_count: 1
|
instance_count: 1
|
||||||
|
Loading…
Reference in New Issue
Block a user