revert to old version

This commit is contained in:
OlivierDehaene 2023-03-10 14:39:35 +01:00
parent c3e2b79a9e
commit c01d9b9d99

View File

@ -8,7 +8,7 @@ environment_variables:
MODEL_ID: bigscience/bloom MODEL_ID: bigscience/bloom
NUM_SHARD: 8 NUM_SHARD: 8
environment: environment:
image: db4c2190dd824d1f950f5d1555fbadf0.azurecr.io/text-generation-inference:sha-941cd42 image: db4c2190dd824d1f950f5d1555fbadf0.azurecr.io/text-generation-inference:sha-4e685d9
inference_config: inference_config:
liveness_route: liveness_route:
port: 80 port: 80
@ -25,14 +25,14 @@ request_settings:
max_concurrent_requests_per_instance: 256 max_concurrent_requests_per_instance: 256
liveness_probe: liveness_probe:
initial_delay: 200 initial_delay: 200
timeout: 20 timeout: 60
period: 60 period: 60
success_threshold: 1 success_threshold: 1
failure_threshold: 5 failure_threshold: 2
readiness_probe: readiness_probe:
initial_delay: 200 initial_delay: 200
timeout: 20 timeout: 60
period: 60 period: 60
success_threshold: 1 success_threshold: 1
failure_threshold: 5 failure_threshold: 2
instance_count: 1 instance_count: 1