diff --git a/aml/deployment.yaml b/aml/deployment.yaml index ad4cf8e4..3b4a9e2e 100644 --- a/aml/deployment.yaml +++ b/aml/deployment.yaml @@ -8,7 +8,7 @@ environment_variables: MODEL_ID: bigscience/bloom NUM_SHARD: 8 environment: - image: db4c2190dd824d1f950f5d1555fbadf0.azurecr.io/text-generation-inference:sha-e520d5b + image: db4c2190dd824d1f950f5d1555fbadf0.azurecr.io/text-generation-inference:sha-4e685d9 inference_config: liveness_route: port: 80 @@ -18,7 +18,7 @@ environment: path: /health scoring_route: port: 80 - path: /generate + path: / instance_type: Standard_ND96amsr_A100_v4 request_settings: request_timeout_ms: 60000