From 2007269fe7eaecc37d96feccd8cbd71bf01ac18c Mon Sep 17 00:00:00 2001 From: "Wang, Yi A" Date: Sat, 3 May 2025 20:54:58 -0700 Subject: [PATCH] lazy mode Signed-off-by: Wang, Yi A --- Dockerfile_gaudi | 1 + 1 file changed, 1 insertion(+) diff --git a/Dockerfile_gaudi b/Dockerfile_gaudi index 06073fe4..5bb5b606 100644 --- a/Dockerfile_gaudi +++ b/Dockerfile_gaudi @@ -60,6 +60,7 @@ FROM vault.habana.ai/gaudi-docker/${HABANA_VERSION}/ubuntu22.04/habanalabs/pytor ENV ATTENTION=default ENV PREFIX_CACHING=0 ENV PREFILL_CHUNKING=0 +ENV PT_HPU_LAZY_MODE=1 # Text Generation Inference base env ENV HF_HOME=/data \