mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-09 03:14:53 +00:00
lazy mode
Signed-off-by: Wang, Yi A <yi.a.wang@intel.com>
This commit is contained in:
parent
3db50ed9d3
commit
2007269fe7
@ -60,6 +60,7 @@ FROM vault.habana.ai/gaudi-docker/${HABANA_VERSION}/ubuntu22.04/habanalabs/pytor
|
|||||||
ENV ATTENTION=default
|
ENV ATTENTION=default
|
||||||
ENV PREFIX_CACHING=0
|
ENV PREFIX_CACHING=0
|
||||||
ENV PREFILL_CHUNKING=0
|
ENV PREFILL_CHUNKING=0
|
||||||
|
ENV PT_HPU_LAZY_MODE=1
|
||||||
|
|
||||||
# Text Generation Inference base env
|
# Text Generation Inference base env
|
||||||
ENV HF_HOME=/data \
|
ENV HF_HOME=/data \
|
||||||
|
Loading…
Reference in New Issue
Block a user