diff --git a/Dockerfile b/Dockerfile index 91b5b337..a963db2f 100644 --- a/Dockerfile +++ b/Dockerfile @@ -208,7 +208,7 @@ COPY server/Makefile server/Makefile ENV UV_SYSTEM_PYTHON=1 RUN cd server && \ pip install -U pip uv && \ - uv sync --frozen --extra gen --extra attention --extra bnb --extra accelerate --extra compressed-tensors --extra marlin --extra moe --extra quantize --extra peft --extra outlines && \ + uv sync --frozen --extra gen --extra attention --extra bnb --extra accelerate --extra compressed-tensors --extra marlin --extra moe --extra quantize --extra peft --extra outlines --no-install-project && \ . ./.venv/bin/activate && \ make gen-server-raw diff --git a/Dockerfile_amd b/Dockerfile_amd index 79d983a7..f95f3b6d 100644 --- a/Dockerfile_amd +++ b/Dockerfile_amd @@ -320,9 +320,16 @@ COPY server server COPY server/Makefile server/Makefile ENV UV_SYSTEM_PYTHON=1 RUN cd server && \ - make gen-server && \ pip install -U pip uv && \ - uv pip install -r requirements_rocm.txt --no-cache-dir + uv sync --frozen --extra gen --extra accelerate --extra compressed-tensors --extra quantize --extra peft --extra outlines --no-install-project && \ + . ./.venv/bin/activate && \ + make gen-server-raw + +RUN cd server && \ + uv sync --frozen --extra gen --extra accelerate --extra compressed-tensors --extra quantize --extra peft --extra outlines && \ + . ./.venv/bin/activate && \ + pwd && \ + text-generation-server --help # Install benchmarker COPY --from=builder /usr/src/target/release-opt/text-generation-benchmark /usr/local/bin/text-generation-benchmark diff --git a/Dockerfile_intel b/Dockerfile_intel index 0f0d4383..3bd697fd 100644 --- a/Dockerfile_intel +++ b/Dockerfile_intel @@ -215,9 +215,16 @@ COPY server server COPY server/Makefile server/Makefile ENV UV_SYSTEM_PYTHON=1 RUN cd server && \ - make gen-server && \ pip install -U pip uv && \ - uv pip install -e ".[accelerate, compressed-tensors, peft, outlines]" --no-cache-dir + uv sync --frozen --extra gen --extra accelerate --extra compressed-tensors --extra quantize --extra peft --extra outlines --no-install-project && \ + . ./.venv/bin/activate && \ + make gen-server-raw + +RUN cd server && \ + uv sync --frozen --extra gen --extra accelerate --extra compressed-tensors --extra quantize --extra peft --extra outlines && \ + . ./.venv/bin/activate && \ + pwd && \ + text-generation-server --help # Install benchmarker COPY --from=builder /usr/src/target/release-opt/text-generation-benchmark /usr/local/bin/text-generation-benchmark @@ -231,5 +238,8 @@ ENV ATTENTION=flashdecoding-ipex ENV PREFIX_CACHING=1 ENV PREFILL_CHUNKING=1 ENV CUDA_GRAPHS=0 -ENTRYPOINT ["text-generation-launcher"] +COPY ./tgi-entrypoint.sh /tgi-entrypoint.sh +RUN chmod +x /tgi-entrypoint.sh + +ENTRYPOINT ["/tgi-entrypoint.sh"] CMD ["--json-output"]