refactor: remove sagemaker entry-point

The SageMaker image is built differently anyway.
This commit is contained in:
David Corvoysier 2025-02-19 09:00:54 +00:00
parent ae37890eef
commit 88a0948692
2 changed files with 0 additions and 30 deletions

View File

@ -153,14 +153,6 @@ COPY --from=builder /usr/src/target/release/text-generation-launcher /usr/local/
COPY --from=pyserver /pyserver/build/dist dist COPY --from=pyserver /pyserver/build/dist dist
RUN pip install dist/text_generation_server*.tar.gz RUN pip install dist/text_generation_server*.tar.gz
# AWS Sagemaker compatible image
FROM neuron AS sagemaker
COPY backends/neuron/sagemaker-entrypoint.sh entrypoint.sh
RUN chmod +x entrypoint.sh
ENTRYPOINT ["./entrypoint.sh"]
# Final image # Final image
FROM neuron FROM neuron

View File

@ -1,22 +0,0 @@
#!/bin/bash
if [[ -z "${HF_MODEL_ID}" ]]; then
echo "HF_MODEL_ID must be set"
exit 1
fi
export MODEL_ID="${HF_MODEL_ID}"
if [[ -n "${HF_MODEL_REVISION}" ]]; then
export REVISION="${HF_MODEL_REVISION}"
fi
if [[ -n "${HF_MODEL_TRUST_REMOTE_CODE}" ]]; then
export TRUST_REMOTE_CODE="${HF_MODEL_TRUST_REMOTE_CODE}"
fi
if [[ -z "${MAX_BATCH_SIZE}" ]]; then
echo "MAX_BATCH_SIZE must be set to the model static batch size"
exit 1
fi
text-generation-launcher --port 8080