mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-04-23 07:52:06 +00:00
refactor: remove sagemaker entry-point
The SageMaker image is built differently anyway.
This commit is contained in:
parent
ae37890eef
commit
88a0948692
@ -153,14 +153,6 @@ COPY --from=builder /usr/src/target/release/text-generation-launcher /usr/local/
|
|||||||
COPY --from=pyserver /pyserver/build/dist dist
|
COPY --from=pyserver /pyserver/build/dist dist
|
||||||
RUN pip install dist/text_generation_server*.tar.gz
|
RUN pip install dist/text_generation_server*.tar.gz
|
||||||
|
|
||||||
# AWS Sagemaker compatible image
|
|
||||||
FROM neuron AS sagemaker
|
|
||||||
|
|
||||||
COPY backends/neuron/sagemaker-entrypoint.sh entrypoint.sh
|
|
||||||
RUN chmod +x entrypoint.sh
|
|
||||||
|
|
||||||
ENTRYPOINT ["./entrypoint.sh"]
|
|
||||||
|
|
||||||
# Final image
|
# Final image
|
||||||
FROM neuron
|
FROM neuron
|
||||||
|
|
||||||
|
@ -1,22 +0,0 @@
|
|||||||
#!/bin/bash
|
|
||||||
|
|
||||||
if [[ -z "${HF_MODEL_ID}" ]]; then
|
|
||||||
echo "HF_MODEL_ID must be set"
|
|
||||||
exit 1
|
|
||||||
fi
|
|
||||||
export MODEL_ID="${HF_MODEL_ID}"
|
|
||||||
|
|
||||||
if [[ -n "${HF_MODEL_REVISION}" ]]; then
|
|
||||||
export REVISION="${HF_MODEL_REVISION}"
|
|
||||||
fi
|
|
||||||
|
|
||||||
if [[ -n "${HF_MODEL_TRUST_REMOTE_CODE}" ]]; then
|
|
||||||
export TRUST_REMOTE_CODE="${HF_MODEL_TRUST_REMOTE_CODE}"
|
|
||||||
fi
|
|
||||||
|
|
||||||
if [[ -z "${MAX_BATCH_SIZE}" ]]; then
|
|
||||||
echo "MAX_BATCH_SIZE must be set to the model static batch size"
|
|
||||||
exit 1
|
|
||||||
fi
|
|
||||||
|
|
||||||
text-generation-launcher --port 8080
|
|
Loading…
Reference in New Issue
Block a user