text-generation-inference/backends/neuron/sagemaker-entrypoint.sh
2025-02-20 16:14:38 +01:00

23 lines
481 B
Bash

#!/bin/bash
if [[ -z "${HF_MODEL_ID}" ]]; then
echo "HF_MODEL_ID must be set"
exit 1
fi
export MODEL_ID="${HF_MODEL_ID}"
if [[ -n "${HF_MODEL_REVISION}" ]]; then
export REVISION="${HF_MODEL_REVISION}"
fi
if [[ -n "${HF_MODEL_TRUST_REMOTE_CODE}" ]]; then
export TRUST_REMOTE_CODE="${HF_MODEL_TRUST_REMOTE_CODE}"
fi
if [[ -z "${MAX_BATCH_SIZE}" ]]; then
echo "MAX_BATCH_SIZE must be set to the model static batch size"
exit 1
fi
text-generation-launcher --port 8080