mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 04:14:52 +00:00
doc: Update TRTLLM deployment doc. Update TRTLLM CI to allow release builds when tagging TGI.
This commit is contained in:
parent
fb51fc9001
commit
c9067176c3
10
.github/workflows/build.yaml
vendored
10
.github/workflows/build.yaml
vendored
@ -64,7 +64,7 @@ jobs:
|
|||||||
export runs_on="aws-g6-12xl-plus-priv-cache"
|
export runs_on="aws-g6-12xl-plus-priv-cache"
|
||||||
export platform=""
|
export platform=""
|
||||||
export extra_pytest=""
|
export extra_pytest=""
|
||||||
export target="nil"
|
export target=""
|
||||||
;;
|
;;
|
||||||
cuda-trtllm)
|
cuda-trtllm)
|
||||||
export dockerfile="Dockerfile_trtllm"
|
export dockerfile="Dockerfile_trtllm"
|
||||||
@ -79,7 +79,7 @@ jobs:
|
|||||||
export target="nil";
|
export target="nil";
|
||||||
else
|
else
|
||||||
export build_type="dev";
|
export build_type="dev";
|
||||||
export target="runtime-ci";
|
export target="ci-runtime";
|
||||||
fi
|
fi
|
||||||
;;
|
;;
|
||||||
rocm)
|
rocm)
|
||||||
@ -91,7 +91,7 @@ jobs:
|
|||||||
export runs_on="ubuntu-latest"
|
export runs_on="ubuntu-latest"
|
||||||
export platform=""
|
export platform=""
|
||||||
export extra_pytest="-k test_flash_gemma_gptq_load"
|
export extra_pytest="-k test_flash_gemma_gptq_load"
|
||||||
export target="nil"
|
export target=""
|
||||||
;;
|
;;
|
||||||
intel-xpu)
|
intel-xpu)
|
||||||
export dockerfile="Dockerfile_intel"
|
export dockerfile="Dockerfile_intel"
|
||||||
@ -101,7 +101,7 @@ jobs:
|
|||||||
export runs_on="ubuntu-latest"
|
export runs_on="ubuntu-latest"
|
||||||
export platform="xpu"
|
export platform="xpu"
|
||||||
export extra_pytest=""
|
export extra_pytest=""
|
||||||
export target="nil"
|
export target=""
|
||||||
;;
|
;;
|
||||||
intel-cpu)
|
intel-cpu)
|
||||||
export dockerfile="Dockerfile_intel"
|
export dockerfile="Dockerfile_intel"
|
||||||
@ -112,7 +112,7 @@ jobs:
|
|||||||
export runs_on="aws-highmemory-32-plus-priv"
|
export runs_on="aws-highmemory-32-plus-priv"
|
||||||
export platform="cpu"
|
export platform="cpu"
|
||||||
export extra_pytest="-k test_flash_gemma_simple"
|
export extra_pytest="-k test_flash_gemma_simple"
|
||||||
export target="nil"
|
export target=""
|
||||||
;;
|
;;
|
||||||
esac
|
esac
|
||||||
echo $dockerfile
|
echo $dockerfile
|
||||||
|
Loading…
Reference in New Issue
Block a user