mirror of
https://github.com/huggingface/text-generation-inference.git
synced 2025-09-11 12:24:53 +00:00
backend(trtllm): use correct library reference decoder_attention_src
This commit is contained in:
parent
9f6f1e905d
commit
11c9acab42
@ -1,4 +1,4 @@
|
|||||||
ARG cuda_arch_list="75-real;80-real;86-real;89-real;90-real;100-real"
|
ARG cuda_arch_list="75-real;80-real;86-real;89-real;90-real;100-real;120-real"
|
||||||
ARG cuda_base=12.8.0
|
ARG cuda_base=12.8.0
|
||||||
ARG build_type=release
|
ARG build_type=release
|
||||||
ARG ompi_version=4.1.7
|
ARG ompi_version=4.1.7
|
||||||
|
@ -59,7 +59,7 @@ target_link_libraries(tgi_trtllm_backend_impl PRIVATE tensorrt_llm nvinfer_plugi
|
|||||||
|
|
||||||
# This install all the artifacts in CMAKE_INSTALL_PREFIX under include/ lib/ bin/ to make easy to link / find it back
|
# This install all the artifacts in CMAKE_INSTALL_PREFIX under include/ lib/ bin/ to make easy to link / find it back
|
||||||
install(TARGETS tgi_trtllm_backend_impl)
|
install(TARGETS tgi_trtllm_backend_impl)
|
||||||
install(TARGETS tensorrt_llm nvinfer_plugin_tensorrt_llm decoder_attention executorWorker)
|
install(TARGETS tensorrt_llm nvinfer_plugin_tensorrt_llm decoder_attention_src executorWorker)
|
||||||
install(FILES ${TRTLLM_NVRTC_WRAPPER_LIBRARY_PATH} TYPE LIB)
|
install(FILES ${TRTLLM_NVRTC_WRAPPER_LIBRARY_PATH} TYPE LIB)
|
||||||
if (NOT ${TGI_TRTLLM_BACKEND_DEBUG})
|
if (NOT ${TGI_TRTLLM_BACKEND_DEBUG})
|
||||||
install(FILES ${TRTLLM_EXECUTOR_STATIC_LIBRARY_PATH} TYPE LIB)
|
install(FILES ${TRTLLM_EXECUTOR_STATIC_LIBRARY_PATH} TYPE LIB)
|
||||||
|
Loading…
Reference in New Issue
Block a user