From d299b52cb5c7e7420c141f1b1ab6b6e6022e3490 Mon Sep 17 00:00:00 2001 From: Morgan Funtowicz Date: Wed, 5 Feb 2025 16:15:31 +0100 Subject: [PATCH] backend(trtllm): link against decoder_attention_{0|1} --- backends/trtllm/CMakeLists.txt | 2 ++ backends/trtllm/build.rs | 5 +++-- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/backends/trtllm/CMakeLists.txt b/backends/trtllm/CMakeLists.txt index 7cd6e85a..5043d23f 100644 --- a/backends/trtllm/CMakeLists.txt +++ b/backends/trtllm/CMakeLists.txt @@ -59,6 +59,8 @@ target_link_libraries(tgi_trtllm_backend_impl PRIVATE tensorrt_llm nvinfer_plugi # This install all the artifacts in CMAKE_INSTALL_PREFIX under include/ lib/ bin/ to make easy to link / find it back install(TARGETS tgi_trtllm_backend_impl) +#install(TARGETS cutlass_src fb_gemm_src fpA_intB_gemm_src gemm_swiglu_sm90_src kernels_src) +install(TARGETS decoder_attention_0 decoder_attention_1) install(TARGETS tensorrt_llm nvinfer_plugin_tensorrt_llm decoder_attention_src executorWorker) install(FILES ${TRTLLM_NVRTC_WRAPPER_LIBRARY_PATH} TYPE LIB) if (NOT ${TGI_TRTLLM_BACKEND_DEBUG}) diff --git a/backends/trtllm/build.rs b/backends/trtllm/build.rs index 4d559fd4..aa613fd6 100644 --- a/backends/trtllm/build.rs +++ b/backends/trtllm/build.rs @@ -25,11 +25,12 @@ const IS_GHA_BUILD: LazyLock = LazyLock::new(|| { // Dependencies const BACKEND_DEPS: &str = "tgi_trtllm_backend_impl"; const CUDA_TRANSITIVE_DEPS: [&str; 4] = ["cuda", "cudart", "cublas", "nvidia-ml"]; -const TENSORRT_LLM_TRANSITIVE_DEPS: [(&str, &str); 4] = [ +const TENSORRT_LLM_TRANSITIVE_DEPS: [(&str, &str); 5] = [ ("dylib", "tensorrt_llm"), ("dylib", "tensorrt_llm_nvrtc_wrapper"), ("dylib", "nvinfer_plugin_tensorrt_llm"), - ("dylib", "decoder_attention"), + ("dylib", "decoder_attention_0"), + ("dylib", "decoder_attention_1"), ]; macro_rules! probe {