chore(trtllm): ensure max throughput scheduling policy is selected

2025-07-30 20:00:16 +00:00 · 2024-10-21 23:40:54 +02:00 · 2024-10-21 23:40:54 +02:00 · 47d8c53dda
commit 47d8c53dda
parent a6ac2741a3
1 changed files with 1 additions and 0 deletions
--- a/backends/trtllm/lib/backend.cpp
+++ b/backends/trtllm/lib/backend.cpp
@ -53,6 +53,7 @@ tle::ExecutorConfig huggingface::tgi::backends::GetExecutorConfig(const json &co
    // Define some configuration variables
    execConfig.setKvCacheConfig(tle::KvCacheConfig(true));
    execConfig.setEnableChunkedContext(computeCapabilities.isPostAmpere());
+    execConfig.setSchedulerConfig(tle::SchedulerConfig(tle::CapacitySchedulerPolicy::kMAX_UTILIZATION));
    return execConfig;
 }