feat: sort cuda graphs in descending order (#2104)

This commit is contained in:
drbh 2024-06-21 14:28:26 -04:00 committed by yuanwu
parent f0ed8d294f
commit d930724e82

View File

@ -15,6 +15,13 @@ if cuda_graphs is not None:
else:
cuda_graphs = None
# sorting the cuda graphs in descending order helps reduce the
# memory impact and results in less memory usage
if cuda_graphs is not None:
cuda_graphs.sort(reverse=True)
CUDA_GRAPHS = cuda_graphs
# This is overridden at model loading.