feat: sort cuda graphs in descending order (#2104)
This commit is contained in:
parent
197c47a302
commit
811a9381b1
|
@ -15,6 +15,13 @@ if cuda_graphs is not None:
|
|||
else:
|
||||
cuda_graphs = None
|
||||
|
||||
|
||||
# sorting the cuda graphs in descending order helps reduce the
|
||||
# memory impact and results in less memory usage
|
||||
if cuda_graphs is not None:
|
||||
cuda_graphs.sort(reverse=True)
|
||||
|
||||
|
||||
CUDA_GRAPHS = cuda_graphs
|
||||
|
||||
# This is overridden at model loading.
|
||||
|
|
Loading…
Reference in New Issue