We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6d243ef commit 21e3943Copy full SHA for 21e3943
vllm/v1/worker/gpu_model_runner.py
@@ -232,8 +232,10 @@ def __init__(
232
# The convention is different.
233
# self.cudagraph_batch_sizes sorts in ascending order.
234
# The batch sizes in the config are in descending order.
235
- self.cudagraph_batch_sizes = list(
236
- reversed(self.compilation_config.cudagraph_capture_sizes))
+ if self.compilation_config.cudagraph_capture_sizes and \
+ self.compilation_config.cudagraph_mode != CUDAGraphMode.NONE:
237
+ self.cudagraph_batch_sizes = list(
238
+ reversed(self.compilation_config.cudagraph_capture_sizes))
239
240
# Cache the device properties.
241
self._init_device_properties()
0 commit comments