We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4bc902a commit 986831fCopy full SHA for 986831f
tensorrt_llm/_torch/pyexecutor/model_engine.py
@@ -376,9 +376,8 @@ def __init__(
376
377
# Create config and runner
378
cuda_graph_runner_config = CUDAGraphRunnerConfig(
379
- use_cuda_graph=pytorch_backend_config.use_cuda_graph,
380
- cuda_graph_padding_enabled=pytorch_backend_config.
381
- cuda_graph_padding_enabled,
+ use_cuda_graph=self.cuda_graph_config is not None,
+ cuda_graph_padding_enabled=self._cuda_graph_padding_enabled,
382
cuda_graph_batch_sizes=self._cuda_graph_batch_sizes,
383
max_cuda_graph_batch_size=self._max_cuda_graph_batch_size,
384
max_beam_width=self.max_beam_width,
0 commit comments