We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3889872 commit 373f8feCopy full SHA for 373f8fe
tensorrt_llm/_torch/pyexecutor/py_executor_creator.py
@@ -516,7 +516,7 @@ def drafting_loop_wrapper(model):
516
speculative_config=spec_config,
517
decoding_config=decoding_config,
518
kv_cache_config=kv_cache_config,
519
- disable_flashinfer_sampling=llm_args._disable_flashinfer_sampling,
+ disable_flashinfer_sampling=llm_args.disable_flashinfer_sampling,
520
)
521
logger.info(f"Using Sampler: {type(sampler).__name__}")
522
0 commit comments