We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 23cf72b commit da074beCopy full SHA for da074be
tensorrt_llm/_torch/attention_backend/trtllm.py
@@ -604,6 +604,9 @@ def is_nvfp4_output_kernel_available(
604
is_mla_enable,
605
)
606
607
+ def is_sm_version_trtllm_gen_kernel(self, sm):
608
+ return not (sm < 100 or sm in [120, 121])
609
+
610
611
@dataclass(kw_only=True)
612
class TrtllmAttentionMetadata(AttentionMetadata):
0 commit comments