File tree Expand file tree Collapse file tree 1 file changed +4
-0
lines changed
tensorrt_llm/_torch/modules/fused_moe Expand file tree Collapse file tree 1 file changed +4
-0
lines changed Original file line number Diff line number Diff line change 1010from ...model_config import ModelConfig
1111from ...utils import AuxStreamType , Fp4QuantizedTensor , ceil_div
1212from .fused_moe_cutlass import CutlassFusedMoE
13+ from .interface import AlltoallMethodType
1314from .quantization import MoEWeightLoadingMode , NVFP4CuteDslFusedMoEMethod
1415from .routing import BaseMoeRoutingMethod
1516
@@ -195,6 +196,9 @@ def __init__(
195196 layer_idx = layer_idx ,
196197 )
197198
199+ def select_alltoall_method_type (self ) -> AlltoallMethodType :
200+ return AlltoallMethodType .NotEnabled
201+
198202 def _get_quant_method (self ):
199203 if self .quant_config is not None and self .quant_config .layer_quant_mode .has_any_quant (
200204 exclude_kv_cache = True ):
You can’t perform that action at this time.
0 commit comments