Skip to content

Commit e63f847

Browse files
committed
disable alltoall
Signed-off-by: Enwei Zhu <[email protected]>
1 parent e13e268 commit e63f847

File tree

1 file changed

+4
-0
lines changed

1 file changed

+4
-0
lines changed

tensorrt_llm/_torch/modules/fused_moe/fused_moe_cute_dsl.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -10,6 +10,7 @@
1010
from ...model_config import ModelConfig
1111
from ...utils import AuxStreamType, Fp4QuantizedTensor, ceil_div
1212
from .fused_moe_cutlass import CutlassFusedMoE
13+
from .interface import AlltoallMethodType
1314
from .quantization import MoEWeightLoadingMode, NVFP4CuteDslFusedMoEMethod
1415
from .routing import BaseMoeRoutingMethod
1516

@@ -195,6 +196,9 @@ def __init__(
195196
layer_idx=layer_idx,
196197
)
197198

199+
def select_alltoall_method_type(self) -> AlltoallMethodType:
200+
return AlltoallMethodType.NotEnabled
201+
198202
def _get_quant_method(self):
199203
if self.quant_config is not None and self.quant_config.layer_quant_mode.has_any_quant(
200204
exclude_kv_cache=True):

0 commit comments

Comments
 (0)