Skip to content

Commit 4f38013

Browse files
committed
Update test cases.
1 parent 0993dfb commit 4f38013

File tree

2 files changed

+22
-22
lines changed

2 files changed

+22
-22
lines changed

tests/functional_tests/test_cases/common/moe_perf/baseline.json

Lines changed: 21 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -1,49 +1,49 @@
11
{
22
"deepseek_a2a_tp1ep8_bf16": {
3-
"backward_ms": 10.309884643554687,
4-
"forward_ms": 7.034489583969116,
5-
"max_allocated_bytes": 3626813952,
3+
"backward_ms": 10.153780746459962,
4+
"forward_ms": 6.925553631782532,
5+
"max_allocated_bytes": 3384636928,
66
"max_regression_ratio": 1.02
77
},
88
"deepseek_a2a_tp1ep8_fp8": {
9-
"backward_ms": 10.18668475151062,
10-
"forward_ms": 7.617563199996948,
11-
"max_allocated_bytes": 4837189632,
9+
"backward_ms": 9.97867522239685,
10+
"forward_ms": 7.455871963500977,
11+
"max_allocated_bytes": 4353529856,
1212
"max_regression_ratio": 1.02
1313
},
1414
"deepseek_deepep_tp1ep8_bf16": {
15-
"backward_ms": 8.947673559188843,
16-
"forward_ms": 5.455151987075806,
17-
"max_allocated_bytes": 2730491136,
15+
"backward_ms": 8.82816162109375,
16+
"forward_ms": 5.38592483997345,
17+
"max_allocated_bytes": 2386569728,
1818
"max_regression_ratio": 1.02
1919
},
2020
"deepseek_deepep_tp1ep8_fp8": {
21-
"backward_ms": 8.718684816360474,
22-
"forward_ms": 5.996280002593994,
23-
"max_allocated_bytes": 4130067712,
21+
"backward_ms": 8.520062398910522,
22+
"forward_ms": 5.844604754447937,
23+
"max_allocated_bytes": 3648516096,
2424
"max_regression_ratio": 1.02
2525
},
2626
"mixtral_a2a_tp1ep8_bf16": {
27-
"backward_ms": 7.681614398956299,
28-
"forward_ms": 4.157967972755432,
29-
"max_allocated_bytes": 2856544256,
27+
"backward_ms": 7.58143048286438,
28+
"forward_ms": 4.162228798866272,
29+
"max_allocated_bytes": 2857003008,
3030
"max_regression_ratio": 1.02
3131
},
3232
"mixtral_a2a_tp1ep8_fp8": {
33-
"backward_ms": 6.655782413482666,
34-
"forward_ms": 3.6682991862297056,
33+
"backward_ms": 6.573556804656983,
34+
"forward_ms": 3.6800352215766905,
3535
"max_allocated_bytes": 3062679552,
3636
"max_regression_ratio": 1.02
3737
},
3838
"mixtral_deepep_tp1ep8_bf16": {
39-
"backward_ms": 7.890902400016785,
40-
"forward_ms": 4.512491202354431,
39+
"backward_ms": 7.826888012886047,
40+
"forward_ms": 4.511423969268799,
4141
"max_allocated_bytes": 2856743424,
4242
"max_regression_ratio": 1.02
4343
},
4444
"mixtral_deepep_tp1ep8_fp8": {
45-
"backward_ms": 6.849382376670837,
46-
"forward_ms": 4.020219159126282,
45+
"backward_ms": 6.801019191741943,
46+
"forward_ms": 4.0494159936904905,
4747
"max_allocated_bytes": 3062223360,
4848
"max_regression_ratio": 1.02
4949
}

tests/functional_tests/test_cases/common/moe_perf/test_cases.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -84,7 +84,7 @@ def is_current_platform(self) -> bool:
8484
micro_batch_size=1,
8585
hidden_size=7168,
8686
moe_ffn_hidden_size=2048,
87-
num_experts=64,
87+
num_experts=32,
8888
router_topk=8,
8989
moe_router_load_balancing_type="seq_aux_loss",
9090
moe_router_num_groups=8,

0 commit comments

Comments
 (0)