|
1 | 1 | { |
2 | 2 | "deepseek_a2a_tp1ep8_bf16": { |
3 | | - "backward_ms": 10.309884643554687, |
4 | | - "forward_ms": 7.034489583969116, |
5 | | - "max_allocated_bytes": 3626813952, |
| 3 | + "backward_ms": 10.153780746459962, |
| 4 | + "forward_ms": 6.925553631782532, |
| 5 | + "max_allocated_bytes": 3384636928, |
6 | 6 | "max_regression_ratio": 1.02 |
7 | 7 | }, |
8 | 8 | "deepseek_a2a_tp1ep8_fp8": { |
9 | | - "backward_ms": 10.18668475151062, |
10 | | - "forward_ms": 7.617563199996948, |
11 | | - "max_allocated_bytes": 4837189632, |
| 9 | + "backward_ms": 9.97867522239685, |
| 10 | + "forward_ms": 7.455871963500977, |
| 11 | + "max_allocated_bytes": 4353529856, |
12 | 12 | "max_regression_ratio": 1.02 |
13 | 13 | }, |
14 | 14 | "deepseek_deepep_tp1ep8_bf16": { |
15 | | - "backward_ms": 8.947673559188843, |
16 | | - "forward_ms": 5.455151987075806, |
17 | | - "max_allocated_bytes": 2730491136, |
| 15 | + "backward_ms": 8.82816162109375, |
| 16 | + "forward_ms": 5.38592483997345, |
| 17 | + "max_allocated_bytes": 2386569728, |
18 | 18 | "max_regression_ratio": 1.02 |
19 | 19 | }, |
20 | 20 | "deepseek_deepep_tp1ep8_fp8": { |
21 | | - "backward_ms": 8.718684816360474, |
22 | | - "forward_ms": 5.996280002593994, |
23 | | - "max_allocated_bytes": 4130067712, |
| 21 | + "backward_ms": 8.520062398910522, |
| 22 | + "forward_ms": 5.844604754447937, |
| 23 | + "max_allocated_bytes": 3648516096, |
24 | 24 | "max_regression_ratio": 1.02 |
25 | 25 | }, |
26 | 26 | "mixtral_a2a_tp1ep8_bf16": { |
27 | | - "backward_ms": 7.681614398956299, |
28 | | - "forward_ms": 4.157967972755432, |
29 | | - "max_allocated_bytes": 2856544256, |
| 27 | + "backward_ms": 7.58143048286438, |
| 28 | + "forward_ms": 4.162228798866272, |
| 29 | + "max_allocated_bytes": 2857003008, |
30 | 30 | "max_regression_ratio": 1.02 |
31 | 31 | }, |
32 | 32 | "mixtral_a2a_tp1ep8_fp8": { |
33 | | - "backward_ms": 6.655782413482666, |
34 | | - "forward_ms": 3.6682991862297056, |
| 33 | + "backward_ms": 6.573556804656983, |
| 34 | + "forward_ms": 3.6800352215766905, |
35 | 35 | "max_allocated_bytes": 3062679552, |
36 | 36 | "max_regression_ratio": 1.02 |
37 | 37 | }, |
38 | 38 | "mixtral_deepep_tp1ep8_bf16": { |
39 | | - "backward_ms": 7.890902400016785, |
40 | | - "forward_ms": 4.512491202354431, |
| 39 | + "backward_ms": 7.826888012886047, |
| 40 | + "forward_ms": 4.511423969268799, |
41 | 41 | "max_allocated_bytes": 2856743424, |
42 | 42 | "max_regression_ratio": 1.02 |
43 | 43 | }, |
44 | 44 | "mixtral_deepep_tp1ep8_fp8": { |
45 | | - "backward_ms": 6.849382376670837, |
46 | | - "forward_ms": 4.020219159126282, |
| 45 | + "backward_ms": 6.801019191741943, |
| 46 | + "forward_ms": 4.0494159936904905, |
47 | 47 | "max_allocated_bytes": 3062223360, |
48 | 48 | "max_regression_ratio": 1.02 |
49 | 49 | } |
|
0 commit comments