|
4 | 4 |
|
5 | 5 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
6 | 6 | |---------|---------------|----------------|------------| |
7 | | -| 100000 | 0.069 | 0.460 | 6.67x | |
| 7 | +| 100000 | 0.079 | 0.520 | 6.58x | |
8 | 8 |
|
9 | 9 | #### float256 Subtraction |
10 | 10 |
|
11 | 11 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
12 | 12 | |---------|---------------|----------------|------------| |
13 | | -| 100000 | 0.069 | 0.471 | 6.83x | |
| 13 | +| 100000 | 0.079 | 0.511 | 6.47x | |
14 | 14 |
|
15 | 15 | #### float256 Multiplication |
16 | 16 |
|
17 | 17 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
18 | 18 | |---------|---------------|----------------|------------| |
19 | | -| 100000 | 0.070 | 0.572 | 8.17x | |
| 19 | +| 100000 | 0.079 | 0.577 | 7.30x | |
20 | 20 |
|
21 | 21 | #### float256 Division |
22 | 22 |
|
23 | 23 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
24 | 24 | |---------|---------------|----------------|------------| |
25 | | -| 100000 | 0.096 | 0.664 | 6.92x | |
| 25 | +| 100000 | 0.107 | 0.769 | 7.19x | |
26 | 26 |
|
27 | 27 | #### double256 Addition |
28 | 28 |
|
29 | 29 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
30 | 30 | |---------|---------------|----------------|------------| |
31 | | -| 100000 | 0.071 | 0.240 | 3.38x | |
| 31 | +| 100000 | 0.079 | 0.261 | 3.30x | |
32 | 32 |
|
33 | 33 | #### double256 Subtraction |
34 | 34 |
|
35 | 35 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
36 | 36 | |---------|---------------|----------------|------------| |
37 | | -| 100000 | 0.074 | 0.245 | 3.31x | |
| 37 | +| 100000 | 0.079 | 0.261 | 3.30x | |
38 | 38 |
|
39 | 39 | #### double256 Multiplication |
40 | 40 |
|
41 | 41 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
42 | 42 | |---------|---------------|----------------|------------| |
43 | | -| 100000 | 0.075 | 0.330 | 4.40x | |
| 43 | +| 100000 | 0.081 | 0.388 | 4.79x | |
44 | 44 |
|
45 | 45 | #### double256 Division |
46 | 46 |
|
47 | 47 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
48 | 48 | |---------|---------------|----------------|------------| |
49 | | -| 100000 | 0.118 | 0.467 | 3.96x | |
| 49 | +| 100000 | 0.141 | 0.565 | 4.01x | |
50 | 50 |
|
51 | 51 | #### int128_with_int32 t_Addition |
52 | 52 |
|
53 | 53 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
54 | 54 | |---------|---------------|----------------|------------| |
55 | | -| 1000000 | 2.480 | 3.050 | 1.23x | |
| 55 | +| 1000000 | 0.829 | 2.540 | 3.06x | |
56 | 56 |
|
57 | 57 | #### int128_with_int32 t_Subtraction |
58 | 58 |
|
59 | 59 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
60 | 60 | |---------|---------------|----------------|------------| |
61 | | -| 1000000 | 2.340 | 3.110 | 1.33x | |
| 61 | +| 1000000 | 0.829 | 2.560 | 3.09x | |
62 | 62 |
|
63 | 63 | #### int128_with_int32 t_Multiplication |
64 | 64 |
|
65 | 65 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
66 | 66 | |---------|---------------|----------------|------------| |
67 | | -| 100000 | 0.070 | 0.274 | 3.91x | |
| 67 | +| 100000 | 0.075 | 0.276 | 3.68x | |
68 | 68 |
|
69 | 69 | #### int128_with_int16 t_Addition |
70 | 70 |
|
71 | 71 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
72 | 72 | |---------|---------------|----------------|------------| |
73 | | -| 100000 | 0.072 | 0.473 | 6.57x | |
| 73 | +| 100000 | 0.074 | 0.513 | 6.93x | |
74 | 74 |
|
75 | 75 | #### int128_with_int16 t_Subtraction |
76 | 76 |
|
77 | 77 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
78 | 78 | |---------|---------------|----------------|------------| |
79 | | -| 100000 | 0.069 | 0.545 | 7.90x | |
| 79 | +| 100000 | 0.076 | 0.511 | 6.72x | |
80 | 80 |
|
81 | 81 | #### int128_with_int16 t_Multiplication |
82 | 82 |
|
83 | 83 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
84 | 84 | |---------|---------------|----------------|------------| |
85 | | -| 100000 | 0.073 | 0.559 | 7.66x | |
| 85 | +| 100000 | 0.074 | 0.615 | 8.31x | |
86 | 86 |
|
87 | 87 | #### int128_with_int8 t_Addition |
88 | 88 |
|
89 | 89 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
90 | 90 | |---------|---------------|----------------|------------| |
91 | | -| 100000 | 0.061 | 0.975 | 15.98x | |
| 91 | +| 100000 | 0.061 | 1.040 | 17.05x | |
92 | 92 |
|
93 | 93 | #### int128_with_int8 t_Subtraction |
94 | 94 |
|
95 | 95 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
96 | 96 | |---------|---------------|----------------|------------| |
97 | | -| 100000 | 0.059 | 1.090 | 18.47x | |
| 97 | +| 100000 | 0.067 | 1.030 | 15.37x | |
98 | 98 |
|
99 | 99 | #### int256_with_int32 t_Addition |
100 | 100 |
|
101 | 101 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
102 | 102 | |---------|---------------|----------------|------------| |
103 | | -| 100000 | 0.091 | 0.503 | 5.53x | |
| 103 | +| 100000 | 0.079 | 0.505 | 6.39x | |
104 | 104 |
|
105 | 105 | #### int256_with_int32 t_Subtraction |
106 | 106 |
|
107 | 107 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
108 | 108 | |---------|---------------|----------------|------------| |
109 | | -| 100000 | 0.084 | 0.500 | 5.95x | |
| 109 | +| 100000 | 0.079 | 0.508 | 6.43x | |
110 | 110 |
|
111 | 111 | #### int256_with_int32 t_Multiplication |
112 | 112 |
|
113 | 113 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
114 | 114 | |---------|---------------|----------------|------------| |
115 | | -| 100000 | 0.080 | 0.532 | 6.65x | |
| 115 | +| 100000 | 0.079 | 0.554 | 7.01x | |
116 | 116 |
|
117 | 117 | #### int256_with_int16 t_Addition |
118 | 118 |
|
119 | 119 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
120 | 120 | |---------|---------------|----------------|------------| |
121 | | -| 100000 | 0.074 | 1.060 | 14.32x | |
| 121 | +| 100000 | 0.079 | 1.030 | 13.04x | |
122 | 122 |
|
123 | 123 | #### int256_with_int16 t_Subtraction |
124 | 124 |
|
125 | 125 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
126 | 126 | |---------|---------------|----------------|------------| |
127 | | -| 100000 | 0.075 | 0.905 | 12.07x | |
| 127 | +| 100000 | 0.079 | 1.020 | 12.91x | |
128 | 128 |
|
129 | 129 | #### int256_with_int16 t_Multiplication |
130 | 130 |
|
131 | 131 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
132 | 132 | |---------|---------------|----------------|------------| |
133 | | -| 100000 | 0.079 | 1.130 | 14.30x | |
| 133 | +| 100000 | 0.079 | 1.160 | 14.68x | |
134 | 134 |
|
135 | 135 | #### int256_with_int8 t_Addition |
136 | 136 |
|
137 | 137 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
138 | 138 | |---------|---------------|----------------|------------| |
139 | | -| 100000 | 0.083 | 1.780 | 21.45x | |
| 139 | +| 100000 | 0.079 | 2.060 | 26.08x | |
140 | 140 |
|
141 | 141 | #### int256_with_int8 t_Subtraction |
142 | 142 |
|
143 | 143 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
144 | 144 | |---------|---------------|----------------|------------| |
145 | | -| 100000 | 0.070 | 2.150 | 30.71x | |
| 145 | +| 100000 | 0.079 | 2.200 | 27.85x | |
146 | 146 |
|
0 commit comments