|
4 | 4 |
|
5 | 5 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
6 | 6 | |---------|---------------|----------------|------------| |
7 | | -| 100000 | 0.108 | 0.506 | 4.69x | |
| 7 | +| 100000 | 0.106 | 0.508 | 4.79x | |
8 | 8 |
|
9 | 9 | #### float256 Subtraction |
10 | 10 |
|
11 | 11 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
12 | 12 | |---------|---------------|----------------|------------| |
13 | | -| 100000 | 0.108 | 0.506 | 4.69x | |
| 13 | +| 100000 | 0.105 | 0.506 | 4.82x | |
14 | 14 |
|
15 | 15 | #### float256 Multiplication |
16 | 16 |
|
17 | 17 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
18 | 18 | |---------|---------------|----------------|------------| |
19 | | -| 100000 | 0.110 | 0.686 | 6.24x | |
| 19 | +| 100000 | 0.106 | 0.696 | 6.57x | |
20 | 20 |
|
21 | 21 | #### float256 Division |
22 | 22 |
|
23 | 23 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
24 | 24 | |---------|---------------|----------------|------------| |
25 | | -| 100000 | 0.112 | 0.800 | 7.14x | |
| 25 | +| 100000 | 0.110 | 0.778 | 7.07x | |
26 | 26 |
|
27 | 27 | #### double256 Addition |
28 | 28 |
|
29 | 29 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
30 | 30 | |---------|---------------|----------------|------------| |
31 | | -| 100000 | 0.107 | 0.274 | 2.56x | |
| 31 | +| 100000 | 0.106 | 0.260 | 2.45x | |
32 | 32 |
|
33 | 33 | #### double256 Subtraction |
34 | 34 |
|
35 | 35 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
36 | 36 | |---------|---------------|----------------|------------| |
37 | | -| 100000 | 0.108 | 0.279 | 2.58x | |
| 37 | +| 100000 | 0.108 | 0.278 | 2.57x | |
38 | 38 |
|
39 | 39 | #### double256 Multiplication |
40 | 40 |
|
41 | 41 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
42 | 42 | |---------|---------------|----------------|------------| |
43 | | -| 100000 | 0.109 | 0.352 | 3.23x | |
| 43 | +| 100000 | 0.102 | 0.359 | 3.52x | |
44 | 44 |
|
45 | 45 | #### double256 Division |
46 | 46 |
|
47 | 47 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
48 | 48 | |---------|---------------|----------------|------------| |
49 | | -| 100000 | 0.143 | 0.561 | 3.92x | |
| 49 | +| 100000 | 0.143 | 0.563 | 3.94x | |
50 | 50 |
|
51 | 51 | #### int128_with_int32 t_Addition |
52 | 52 |
|
53 | 53 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
54 | 54 | |---------|---------------|----------------|------------| |
55 | | -| 1000000 | 1.050 | 2.580 | 2.46x | |
| 55 | +| 1000000 | 1.050 | 2.590 | 2.47x | |
56 | 56 |
|
57 | 57 | #### int128_with_int32 t_Subtraction |
58 | 58 |
|
59 | 59 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
60 | 60 | |---------|---------------|----------------|------------| |
61 | | -| 1000000 | 0.997 | 2.590 | 2.60x | |
| 61 | +| 1000000 | 1.040 | 2.580 | 2.48x | |
62 | 62 |
|
63 | 63 | #### int128_with_int32 t_Multiplication |
64 | 64 |
|
65 | 65 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
66 | 66 | |---------|---------------|----------------|------------| |
67 | | -| 100000 | 0.076 | 0.253 | 3.33x | |
| 67 | +| 100000 | 0.077 | 0.254 | 3.30x | |
68 | 68 |
|
69 | 69 | #### int128_with_int16 t_Addition |
70 | 70 |
|
71 | 71 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
72 | 72 | |---------|---------------|----------------|------------| |
73 | | -| 100000 | 0.075 | 0.517 | 6.89x | |
| 73 | +| 100000 | 0.076 | 0.509 | 6.70x | |
74 | 74 |
|
75 | 75 | #### int128_with_int16 t_Subtraction |
76 | 76 |
|
77 | 77 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
78 | 78 | |---------|---------------|----------------|------------| |
79 | | -| 100000 | 0.080 | 0.510 | 6.38x | |
| 79 | +| 100000 | 0.076 | 0.509 | 6.70x | |
80 | 80 |
|
81 | 81 | #### int128_with_int16 t_Multiplication |
82 | 82 |
|
83 | 83 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
84 | 84 | |---------|---------------|----------------|------------| |
85 | | -| 100000 | 0.076 | 0.681 | 8.96x | |
| 85 | +| 100000 | 0.076 | 0.679 | 8.93x | |
86 | 86 |
|
87 | 87 | #### int128_with_int8 t_Addition |
88 | 88 |
|
|
94 | 94 |
|
95 | 95 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
96 | 96 | |---------|---------------|----------------|------------| |
97 | | -| 100000 | 0.061 | 1.100 | 18.03x | |
| 97 | +| 100000 | 0.062 | 1.100 | 17.74x | |
98 | 98 |
|
99 | 99 | #### int256_with_int32 t_Addition |
100 | 100 |
|
101 | 101 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
102 | 102 | |---------|---------------|----------------|------------| |
103 | | -| 100000 | 0.108 | 0.509 | 4.71x | |
| 103 | +| 100000 | 0.108 | 0.510 | 4.72x | |
104 | 104 |
|
105 | 105 | #### int256_with_int32 t_Subtraction |
106 | 106 |
|
107 | 107 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
108 | 108 | |---------|---------------|----------------|------------| |
109 | | -| 100000 | 0.109 | 0.504 | 4.62x | |
| 109 | +| 100000 | 0.107 | 0.507 | 4.74x | |
110 | 110 |
|
111 | 111 | #### int256_with_int32 t_Multiplication |
112 | 112 |
|
113 | 113 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
114 | 114 | |---------|---------------|----------------|------------| |
115 | | -| 100000 | 0.109 | 0.590 | 5.41x | |
| 115 | +| 100000 | 0.108 | 0.573 | 5.31x | |
116 | 116 |
|
117 | 117 | #### int256_with_int16 t_Addition |
118 | 118 |
|
119 | 119 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
120 | 120 | |---------|---------------|----------------|------------| |
121 | | -| 100000 | 0.108 | 1.030 | 9.54x | |
| 121 | +| 100000 | 0.106 | 1.030 | 9.72x | |
122 | 122 |
|
123 | 123 | #### int256_with_int16 t_Subtraction |
124 | 124 |
|
125 | 125 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
126 | 126 | |---------|---------------|----------------|------------| |
127 | | -| 100000 | 0.113 | 1.040 | 9.20x | |
| 127 | +| 100000 | 0.108 | 1.090 | 10.09x | |
128 | 128 |
|
129 | 129 | #### int256_with_int16 t_Multiplication |
130 | 130 |
|
131 | 131 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
132 | 132 | |---------|---------------|----------------|------------| |
133 | | -| 100000 | 0.108 | 1.400 | 12.96x | |
| 133 | +| 100000 | 0.109 | 1.390 | 12.75x | |
134 | 134 |
|
135 | 135 | #### int256_with_int8 t_Addition |
136 | 136 |
|
137 | 137 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
138 | 138 | |---------|---------------|----------------|------------| |
139 | | -| 100000 | 0.107 | 2.190 | 20.47x | |
| 139 | +| 100000 | 0.106 | 2.160 | 20.38x | |
140 | 140 |
|
141 | 141 | #### int256_with_int8 t_Subtraction |
142 | 142 |
|
143 | 143 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
144 | 144 | |---------|---------------|----------------|------------| |
145 | | -| 100000 | 0.107 | 2.250 | 21.03x | |
| 145 | +| 100000 | 0.106 | 2.160 | 20.38x | |
146 | 146 |
|
0 commit comments