|
4 | 4 |
|
5 | 5 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
6 | 6 | |---------|---------------|----------------|------------| |
7 | | -| 100000 | 0.080 | 0.525 | 6.56x | |
| 7 | +| 100000 | 0.100 | 0.515 | 5.15x | |
8 | 8 |
|
9 | 9 | #### float256 Subtraction |
10 | 10 |
|
11 | 11 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
12 | 12 | |---------|---------------|----------------|------------| |
13 | | -| 100000 | 0.080 | 0.511 | 6.39x | |
| 13 | +| 100000 | 0.100 | 0.522 | 5.22x | |
14 | 14 |
|
15 | 15 | #### float256 Multiplication |
16 | 16 |
|
17 | 17 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
18 | 18 | |---------|---------------|----------------|------------| |
19 | | -| 100000 | 0.080 | 0.583 | 7.29x | |
| 19 | +| 100000 | 0.104 | 0.583 | 5.61x | |
20 | 20 |
|
21 | 21 | #### float256 Division |
22 | 22 |
|
23 | 23 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
24 | 24 | |---------|---------------|----------------|------------| |
25 | | -| 100000 | 0.111 | 0.770 | 6.94x | |
| 25 | +| 100000 | 0.110 | 0.770 | 7.00x | |
26 | 26 |
|
27 | 27 | #### double256 Addition |
28 | 28 |
|
29 | 29 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
30 | 30 | |---------|---------------|----------------|------------| |
31 | | -| 100000 | 0.080 | 0.283 | 3.54x | |
| 31 | +| 100000 | 0.103 | 0.262 | 2.54x | |
32 | 32 |
|
33 | 33 | #### double256 Subtraction |
34 | 34 |
|
35 | 35 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
36 | 36 | |---------|---------------|----------------|------------| |
37 | | -| 100000 | 0.080 | 0.262 | 3.27x | |
| 37 | +| 100000 | 0.099 | 0.271 | 2.74x | |
38 | 38 |
|
39 | 39 | #### double256 Multiplication |
40 | 40 |
|
41 | 41 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
42 | 42 | |---------|---------------|----------------|------------| |
43 | | -| 100000 | 0.085 | 0.389 | 4.58x | |
| 43 | +| 100000 | 0.102 | 0.335 | 3.28x | |
44 | 44 |
|
45 | 45 | #### double256 Division |
46 | 46 |
|
47 | 47 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
48 | 48 | |---------|---------------|----------------|------------| |
49 | | -| 100000 | 0.142 | 0.568 | 4.00x | |
| 49 | +| 100000 | 0.141 | 0.564 | 4.00x | |
50 | 50 |
|
51 | 51 | #### int128_with_int32 t_Addition |
52 | 52 |
|
53 | 53 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
54 | 54 | |---------|---------------|----------------|------------| |
55 | | -| 1000000 | 1.070 | 2.560 | 2.39x | |
| 55 | +| 1000000 | 1.040 | 2.560 | 2.46x | |
56 | 56 |
|
57 | 57 | #### int128_with_int32 t_Subtraction |
58 | 58 |
|
59 | 59 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
60 | 60 | |---------|---------------|----------------|------------| |
61 | | -| 1000000 | 1.060 | 2.580 | 2.43x | |
| 61 | +| 1000000 | 1.050 | 2.570 | 2.45x | |
62 | 62 |
|
63 | 63 | #### int128_with_int32 t_Multiplication |
64 | 64 |
|
65 | 65 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
66 | 66 | |---------|---------------|----------------|------------| |
67 | | -| 100000 | 0.074 | 0.277 | 3.74x | |
| 67 | +| 100000 | 0.076 | 0.266 | 3.50x | |
68 | 68 |
|
69 | 69 | #### int128_with_int16 t_Addition |
70 | 70 |
|
71 | 71 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
72 | 72 | |---------|---------------|----------------|------------| |
73 | | -| 100000 | 0.073 | 0.517 | 7.08x | |
| 73 | +| 100000 | 0.074 | 0.512 | 6.92x | |
74 | 74 |
|
75 | 75 | #### int128_with_int16 t_Subtraction |
76 | 76 |
|
77 | 77 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
78 | 78 | |---------|---------------|----------------|------------| |
79 | | -| 100000 | 0.076 | 0.511 | 6.72x | |
| 79 | +| 100000 | 0.075 | 0.516 | 6.88x | |
80 | 80 |
|
81 | 81 | #### int128_with_int16 t_Multiplication |
82 | 82 |
|
83 | 83 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
84 | 84 | |---------|---------------|----------------|------------| |
85 | | -| 100000 | 0.073 | 0.616 | 8.44x | |
| 85 | +| 100000 | 0.074 | 0.617 | 8.34x | |
86 | 86 |
|
87 | 87 | #### int128_with_int8 t_Addition |
88 | 88 |
|
89 | 89 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
90 | 90 | |---------|---------------|----------------|------------| |
91 | | -| 100000 | 0.062 | 1.030 | 16.61x | |
| 91 | +| 100000 | 0.067 | 1.030 | 15.37x | |
92 | 92 |
|
93 | 93 | #### int128_with_int8 t_Subtraction |
94 | 94 |
|
95 | 95 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
96 | 96 | |---------|---------------|----------------|------------| |
97 | | -| 100000 | 0.069 | 1.030 | 14.93x | |
| 97 | +| 100000 | 0.061 | 1.030 | 16.89x | |
98 | 98 |
|
99 | 99 | #### int256_with_int32 t_Addition |
100 | 100 |
|
101 | 101 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
102 | 102 | |---------|---------------|----------------|------------| |
103 | | -| 100000 | 0.080 | 0.505 | 6.31x | |
| 103 | +| 100000 | 0.093 | 0.505 | 5.43x | |
104 | 104 |
|
105 | 105 | #### int256_with_int32 t_Subtraction |
106 | 106 |
|
107 | 107 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
108 | 108 | |---------|---------------|----------------|------------| |
109 | | -| 100000 | 0.081 | 0.511 | 6.31x | |
| 109 | +| 100000 | 0.100 | 0.507 | 5.07x | |
110 | 110 |
|
111 | 111 | #### int256_with_int32 t_Multiplication |
112 | 112 |
|
113 | 113 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
114 | 114 | |---------|---------------|----------------|------------| |
115 | | -| 100000 | 0.080 | 0.553 | 6.91x | |
| 115 | +| 100000 | 0.092 | 0.551 | 5.99x | |
116 | 116 |
|
117 | 117 | #### int256_with_int16 t_Addition |
118 | 118 |
|
119 | 119 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
120 | 120 | |---------|---------------|----------------|------------| |
121 | | -| 100000 | 0.080 | 1.030 | 12.88x | |
| 121 | +| 100000 | 0.103 | 1.030 | 10.00x | |
122 | 122 |
|
123 | 123 | #### int256_with_int16 t_Subtraction |
124 | 124 |
|
125 | 125 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
126 | 126 | |---------|---------------|----------------|------------| |
127 | | -| 100000 | 0.080 | 1.020 | 12.75x | |
| 127 | +| 100000 | 0.098 | 1.020 | 10.41x | |
128 | 128 |
|
129 | 129 | #### int256_with_int16 t_Multiplication |
130 | 130 |
|
131 | 131 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
132 | 132 | |---------|---------------|----------------|------------| |
133 | | -| 100000 | 0.080 | 1.160 | 14.50x | |
| 133 | +| 100000 | 0.098 | 1.160 | 11.84x | |
134 | 134 |
|
135 | 135 | #### int256_with_int8 t_Addition |
136 | 136 |
|
137 | 137 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
138 | 138 | |---------|---------------|----------------|------------| |
139 | | -| 100000 | 0.081 | 2.060 | 25.43x | |
| 139 | +| 100000 | 0.098 | 2.210 | 22.55x | |
140 | 140 |
|
141 | 141 | #### int256_with_int8 t_Subtraction |
142 | 142 |
|
143 | 143 | | Variant | SIMD Time (ms) | Plain Time (ms) | Speedup (x) | |
144 | 144 | |---------|---------------|----------------|------------| |
145 | | -| 100000 | 0.080 | 2.210 | 27.62x | |
| 145 | +| 100000 | 0.089 | 2.210 | 24.83x | |
146 | 146 |
|
0 commit comments