|
96 | 96 | #ifdef USE_ABS |
97 | 97 | andps %xmm15, %xmm0 |
98 | 98 | #endif |
99 | | - movaps %xmm0, %xmm1 |
100 | | - movaps %xmm0, %xmm2 |
101 | | - movaps %xmm0, %xmm3 /* Generating "seed value" */ |
| 99 | + movups %xmm0, %xmm1 |
| 100 | + movups %xmm0, %xmm2 |
| 101 | + movups %xmm0, %xmm3 /* Generating "seed value" */ |
102 | 102 | cmpq $SIZE, INCX |
103 | 103 | jne .L80 /* Incx != 1 goto L80 */ |
104 | 104 |
|
|
146 | 146 | PREFETCH (PREFETCHSIZE + 0) - PREOFFSET(X) |
147 | 147 | #endif |
148 | 148 |
|
149 | | - movaps 0 * SIZE(X), %xmm4 |
| 149 | + movups 0 * SIZE(X), %xmm4 |
150 | 150 | #ifdef USE_ABS |
151 | 151 | andps %xmm15, %xmm4 |
152 | 152 | #endif |
153 | 153 | MAXPS %xmm4, %xmm0 |
154 | 154 |
|
155 | | - movaps 4 * SIZE(X), %xmm5 |
| 155 | + movups 4 * SIZE(X), %xmm5 |
156 | 156 | #ifdef USE_ABS |
157 | 157 | andps %xmm15, %xmm5 |
158 | 158 | #endif |
159 | 159 | MAXPS %xmm5, %xmm1 |
160 | 160 |
|
161 | | - movaps 8 * SIZE(X), %xmm6 |
| 161 | + movups 8 * SIZE(X), %xmm6 |
162 | 162 | #ifdef USE_ABS |
163 | 163 | andps %xmm15, %xmm6 |
164 | 164 | #endif |
165 | 165 | MAXPS %xmm6, %xmm2 |
166 | 166 |
|
167 | | - movaps 12 * SIZE(X), %xmm7 |
| 167 | + movups 12 * SIZE(X), %xmm7 |
168 | 168 | #ifdef USE_ABS |
169 | 169 | andps %xmm15, %xmm7 |
170 | 170 | #endif |
|
182 | 182 | testq $8, M |
183 | 183 | je .L16 |
184 | 184 |
|
185 | | - movaps 0 * SIZE(X), %xmm4 |
| 185 | + movups 0 * SIZE(X), %xmm4 |
186 | 186 | #ifdef USE_ABS |
187 | 187 | andps %xmm15, %xmm4 |
188 | 188 | #endif |
189 | 189 | MAXPS %xmm4, %xmm0 |
190 | 190 |
|
191 | | - movaps 4 * SIZE(X), %xmm5 |
| 191 | + movups 4 * SIZE(X), %xmm5 |
192 | 192 | #ifdef USE_ABS |
193 | 193 | andps %xmm15, %xmm5 |
194 | 194 | #endif |
|
200 | 200 | testq $4, M |
201 | 201 | je .L17 |
202 | 202 |
|
203 | | - movaps 0 * SIZE(X), %xmm6 |
| 203 | + movups 0 * SIZE(X), %xmm6 |
204 | 204 | #ifdef USE_ABS |
205 | 205 | andps %xmm15, %xmm6 |
206 | 206 | #endif |
|
238 | 238 | MAXPS %xmm1, %xmm0 |
239 | 239 | MAXPS %xmm3, %xmm2 |
240 | 240 | MAXPS %xmm2, %xmm0 |
241 | | - movaps %xmm0, %xmm1 |
| 241 | + movups %xmm0, %xmm1 |
242 | 242 | movhlps %xmm0, %xmm0 |
243 | 243 | MAXPS %xmm1, %xmm0 |
244 | | - movaps %xmm0, %xmm1 |
| 244 | + movups %xmm0, %xmm1 |
245 | 245 | shufps $1, %xmm0, %xmm0 |
246 | 246 | MAXSS %xmm1, %xmm0 |
247 | 247 | shufps $0, %xmm0, %xmm0 |
|
295 | 295 | PREFETCH (PREFETCHSIZE + 0) - PREOFFSET(X) |
296 | 296 | #endif |
297 | 297 |
|
298 | | - movaps 0 * SIZE(X), %xmm1 |
| 298 | + movups 0 * SIZE(X), %xmm1 |
299 | 299 | #ifdef USE_ABS |
300 | 300 | andps %xmm15, %xmm1 |
301 | 301 | #endif |
302 | 302 | cmpeqps %xmm0, %xmm1 |
303 | 303 |
|
304 | | - movaps 4 * SIZE(X), %xmm3 |
| 304 | + movups 4 * SIZE(X), %xmm3 |
305 | 305 | #ifdef USE_ABS |
306 | 306 | andps %xmm15, %xmm3 |
307 | 307 | #endif |
|
536 | 536 | MAXPS %xmm1, %xmm0 |
537 | 537 | MAXPS %xmm3, %xmm2 |
538 | 538 | MAXPS %xmm2, %xmm0 |
539 | | - movaps %xmm0, %xmm1 |
| 539 | + movups %xmm0, %xmm1 |
540 | 540 | movhlps %xmm0, %xmm0 |
541 | 541 | MAXPS %xmm1, %xmm0 |
542 | | - movaps %xmm0, %xmm1 |
| 542 | + movups %xmm0, %xmm1 |
543 | 543 | shufps $1, %xmm0, %xmm0 |
544 | 544 | MAXSS %xmm1, %xmm0 |
545 | 545 | shufps $0, %xmm0, %xmm0 |
|
0 commit comments