Skip to content

Commit 49eca84

Browse files
authored
Merge pull request #5478 from martin-frbg/issue5477
Change all aligned moves in x86_64 MIN/MAX to unaligned
2 parents 7af2225 + b48a089 commit 49eca84

File tree

1 file changed

+16
-16
lines changed

1 file changed

+16
-16
lines changed

kernel/x86_64/iamax_sse.S

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -96,9 +96,9 @@
9696
#ifdef USE_ABS
9797
andps %xmm15, %xmm0
9898
#endif
99-
movaps %xmm0, %xmm1
100-
movaps %xmm0, %xmm2
101-
movaps %xmm0, %xmm3 /* Generating "seed value" */
99+
movups %xmm0, %xmm1
100+
movups %xmm0, %xmm2
101+
movups %xmm0, %xmm3 /* Generating "seed value" */
102102
cmpq $SIZE, INCX
103103
jne .L80 /* Incx != 1 goto L80 */
104104

@@ -146,25 +146,25 @@
146146
PREFETCH (PREFETCHSIZE + 0) - PREOFFSET(X)
147147
#endif
148148

149-
movaps 0 * SIZE(X), %xmm4
149+
movups 0 * SIZE(X), %xmm4
150150
#ifdef USE_ABS
151151
andps %xmm15, %xmm4
152152
#endif
153153
MAXPS %xmm4, %xmm0
154154

155-
movaps 4 * SIZE(X), %xmm5
155+
movups 4 * SIZE(X), %xmm5
156156
#ifdef USE_ABS
157157
andps %xmm15, %xmm5
158158
#endif
159159
MAXPS %xmm5, %xmm1
160160

161-
movaps 8 * SIZE(X), %xmm6
161+
movups 8 * SIZE(X), %xmm6
162162
#ifdef USE_ABS
163163
andps %xmm15, %xmm6
164164
#endif
165165
MAXPS %xmm6, %xmm2
166166

167-
movaps 12 * SIZE(X), %xmm7
167+
movups 12 * SIZE(X), %xmm7
168168
#ifdef USE_ABS
169169
andps %xmm15, %xmm7
170170
#endif
@@ -182,13 +182,13 @@
182182
testq $8, M
183183
je .L16
184184

185-
movaps 0 * SIZE(X), %xmm4
185+
movups 0 * SIZE(X), %xmm4
186186
#ifdef USE_ABS
187187
andps %xmm15, %xmm4
188188
#endif
189189
MAXPS %xmm4, %xmm0
190190

191-
movaps 4 * SIZE(X), %xmm5
191+
movups 4 * SIZE(X), %xmm5
192192
#ifdef USE_ABS
193193
andps %xmm15, %xmm5
194194
#endif
@@ -200,7 +200,7 @@
200200
testq $4, M
201201
je .L17
202202

203-
movaps 0 * SIZE(X), %xmm6
203+
movups 0 * SIZE(X), %xmm6
204204
#ifdef USE_ABS
205205
andps %xmm15, %xmm6
206206
#endif
@@ -238,10 +238,10 @@
238238
MAXPS %xmm1, %xmm0
239239
MAXPS %xmm3, %xmm2
240240
MAXPS %xmm2, %xmm0
241-
movaps %xmm0, %xmm1
241+
movups %xmm0, %xmm1
242242
movhlps %xmm0, %xmm0
243243
MAXPS %xmm1, %xmm0
244-
movaps %xmm0, %xmm1
244+
movups %xmm0, %xmm1
245245
shufps $1, %xmm0, %xmm0
246246
MAXSS %xmm1, %xmm0
247247
shufps $0, %xmm0, %xmm0
@@ -295,13 +295,13 @@
295295
PREFETCH (PREFETCHSIZE + 0) - PREOFFSET(X)
296296
#endif
297297

298-
movaps 0 * SIZE(X), %xmm1
298+
movups 0 * SIZE(X), %xmm1
299299
#ifdef USE_ABS
300300
andps %xmm15, %xmm1
301301
#endif
302302
cmpeqps %xmm0, %xmm1
303303

304-
movaps 4 * SIZE(X), %xmm3
304+
movups 4 * SIZE(X), %xmm3
305305
#ifdef USE_ABS
306306
andps %xmm15, %xmm3
307307
#endif
@@ -536,10 +536,10 @@
536536
MAXPS %xmm1, %xmm0
537537
MAXPS %xmm3, %xmm2
538538
MAXPS %xmm2, %xmm0
539-
movaps %xmm0, %xmm1
539+
movups %xmm0, %xmm1
540540
movhlps %xmm0, %xmm0
541541
MAXPS %xmm1, %xmm0
542-
movaps %xmm0, %xmm1
542+
movups %xmm0, %xmm1
543543
shufps $1, %xmm0, %xmm0
544544
MAXSS %xmm1, %xmm0
545545
shufps $0, %xmm0, %xmm0

0 commit comments

Comments
 (0)