@@ -23,24 +23,24 @@
add $2f-1b, BASE
#endif
- movdqa 0(BASE), %xmm0
- movdqa 1*16(BASE), %xmm1
- movdqa 2*16(BASE), %xmm2
- movdqa 3*16(BASE), %xmm3
- movdqa 4*16(BASE), %xmm4
- movdqa 5*16(BASE), %xmm5
- movdqa 6*16(BASE), %xmm6
- movdqa 7*16(BASE), %xmm7
+ vmovdqa 0(BASE), %ymm0
+ vmovdqa 1*32(BASE), %ymm1
+ vmovdqa 2*32(BASE), %ymm2
+ vmovdqa 3*32(BASE), %ymm3
+ vmovdqa 4*32(BASE), %ymm4
+ vmovdqa 5*32(BASE), %ymm5
+ vmovdqa 6*32(BASE), %ymm6
+ vmovdqa 7*32(BASE), %ymm7
#ifdef __x86_64__
- movdqa 8*16(BASE), %xmm8
- movdqa 9*16(BASE), %xmm9
- movdqa 10*16(BASE), %xmm10
- movdqa 11*16(BASE), %xmm11
- movdqa 12*16(BASE), %xmm12
- movdqa 13*16(BASE), %xmm13
- movdqa 14*16(BASE), %xmm14
- movdqa 15*16(BASE), %xmm15
+ vmovdqa 8*32(BASE), %ymm8
+ vmovdqa 9*32(BASE), %ymm9
+ vmovdqa 10*32(BASE), %ymm10
+ vmovdqa 11*32(BASE), %ymm11
+ vmovdqa 12*32(BASE), %ymm12
+ vmovdqa 13*32(BASE), %ymm13
+ vmovdqa 14*32(BASE), %ymm14
+ vmovdqa 15*32(BASE), %ymm15
#endif
xor %eax, %eax
@@ -75,6 +75,6 @@
2:
.set i, 0
.rept 256
- .byte i
+ .byte i, i, i, i
.set i, i + 1
.endr
In order to not be a hack, we'd have to test whether avx2 exists. Signed-off-by: Richard Henderson <richard.henderson@linaro.org> --- test_i386.S | 34 +++++++++++++++++----------------- 1 file changed, 17 insertions(+), 17 deletions(-) -- 2.17.1