| Index: third_party/boringssl/mac-x86/crypto/sha/sha256-586.S
|
| diff --git a/third_party/boringssl/mac-x86/crypto/sha/sha256-586.S b/third_party/boringssl/mac-x86/crypto/sha/sha256-586.S
|
| index f0ba612fabb90014d18c5eb6a1d5cf12d2c9d952..841854f7a9772d16ac1fcbec5c391930be066ef0 100644
|
| --- a/third_party/boringssl/mac-x86/crypto/sha/sha256-586.S
|
| +++ b/third_party/boringssl/mac-x86/crypto/sha/sha256-586.S
|
| @@ -36,11 +36,10 @@ L000pic_point:
|
| jz L003no_xmm
|
| andl $1073741824,%ecx
|
| andl $268435968,%ebx
|
| - testl $536870912,%edx
|
| - jnz L004shaext
|
| orl %ebx,%ecx
|
| andl $1342177280,%ecx
|
| cmpl $1342177280,%ecx
|
| + je L004AVX
|
| testl $512,%ebx
|
| jnz L005SSSE3
|
| L003no_xmm:
|
| @@ -3166,204 +3165,6 @@ L009grand_loop:
|
| popl %ebp
|
| ret
|
| .align 5,0x90
|
| -L004shaext:
|
| - subl $32,%esp
|
| - movdqu (%esi),%xmm1
|
| - leal 128(%ebp),%ebp
|
| - movdqu 16(%esi),%xmm2
|
| - movdqa 128(%ebp),%xmm7
|
| - pshufd $27,%xmm1,%xmm0
|
| - pshufd $177,%xmm1,%xmm1
|
| - pshufd $27,%xmm2,%xmm2
|
| -.byte 102,15,58,15,202,8
|
| - punpcklqdq %xmm0,%xmm2
|
| - jmp L010loop_shaext
|
| -.align 4,0x90
|
| -L010loop_shaext:
|
| - movdqu (%edi),%xmm3
|
| - movdqu 16(%edi),%xmm4
|
| - movdqu 32(%edi),%xmm5
|
| -.byte 102,15,56,0,223
|
| - movdqu 48(%edi),%xmm6
|
| - movdqa %xmm2,16(%esp)
|
| - movdqa -128(%ebp),%xmm0
|
| - paddd %xmm3,%xmm0
|
| -.byte 102,15,56,0,231
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - nop
|
| - movdqa %xmm1,(%esp)
|
| -.byte 15,56,203,202
|
| - movdqa -112(%ebp),%xmm0
|
| - paddd %xmm4,%xmm0
|
| -.byte 102,15,56,0,239
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - leal 64(%edi),%edi
|
| -.byte 15,56,204,220
|
| -.byte 15,56,203,202
|
| - movdqa -96(%ebp),%xmm0
|
| - paddd %xmm5,%xmm0
|
| -.byte 102,15,56,0,247
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm6,%xmm7
|
| -.byte 102,15,58,15,253,4
|
| - nop
|
| - paddd %xmm7,%xmm3
|
| -.byte 15,56,204,229
|
| -.byte 15,56,203,202
|
| - movdqa -80(%ebp),%xmm0
|
| - paddd %xmm6,%xmm0
|
| -.byte 15,56,205,222
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm3,%xmm7
|
| -.byte 102,15,58,15,254,4
|
| - nop
|
| - paddd %xmm7,%xmm4
|
| -.byte 15,56,204,238
|
| -.byte 15,56,203,202
|
| - movdqa -64(%ebp),%xmm0
|
| - paddd %xmm3,%xmm0
|
| -.byte 15,56,205,227
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm4,%xmm7
|
| -.byte 102,15,58,15,251,4
|
| - nop
|
| - paddd %xmm7,%xmm5
|
| -.byte 15,56,204,243
|
| -.byte 15,56,203,202
|
| - movdqa -48(%ebp),%xmm0
|
| - paddd %xmm4,%xmm0
|
| -.byte 15,56,205,236
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm5,%xmm7
|
| -.byte 102,15,58,15,252,4
|
| - nop
|
| - paddd %xmm7,%xmm6
|
| -.byte 15,56,204,220
|
| -.byte 15,56,203,202
|
| - movdqa -32(%ebp),%xmm0
|
| - paddd %xmm5,%xmm0
|
| -.byte 15,56,205,245
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm6,%xmm7
|
| -.byte 102,15,58,15,253,4
|
| - nop
|
| - paddd %xmm7,%xmm3
|
| -.byte 15,56,204,229
|
| -.byte 15,56,203,202
|
| - movdqa -16(%ebp),%xmm0
|
| - paddd %xmm6,%xmm0
|
| -.byte 15,56,205,222
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm3,%xmm7
|
| -.byte 102,15,58,15,254,4
|
| - nop
|
| - paddd %xmm7,%xmm4
|
| -.byte 15,56,204,238
|
| -.byte 15,56,203,202
|
| - movdqa (%ebp),%xmm0
|
| - paddd %xmm3,%xmm0
|
| -.byte 15,56,205,227
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm4,%xmm7
|
| -.byte 102,15,58,15,251,4
|
| - nop
|
| - paddd %xmm7,%xmm5
|
| -.byte 15,56,204,243
|
| -.byte 15,56,203,202
|
| - movdqa 16(%ebp),%xmm0
|
| - paddd %xmm4,%xmm0
|
| -.byte 15,56,205,236
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm5,%xmm7
|
| -.byte 102,15,58,15,252,4
|
| - nop
|
| - paddd %xmm7,%xmm6
|
| -.byte 15,56,204,220
|
| -.byte 15,56,203,202
|
| - movdqa 32(%ebp),%xmm0
|
| - paddd %xmm5,%xmm0
|
| -.byte 15,56,205,245
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm6,%xmm7
|
| -.byte 102,15,58,15,253,4
|
| - nop
|
| - paddd %xmm7,%xmm3
|
| -.byte 15,56,204,229
|
| -.byte 15,56,203,202
|
| - movdqa 48(%ebp),%xmm0
|
| - paddd %xmm6,%xmm0
|
| -.byte 15,56,205,222
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm3,%xmm7
|
| -.byte 102,15,58,15,254,4
|
| - nop
|
| - paddd %xmm7,%xmm4
|
| -.byte 15,56,204,238
|
| -.byte 15,56,203,202
|
| - movdqa 64(%ebp),%xmm0
|
| - paddd %xmm3,%xmm0
|
| -.byte 15,56,205,227
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm4,%xmm7
|
| -.byte 102,15,58,15,251,4
|
| - nop
|
| - paddd %xmm7,%xmm5
|
| -.byte 15,56,204,243
|
| -.byte 15,56,203,202
|
| - movdqa 80(%ebp),%xmm0
|
| - paddd %xmm4,%xmm0
|
| -.byte 15,56,205,236
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - movdqa %xmm5,%xmm7
|
| -.byte 102,15,58,15,252,4
|
| -.byte 15,56,203,202
|
| - paddd %xmm7,%xmm6
|
| - movdqa 96(%ebp),%xmm0
|
| - paddd %xmm5,%xmm0
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| -.byte 15,56,205,245
|
| - movdqa 128(%ebp),%xmm7
|
| -.byte 15,56,203,202
|
| - movdqa 112(%ebp),%xmm0
|
| - paddd %xmm6,%xmm0
|
| - nop
|
| -.byte 15,56,203,209
|
| - pshufd $14,%xmm0,%xmm0
|
| - cmpl %edi,%eax
|
| - nop
|
| -.byte 15,56,203,202
|
| - paddd 16(%esp),%xmm2
|
| - paddd (%esp),%xmm1
|
| - jnz L010loop_shaext
|
| - pshufd $177,%xmm2,%xmm2
|
| - pshufd $27,%xmm1,%xmm7
|
| - pshufd $177,%xmm1,%xmm1
|
| - punpckhqdq %xmm2,%xmm1
|
| -.byte 102,15,58,15,215,8
|
| - movl 44(%esp),%esp
|
| - movdqu %xmm1,(%esi)
|
| - movdqu %xmm2,16(%esi)
|
| - popl %edi
|
| - popl %esi
|
| - popl %ebx
|
| - popl %ebp
|
| - ret
|
| -.align 5,0x90
|
| L005SSSE3:
|
| leal -96(%esp),%esp
|
| movl (%esi),%eax
|
| @@ -3383,9 +3184,9 @@ L005SSSE3:
|
| movl %ecx,24(%esp)
|
| movl %esi,28(%esp)
|
| movdqa 256(%ebp),%xmm7
|
| - jmp L011grand_ssse3
|
| + jmp L010grand_ssse3
|
| .align 4,0x90
|
| -L011grand_ssse3:
|
| +L010grand_ssse3:
|
| movdqu (%edi),%xmm0
|
| movdqu 16(%edi),%xmm1
|
| movdqu 32(%edi),%xmm2
|
| @@ -3408,9 +3209,9 @@ L011grand_ssse3:
|
| paddd %xmm3,%xmm7
|
| movdqa %xmm6,64(%esp)
|
| movdqa %xmm7,80(%esp)
|
| - jmp L012ssse3_00_47
|
| + jmp L011ssse3_00_47
|
| .align 4,0x90
|
| -L012ssse3_00_47:
|
| +L011ssse3_00_47:
|
| addl $64,%ebp
|
| movl %edx,%ecx
|
| movdqa %xmm1,%xmm4
|
| @@ -4053,7 +3854,7 @@ L012ssse3_00_47:
|
| addl %ecx,%eax
|
| movdqa %xmm6,80(%esp)
|
| cmpl $66051,64(%ebp)
|
| - jne L012ssse3_00_47
|
| + jne L011ssse3_00_47
|
| movl %edx,%ecx
|
| rorl $14,%edx
|
| movl 20(%esp),%esi
|
| @@ -4567,8 +4368,1189 @@ L012ssse3_00_47:
|
| movdqa 64(%ebp),%xmm7
|
| subl $192,%ebp
|
| cmpl 104(%esp),%edi
|
| - jb L011grand_ssse3
|
| + jb L010grand_ssse3
|
| + movl 108(%esp),%esp
|
| + popl %edi
|
| + popl %esi
|
| + popl %ebx
|
| + popl %ebp
|
| + ret
|
| +.align 5,0x90
|
| +L004AVX:
|
| + leal -96(%esp),%esp
|
| + vzeroall
|
| + movl (%esi),%eax
|
| + movl 4(%esi),%ebx
|
| + movl 8(%esi),%ecx
|
| + movl 12(%esi),%edi
|
| + movl %ebx,4(%esp)
|
| + xorl %ecx,%ebx
|
| + movl %ecx,8(%esp)
|
| + movl %edi,12(%esp)
|
| + movl 16(%esi),%edx
|
| + movl 20(%esi),%edi
|
| + movl 24(%esi),%ecx
|
| + movl 28(%esi),%esi
|
| + movl %edi,20(%esp)
|
| + movl 100(%esp),%edi
|
| + movl %ecx,24(%esp)
|
| + movl %esi,28(%esp)
|
| + vmovdqa 256(%ebp),%xmm7
|
| + jmp L012grand_avx
|
| +.align 5,0x90
|
| +L012grand_avx:
|
| + vmovdqu (%edi),%xmm0
|
| + vmovdqu 16(%edi),%xmm1
|
| + vmovdqu 32(%edi),%xmm2
|
| + vmovdqu 48(%edi),%xmm3
|
| + addl $64,%edi
|
| + vpshufb %xmm7,%xmm0,%xmm0
|
| + movl %edi,100(%esp)
|
| + vpshufb %xmm7,%xmm1,%xmm1
|
| + vpshufb %xmm7,%xmm2,%xmm2
|
| + vpaddd (%ebp),%xmm0,%xmm4
|
| + vpshufb %xmm7,%xmm3,%xmm3
|
| + vpaddd 16(%ebp),%xmm1,%xmm5
|
| + vpaddd 32(%ebp),%xmm2,%xmm6
|
| + vpaddd 48(%ebp),%xmm3,%xmm7
|
| + vmovdqa %xmm4,32(%esp)
|
| + vmovdqa %xmm5,48(%esp)
|
| + vmovdqa %xmm6,64(%esp)
|
| + vmovdqa %xmm7,80(%esp)
|
| + jmp L013avx_00_47
|
| +.align 4,0x90
|
| +L013avx_00_47:
|
| + addl $64,%ebp
|
| + vpalignr $4,%xmm0,%xmm1,%xmm4
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 20(%esp),%esi
|
| + vpalignr $4,%xmm2,%xmm3,%xmm7
|
| + xorl %ecx,%edx
|
| + movl 24(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $7,%xmm4,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,16(%esp)
|
| + vpaddd %xmm7,%xmm0,%xmm0
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrld $3,%xmm4,%xmm7
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 4(%esp),%edi
|
| + vpslld $14,%xmm4,%xmm5
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,(%esp)
|
| + vpxor %xmm6,%xmm7,%xmm4
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 28(%esp),%edx
|
| + vpshufd $250,%xmm3,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpsrld $11,%xmm6,%xmm6
|
| + addl 32(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + addl %edx,%ebx
|
| + addl 12(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpslld $11,%xmm5,%xmm5
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 16(%esp),%esi
|
| + vpxor %xmm6,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + movl 20(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $10,%xmm7,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,12(%esp)
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl (%esp),%edi
|
| + vpaddd %xmm4,%xmm0,%xmm0
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,28(%esp)
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 24(%esp),%edx
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + addl 36(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + vpshufd $132,%xmm6,%xmm7
|
| + addl %edx,%eax
|
| + addl 8(%esp),%edx
|
| + addl %ecx,%eax
|
| + vpsrldq $8,%xmm7,%xmm7
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 12(%esp),%esi
|
| + vpaddd %xmm7,%xmm0,%xmm0
|
| + xorl %ecx,%edx
|
| + movl 16(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpshufd $80,%xmm0,%xmm7
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,8(%esp)
|
| + vpsrld $10,%xmm7,%xmm6
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 28(%esp),%edi
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,24(%esp)
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 20(%esp),%edx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpshufd $232,%xmm6,%xmm7
|
| + addl 40(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpslldq $8,%xmm7,%xmm7
|
| + addl %edx,%ebx
|
| + addl 4(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpaddd %xmm7,%xmm0,%xmm0
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 8(%esp),%esi
|
| + vpaddd (%ebp),%xmm0,%xmm6
|
| + xorl %ecx,%edx
|
| + movl 12(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,4(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 24(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,20(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 16(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 44(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl (%esp),%edx
|
| + addl %ecx,%eax
|
| + vmovdqa %xmm6,32(%esp)
|
| + vpalignr $4,%xmm1,%xmm2,%xmm4
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 4(%esp),%esi
|
| + vpalignr $4,%xmm3,%xmm0,%xmm7
|
| + xorl %ecx,%edx
|
| + movl 8(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $7,%xmm4,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,(%esp)
|
| + vpaddd %xmm7,%xmm1,%xmm1
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrld $3,%xmm4,%xmm7
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 20(%esp),%edi
|
| + vpslld $14,%xmm4,%xmm5
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,16(%esp)
|
| + vpxor %xmm6,%xmm7,%xmm4
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 12(%esp),%edx
|
| + vpshufd $250,%xmm0,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpsrld $11,%xmm6,%xmm6
|
| + addl 48(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + addl %edx,%ebx
|
| + addl 28(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpslld $11,%xmm5,%xmm5
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl (%esp),%esi
|
| + vpxor %xmm6,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + movl 4(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $10,%xmm7,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,28(%esp)
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 16(%esp),%edi
|
| + vpaddd %xmm4,%xmm1,%xmm1
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,12(%esp)
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 8(%esp),%edx
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + addl 52(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + vpshufd $132,%xmm6,%xmm7
|
| + addl %edx,%eax
|
| + addl 24(%esp),%edx
|
| + addl %ecx,%eax
|
| + vpsrldq $8,%xmm7,%xmm7
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 28(%esp),%esi
|
| + vpaddd %xmm7,%xmm1,%xmm1
|
| + xorl %ecx,%edx
|
| + movl (%esp),%edi
|
| + xorl %edi,%esi
|
| + vpshufd $80,%xmm1,%xmm7
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,24(%esp)
|
| + vpsrld $10,%xmm7,%xmm6
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 12(%esp),%edi
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,8(%esp)
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 4(%esp),%edx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpshufd $232,%xmm6,%xmm7
|
| + addl 56(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpslldq $8,%xmm7,%xmm7
|
| + addl %edx,%ebx
|
| + addl 20(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpaddd %xmm7,%xmm1,%xmm1
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 24(%esp),%esi
|
| + vpaddd 16(%ebp),%xmm1,%xmm6
|
| + xorl %ecx,%edx
|
| + movl 28(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,20(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 8(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,4(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl (%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 60(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 16(%esp),%edx
|
| + addl %ecx,%eax
|
| + vmovdqa %xmm6,48(%esp)
|
| + vpalignr $4,%xmm2,%xmm3,%xmm4
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 20(%esp),%esi
|
| + vpalignr $4,%xmm0,%xmm1,%xmm7
|
| + xorl %ecx,%edx
|
| + movl 24(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $7,%xmm4,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,16(%esp)
|
| + vpaddd %xmm7,%xmm2,%xmm2
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrld $3,%xmm4,%xmm7
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 4(%esp),%edi
|
| + vpslld $14,%xmm4,%xmm5
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,(%esp)
|
| + vpxor %xmm6,%xmm7,%xmm4
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 28(%esp),%edx
|
| + vpshufd $250,%xmm1,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpsrld $11,%xmm6,%xmm6
|
| + addl 64(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + addl %edx,%ebx
|
| + addl 12(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpslld $11,%xmm5,%xmm5
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 16(%esp),%esi
|
| + vpxor %xmm6,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + movl 20(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $10,%xmm7,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,12(%esp)
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl (%esp),%edi
|
| + vpaddd %xmm4,%xmm2,%xmm2
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,28(%esp)
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 24(%esp),%edx
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + addl 68(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + vpshufd $132,%xmm6,%xmm7
|
| + addl %edx,%eax
|
| + addl 8(%esp),%edx
|
| + addl %ecx,%eax
|
| + vpsrldq $8,%xmm7,%xmm7
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 12(%esp),%esi
|
| + vpaddd %xmm7,%xmm2,%xmm2
|
| + xorl %ecx,%edx
|
| + movl 16(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpshufd $80,%xmm2,%xmm7
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,8(%esp)
|
| + vpsrld $10,%xmm7,%xmm6
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 28(%esp),%edi
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,24(%esp)
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 20(%esp),%edx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpshufd $232,%xmm6,%xmm7
|
| + addl 72(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpslldq $8,%xmm7,%xmm7
|
| + addl %edx,%ebx
|
| + addl 4(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpaddd %xmm7,%xmm2,%xmm2
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 8(%esp),%esi
|
| + vpaddd 32(%ebp),%xmm2,%xmm6
|
| + xorl %ecx,%edx
|
| + movl 12(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,4(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 24(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,20(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 16(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 76(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl (%esp),%edx
|
| + addl %ecx,%eax
|
| + vmovdqa %xmm6,64(%esp)
|
| + vpalignr $4,%xmm3,%xmm0,%xmm4
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 4(%esp),%esi
|
| + vpalignr $4,%xmm1,%xmm2,%xmm7
|
| + xorl %ecx,%edx
|
| + movl 8(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $7,%xmm4,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,(%esp)
|
| + vpaddd %xmm7,%xmm3,%xmm3
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrld $3,%xmm4,%xmm7
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 20(%esp),%edi
|
| + vpslld $14,%xmm4,%xmm5
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,16(%esp)
|
| + vpxor %xmm6,%xmm7,%xmm4
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 12(%esp),%edx
|
| + vpshufd $250,%xmm2,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpsrld $11,%xmm6,%xmm6
|
| + addl 80(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + addl %edx,%ebx
|
| + addl 28(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpslld $11,%xmm5,%xmm5
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl (%esp),%esi
|
| + vpxor %xmm6,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + movl 4(%esp),%edi
|
| + xorl %edi,%esi
|
| + vpsrld $10,%xmm7,%xmm6
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,28(%esp)
|
| + vpxor %xmm5,%xmm4,%xmm4
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 16(%esp),%edi
|
| + vpaddd %xmm4,%xmm3,%xmm3
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,12(%esp)
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 8(%esp),%edx
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + addl 84(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + vpshufd $132,%xmm6,%xmm7
|
| + addl %edx,%eax
|
| + addl 24(%esp),%edx
|
| + addl %ecx,%eax
|
| + vpsrldq $8,%xmm7,%xmm7
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 28(%esp),%esi
|
| + vpaddd %xmm7,%xmm3,%xmm3
|
| + xorl %ecx,%edx
|
| + movl (%esp),%edi
|
| + xorl %edi,%esi
|
| + vpshufd $80,%xmm3,%xmm7
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,24(%esp)
|
| + vpsrld $10,%xmm7,%xmm6
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + vpsrlq $17,%xmm7,%xmm5
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 12(%esp),%edi
|
| + vpxor %xmm5,%xmm6,%xmm6
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,8(%esp)
|
| + vpsrlq $19,%xmm7,%xmm7
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 4(%esp),%edx
|
| + vpxor %xmm7,%xmm6,%xmm6
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + vpshufd $232,%xmm6,%xmm7
|
| + addl 88(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + vpslldq $8,%xmm7,%xmm7
|
| + addl %edx,%ebx
|
| + addl 20(%esp),%edx
|
| + addl %ecx,%ebx
|
| + vpaddd %xmm7,%xmm3,%xmm3
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 24(%esp),%esi
|
| + vpaddd 48(%ebp),%xmm3,%xmm6
|
| + xorl %ecx,%edx
|
| + movl 28(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,20(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 8(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,4(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl (%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 92(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 16(%esp),%edx
|
| + addl %ecx,%eax
|
| + vmovdqa %xmm6,80(%esp)
|
| + cmpl $66051,64(%ebp)
|
| + jne L013avx_00_47
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 20(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 24(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,16(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 4(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 28(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 32(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 12(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 16(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 20(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,12(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl (%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,28(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 24(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 36(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 8(%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 12(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 16(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,8(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 28(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,24(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 20(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 40(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 4(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 8(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 12(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,4(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 24(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,20(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 16(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 44(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl (%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 4(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 8(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 20(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,16(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 12(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 48(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 28(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl (%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 4(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,28(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 16(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,12(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 8(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 52(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 24(%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 28(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl (%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,24(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 12(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,8(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 4(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 56(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 20(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 24(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 28(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,20(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 8(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,4(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl (%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 60(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 16(%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 20(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 24(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,16(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 4(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 28(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 64(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 12(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 16(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 20(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,12(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl (%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,28(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 24(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 68(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 8(%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 12(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 16(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,8(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 28(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,24(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 20(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 72(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 4(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 8(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 12(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,4(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 24(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,20(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 16(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 76(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl (%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 4(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 8(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 20(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,16(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 12(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 80(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 28(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl (%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 4(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,28(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 16(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,12(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl 8(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 84(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 24(%esp),%edx
|
| + addl %ecx,%eax
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 28(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl (%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,24(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %eax,%ecx
|
| + addl %edi,%edx
|
| + movl 12(%esp),%edi
|
| + movl %eax,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %eax,8(%esp)
|
| + xorl %eax,%ecx
|
| + xorl %edi,%eax
|
| + addl 4(%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %eax,%ebx
|
| + xorl %esi,%ecx
|
| + addl 88(%esp),%edx
|
| + xorl %edi,%ebx
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%ebx
|
| + addl 20(%esp),%edx
|
| + addl %ecx,%ebx
|
| + movl %edx,%ecx
|
| + shrdl $14,%edx,%edx
|
| + movl 24(%esp),%esi
|
| + xorl %ecx,%edx
|
| + movl 28(%esp),%edi
|
| + xorl %edi,%esi
|
| + shrdl $5,%edx,%edx
|
| + andl %ecx,%esi
|
| + movl %ecx,20(%esp)
|
| + xorl %ecx,%edx
|
| + xorl %esi,%edi
|
| + shrdl $6,%edx,%edx
|
| + movl %ebx,%ecx
|
| + addl %edi,%edx
|
| + movl 8(%esp),%edi
|
| + movl %ebx,%esi
|
| + shrdl $9,%ecx,%ecx
|
| + movl %ebx,4(%esp)
|
| + xorl %ebx,%ecx
|
| + xorl %edi,%ebx
|
| + addl (%esp),%edx
|
| + shrdl $11,%ecx,%ecx
|
| + andl %ebx,%eax
|
| + xorl %esi,%ecx
|
| + addl 92(%esp),%edx
|
| + xorl %edi,%eax
|
| + shrdl $2,%ecx,%ecx
|
| + addl %edx,%eax
|
| + addl 16(%esp),%edx
|
| + addl %ecx,%eax
|
| + movl 96(%esp),%esi
|
| + xorl %edi,%ebx
|
| + movl 12(%esp),%ecx
|
| + addl (%esi),%eax
|
| + addl 4(%esi),%ebx
|
| + addl 8(%esi),%edi
|
| + addl 12(%esi),%ecx
|
| + movl %eax,(%esi)
|
| + movl %ebx,4(%esi)
|
| + movl %edi,8(%esi)
|
| + movl %ecx,12(%esi)
|
| + movl %ebx,4(%esp)
|
| + xorl %edi,%ebx
|
| + movl %edi,8(%esp)
|
| + movl %ecx,12(%esp)
|
| + movl 20(%esp),%edi
|
| + movl 24(%esp),%ecx
|
| + addl 16(%esi),%edx
|
| + addl 20(%esi),%edi
|
| + addl 24(%esi),%ecx
|
| + movl %edx,16(%esi)
|
| + movl %edi,20(%esi)
|
| + movl %edi,20(%esp)
|
| + movl 28(%esp),%edi
|
| + movl %ecx,24(%esi)
|
| + addl 28(%esi),%edi
|
| + movl %ecx,24(%esp)
|
| + movl %edi,28(%esi)
|
| + movl %edi,28(%esp)
|
| + movl 100(%esp),%edi
|
| + vmovdqa 64(%ebp),%xmm7
|
| + subl $192,%ebp
|
| + cmpl 104(%esp),%edi
|
| + jb L012grand_avx
|
| movl 108(%esp),%esp
|
| + vzeroall
|
| popl %edi
|
| popl %esi
|
| popl %ebx
|
|
|