Re-generate assembly sources from the updated openssl submodule.
Signed-off-by: Anderson Toshiyuki Sasaki <ansasaki@redhat.com>
.Loop192:
tbl v6.16b,{v4.16b},v2.16b
ext v5.16b,v0.16b,v3.16b,#12
+
+
+
+
st1 {v4.8b},[x2],#8
+
aese v6.16b,v0.16b
subs w1,w1,#1
ldr w5,[x3,#240]
ldr w8, [x4, #12]
+
+
+
ld1 {v0.4s},[x4]
ld1 {v16.4s,v17.4s},[x3]
.text
+.hidden _gnutls_arm_cpuid_s
.globl sha1_block_data_order
.type sha1_block_data_order,%function
.align 6
.byte 83,72,65,49,32,98,108,111,99,107,32,116,114,97,110,115,102,111,114,109,32,102,111,114,32,65,82,77,118,56,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0
.align 2
.align 2
-.comm _gnutls_arm_cpuid_s,4,4
.section .note.GNU-stack,"",%progbits
.text
+.hidden _gnutls_arm_cpuid_s
.globl sha256_block_data_order
.type sha256_block_data_order,%function
.align 6
add sp,sp,#16*4+16
ret
.size sha256_block_neon,.-sha256_block_neon
-
-.comm _gnutls_arm_cpuid_s,4,4
.section .note.GNU-stack,"",%progbits
.text
+.hidden _gnutls_arm_cpuid_s
.globl sha512_block_data_order
.type sha512_block_data_order,%function
.align 6
ldr x29,[sp],#16
ret
.size sha512_block_armv8,.-sha512_block_armv8
-
-
-.comm _gnutls_arm_cpuid_s,4,4
.section .note.GNU-stack,"",%progbits
Loop192:
tbl v6.16b,{v4.16b},v2.16b
ext v5.16b,v0.16b,v3.16b,#12
+
+
+
+
st1 {v4.8b},[x2],#8
+
aese v6.16b,v0.16b
subs w1,w1,#1
ldr w5,[x3,#240]
ldr w8, [x4, #12]
+
+
+
ld1 {v0.4s},[x4]
ld1 {v16.4s,v17.4s},[x3]
.text
+.private_extern __gnutls_arm_cpuid_s
.globl _sha1_block_data_order
.align 6
.byte 83,72,65,49,32,98,108,111,99,107,32,116,114,97,110,115,102,111,114,109,32,102,111,114,32,65,82,77,118,56,44,32,67,82,89,80,84,79,71,65,77,83,32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115,115,108,46,111,114,103,62,0
.align 2
.align 2
-.comm __gnutls_arm_cpuid_s,4,4
.text
+.private_extern __gnutls_arm_cpuid_s
.globl _sha256_block_data_order
.align 6
ldr x29,[x29]
add sp,sp,#16*4+16
ret
-
-
-.comm __gnutls_arm_cpuid_s,4,4
.text
+.private_extern __gnutls_arm_cpuid_s
.globl _sha512_block_data_order
.align 6
ldr x29,[sp],#16
ret
-
-
-
-.comm __gnutls_arm_cpuid_s,4,4
.def _aesni_ctr32_ghash_6x; .scl 3; .type 32; .endef
.p2align 5
_aesni_ctr32_ghash_6x:
+
vmovdqu 32(%r11),%xmm2
subq $6,%rdx
vpxor %xmm4,%xmm4,%xmm4
.byte 0xf3,0xc3
+
.globl aesni_gcm_decrypt
.def aesni_gcm_decrypt; .scl 2; .type 32; .endef
.p2align 5
.def _aesni_ctr32_6x; .scl 3; .type 32; .endef
.p2align 5
_aesni_ctr32_6x:
+
vmovdqu 0-128(%rcx),%xmm4
vmovdqu 32(%r11),%xmm2
leaq -1(%rbp),%r13
jmp .Loop_ctr32
+
.globl aesni_gcm_encrypt
.def aesni_gcm_encrypt; .scl 2; .type 32; .endef
.p2align 5
movq 40(%rsp),%r8
movq 48(%rsp),%r9
+
leaq -88(%rsp),%rsp
movaps %xmm6,(%rsp)
movaps %xmm7,16(%rsp)
movq 8(%rsp),%rdi
movq 16(%rsp),%rsi
.byte 0xf3,0xc3
+
.LSEH_end_aesni_ccm64_encrypt_blocks:
.globl aesni_ccm64_decrypt_blocks
.def aesni_ccm64_decrypt_blocks; .scl 2; .type 32; .endef
movq 40(%rsp),%r8
movq 48(%rsp),%r9
+
leaq -88(%rsp),%rsp
movaps %xmm6,(%rsp)
movaps %xmm7,16(%rsp)
movq 8(%rsp),%rdi
movq 16(%rsp),%rsi
.byte 0xf3,0xc3
+
.LSEH_end_aesni_ccm64_decrypt_blocks:
.globl aesni_ctr32_encrypt_blocks
.def aesni_ctr32_encrypt_blocks; .scl 2; .type 32; .endef
.def __ocb_encrypt6; .scl 3; .type 32; .endef
.p2align 5
__ocb_encrypt6:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 0xf3,0xc3
+
.def __ocb_encrypt4; .scl 3; .type 32; .endef
.p2align 5
__ocb_encrypt4:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 0xf3,0xc3
+
.def __ocb_encrypt1; .scl 3; .type 32; .endef
.p2align 5
__ocb_encrypt1:
+
pxor %xmm15,%xmm7
pxor %xmm9,%xmm7
pxor %xmm2,%xmm8
.byte 0xf3,0xc3
+
.globl aesni_ocb_decrypt
.def aesni_ocb_decrypt; .scl 2; .type 32; .endef
.p2align 5
.def __ocb_decrypt6; .scl 3; .type 32; .endef
.p2align 5
__ocb_decrypt6:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 0xf3,0xc3
+
.def __ocb_decrypt4; .scl 3; .type 32; .endef
.p2align 5
__ocb_decrypt4:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 0xf3,0xc3
+
.def __ocb_decrypt1; .scl 3; .type 32; .endef
.p2align 5
__ocb_decrypt1:
+
pxor %xmm15,%xmm7
pxor %xmm9,%xmm7
pxor %xmm7,%xmm2
.byte 102,15,56,223,215
.byte 0xf3,0xc3
+
.globl aesni_cbc_encrypt
.def aesni_cbc_encrypt; .scl 2; .type 32; .endef
.p2align 4
addq $8,%rsp
.byte 0xf3,0xc3
-
.LSEH_end_set_encrypt_key:
.p2align 4
.byte 0xf3,0xc3
+
.p2align 6
.Lbswap_mask:
.byte 15,14,13,12,11,10,9,8,7,6,5,4,3,2,1,0
movaps -8-16(%rax),%xmm9
movq %rax,%rsp
.Lepilogue_shaext:
-
movq 8(%rsp),%rdi
movq 16(%rsp),%rsi
.byte 0xf3,0xc3
+
.LSEH_end_sha1_block_data_order_shaext:
.def sha1_block_data_order_ssse3; .scl 3; .type 32; .endef
.p2align 4
movq %r8,%rdx
_shaext_shortcut:
+
leaq -88(%rsp),%rsp
movaps %xmm6,-8-80(%rax)
movaps %xmm7,-8-64(%rax)
movq 8(%rsp),%rdi
movq 16(%rsp),%rsi
.byte 0xf3,0xc3
+
.LSEH_end_sha256_block_data_order_shaext:
.def sha256_block_data_order_ssse3; .scl 3; .type 32; .endef
.p2align 6
leaq 448(%rsp),%rsp
+
+
addl 0(%rdi),%eax
addl 4(%rdi),%ebx
addl 8(%rdi),%ecx
jbe .Loop_avx2
leaq (%rsp),%rbp
+
+
+
.Ldone_avx2:
- leaq (%rbp),%rsp
- movq 88(%rsp),%rsi
+ movq 88(%rbp),%rsi
vzeroupper
- movaps 64+32(%rsp),%xmm6
- movaps 64+48(%rsp),%xmm7
- movaps 64+64(%rsp),%xmm8
- movaps 64+80(%rsp),%xmm9
+ movaps 64+32(%rbp),%xmm6
+ movaps 64+48(%rbp),%xmm7
+ movaps 64+64(%rbp),%xmm8
+ movaps 64+80(%rbp),%xmm9
movq -48(%rsi),%r15
movq -40(%rsi),%r14
leaq 1152(%rsp),%rsp
+
+
addq 0(%rdi),%rax
addq 8(%rdi),%rbx
addq 16(%rdi),%rcx
jbe .Loop_avx2
leaq (%rsp),%rbp
+
+
+
.Ldone_avx2:
- leaq (%rbp),%rsp
- movq 152(%rsp),%rsi
+ movq 152(%rbp),%rsi
vzeroupper
- movaps 128+32(%rsp),%xmm6
- movaps 128+48(%rsp),%xmm7
- movaps 128+64(%rsp),%xmm8
- movaps 128+80(%rsp),%xmm9
- movaps 128+96(%rsp),%xmm10
- movaps 128+112(%rsp),%xmm11
+ movaps 128+32(%rbp),%xmm6
+ movaps 128+48(%rbp),%xmm7
+ movaps 128+64(%rbp),%xmm8
+ movaps 128+80(%rbp),%xmm9
+ movaps 128+96(%rbp),%xmm10
+ movaps 128+112(%rbp),%xmm11
movq -48(%rsi),%r15
movq -40(%rsi),%r14
.type _aesni_ctr32_ghash_6x,@function
.align 32
_aesni_ctr32_ghash_6x:
+.cfi_startproc
vmovdqu 32(%r11),%xmm2
subq $6,%rdx
vpxor %xmm4,%xmm4,%xmm4
vpxor %xmm4,%xmm8,%xmm8
.byte 0xf3,0xc3
+.cfi_endproc
.size _aesni_ctr32_ghash_6x,.-_aesni_ctr32_ghash_6x
.globl aesni_gcm_decrypt
.type aesni_gcm_decrypt,@function
.type _aesni_ctr32_6x,@function
.align 32
_aesni_ctr32_6x:
+.cfi_startproc
vmovdqu 0-128(%rcx),%xmm4
vmovdqu 32(%r11),%xmm2
leaq -1(%rbp),%r13
vpshufb %xmm0,%xmm1,%xmm1
vpxor %xmm4,%xmm14,%xmm14
jmp .Loop_ctr32
+.cfi_endproc
.size _aesni_ctr32_6x,.-_aesni_ctr32_6x
.globl aesni_gcm_encrypt
.type aesni_ccm64_encrypt_blocks,@function
.align 16
aesni_ccm64_encrypt_blocks:
+.cfi_startproc
movl 240(%rcx),%eax
movdqu (%r8),%xmm6
movdqa .Lincrement64(%rip),%xmm9
pxor %xmm8,%xmm8
pxor %xmm6,%xmm6
.byte 0xf3,0xc3
+.cfi_endproc
.size aesni_ccm64_encrypt_blocks,.-aesni_ccm64_encrypt_blocks
.globl aesni_ccm64_decrypt_blocks
.type aesni_ccm64_decrypt_blocks,@function
.align 16
aesni_ccm64_decrypt_blocks:
+.cfi_startproc
movl 240(%rcx),%eax
movups (%r8),%xmm6
movdqu (%r9),%xmm3
pxor %xmm8,%xmm8
pxor %xmm6,%xmm6
.byte 0xf3,0xc3
+.cfi_endproc
.size aesni_ccm64_decrypt_blocks,.-aesni_ccm64_decrypt_blocks
.globl aesni_ctr32_encrypt_blocks
.type aesni_ctr32_encrypt_blocks,@function
.type __ocb_encrypt6,@function
.align 32
__ocb_encrypt6:
+.cfi_startproc
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 102,65,15,56,221,246
.byte 102,65,15,56,221,255
.byte 0xf3,0xc3
+.cfi_endproc
.size __ocb_encrypt6,.-__ocb_encrypt6
.type __ocb_encrypt4,@function
.align 32
__ocb_encrypt4:
+.cfi_startproc
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 102,65,15,56,221,228
.byte 102,65,15,56,221,237
.byte 0xf3,0xc3
+.cfi_endproc
.size __ocb_encrypt4,.-__ocb_encrypt4
.type __ocb_encrypt1,@function
.align 32
__ocb_encrypt1:
+.cfi_startproc
pxor %xmm15,%xmm7
pxor %xmm9,%xmm7
pxor %xmm2,%xmm8
.byte 102,15,56,221,215
.byte 0xf3,0xc3
+.cfi_endproc
.size __ocb_encrypt1,.-__ocb_encrypt1
.globl aesni_ocb_decrypt
.type __ocb_decrypt6,@function
.align 32
__ocb_decrypt6:
+.cfi_startproc
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 102,65,15,56,223,246
.byte 102,65,15,56,223,255
.byte 0xf3,0xc3
+.cfi_endproc
.size __ocb_decrypt6,.-__ocb_decrypt6
.type __ocb_decrypt4,@function
.align 32
__ocb_decrypt4:
+.cfi_startproc
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
.byte 102,65,15,56,223,228
.byte 102,65,15,56,223,237
.byte 0xf3,0xc3
+.cfi_endproc
.size __ocb_decrypt4,.-__ocb_decrypt4
.type __ocb_decrypt1,@function
.align 32
__ocb_decrypt1:
+.cfi_startproc
pxor %xmm15,%xmm7
pxor %xmm9,%xmm7
pxor %xmm7,%xmm2
.byte 102,15,56,223,215
.byte 0xf3,0xc3
+.cfi_endproc
.size __ocb_decrypt1,.-__ocb_decrypt1
.globl aesni_cbc_encrypt
.type aesni_cbc_encrypt,@function
addq $8,%rsp
.cfi_adjust_cfa_offset -8
.byte 0xf3,0xc3
-.cfi_endproc
.LSEH_end_set_encrypt_key:
.align 16
shufps $170,%xmm1,%xmm1
xorps %xmm1,%xmm2
.byte 0xf3,0xc3
+.cfi_endproc
.size aesni_set_encrypt_key,.-aesni_set_encrypt_key
.size __aesni_set_encrypt_key,.-__aesni_set_encrypt_key
.align 64
pshufd $27,%xmm1,%xmm1
movdqu %xmm0,(%rdi)
movd %xmm1,16(%rdi)
-.cfi_endproc
.byte 0xf3,0xc3
+.cfi_endproc
.size sha1_block_data_order_shaext,.-sha1_block_data_order_shaext
.type sha1_block_data_order_ssse3,@function
.align 16
.align 64
sha256_block_data_order_shaext:
_shaext_shortcut:
+.cfi_startproc
leaq K256+128(%rip),%rcx
movdqu (%rdi),%xmm1
movdqu 16(%rdi),%xmm2
movdqu %xmm1,(%rdi)
movdqu %xmm2,16(%rdi)
.byte 0xf3,0xc3
+.cfi_endproc
.size sha256_block_data_order_shaext,.-sha256_block_data_order_shaext
.type sha256_block_data_order_ssse3,@function
.align 64
vmovdqa %ymm4,0(%rsp)
xorl %r14d,%r14d
vmovdqa %ymm5,32(%rsp)
+
+ movq 88(%rsp),%rdi
+.cfi_def_cfa %rdi,8
leaq -64(%rsp),%rsp
+
+
+
+ movq %rdi,-8(%rsp)
+.cfi_escape 0x0f,0x05,0x77,0x78,0x06,0x23,0x08
movl %ebx,%edi
vmovdqa %ymm6,0(%rsp)
xorl %ecx,%edi
.align 16
.Lavx2_00_47:
leaq -64(%rsp),%rsp
+.cfi_escape 0x0f,0x05,0x77,0x38,0x06,0x23,0x08
+
+ pushq 64-8(%rsp)
+.cfi_escape 0x0f,0x05,0x77,0x00,0x06,0x23,0x08
+ leaq 8(%rsp),%rsp
+.cfi_escape 0x0f,0x05,0x77,0x78,0x06,0x23,0x08
vpalignr $4,%ymm0,%ymm1,%ymm4
addl 0+128(%rsp),%r11d
andl %r8d,%r12d
movl %r9d,%r12d
vmovdqa %ymm6,32(%rsp)
leaq -64(%rsp),%rsp
+.cfi_escape 0x0f,0x05,0x77,0x38,0x06,0x23,0x08
+
+ pushq 64-8(%rsp)
+.cfi_escape 0x0f,0x05,0x77,0x00,0x06,0x23,0x08
+ leaq 8(%rsp),%rsp
+.cfi_escape 0x0f,0x05,0x77,0x78,0x06,0x23,0x08
vpalignr $4,%ymm2,%ymm3,%ymm4
addl 0+128(%rsp),%r11d
andl %r8d,%r12d
leaq 448(%rsp),%rsp
+.cfi_escape 0x0f,0x06,0x77,0xd8,0x00,0x06,0x23,0x08
+
addl 0(%rdi),%eax
addl 4(%rdi),%ebx
addl 8(%rdi),%ecx
jbe .Loop_avx2
leaq (%rsp),%rbp
+
+.cfi_escape 0x0f,0x06,0x76,0xd8,0x00,0x06,0x23,0x08
+
.Ldone_avx2:
- leaq (%rbp),%rsp
- movq 88(%rsp),%rsi
+ movq 88(%rbp),%rsi
.cfi_def_cfa %rsi,8
vzeroupper
movq -48(%rsi),%r15
vmovdqa %ymm10,64(%rsp)
vpaddq 64(%rbp),%ymm6,%ymm10
vmovdqa %ymm11,96(%rsp)
+
+ movq 152(%rsp),%rdi
+.cfi_def_cfa %rdi,8
leaq -128(%rsp),%rsp
+
+
+
+ movq %rdi,-8(%rsp)
+.cfi_escape 0x0f,0x05,0x77,0x78,0x06,0x23,0x08
vpaddq 96(%rbp),%ymm7,%ymm11
vmovdqa %ymm8,0(%rsp)
xorq %r14,%r14
.align 16
.Lavx2_00_47:
leaq -128(%rsp),%rsp
+.cfi_escape 0x0f,0x06,0x77,0xf8,0x00,0x06,0x23,0x08
+
+ pushq 128-8(%rsp)
+.cfi_escape 0x0f,0x05,0x77,0x00,0x06,0x23,0x08
+ leaq 8(%rsp),%rsp
+.cfi_escape 0x0f,0x05,0x77,0x78,0x06,0x23,0x08
vpalignr $8,%ymm0,%ymm1,%ymm8
addq 0+256(%rsp),%r11
andq %r8,%r12
movq %r9,%r12
vmovdqa %ymm10,96(%rsp)
leaq -128(%rsp),%rsp
+.cfi_escape 0x0f,0x06,0x77,0xf8,0x00,0x06,0x23,0x08
+
+ pushq 128-8(%rsp)
+.cfi_escape 0x0f,0x05,0x77,0x00,0x06,0x23,0x08
+ leaq 8(%rsp),%rsp
+.cfi_escape 0x0f,0x05,0x77,0x78,0x06,0x23,0x08
vpalignr $8,%ymm4,%ymm5,%ymm8
addq 0+256(%rsp),%r11
andq %r8,%r12
leaq 1152(%rsp),%rsp
+.cfi_escape 0x0f,0x06,0x77,0x98,0x01,0x06,0x23,0x08
+
addq 0(%rdi),%rax
addq 8(%rdi),%rbx
addq 16(%rdi),%rcx
jbe .Loop_avx2
leaq (%rsp),%rbp
+
+.cfi_escape 0x0f,0x06,0x76,0x98,0x01,0x06,0x23,0x08
+
.Ldone_avx2:
- leaq (%rbp),%rsp
- movq 152(%rsp),%rsi
+ movq 152(%rbp),%rsi
.cfi_def_cfa %rsi,8
vzeroupper
movq -48(%rsi),%r15
.p2align 5
_aesni_ctr32_ghash_6x:
+
vmovdqu 32(%r11),%xmm2
subq $6,%rdx
vpxor %xmm4,%xmm4,%xmm4
.byte 0xf3,0xc3
+
.globl _aesni_gcm_decrypt
.p2align 5
.p2align 5
_aesni_ctr32_6x:
+
vmovdqu 0-128(%rcx),%xmm4
vmovdqu 32(%r11),%xmm2
leaq -1(%rbp),%r13
jmp L$oop_ctr32
+
.globl _aesni_gcm_encrypt
.p2align 5
.p2align 4
_aesni_ccm64_encrypt_blocks:
+
movl 240(%rcx),%eax
movdqu (%r8),%xmm6
movdqa L$increment64(%rip),%xmm9
pxor %xmm6,%xmm6
.byte 0xf3,0xc3
+
.globl _aesni_ccm64_decrypt_blocks
.p2align 4
_aesni_ccm64_decrypt_blocks:
+
movl 240(%rcx),%eax
movups (%r8),%xmm6
movdqu (%r9),%xmm3
pxor %xmm6,%xmm6
.byte 0xf3,0xc3
+
.globl _aesni_ctr32_encrypt_blocks
.p2align 4
.p2align 5
__ocb_encrypt6:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
+
.p2align 5
__ocb_encrypt4:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
+
.p2align 5
__ocb_encrypt1:
+
pxor %xmm15,%xmm7
pxor %xmm9,%xmm7
pxor %xmm2,%xmm8
.byte 0xf3,0xc3
+
.globl _aesni_ocb_decrypt
.p2align 5
.p2align 5
__ocb_decrypt6:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
+
.p2align 5
__ocb_decrypt4:
+
pxor %xmm9,%xmm15
movdqu (%rbx,%r12,1),%xmm11
movdqa %xmm10,%xmm12
+
.p2align 5
__ocb_decrypt1:
+
pxor %xmm15,%xmm7
pxor %xmm9,%xmm7
pxor %xmm7,%xmm2
.byte 102,15,56,223,215
.byte 0xf3,0xc3
+
.globl _aesni_cbc_encrypt
.p2align 4
addq $8,%rsp
.byte 0xf3,0xc3
-
L$SEH_end_set_encrypt_key:
.p2align 4
.byte 0xf3,0xc3
+
.p2align 6
L$bswap_mask:
.byte 15,14,13,12,11,10,9,8,7,6,5,4,3,2,1,0
pshufd $27,%xmm1,%xmm1
movdqu %xmm0,(%rdi)
movd %xmm1,16(%rdi)
-
.byte 0xf3,0xc3
+
.p2align 4
sha1_block_data_order_ssse3:
_ssse3_shortcut:
.p2align 6
sha256_block_data_order_shaext:
_shaext_shortcut:
+
leaq K256+128(%rip),%rcx
movdqu (%rdi),%xmm1
movdqu 16(%rdi),%xmm2
.byte 0xf3,0xc3
+
.p2align 6
sha256_block_data_order_ssse3:
vmovdqa %ymm4,0(%rsp)
xorl %r14d,%r14d
vmovdqa %ymm5,32(%rsp)
+
+ movq 88(%rsp),%rdi
+
leaq -64(%rsp),%rsp
+
+
+
+ movq %rdi,-8(%rsp)
+
movl %ebx,%edi
vmovdqa %ymm6,0(%rsp)
xorl %ecx,%edi
.p2align 4
L$avx2_00_47:
leaq -64(%rsp),%rsp
+
+
+ pushq 64-8(%rsp)
+
+ leaq 8(%rsp),%rsp
+
vpalignr $4,%ymm0,%ymm1,%ymm4
addl 0+128(%rsp),%r11d
andl %r8d,%r12d
movl %r9d,%r12d
vmovdqa %ymm6,32(%rsp)
leaq -64(%rsp),%rsp
+
+
+ pushq 64-8(%rsp)
+
+ leaq 8(%rsp),%rsp
+
vpalignr $4,%ymm2,%ymm3,%ymm4
addl 0+128(%rsp),%r11d
andl %r8d,%r12d
leaq 448(%rsp),%rsp
+
+
addl 0(%rdi),%eax
addl 4(%rdi),%ebx
addl 8(%rdi),%ecx
jbe L$oop_avx2
leaq (%rsp),%rbp
+
+
+
L$done_avx2:
- leaq (%rbp),%rsp
- movq 88(%rsp),%rsi
+ movq 88(%rbp),%rsi
vzeroupper
movq -48(%rsi),%r15
vmovdqa %ymm10,64(%rsp)
vpaddq 64(%rbp),%ymm6,%ymm10
vmovdqa %ymm11,96(%rsp)
+
+ movq 152(%rsp),%rdi
+
leaq -128(%rsp),%rsp
+
+
+
+ movq %rdi,-8(%rsp)
+
vpaddq 96(%rbp),%ymm7,%ymm11
vmovdqa %ymm8,0(%rsp)
xorq %r14,%r14
.p2align 4
L$avx2_00_47:
leaq -128(%rsp),%rsp
+
+
+ pushq 128-8(%rsp)
+
+ leaq 8(%rsp),%rsp
+
vpalignr $8,%ymm0,%ymm1,%ymm8
addq 0+256(%rsp),%r11
andq %r8,%r12
movq %r9,%r12
vmovdqa %ymm10,96(%rsp)
leaq -128(%rsp),%rsp
+
+
+ pushq 128-8(%rsp)
+
+ leaq 8(%rsp),%rsp
+
vpalignr $8,%ymm4,%ymm5,%ymm8
addq 0+256(%rsp),%r11
andq %r8,%r12
leaq 1152(%rsp),%rsp
+
+
addq 0(%rdi),%rax
addq 8(%rdi),%rbx
addq 16(%rdi),%rcx
jbe L$oop_avx2
leaq (%rsp),%rbp
+
+
+
L$done_avx2:
- leaq (%rbp),%rsp
- movq 152(%rsp),%rsi
+ movq 152(%rbp),%rsi
vzeroupper
movq -48(%rsi),%r15