L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call acos@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call acos@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call acosh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call acosh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call asin@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call asin@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call asinh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call asinh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
- movsd 64(%rsp, %r14, 8), %xmm1
+ vmovsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm1
call atan2@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 96(%rsp, %r14, 8)
+ vmovsd %xmm0, 96(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
- movsd 128(%rsp, %r14, 8), %xmm1
+ vmovsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 128(%rsp, %r14, 8), %xmm1
call atan2@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 192(%rsp, %r14, 8)
+ vmovsd %xmm0, 192(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call atanh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call atanh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call cbrt@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call cosh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call cosh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call erfc@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call erfc@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call exp10@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call exp10@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call exp2@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call exp2@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call expm1@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call expm1@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
- movsd 64(%rsp, %r14, 8), %xmm1
+ vmovsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm1
call hypot@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 96(%rsp, %r14, 8)
+ vmovsd %xmm0, 96(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
- movsd 128(%rsp, %r14, 8), %xmm1
+ vmovsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 128(%rsp, %r14, 8), %xmm1
call hypot@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 192(%rsp, %r14, 8)
+ vmovsd %xmm0, 192(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call log10@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call log10@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call log1p@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call log1p@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call log2@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call log2@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call sinh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call sinh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call tan@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call tan@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
vpcmpgtd %xmm11, %xmm9, %xmm10
vpcmpgtd %xmm8, %xmm9, %xmm0
vpand %xmm10, %xmm9, %xmm7
- blendvps %xmm0, %xmm8, %xmm7
+ vblendvps %xmm0, %xmm8, %xmm7, %xmm7
/*
* VSHRIMM( I, iIndex, = iIndex, (17 - 4) );
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 32(%rsp, %r14, 8), %xmm0
+ vmovsd 32(%rsp, %r14, 8), %xmm0
call tanh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 64(%rsp, %r14, 8)
+ vmovsd %xmm0, 64(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movsd 64(%rsp, %r14, 8), %xmm0
+ vmovsd 64(%rsp, %r14, 8), %xmm0
call tanh@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movsd %xmm0, 128(%rsp, %r14, 8)
+ vmovsd %xmm0, 128(%rsp, %r14, 8)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call acosf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call acosf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call acoshf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call acoshf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call asinf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call asinf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call asinhf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call asinhf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
- movss 128(%rsp, %r14, 4), %xmm1
+ vmovss 64(%rsp, %r14, 4), %xmm0
+ vmovss 128(%rsp, %r14, 4), %xmm1
call atan2f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 192(%rsp, %r14, 4)
+ vmovss %xmm0, 192(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
- movss 64(%rsp, %r14, 4), %xmm1
+ vmovss 32(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm1
call atan2f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 96(%rsp, %r14, 4)
+ vmovss %xmm0, 96(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
tzcntl %ebx, %ebp
/* Scalar math fucntion call to process special input. */
- movss 64(%rsp, %rbp, 4), %xmm0
+ vmovss 64(%rsp, %rbp, 4), %xmm0
call atanhf@PLT
/* No good way to avoid the store-forwarding fault this will cause on
return. `lfence` avoids the SF fault but at greater cost as it
serialized stack/callee save restoration. */
- movss %xmm0, (%rsp, %rbp, 4)
+ vmovss %xmm0, (%rsp, %rbp, 4)
blsrl %ebx, %ebx
jnz L(SPECIAL_VALUES_LOOP)
tzcntl %ebx, %ebp
/* Scalar math fucntion call to process special input. */
- movss 32(%rsp, %rbp, 4), %xmm0
+ vmovss 32(%rsp, %rbp, 4), %xmm0
call atanhf@PLT
/* No good way to avoid the store-forwarding fault this will cause on
return. `lfence` avoids the SF fault but at greater cost as it
serialized stack/callee save restoration. */
- movss %xmm0, (%rsp, %rbp, 4)
+ vmovss %xmm0, (%rsp, %rbp, 4)
blsrl %ebx, %ebx
jnz L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call cbrtf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call coshf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call coshf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call erfcf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call erfcf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call exp10f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call exp10f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call exp2f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call exp2f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call expm1f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call expm1f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
- movss 128(%rsp, %r14, 4), %xmm1
+ vmovss 64(%rsp, %r14, 4), %xmm0
+ vmovss 128(%rsp, %r14, 4), %xmm1
call hypotf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 192(%rsp, %r14, 4)
+ vmovss %xmm0, 192(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
- movss 64(%rsp, %r14, 4), %xmm1
+ vmovss 32(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm1
call hypotf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 96(%rsp, %r14, 4)
+ vmovss %xmm0, 96(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call log10f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call log10f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call log1pf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call log1pf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call log2f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call log2f@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call sinhf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 32(%rsp, %r14, 4), %xmm0
+ vmovss 32(%rsp, %r14, 4), %xmm0
call sinhf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 64(%rsp, %r14, 4)
+ vmovss %xmm0, 64(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %r12d, %r14d
- movss 64(%rsp, %r14, 4), %xmm0
+ vmovss 64(%rsp, %r14, 4), %xmm0
call tanf@PLT
# LOE rbx r14 r15 r12d r13d xmm0
- movss %xmm0, 128(%rsp, %r14, 4)
+ vmovss %xmm0, 128(%rsp, %r14, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
L(SCALAR_MATH_CALL):
movl %ebx, %r13d
- movss 32(%rsp, %r13, 4), %xmm0
+ vmovss 32(%rsp, %r13, 4), %xmm0
call tanf@PLT
# LOE r13 r14 r15 ebx r12d xmm0
- movss %xmm0, 64(%rsp, %r13, 4)
+ vmovss %xmm0, 64(%rsp, %r13, 4)
/* Process special inputs in loop */
jmp L(SPECIAL_VALUES_LOOP)
tzcntl %ebx, %ebp
/* Scalar math fucntion call to process special input. */
- movss 64(%rsp, %rbp, 4), %xmm0
+ vmovss 64(%rsp, %rbp, 4), %xmm0
call tanhf@PLT
/* No good way to avoid the store-forwarding fault this will cause on
return. `lfence` avoids the SF fault but at greater cost as it
serialized stack/callee save restoration. */
- movss %xmm0, (%rsp, %rbp, 4)
+ vmovss %xmm0, (%rsp, %rbp, 4)
blsrl %ebx, %ebx
jnz L(SPECIAL_VALUES_LOOP)
tzcntl %ebx, %ebp
/* Scalar math function call to process special input. */
- movss 32(%rsp, %rbp, 4), %xmm0
+ vmovss 32(%rsp, %rbp, 4), %xmm0
call tanhf@PLT
/* No good way to avoid the store-forwarding fault this will cause on
return. `lfence` avoids the SF fault but at greater cost as it
serialized stack/callee save restoration. */
- movss %xmm0, (%rsp, %rbp, 4)
+ vmovss %xmm0, (%rsp, %rbp, 4)
blsrl %ebx, %ebx
jnz L(SPECIAL_VALUES_LOOP)
.section SECTION(.text), "ax", @progbits
ENTRY(STRRCHR)
- movd %esi, %xmm7
+ vmovd %esi, %xmm7
movl %edi, %eax
/* Broadcast CHAR to YMM4. */
VPBROADCAST %xmm7, %ymm7