@@ -219,4 +219,15 @@
#define __DECL_SIMD_atan2f32x
#define __DECL_SIMD_atan2f64x
#define __DECL_SIMD_atan2f128x
+
+#define __DECL_SIMD_log10
+#define __DECL_SIMD_log10f
+#define __DECL_SIMD_log10l
+#define __DECL_SIMD_log10f16
+#define __DECL_SIMD_log10f32
+#define __DECL_SIMD_log10f64
+#define __DECL_SIMD_log10f128
+#define __DECL_SIMD_log10f32x
+#define __DECL_SIMD_log10f64x
+#define __DECL_SIMD_log10f128x
#endif
@@ -104,7 +104,7 @@ __MATHCALL (ldexp,, (_Mdouble_ __x, int __exponent));
__MATHCALL_VEC (log,, (_Mdouble_ __x));
/* Base-ten logarithm of X. */
-__MATHCALL (log10,, (_Mdouble_ __x));
+__MATHCALL_VEC (log10,, (_Mdouble_ __x));
/* Break VALUE into integral and fractional parts. */
__MATHCALL (modf,, (_Mdouble_ __x, _Mdouble_ *__iptr)) __nonnull ((2));
@@ -54,6 +54,7 @@ GLIBC_2.35 _ZGVbN2v_cosh F
GLIBC_2.35 _ZGVbN2v_exp10 F
GLIBC_2.35 _ZGVbN2v_exp2 F
GLIBC_2.35 _ZGVbN2v_expm1 F
+GLIBC_2.35 _ZGVbN2v_log10 F
GLIBC_2.35 _ZGVbN2v_sinh F
GLIBC_2.35 _ZGVbN2vv_atan2 F
GLIBC_2.35 _ZGVbN2vv_hypot F
@@ -65,6 +66,7 @@ GLIBC_2.35 _ZGVbN4v_coshf F
GLIBC_2.35 _ZGVbN4v_exp10f F
GLIBC_2.35 _ZGVbN4v_exp2f F
GLIBC_2.35 _ZGVbN4v_expm1f F
+GLIBC_2.35 _ZGVbN4v_log10f F
GLIBC_2.35 _ZGVbN4v_sinhf F
GLIBC_2.35 _ZGVbN4vv_atan2f F
GLIBC_2.35 _ZGVbN4vv_hypotf F
@@ -76,6 +78,7 @@ GLIBC_2.35 _ZGVcN4v_cosh F
GLIBC_2.35 _ZGVcN4v_exp10 F
GLIBC_2.35 _ZGVcN4v_exp2 F
GLIBC_2.35 _ZGVcN4v_expm1 F
+GLIBC_2.35 _ZGVcN4v_log10 F
GLIBC_2.35 _ZGVcN4v_sinh F
GLIBC_2.35 _ZGVcN4vv_atan2 F
GLIBC_2.35 _ZGVcN4vv_hypot F
@@ -87,6 +90,7 @@ GLIBC_2.35 _ZGVcN8v_coshf F
GLIBC_2.35 _ZGVcN8v_exp10f F
GLIBC_2.35 _ZGVcN8v_exp2f F
GLIBC_2.35 _ZGVcN8v_expm1f F
+GLIBC_2.35 _ZGVcN8v_log10f F
GLIBC_2.35 _ZGVcN8v_sinhf F
GLIBC_2.35 _ZGVcN8vv_atan2f F
GLIBC_2.35 _ZGVcN8vv_hypotf F
@@ -98,6 +102,7 @@ GLIBC_2.35 _ZGVdN4v_cosh F
GLIBC_2.35 _ZGVdN4v_exp10 F
GLIBC_2.35 _ZGVdN4v_exp2 F
GLIBC_2.35 _ZGVdN4v_expm1 F
+GLIBC_2.35 _ZGVdN4v_log10 F
GLIBC_2.35 _ZGVdN4v_sinh F
GLIBC_2.35 _ZGVdN4vv_atan2 F
GLIBC_2.35 _ZGVdN4vv_hypot F
@@ -109,6 +114,7 @@ GLIBC_2.35 _ZGVdN8v_coshf F
GLIBC_2.35 _ZGVdN8v_exp10f F
GLIBC_2.35 _ZGVdN8v_exp2f F
GLIBC_2.35 _ZGVdN8v_expm1f F
+GLIBC_2.35 _ZGVdN8v_log10f F
GLIBC_2.35 _ZGVdN8v_sinhf F
GLIBC_2.35 _ZGVdN8vv_atan2f F
GLIBC_2.35 _ZGVdN8vv_hypotf F
@@ -120,6 +126,7 @@ GLIBC_2.35 _ZGVeN16v_coshf F
GLIBC_2.35 _ZGVeN16v_exp10f F
GLIBC_2.35 _ZGVeN16v_exp2f F
GLIBC_2.35 _ZGVeN16v_expm1f F
+GLIBC_2.35 _ZGVeN16v_log10f F
GLIBC_2.35 _ZGVeN16v_sinhf F
GLIBC_2.35 _ZGVeN16vv_atan2f F
GLIBC_2.35 _ZGVeN16vv_hypotf F
@@ -131,6 +138,7 @@ GLIBC_2.35 _ZGVeN8v_cosh F
GLIBC_2.35 _ZGVeN8v_exp10 F
GLIBC_2.35 _ZGVeN8v_exp2 F
GLIBC_2.35 _ZGVeN8v_expm1 F
+GLIBC_2.35 _ZGVeN8v_log10 F
GLIBC_2.35 _ZGVeN8v_sinh F
GLIBC_2.35 _ZGVeN8vv_atan2 F
GLIBC_2.35 _ZGVeN8vv_hypot F
@@ -102,6 +102,10 @@
# define __DECL_SIMD_atan2 __DECL_SIMD_x86_64
# undef __DECL_SIMD_atan2f
# define __DECL_SIMD_atan2f __DECL_SIMD_x86_64
+# undef __DECL_SIMD_log10
+# define __DECL_SIMD_log10 __DECL_SIMD_x86_64
+# undef __DECL_SIMD_log10f
+# define __DECL_SIMD_log10f __DECL_SIMD_x86_64
# endif
#endif
@@ -50,6 +50,8 @@
!GCC$ builtin (cbrtf) attributes simd (notinbranch) if('x86_64')
!GCC$ builtin (atan2) attributes simd (notinbranch) if('x86_64')
!GCC$ builtin (atan2f) attributes simd (notinbranch) if('x86_64')
+!GCC$ builtin (log10) attributes simd (notinbranch) if('x86_64')
+!GCC$ builtin (log10f) attributes simd (notinbranch) if('x86_64')
!GCC$ builtin (cos) attributes simd (notinbranch) if('x32')
!GCC$ builtin (cosf) attributes simd (notinbranch) if('x32')
@@ -85,3 +87,5 @@
!GCC$ builtin (cbrtf) attributes simd (notinbranch) if('x32')
!GCC$ builtin (atan2) attributes simd (notinbranch) if('x32')
!GCC$ builtin (atan2f) attributes simd (notinbranch) if('x32')
+!GCC$ builtin (log10) attributes simd (notinbranch) if('x32')
+!GCC$ builtin (log10f) attributes simd (notinbranch) if('x32')
@@ -35,6 +35,7 @@ libmvec-funcs = \
expm1 \
hypot \
log \
+ log10 \
pow \
sin \
sincos \
@@ -22,6 +22,7 @@ libmvec {
_ZGVbN2v_exp10; _ZGVcN4v_exp10; _ZGVdN4v_exp10; _ZGVeN8v_exp10;
_ZGVbN2v_exp2; _ZGVcN4v_exp2; _ZGVdN4v_exp2; _ZGVeN8v_exp2;
_ZGVbN2v_expm1; _ZGVcN4v_expm1; _ZGVdN4v_expm1; _ZGVeN8v_expm1;
+ _ZGVbN2v_log10; _ZGVcN4v_log10; _ZGVdN4v_log10; _ZGVeN8v_log10;
_ZGVbN2v_sinh; _ZGVcN4v_sinh; _ZGVdN4v_sinh; _ZGVeN8v_sinh;
_ZGVbN2vv_atan2; _ZGVcN4vv_atan2; _ZGVdN4vv_atan2; _ZGVeN8vv_atan2;
_ZGVbN2vv_hypot; _ZGVcN4vv_hypot; _ZGVdN4vv_hypot; _ZGVeN8vv_hypot;
@@ -33,6 +34,7 @@ libmvec {
_ZGVbN4v_exp10f; _ZGVcN8v_exp10f; _ZGVdN8v_exp10f; _ZGVeN16v_exp10f;
_ZGVbN4v_exp2f; _ZGVcN8v_exp2f; _ZGVdN8v_exp2f; _ZGVeN16v_exp2f;
_ZGVbN4v_expm1f; _ZGVcN8v_expm1f; _ZGVdN8v_expm1f; _ZGVeN16v_expm1f;
+ _ZGVbN4v_log10f; _ZGVcN8v_log10f; _ZGVdN8v_log10f; _ZGVeN16v_log10f;
_ZGVbN4v_sinhf; _ZGVcN8v_sinhf; _ZGVdN8v_sinhf; _ZGVeN16v_sinhf;
_ZGVbN4vv_atan2f; _ZGVcN8vv_atan2f; _ZGVdN8vv_atan2f; _ZGVeN16vv_atan2f;
_ZGVbN4vv_hypotf; _ZGVcN8vv_hypotf; _ZGVdN8vv_hypotf; _ZGVeN16vv_hypotf;
@@ -1641,6 +1641,26 @@ float: 2
float128: 1
ldouble: 1
+Function: "log10_vlen16":
+float: 1
+
+Function: "log10_vlen2":
+double: 1
+
+Function: "log10_vlen4":
+double: 1
+float: 1
+
+Function: "log10_vlen4_avx2":
+double: 1
+
+Function: "log10_vlen8":
+double: 1
+float: 1
+
+Function: "log10_vlen8_avx2":
+float: 1
+
Function: "log1p":
double: 1
float: 1
new file mode 100644
@@ -0,0 +1,20 @@
+/* SSE2 version of vectorized log10, vector length is 2.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define _ZGVbN2v_log10 _ZGVbN2v_log10_sse2
+#include "../svml_d_log102_core.S"
new file mode 100644
@@ -0,0 +1,27 @@
+/* Multiple versions of vectorized log10, vector length is 2.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define SYMBOL_NAME _ZGVbN2v_log10
+#include "ifunc-mathvec-sse4_1.h"
+
+libc_ifunc_redirected (REDIRECT_NAME, SYMBOL_NAME, IFUNC_SELECTOR ());
+
+#ifdef SHARED
+__hidden_ver1 (_ZGVbN2v_log10, __GI__ZGVbN2v_log10, __redirect__ZGVbN2v_log10)
+ __attribute__ ((visibility ("hidden")));
+#endif
new file mode 100644
@@ -0,0 +1,1086 @@
+/* Function log10 vectorized with SSE4.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ https://www.gnu.org/licenses/. */
+
+/*
+ * ALGORITHM DESCRIPTION:
+ *
+ * Get short reciprocal approximation Rcp ~ 1/mantissa(x)
+ * R = Rcp*x - 1.0
+ * log10(x) = k*log10(2.0) - log10(Rcp) + poly_approximation(R)
+ * log10(Rcp) is tabulated
+ *
+ *
+ */
+
+/* Offsets for data table __svml_dlog10_data_internal
+ */
+#define Log_HA_table 0
+#define Log_LA_table 4112
+#define poly_coeff 8224
+#define ExpMask 8304
+#define Two10 8320
+#define MinNorm 8336
+#define MaxNorm 8352
+#define HalfMask 8368
+#define One 8384
+#define Threshold 8400
+#define Bias 8416
+#define Bias1 8432
+#define L2 8448
+
+#include <sysdep.h>
+
+ .text
+ .section .text.sse4,"ax",@progbits
+ENTRY(_ZGVbN2v_log10_sse4)
+ pushq %rbp
+ cfi_def_cfa_offset(16)
+ movq %rsp, %rbp
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+ andq $-32, %rsp
+ subq $64, %rsp
+
+/* exponent bits */
+ movaps %xmm0, %xmm5
+
+/* preserve mantissa, set input exponent to 2^(-10) */
+ movups ExpMask+__svml_dlog10_data_internal(%rip), %xmm1
+ psrlq $20, %xmm5
+ andps %xmm0, %xmm1
+ lea -4222960+__svml_dlog10_data_internal(%rip), %rsi
+ orps Two10+__svml_dlog10_data_internal(%rip), %xmm1
+
+/* check range */
+ movaps %xmm0, %xmm8
+
+/* reciprocal approximation good to at least 11 bits */
+ cvtpd2ps %xmm1, %xmm2
+ cmpltpd MinNorm+__svml_dlog10_data_internal(%rip), %xmm8
+ movlhps %xmm2, %xmm2
+ movaps %xmm0, %xmm7
+ rcpps %xmm2, %xmm3
+ cmpnlepd MaxNorm+__svml_dlog10_data_internal(%rip), %xmm7
+ cvtps2pd %xmm3, %xmm12
+
+/* round reciprocal to nearest integer, will have 1+9 mantissa bits */
+ movups .FLT_12(%rip), %xmm4
+ orps %xmm7, %xmm8
+ addpd %xmm4, %xmm12
+
+/* combine and get argument value range mask */
+ movmskpd %xmm8, %edx
+
+/* argument reduction */
+ movups HalfMask+__svml_dlog10_data_internal(%rip), %xmm9
+ subpd %xmm4, %xmm12
+ andps %xmm1, %xmm9
+
+/*
+ * prepare table index
+ * table lookup
+ */
+ movaps %xmm12, %xmm10
+ subpd %xmm9, %xmm1
+ mulpd %xmm12, %xmm9
+ mulpd %xmm12, %xmm1
+ subpd One+__svml_dlog10_data_internal(%rip), %xmm9
+ addpd %xmm9, %xmm1
+
+/* polynomial */
+ movups poly_coeff+__svml_dlog10_data_internal(%rip), %xmm14
+ psrlq $40, %xmm10
+ mulpd %xmm1, %xmm14
+ movd %xmm10, %eax
+ pshufd $2, %xmm10, %xmm11
+ movaps %xmm1, %xmm10
+ movups poly_coeff+32+__svml_dlog10_data_internal(%rip), %xmm15
+ mulpd %xmm1, %xmm10
+ addpd poly_coeff+16+__svml_dlog10_data_internal(%rip), %xmm14
+ mulpd %xmm1, %xmm15
+ mulpd %xmm10, %xmm14
+ addpd poly_coeff+48+__svml_dlog10_data_internal(%rip), %xmm15
+ movd %xmm11, %ecx
+
+/* exponent*log(2.0) */
+ movups Threshold+__svml_dlog10_data_internal(%rip), %xmm13
+ addpd %xmm14, %xmm15
+ cmpltpd %xmm12, %xmm13
+ mulpd %xmm15, %xmm10
+ pshufd $221, %xmm5, %xmm6
+ movups poly_coeff+64+__svml_dlog10_data_internal(%rip), %xmm11
+
+/* biased exponent in DP format */
+ cvtdq2pd %xmm6, %xmm3
+ mulpd %xmm1, %xmm11
+ andps Bias+__svml_dlog10_data_internal(%rip), %xmm13
+ orps Bias1+__svml_dlog10_data_internal(%rip), %xmm13
+ subpd %xmm13, %xmm3
+ addpd %xmm10, %xmm11
+ mulpd L2+__svml_dlog10_data_internal(%rip), %xmm3
+ movslq %eax, %rax
+ movslq %ecx, %rcx
+ movsd (%rsi,%rax), %xmm2
+ movhpd (%rsi,%rcx), %xmm2
+
+/* reconstruction */
+ addpd %xmm11, %xmm2
+ addpd %xmm2, %xmm3
+ testl %edx, %edx
+
+/* Go to special inputs processing branch */
+ jne L(SPECIAL_VALUES_BRANCH)
+ # LOE rbx r12 r13 r14 r15 edx xmm0 xmm3
+
+/* Restore registers
+ * and exit the function
+ */
+
+L(EXIT):
+ movaps %xmm3, %xmm0
+ movq %rbp, %rsp
+ popq %rbp
+ cfi_def_cfa(7, 8)
+ cfi_restore(6)
+ ret
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+
+/* Branch to process
+ * special inputs
+ */
+
+L(SPECIAL_VALUES_BRANCH):
+ movups %xmm0, 32(%rsp)
+ movups %xmm3, 48(%rsp)
+ # LOE rbx r12 r13 r14 r15 edx
+
+ xorl %eax, %eax
+ movq %r12, 16(%rsp)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -48; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd0, 0xff, 0xff, 0xff, 0x22
+ movl %eax, %r12d
+ movq %r13, 8(%rsp)
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -56; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xc8, 0xff, 0xff, 0xff, 0x22
+ movl %edx, %r13d
+ movq %r14, (%rsp)
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -64; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r15 r12d r13d
+
+/* Range mask
+ * bits check
+ */
+
+L(RANGEMASK_CHECK):
+ btl %r12d, %r13d
+
+/* Call scalar math function */
+ jc L(SCALAR_MATH_CALL)
+ # LOE rbx r15 r12d r13d
+
+/* Special inputs
+ * processing loop
+ */
+
+L(SPECIAL_VALUES_LOOP):
+ incl %r12d
+ cmpl $2, %r12d
+
+/* Check bits in range mask */
+ jl L(RANGEMASK_CHECK)
+ # LOE rbx r15 r12d r13d
+
+ movq 16(%rsp), %r12
+ cfi_restore(12)
+ movq 8(%rsp), %r13
+ cfi_restore(13)
+ movq (%rsp), %r14
+ cfi_restore(14)
+ movups 48(%rsp), %xmm3
+
+/* Go to exit */
+ jmp L(EXIT)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -48; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xd0, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -56; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xc8, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -64; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r12 r13 r14 r15 xmm3
+
+/* Scalar math fucntion call
+ * to process special input
+ */
+
+L(SCALAR_MATH_CALL):
+ movl %r12d, %r14d
+ movsd 32(%rsp,%r14,8), %xmm0
+ call log10@PLT
+ # LOE rbx r14 r15 r12d r13d xmm0
+
+ movsd %xmm0, 48(%rsp,%r14,8)
+
+/* Process special inputs in loop */
+ jmp L(SPECIAL_VALUES_LOOP)
+ # LOE rbx r15 r12d r13d
+END(_ZGVbN2v_log10_sse4)
+
+ .section .rodata, "a"
+ .align 16
+
+#ifdef __svml_dlog10_data_internal_typedef
+typedef unsigned int VUINT32;
+typedef struct {
+ __declspec(align(16)) VUINT32 Log_HA_table[(1<<9)+2][2];
+ __declspec(align(16)) VUINT32 Log_LA_table[(1<<9)+1][2];
+ __declspec(align(16)) VUINT32 poly_coeff[5][2][2];
+ __declspec(align(16)) VUINT32 ExpMask[2][2];
+ __declspec(align(16)) VUINT32 Two10[2][2];
+ __declspec(align(16)) VUINT32 MinNorm[2][2];
+ __declspec(align(16)) VUINT32 MaxNorm[2][2];
+ __declspec(align(16)) VUINT32 HalfMask[2][2];
+ __declspec(align(16)) VUINT32 One[2][2];
+ __declspec(align(16)) VUINT32 Threshold[2][2];
+ __declspec(align(16)) VUINT32 Bias[2][2];
+ __declspec(align(16)) VUINT32 Bias1[2][2];
+ __declspec(align(16)) VUINT32 L2[2][2];
+} __svml_dlog10_data_internal;
+#endif
+__svml_dlog10_data_internal:
+ /* Log_HA_table */
+ .quad 0xc0733a7146f6b080, 0xbe1e707ce619c200
+ .quad 0xc0733a7547771970, 0xbe1e79c6c06d6f51
+ .quad 0xc0733a7945aacb70, 0xbe1e78e225fad29c
+ .quad 0xc0733a7d41946970, 0xbe1e76d607f9693b
+ .quad 0xc0733a813b3691f0, 0xbe1e7704b3e0685b
+ .quad 0xc0733a853293df00, 0xbe1e79c1216a27fa
+ .quad 0xc0733a8927aee660, 0xbe1e76dce5734a81
+ .quad 0xc0733a8d1a8a3920, 0xbe1e782ee2ca4dba
+ .quad 0xc0733a910b286430, 0xbe1e7812d1a0a61f
+ .quad 0xc0733a94f98bf010, 0xbe1e77e1b5ecbc61
+ .quad 0xc0733a98e5b76100, 0xbe1e76635cac1586
+ .quad 0xc0733a9ccfad36f0, 0xbe1e7638f7968f32
+ .quad 0xc0733aa0b76feda0, 0xbe1e7840ee76e365
+ .quad 0xc0733aa49d01fcb0, 0xbe1e79f3fd01907e
+ .quad 0xc0733aa88065d7a0, 0xbe1e77bbb3a9c38a
+ .quad 0xc0733aac619dedb0, 0xbe1e7742719bf41d
+ .quad 0xc0733ab040acaa20, 0xbe1e79bcedaf79cb
+ .quad 0xc0733ab41d947450, 0xbe1e762d63cb7ca0
+ .quad 0xc0733ab7f857af50, 0xbe1e77a07be83403
+ .quad 0xc0733abbd0f8ba80, 0xbe1e7763ff836ad0
+ .quad 0xc0733abfa779f130, 0xbe1e7737720ead39
+ .quad 0xc0733ac37bddaad0, 0xbe1e7776a08e55e7
+ .quad 0xc0733ac74e263af0, 0xbe1e793e3c52dd36
+ .quad 0xc0733acb1e55f160, 0xbe1e788a94695051
+ .quad 0xc0733aceec6f1a10, 0xbe1e76508114a813
+ .quad 0xc0733ad2b873fd20, 0xbe1e76909457d23e
+ .quad 0xc0733ad68266df10, 0xbe1e7664a24f9ca4
+ .quad 0xc0733ada4a4a0090, 0xbe1e7a07b3d44b18
+ .quad 0xc0733ade101f9ee0, 0xbe1e76d87594704d
+ .quad 0xc0733ae1d3e9f340, 0xbe1e79563595a182
+ .quad 0xc0733ae595ab33b0, 0xbe1e771880c3c6ab
+ .quad 0xc0733ae955659250, 0xbe1e78c171f517d4
+ .quad 0xc0733aed131b3df0, 0xbe1e77eac3874666
+ .quad 0xc0733af0cece61b0, 0xbe1e790db479d8f6
+ .quad 0xc0733af488812550, 0xbe1e7965d1aa5c90
+ .quad 0xc0733af84035ad10, 0xbe1e78ceb398ba47
+ .quad 0xc0733afbf5ee19c0, 0xbe1e779cc0dcb5aa
+ .quad 0xc0733affa9ac88c0, 0xbe1e7871053953ed
+ .quad 0xc0733b035b731420, 0xbe1e7a082cffa71a
+ .quad 0xc0733b070b43d2a0, 0xbe1e7904b4382fad
+ .quad 0xc0733b0ab920d790, 0xbe1e79b458d0b4f3
+ .quad 0xc0733b0e650c3310, 0xbe1e79d0ded414c6
+ .quad 0xc0733b120f07f200, 0xbe1e763c357a1943
+ .quad 0xc0733b15b7161dd0, 0xbe1e78b80ba6daaa
+ .quad 0xc0733b195d38bd00, 0xbe1e7998e23b8ffd
+ .quad 0xc0733b1d0171d2c0, 0xbe1e7974aa65ee8c
+ .quad 0xc0733b20a3c35f20, 0xbe1e76ccfde752ab
+ .quad 0xc0733b24442f5ef0, 0xbe1e77b4ff19debb
+ .quad 0xc0733b27e2b7cc10, 0xbe1e7772ee478542
+ .quad 0xc0733b2b7f5e9d30, 0xbe1e781d81b58b44
+ .quad 0xc0733b2f1a25c600, 0xbe1e78350d967565
+ .quad 0xc0733b32b30f3720, 0xbe1e783888e48152
+ .quad 0xc0733b364a1cde30, 0xbe1e78367bf7c111
+ .quad 0xc0733b39df50a5d0, 0xbe1e7959e57ca47d
+ .quad 0xc0733b3d72ac75c0, 0xbe1e777322423222
+ .quad 0xc0733b41043232b0, 0xbe1e767ce42a60aa
+ .quad 0xc0733b4493e3be70, 0xbe1e781d445aea19
+ .quad 0xc0733b4821c2f800, 0xbe1e7922fca18e18
+ .quad 0xc0733b4badd1bb80, 0xbe1e76fed3d40647
+ .quad 0xc0733b4f3811e210, 0xbe1e793948c9eabc
+ .quad 0xc0733b52c0854240, 0xbe1e76e487656b8c
+ .quad 0xc0733b56472daf90, 0xbe1e780ab2f71223
+ .quad 0xc0733b59cc0cfaf0, 0xbe1e77189120b09c
+ .quad 0xc0733b5d4f24f270, 0xbe1e7644a0343a12
+ .quad 0xc0733b60d0776160, 0xbe1e78f2a3e4733d
+ .quad 0xc0733b6450061080, 0xbe1e7913b2f73ae5
+ .quad 0xc0733b67cdd2c5c0, 0xbe1e7882d08393b5
+ .quad 0xc0733b6b49df4470, 0xbe1e765e1b209979
+ .quad 0xc0733b6ec42d4d20, 0xbe1e785c9c4620d4
+ .quad 0xc0733b75b394f240, 0xbe1e78878cd0e956
+ .quad 0xc0733b7c9c178630, 0xbe1e789a4112d90b
+ .quad 0xc0733b837dc2b0f0, 0xbe1e79050b8a1766
+ .quad 0xc0733b8a58a3f220, 0xbe1e7790dffc47aa
+ .quad 0xc0733b912cc8a180, 0xbe1e77174593b06a
+ .quad 0xc0733b97fa3defb0, 0xbe1e7677de2d2ecc
+ .quad 0xc0733b9ec110e6b0, 0xbe1e76cff477ca18
+ .quad 0xc0733ba5814e6a80, 0xbe1e78f8644dec7b
+ .quad 0xc0733bac3b0339d0, 0xbe1e764e1361788d
+ .quad 0xc0733bb2ee3bee30, 0xbe1e78c913e738de
+ .quad 0xc0733bb99b04fd30, 0xbe1e76666f5bddaa
+ .quad 0xc0733bc0416ab850, 0xbe1e77e87cbd8ab6
+ .quad 0xc0733bc6e1794e10, 0xbe1e76f18ba1c966
+ .quad 0xc0733bcd7b3cca10, 0xbe1e777c9461b8db
+ .quad 0xc0733bd40ec115d0, 0xbe1e78b78526ffac
+ .quad 0xc0733bda9c11f920, 0xbe1e7942abecfede
+ .quad 0xc0733be1233b1aa0, 0xbe1e76d8a684fd8c
+ .quad 0xc0733be7a4480010, 0xbe1e79622b539ac9
+ .quad 0xc0733bee1f440f30, 0xbe1e7978e7cc20ea
+ .quad 0xc0733bf4943a8de0, 0xbe1e765c9c9de825
+ .quad 0xc0733bfb0336a290, 0xbe1e775d8b138ee2
+ .quad 0xc0733c016c435500, 0xbe1e78bf33465c2f
+ .quad 0xc0733c07cf6b8e80, 0xbe1e78164f7cc441
+ .quad 0xc0733c0e2cba1a50, 0xbe1e7824e64d0b23
+ .quad 0xc0733c148439a630, 0xbe1e78373ae7dd81
+ .quad 0xc0733c1ad5f4c2c0, 0xbe1e7704513e0afe
+ .quad 0xc0733c2121f5e3d0, 0xbe1e7914aa84200f
+ .quad 0xc0733c2768476110, 0xbe1e76b1cde25cf6
+ .quad 0xc0733c2da8f37600, 0xbe1e796120e3862d
+ .quad 0xc0733c33e40442e0, 0xbe1e78ec836d7e7b
+ .quad 0xc0733c3a1983cca0, 0xbe1e77fb13b7dabb
+ .quad 0xc0733c40497bfd70, 0xbe1e783c6fcb2404
+ .quad 0xc0733c4673f6a530, 0xbe1e7628bb93dce8
+ .quad 0xc0733c4c98fd7990, 0xbe1e7857a47b5001
+ .quad 0xc0733c52b89a16d0, 0xbe1e76708dc2831f
+ .quad 0xc0733c58d2d5ffa0, 0xbe1e77b6038651f1
+ .quad 0xc0733c5ee7ba9de0, 0xbe1e792e855bb5b2
+ .quad 0xc0733c64f75142d0, 0xbe1e776cacd5c105
+ .quad 0xc0733c6b01a32740, 0xbe1e77f8a8011315
+ .quad 0xc0733c7106b96c30, 0xbe1e765cf3efcfde
+ .quad 0xc0733c77069d1ad0, 0xbe1e78d837d2efac
+ .quad 0xc0733c7d01572530, 0xbe1e78b615cf772c
+ .quad 0xc0733c82f6f06640, 0xbe1e7650bbbd7a25
+ .quad 0xc0733c88e771a220, 0xbe1e78bcf3495872
+ .quad 0xc0733c8ed2e386c0, 0xbe1e792266832e84
+ .quad 0xc0733c94b94eabd0, 0xbe1e79c1c3c2ca52
+ .quad 0xc0733c9a9abb9340, 0xbe1e78aa61e5807d
+ .quad 0xc0733ca07732a970, 0xbe1e7620fc4cf156
+ .quad 0xc0733ca64ebc4570, 0xbe1e76b914a832c5
+ .quad 0xc0733cac2160a970, 0xbe1e79227f72020e
+ .quad 0xc0733cb1ef280300, 0xbe1e77ac972cc008
+ .quad 0xc0733cb7b81a6b10, 0xbe1e798089be41f4
+ .quad 0xc0733cbd7c3fe6a0, 0xbe1e77942ae037fe
+ .quad 0xc0733cc33ba06690, 0xbe1e7956ae6463d9
+ .quad 0xc0733cc8f643c850, 0xbe1e7918a50c7942
+ .quad 0xc0733cceac31d5d0, 0xbe1e78308eeab604
+ .quad 0xc0733cd45d7245e0, 0xbe1e76dd4ea88445
+ .quad 0xc0733cda0a0cbc60, 0xbe1e77e7c1aa5909
+ .quad 0xc0733cdfb208caa0, 0xbe1e7804b9d20e54
+ .quad 0xc0733ce5556def70, 0xbe1e78f88e99d49c
+ .quad 0xc0733ceaf4439780, 0xbe1e787d74682d68
+ .quad 0xc0733cf08e911d80, 0xbe1e76edc24fe6e7
+ .quad 0xc0733cf6245dca50, 0xbe1e79b347ec86d2
+ .quad 0xc0733cfbb5b0d580, 0xbe1e797cceb2c39b
+ .quad 0xc0733d0142916530, 0xbe1e783adbdc6aa1
+ .quad 0xc0733d06cb068e70, 0xbe1e76e4c20e3d9e
+ .quad 0xc0733d0c4f175570, 0xbe1e77070bf3cf61
+ .quad 0xc0733d11cecaadc0, 0xbe1e781c43502734
+ .quad 0xc0733d174a277a80, 0xbe1e78b11268ea72
+ .quad 0xc0733d1cc1348e90, 0xbe1e7754b83bfc7d
+ .quad 0xc0733d2233f8acb0, 0xbe1e7756c29bf5e9
+ .quad 0xc0733d27a27a87d0, 0xbe1e7952fc1d9333
+ .quad 0xc0733d2d0cc0c350, 0xbe1e778c76ae6077
+ .quad 0xc0733d3272d1f2e0, 0xbe1e7a1896ba8f43
+ .quad 0xc0733d37d4b49b30, 0xbe1e76dafdf432d8
+ .quad 0xc0733d3d326f3180, 0xbe1e795330184013
+ .quad 0xc0733d428c081c80, 0xbe1e763cc774d30f
+ .quad 0xc0733d47e185b3d0, 0xbe1e77030a779c0a
+ .quad 0xc0733d4d32ee40b0, 0xbe1e7908af2a2d7e
+ .quad 0xc0733d528047fe00, 0xbe1e78c4953b797d
+ .quad 0xc0733d57c9991850, 0xbe1e78b43b096579
+ .quad 0xc0733d5d0ee7ae30, 0xbe1e7824ae0a4804
+ .quad 0xc0733d625039d040, 0xbe1e79d2b2fbb740
+ .quad 0xc0733d678d958190, 0xbe1e7662de59a1a6
+ .quad 0xc0733d6cc700b760, 0xbe1e76b251d59aaa
+ .quad 0xc0733d71fc8159b0, 0xbe1e7a00cfd1f487
+ .quad 0xc0733d772e1d4360, 0xbe1e77f4d246167e
+ .quad 0xc0733d7c5bda4200, 0xbe1e767a4ee8e6fc
+ .quad 0xc0733d8185be1640, 0xbe1e777ccf0a8aed
+ .quad 0xc0733d86abce7420, 0xbe1e767d7e279ada
+ .quad 0xc0733d8bce1102d0, 0xbe1e7a05cef4bb90
+ .quad 0xc0733d90ec8b5d40, 0xbe1e78f75369be5b
+ .quad 0xc0733d96074311d0, 0xbe1e77b9612e8c8a
+ .quad 0xc0733d9b1e3da2b0, 0xbe1e794518b9adeb
+ .quad 0xc0733da031808620, 0xbe1e7810626fb934
+ .quad 0xc0733da541112650, 0xbe1e76d87223fa6d
+ .quad 0xc0733daa4cf4e1a0, 0xbe1e794c5e7ca3b5
+ .quad 0xc0733daf55310af0, 0xbe1e789856ef816f
+ .quad 0xc0733db459cae970, 0xbe1e77d2004effbd
+ .quad 0xc0733db95ac7b8f0, 0xbe1e78467d31eb9c
+ .quad 0xc0733dbe582caa00, 0xbe1e79aaa4e25787
+ .quad 0xc0733dc351fee220, 0xbe1e762de8f107bf
+ .quad 0xc0733dc848437b90, 0xbe1e7670670a63fe
+ .quad 0xc0733dcd3aff85d0, 0xbe1e795ca237c6cc
+ .quad 0xc0733dd22a3805b0, 0xbe1e77e55c53c1d9
+ .quad 0xc0733dd715f1f520, 0xbe1e78a806213ac4
+ .quad 0xc0733ddbfe3243b0, 0xbe1e77743a2bc615
+ .quad 0xc0733de0e2fdd660, 0xbe1e78b8b45b0b7d
+ .quad 0xc0733de5c4598800, 0xbe1e78d635f2f4b9
+ .quad 0xc0733deaa24a2920, 0xbe1e7758c396a11e
+ .quad 0xc0733def7cd48020, 0xbe1e7a17a8cc454c
+ .quad 0xc0733df453fd49a0, 0xbe1e783caa73f616
+ .quad 0xc0733df927c93820, 0xbe1e7932cfa29664
+ .quad 0xc0733dfdf83cf490, 0xbe1e777d265c72a6
+ .quad 0xc0733e02c55d1e10, 0xbe1e7775e7c03c60
+ .quad 0xc0733e078f2e4a40, 0xbe1e79f65d52d232
+ .quad 0xc0733e0c55b50570, 0xbe1e76e7e7464b4e
+ .quad 0xc0733e1118f5d250, 0xbe1e77be81cad877
+ .quad 0xc0733e15d8f52a80, 0xbe1e79dd25b5fb3a
+ .quad 0xc0733e1a95b77e80, 0xbe1e78e45f1418ef
+ .quad 0xc0733e1f4f4135a0, 0xbe1e78eb7289505b
+ .quad 0xc0733e240596ae50, 0xbe1e78a468c07cad
+ .quad 0xc0733e28b8bc3e20, 0xbe1e776b558a4009
+ .quad 0xc0733e2d68b631d0, 0xbe1e77412eb9941e
+ .quad 0xc0733e321588cd80, 0xbe1e76b2853f845e
+ .quad 0xc0733e36bf384cb0, 0xbe1e76aa7184273c
+ .quad 0xc0733e3b65c8e260, 0xbe1e7832027f78fa
+ .quad 0xc0733e40093eb930, 0xbe1e7a1c7da131f5
+ .quad 0xc0733e44a99df380, 0xbe1e76a0bc2ae4bc
+ .quad 0xc0733e4946eaab30, 0xbe1e78dff13b6f5d
+ .quad 0xc0733e4de128f250, 0xbe1e765a226dea2c
+ .quad 0xc0733e52785cd290, 0xbe1e78509b989111
+ .quad 0xc0733e570c8a4de0, 0xbe1e7916a4e9803d
+ .quad 0xc0733e5b9db55e30, 0xbe1e7950c15758cc
+ .quad 0xc0733e602be1f5a0, 0xbe1e7922ba1ad420
+ .quad 0xc0733e64b713fe90, 0xbe1e794cbaabcef6
+ .quad 0xc0733e693f4f5bc0, 0xbe1e7837bf883fed
+ .quad 0xc0733e6dc497e850, 0xbe1e76f198ddbbdf
+ .quad 0xc0733e7246f177d0, 0xbe1e7a18c1067764
+ .quad 0xc0733e76c65fd6a0, 0xbe1e76b845a8fd9d
+ .quad 0xc0733e7b42e6c970, 0xbe1e7714012df506
+ .quad 0xc0733e7fbc8a0de0, 0xbe1e7765612922cd
+ .quad 0xc0733e84334d5a50, 0xbe1e7688f5424a00
+ .quad 0xc0733e88a7345df0, 0xbe1e769d011f6663
+ .quad 0xc0733e8d1842c0e0, 0xbe1e79914acbfaf7
+ .quad 0xc0733e91867c2460, 0xbe1e79a85e189bd7
+ .quad 0xc0733e95f1e422a0, 0xbe1e79ea7c726432
+ .quad 0xc0733e9a5a7e4f10, 0xbe1e768a6fbb8e6e
+ .quad 0xc0733e9ec04e3620, 0xbe1e793c75bcc9fc
+ .quad 0xc0733ea323575dd0, 0xbe1e797f78da13d4
+ .quad 0xc0733ea7839d4550, 0xbe1e78d8c9cda978
+ .quad 0xc0733eabe1236540, 0xbe1e77028d480fff
+ .quad 0xc0733eb03bed2fa0, 0xbe1e7a0d0f74ff7c
+ .quad 0xc0733eb493fe1040, 0xbe1e76732e8a35fb
+ .quad 0xc0733eb8e9596c30, 0xbe1e77220caeabeb
+ .quad 0xc0733ebd3c02a260, 0xbe1e797438b645ef
+ .quad 0xc0733ec18bfd0b80, 0xbe1e79207c5fd6e8
+ .quad 0xc0733ec5d94bf9f0, 0xbe1e781c7df8f946
+ .quad 0xc0733eca23f2b9f0, 0xbe1e76736284e2db
+ .quad 0xc0733ece6bf49190, 0xbe1e7a109cc0c3f5
+ .quad 0xc0733ed2b154c120, 0xbe1e767f14a16d50
+ .quad 0xc0733ed6f4168290, 0xbe1e789cd22acaf0
+ .quad 0xc0733edb343d0a40, 0xbe1e764355ca28ad
+ .quad 0xc0733edf71cb8660, 0xbe1e79e4c7a81c45
+ .quad 0xc0733ee3acc51fb0, 0xbe1e761e26b644c2
+ .quad 0xc0733ee7e52cf8c0, 0xbe1e793e9f8fbdd3
+ .quad 0xc0733eec1b062ed0, 0xbe1e78c432991c20
+ .quad 0xc0733ef04e53d940, 0xbe1e78cdd025f4d8
+ .quad 0xc0733ef47f1909f0, 0xbe1e778310c6446e
+ .quad 0xc0733ef8ad58cd20, 0xbe1e7871af3d6e17
+ .quad 0xc0733efcd91629b0, 0xbe1e77e0e906f697
+ .quad 0xc0733f01025420f0, 0xbe1e7a1ae9b27892
+ .quad 0xc0733f052915af00, 0xbe1e76ac64c88f9d
+ .quad 0xc0733f094d5dca60, 0xbe1e779a815589c4
+ .quad 0xc0733f0d6f2f6480, 0xbe1e788f39a4864c
+ .quad 0xc0733f118e8d6980, 0xbe1e79fc51263525
+ .quad 0xc0733f15ab7ac060, 0xbe1e783501f19e90
+ .quad 0xc0733f19c5fa4ae0, 0xbe1e767e82c327ab
+ .quad 0xc0733f1dde0ee5a0, 0xbe1e7a1785d66123
+ .quad 0xc0733f21f3bb6870, 0xbe1e7936d07203da
+ .quad 0xc0733f260702a5e0, 0xbe1e7a010a7ac699
+ .quad 0xc0733f2a17e76bb0, 0xbe1e7975e4e16312
+ .quad 0xc0733f2e266c82b0, 0xbe1e7654b5422330
+ .quad 0xc0733f323294aeb0, 0xbe1e77f8a4909d35
+ .quad 0xc0733f363c62aee0, 0xbe1e792c8e30d226
+ .quad 0xc0733f3a43d93da0, 0xbe1e76f6ac67a1ff
+ .quad 0xc0733f3e48fb1070, 0xbe1e775c2e97715a
+ .quad 0xc0733f424bcad840, 0xbe1e781cd54ae100
+ /*== Log_LA_table ==*/
+ .align 16
+ .quad 0x0000000000000000
+ .quad 0xbf4bc48a867884b7
+ .quad 0xbf5bbd9e9482af09
+ .quad 0xbf64c9096b94befd
+ .quad 0xbf6bafd47221ed26
+ .quad 0xbf714999e2ad8ea6
+ .quad 0xbf74b99563d2a1bd
+ .quad 0xbf7827de6b310350
+ .quad 0xbf7b9476a4fcd10f
+ .quad 0xbf7eff5fbaf25781
+ .quad 0xbf81344daa2d7553
+ .quad 0xbf82e8158b08d957
+ .quad 0xbf849b0851443684
+ .quad 0xbf864d26cce610dd
+ .quad 0xbf87fe71ccc4e6b0
+ .quad 0xbf89aeea1e897fdf
+ .quad 0xbf8b5e908eb13790
+ .quad 0xbf8d0d65e890405a
+ .quad 0xbf8ebb6af653e2ee
+ .quad 0xbf90345040825bad
+ .quad 0xbf910a83a8446c78
+ .quad 0xbf91e05015d30a71
+ .quad 0xbf92b5b5ec0209d3
+ .quad 0xbf938ab58d173e91
+ .quad 0xbf945f4f5acb8be0
+ .quad 0xbf953383b64bf13f
+ .quad 0xbf960753003a94ef
+ .quad 0xbf96dabd98afcc05
+ .quad 0xbf97adc3df3b1ff8
+ .quad 0xbf98806632e451d0
+ .quad 0xbf9952a4f22c5ae9
+ .quad 0xbf9a24807b0e6b5c
+ .quad 0xbf9af5f92b00e610
+ .quad 0xbf9bc70f5ef65a77
+ .quad 0xbf9c97c3735e7c0a
+ .quad 0xbf9d6815c4271775
+ .quad 0xbf9e3806acbd058f
+ .quad 0xbf9f0796880d1c19
+ .quad 0xbf9fd6c5b0851c4c
+ .quad 0xbfa052ca400a4f9b
+ .quad 0xbfa0ba01a8170000
+ .quad 0xbfa121093ce3a205
+ .quad 0xbfa187e12aad8077
+ .quad 0xbfa1ee899d74a03e
+ .quad 0xbfa25502c0fc314c
+ .quad 0xbfa2bb4cc0cafe8d
+ .quad 0xbfa32167c82bdcda
+ .quad 0xbfa38754022e18e2
+ .quad 0xbfa3ed1199a5e425
+ .quad 0xbfa452a0b92cc0ec
+ .quad 0xbfa4b8018b21ed4f
+ .quad 0xbfa51d3439aacd4a
+ .quad 0xbfa58238eeb353da
+ .quad 0xbfa5e70fd3ee6b34
+ .quad 0xbfa64bb912d65c07
+ .quad 0xbfa6b034d4ad33df
+ .quad 0xbfa71483427d2a99
+ .quad 0xbfa778a4851906f3
+ .quad 0xbfa7dc98c51c8242
+ .quad 0xbfa840602aecab3d
+ .quad 0xbfa8a3fadeb847f4
+ .quad 0xbfa90769087836e4
+ .quad 0xbfa96aaacfefcf3c
+ .quad 0xbfa9cdc05cad4042
+ .quad 0xbfaa30a9d609efea
+ .quad 0xbfaa9367632ad897
+ .quad 0xbfaaf5f92b00e610
+ .quad 0xbfab585f544951a4
+ .quad 0xbfabba9a058dfd84
+ .quad 0xbfac1ca96525cf56
+ .quad 0xbfac7e8d993509f9
+ .quad 0xbface046c7ada68d
+ .quad 0xbfad41d5164facb4
+ .quad 0xbfada338aaa98a0c
+ .quad 0xbfae0471aa1868f5
+ .quad 0xbfae658039c88690
+ .quad 0xbfaec6647eb58808
+ .quad 0xbfaf271e9daacf20
+ .quad 0xbfaf87aebb43ce06
+ .quad 0xbfafe814fbec5a77
+ .quad 0xbfb02428c1f08016
+ .quad 0xbfb054323b97a948
+ .quad 0xbfb08426fcdb1ee7
+ .quad 0xbfb0b40717932b96
+ .quad 0xbfb0e3d29d81165e
+ .quad 0xbfb11389a04f4a2e
+ .quad 0xbfb1432c31917d08
+ .quad 0xbfb172ba62c4d6de
+ .quad 0xbfb1a23445501816
+ .quad 0xbfb1d199ea83bfbe
+ .quad 0xbfb200eb639a3173
+ .quad 0xbfb23028c1b7daed
+ .quad 0xbfb25f5215eb594a
+ .quad 0xbfb28e67712d9dfc
+ .quad 0xbfb2bd68e4621371
+ .quad 0xbfb2ec568056c16f
+ .quad 0xbfb31b3055c47118
+ .quad 0xbfb349f6754ed0b4
+ .quad 0xbfb378a8ef84971e
+ .quad 0xbfb3a747d4dfa6f5
+ .quad 0xbfb3d5d335c53179
+ .quad 0xbfb4044b2285d925
+ .quad 0xbfb432afab5dd3ff
+ .quad 0xbfb46100e0750da1
+ .quad 0xbfb48f3ed1df48fb
+ .quad 0xbfb4bd698f9c41cf
+ .quad 0xbfb4eb812997cde4
+ .quad 0xbfb51985afa9fdfd
+ .quad 0xbfb5477731973e85
+ .quad 0xbfb57555bf1077f5
+ .quad 0xbfb5a32167b32f02
+ .quad 0xbfb5d0da3b09a47e
+ .quad 0xbfb5fe80488af4fd
+ .quad 0xbfb62c139f9b3837
+ .quad 0xbfb659944f8ba02d
+ .quad 0xbfb68702679a980a
+ .quad 0xbfb6b45df6f3e2c9
+ .quad 0xbfb6e1a70cb0b99a
+ .quad 0xbfb70eddb7d7ea07
+ .quad 0xbfb73c02075df3e5
+ .quad 0xbfb769140a2526fd
+ .quad 0xbfb79613cefdc07d
+ .quad 0xbfb7c30164a60836
+ .quad 0xbfb7efdcd9ca6d8f
+ .quad 0xbfb81ca63d05a44a
+ .quad 0xbfb8495d9ce0c10c
+ .quad 0xbfb8760307d355ab
+ .quad 0xbfb8a2968c438d41
+ .quad 0xbfb8cf183886480d
+ .quad 0xbfb8fb881adf3713
+ .quad 0xbfb927e64180f790
+ .quad 0xbfb95432ba8d2e2f
+ .quad 0xbfb9806d9414a209
+ .quad 0xbfb9ac96dc175776
+ .quad 0xbfb9d8aea084aa9c
+ .quad 0xbfba04b4ef3b69d8
+ .quad 0xbfba30a9d609efea
+ .quad 0xbfba5c8d62ae3dec
+ .quad 0xbfba885fa2d6151e
+ .quad 0xbfbab420a41f1076
+ .quad 0xbfbadfd07416be07
+ .quad 0xbfbb0b6f203ab82c
+ .quad 0xbfbb36fcb5f8be8a
+ .quad 0xbfbb627942aecedd
+ .quad 0xbfbb8de4d3ab3d98
+ .quad 0xbfbbb93f762cce4f
+ .quad 0xbfbbe4893762cbf7
+ .quad 0xbfbc0fc2246d20f5
+ .quad 0xbfbc3aea4a5c6eff
+ .quad 0xbfbc6601b63226cb
+ .quad 0xbfbc910874e09f98
+ .quad 0xbfbcbbfe934b2e81
+ .quad 0xbfbce6e41e463da5
+ .quad 0xbfbd11b92297632b
+ .quad 0xbfbd3c7dacf5780b
+ .quad 0xbfbd6731ca08aeb9
+ .quad 0xbfbd91d5866aa99c
+ .quad 0xbfbdbc68eea6915b
+ .quad 0xbfbde6ec0f392b05
+ .quad 0xbfbe115ef490ee07
+ .quad 0xbfbe3bc1ab0e19fe
+ .quad 0xbfbe66143f02cc5d
+ .quad 0xbfbe9056bcb315e8
+ .quad 0xbfbeba893055100b
+ .quad 0xbfbee4aba610f204
+ .quad 0xbfbf0ebe2a0125eb
+ .quad 0xbfbf38c0c8325d86
+ .quad 0xbfbf62b38ca3a706
+ .quad 0xbfbf8c9683468191
+ .quad 0xbfbfb669b7fef1a8
+ .quad 0xbfbfe02d36a3956d
+ .quad 0xbfc004f0857edc5c
+ .quad 0xbfc019c2a064b486
+ .quad 0xbfc02e8cf1dac4b8
+ .quad 0xbfc0434f7fb1f307
+ .quad 0xbfc0580a4fb4a3df
+ .quad 0xbfc06cbd67a6c3b6
+ .quad 0xbfc08168cd45d0a9
+ .quad 0xbfc0960c8648e406
+ .quad 0xbfc0aaa89860bbcf
+ .quad 0xbfc0bf3d0937c41c
+ .quad 0xbfc0d3c9de722078
+ .quad 0xbfc0e84f1dadb526
+ .quad 0xbfc0fccccc823059
+ .quad 0xbfc11142f0811357
+ .quad 0xbfc125b18f35bb8e
+ .quad 0xbfc13a18ae256b99
+ .quad 0xbfc14e7852cf5430
+ .quad 0xbfc162d082ac9d10
+ .quad 0xbfc1772143306dc6
+ .quad 0xbfc18b6a99c7f679
+ .quad 0xbfc19fac8bda7897
+ .quad 0xbfc1b3e71ec94f7b
+ .quad 0xbfc1c81a57eff8fd
+ .quad 0xbfc1dc463ca41df8
+ .quad 0xbfc1f06ad2359abd
+ .quad 0xbfc204881dee8777
+ .quad 0xbfc2189e25134081
+ .quad 0xbfc22cacece26ead
+ .quad 0xbfc240b47a950f79
+ .quad 0xbfc254b4d35e7d3c
+ .quad 0xbfc268adfc6c773e
+ .quad 0xbfc27c9ffae729c1
+ .quad 0xbfc2908ad3f13603
+ .quad 0xbfc2a46e8ca7ba2a
+ .quad 0xbfc2b84b2a225923
+ .quad 0xbfc2cc20b1734279
+ .quad 0xbfc2dfef27a73a18
+ .quad 0xbfc2f3b691c5a001
+ .quad 0xbfc30776f4d077f7
+ .quad 0xbfc31b3055c47118
+ .quad 0xbfc32ee2b998ed6e
+ .quad 0xbfc3428e2540096d
+ .quad 0x3fc331f403985097
+ .quad 0x3fc31e56798a910a
+ .quad 0x3fc30abfd8f333b6
+ .quad 0x3fc2f7301cf4e87b
+ .quad 0x3fc2e3a740b7800f
+ .quad 0x3fc2d0253f67e4cb
+ .quad 0x3fc2bcaa14381386
+ .quad 0x3fc2a935ba5f1479
+ .quad 0x3fc295c82d18f434
+ .quad 0x3fc2826167a6bc9c
+ .quad 0x3fc26f01654e6df6
+ .quad 0x3fc25ba8215af7fc
+ .quad 0x3fc24855971c3307
+ .quad 0x3fc23509c1e6d937
+ .quad 0x3fc221c49d147fb3
+ .quad 0x3fc20e8624038fed
+ .quad 0x3fc1fb4e521740f4
+ .quad 0x3fc1e81d22b790d4
+ .quad 0x3fc1d4f291513e01
+ .quad 0x3fc1c1ce9955c0c6
+ .quad 0x3fc1aeb1363b44c8
+ .quad 0x3fc19b9a637ca295
+ .quad 0x3fc1888a1c995931
+ .quad 0x3fc175805d1587c1
+ .quad 0x3fc1627d2079e731
+ .quad 0x3fc14f806253c3ed
+ .quad 0x3fc13c8a1e34f7a0
+ .quad 0x3fc1299a4fb3e306
+ .quad 0x3fc116b0f26b67bb
+ .quad 0x3fc103ce01fae223
+ .quad 0x3fc0f0f17a062353
+ .quad 0x3fc0de1b56356b04
+ .quad 0x3fc0cb4b9235619a
+ .quad 0x3fc0b88229b71227
+ .quad 0x3fc0a5bf186fe483
+ .quad 0x3fc093025a19976c
+ .quad 0x3fc0804bea723aa9
+ .quad 0x3fc06d9bc53c2941
+ .quad 0x3fc05af1e63e03b4
+ .quad 0x3fc0484e4942aa43
+ .quad 0x3fc035b0ea19373b
+ .quad 0x3fc02319c494f951
+ .quad 0x3fc01088d48d6e03
+ .quad 0x3fbffbfc2bbc7803
+ .quad 0x3fbfd6f308ce5b52
+ .quad 0x3fbfb1f6381856f4
+ .quad 0x3fbf8d05b16a6d47
+ .quad 0x3fbf68216c9cc727
+ .quad 0x3fbf4349618fa91a
+ .quad 0x3fbf1e7d882b689a
+ .quad 0x3fbef9bdd860616b
+ .quad 0x3fbed50a4a26eafc
+ .quad 0x3fbeb062d57f4de8
+ .quad 0x3fbe8bc77271b97a
+ .quad 0x3fbe6738190e394c
+ .quad 0x3fbe42b4c16caaf3
+ .quad 0x3fbe1e3d63acb3ba
+ .quad 0x3fbdf9d1f7f5b674
+ .quad 0x3fbdd5727676c959
+ .quad 0x3fbdb11ed766abf4
+ .quad 0x3fbd8cd71303bd26
+ .quad 0x3fbd689b2193f133
+ .quad 0x3fbd446afb64c7e5
+ .quad 0x3fbd204698cb42bd
+ .quad 0x3fbcfc2df223db2d
+ .quad 0x3fbcd820ffd278f3
+ .quad 0x3fbcb41fba42686d
+ .quad 0x3fbc902a19e65111
+ .quad 0x3fbc6c4017382bea
+ .quad 0x3fbc4861aab93a23
+ .quad 0x3fbc248eccf1fba6
+ .quad 0x3fbc00c7767225cb
+ .quad 0x3fbbdd0b9fd09a10
+ .quad 0x3fbbb95b41ab5ce6
+ .quad 0x3fbb95b654a78c87
+ .quad 0x3fbb721cd17157e3
+ .quad 0x3fbb4e8eb0bbf58f
+ .quad 0x3fbb2b0beb419ad0
+ .quad 0x3fbb079479c372ad
+ .quad 0x3fbae4285509950b
+ .quad 0x3fbac0c775e2fde6
+ .quad 0x3fba9d71d5258484
+ .quad 0x3fba7a276badd2c8
+ .quad 0x3fba56e8325f5c87
+ .quad 0x3fba33b4222456f1
+ .quad 0x3fba108b33edb005
+ .quad 0x3fb9ed6d60b30612
+ .quad 0x3fb9ca5aa1729f45
+ .quad 0x3fb9a752ef316149
+ .quad 0x3fb9845642fac8f0
+ .quad 0x3fb9616495e0e1e8
+ .quad 0x3fb93e7de0fc3e80
+ .quad 0x3fb91ba21d6bef77
+ .quad 0x3fb8f8d144557bdf
+ .quad 0x3fb8d60b4ee4d901
+ .quad 0x3fb8b350364c6257
+ .quad 0x3fb8909ff3c4d191
+ .quad 0x3fb86dfa808d36a0
+ .quad 0x3fb84b5fd5eaefd8
+ .quad 0x3fb828cfed29a215
+ .quad 0x3fb8064abf9b30f1
+ .quad 0x3fb7e3d04697b704
+ .quad 0x3fb7c1607b7d7e32
+ .quad 0x3fb79efb57b0f803
+ .quad 0x3fb77ca0d49cb608
+ .quad 0x3fb75a50ebb1624a
+ .quad 0x3fb7380b9665b7c8
+ .quad 0x3fb715d0ce367afc
+ .quad 0x3fb6f3a08ca67270
+ .quad 0x3fb6d17acb3e5f5e
+ .quad 0x3fb6af5f838cf654
+ .quad 0x3fb68d4eaf26d7ee
+ .quad 0x3fb66b4847a68997
+ .quad 0x3fb6494c46ac6e4d
+ .quad 0x3fb6275aa5debf81
+ .quad 0x3fb605735ee985f1
+ .quad 0x3fb5e3966b7e9295
+ .quad 0x3fb5c1c3c5557799
+ .quad 0x3fb59ffb662b815c
+ .quad 0x3fb57e3d47c3af7b
+ .quad 0x3fb55c8963e6adeb
+ .quad 0x3fb53adfb462ce16
+ .quad 0x3fb51940330c000b
+ .quad 0x3fb4f7aad9bbcbaf
+ .quad 0x3fb4d61fa2514a00
+ .quad 0x3fb4b49e86b11e5f
+ .quad 0x3fb4932780c56fe2
+ .quad 0x3fb471ba8a7de2b7
+ .quad 0x3fb450579dcf9186
+ .quad 0x3fb42efeb4b506e9
+ .quad 0x3fb40dafc92e36e2
+ .quad 0x3fb3ec6ad5407868
+ .quad 0x3fb3cb2fd2f67ef1
+ .quad 0x3fb3a9febc60540a
+ .quad 0x3fb388d78b9350ff
+ .quad 0x3fb367ba3aaa1883
+ .quad 0x3fb346a6c3c49066
+ .quad 0x3fb3259d2107db54
+ .quad 0x3fb3049d4c9e52a0
+ .quad 0x3fb2e3a740b7800f
+ .quad 0x3fb2c2baf78817b7
+ .quad 0x3fb2a1d86b49f1e2
+ .quad 0x3fb280ff963c04fc
+ .quad 0x3fb2603072a25f82
+ .quad 0x3fb23f6afac6220a
+ .quad 0x3fb21eaf28f57941
+ .quad 0x3fb1fdfcf7839804
+ .quad 0x3fb1dd5460c8b16f
+ .quad 0x3fb1bcb55f21f307
+ .quad 0x3fb19c1fecf17ee0
+ .quad 0x3fb17b94049e65d0
+ .quad 0x3fb15b11a094a1aa
+ .quad 0x3fb13a98bb450f81
+ .quad 0x3fb11a294f2569f6
+ .quad 0x3fb0f9c356b04389
+ .quad 0x3fb0d966cc6500fa
+ .quad 0x3fb0b913aac7d3a7
+ .quad 0x3fb098c9ec61b3ff
+ .quad 0x3fb078898bc05bf4
+ .quad 0x3fb0585283764178
+ .quad 0x3fb03824ce1a9101
+ .quad 0x3fb0180066492817
+ .quad 0x3fafefca8d451fd6
+ .quad 0x3fafafa6d397efdb
+ .quad 0x3faf6f9594de60f0
+ .quad 0x3faf2f96c6754aee
+ .quad 0x3faeefaa5dc2b239
+ .quad 0x3faeafd05035bd3b
+ .quad 0x3fae70089346a9e6
+ .quad 0x3fae30531c76c34a
+ .quad 0x3fadf0afe1505738
+ .quad 0x3fadb11ed766abf4
+ .quad 0x3fad719ff455f5f7
+ .quad 0x3fad32332dc34dbd
+ .quad 0x3facf2d8795ca5a5
+ .quad 0x3facb38fccd8bfdb
+ .quad 0x3fac74591df72456
+ .quad 0x3fac3534628016dd
+ .quad 0x3fabf62190448d22
+ .quad 0x3fabb7209d1e24e5
+ .quad 0x3fab78317eef1a29
+ .quad 0x3fab39542ba23d73
+ .quad 0x3faafa88992aea19
+ .quad 0x3faabbcebd84fca0
+ .quad 0x3faa7d268eb4c924
+ .quad 0x3faa3e9002c711d2
+ .quad 0x3faa000b0fd0fd6b
+ .quad 0x3fa9c197abf00dd7
+ .quad 0x3fa98335cd4a16c3
+ .quad 0x3fa944e56a0d3450
+ .quad 0x3fa906a6786fc1cb
+ .quad 0x3fa8c878eeb05074
+ .quad 0x3fa88a5cc3159e53
+ .quad 0x3fa84c51ebee8d15
+ .quad 0x3fa80e585f9218fc
+ .quad 0x3fa7d070145f4fd7
+ .quad 0x3fa7929900bd4809
+ .quad 0x3fa754d31b1b179c
+ .quad 0x3fa7171e59efcb5f
+ .quad 0x3fa6d97ab3ba5e10
+ .quad 0x3fa69be81f01af99
+ .quad 0x3fa65e6692547c4e
+ .quad 0x3fa620f604495440
+ .quad 0x3fa5e3966b7e9295
+ .quad 0x3fa5a647be9a54f6
+ .quad 0x3fa56909f44a72fe
+ .quad 0x3fa52bdd034475b8
+ .quad 0x3fa4eec0e2458f30
+ .quad 0x3fa4b1b588129203
+ .quad 0x3fa474baeb77e904
+ .quad 0x3fa437d103498eec
+ .quad 0x3fa3faf7c663060e
+ .quad 0x3fa3be2f2ba7501f
+ .quad 0x3fa381772a00e604
+ .quad 0x3fa344cfb861afae
+ .quad 0x3fa30838cdc2fbfd
+ .quad 0x3fa2cbb2612578b4
+ .quad 0x3fa28f3c69912a74
+ .quad 0x3fa252d6de1564c1
+ .quad 0x3fa21681b5c8c213
+ .quad 0x3fa1da3ce7c91bf8
+ .quad 0x3fa19e086b3b8333
+ .quad 0x3fa161e4374c37f4
+ .quad 0x3fa125d0432ea20e
+ .quad 0x3fa0e9cc861d4944
+ .quad 0x3fa0add8f759cd95
+ .quad 0x3fa071f58e2cdf9b
+ .quad 0x3fa0362241e638ec
+ .quad 0x3f9ff4be13b92920
+ .quad 0x3f9f7d57badb4ee8
+ .quad 0x3f9f061167fc31e8
+ .quad 0x3f9e8eeb09f2f6cb
+ .quad 0x3f9e17e48fa48962
+ .quad 0x3f9da0fde8038de9
+ .quad 0x3f9d2a3702105259
+ .quad 0x3f9cb38fccd8bfdb
+ .quad 0x3f9c3d0837784c41
+ .quad 0x3f9bc6a03117eb97
+ .quad 0x3f9b5057a8ee01ce
+ .quad 0x3f9ada2e8e3e546f
+ .quad 0x3f9a6424d059fc68
+ .quad 0x3f99ee3a5e9f57e8
+ .quad 0x3f99786f2879fc53
+ .quad 0x3f9902c31d62a843
+ .quad 0x3f988d362cdf359e
+ .quad 0x3f9817c846828bbd
+ .quad 0x3f97a27959ec91aa
+ .quad 0x3f972d4956ca2067
+ .quad 0x3f96b8382cd4f551
+ .quad 0x3f964345cbd3a491
+ .quad 0x3f95ce7223998b98
+ .quad 0x3f9559bd2406c3ba
+ .quad 0x3f94e526bd0814d1
+ .quad 0x3f9470aede96e7f2
+ .quad 0x3f93fc5578b93a38
+ .quad 0x3f93881a7b818f9e
+ .quad 0x3f9313fdd70ee5e8
+ .quad 0x3f929fff7b8ca79d
+ .quad 0x3f922c1f59329f1b
+ .quad 0x3f91b85d6044e9ae
+ .quad 0x3f9144b98113eac0
+ .quad 0x3f90d133abfc3f1b
+ .quad 0x3f905dcbd166b033
+ .quad 0x3f8fd503c3904f1d
+ .quad 0x3f8eeeab9b43445d
+ .quad 0x3f8e088f0b004827
+ .quad 0x3f8d22adf3f9579d
+ .quad 0x3f8c3d0837784c41
+ .quad 0x3f8b579db6dec358
+ .quad 0x3f8a726e53a6056e
+ .quad 0x3f898d79ef5eedf0
+ .quad 0x3f88a8c06bb1d2f4
+ .quad 0x3f87c441aa5e6d15
+ .quad 0x3f86dffd8d3bbf70
+ .quad 0x3f85fbf3f637ffc5
+ .quad 0x3f851824c7587eb0
+ .quad 0x3f84348fe2b99002
+ .quad 0x3f8351352a8e733f
+ .quad 0x3f826e1481213c2e
+ .quad 0x3f818b2dc8d2bb91
+ .quad 0x3f80a880e41a67f6
+ .quad 0x3f7f8c1b6b0c8d4e
+ .quad 0x3f7dc7a83f75a96d
+ .quad 0x3f7c03a80ae5e054
+ .quad 0x3f7a401a92ff827e
+ .quad 0x3f787cff9d9147a5
+ .quad 0x3f76ba56f09621bc
+ .quad 0x3f74f8205235102d
+ .quad 0x3f73365b88c0f347
+ .quad 0x3f7175085ab85ff0
+ .quad 0x3f6f684d1d8ae702
+ .quad 0x3f6be76bd77b4fc3
+ .quad 0x3f68676c71434fb9
+ .quad 0x3f64e84e793a474a
+ .quad 0x3f616a117e0d4b30
+ .quad 0x3f5bd96a1d7d9cbc
+ .quad 0x3f54e071754c98ba
+ .quad 0x3f4bd27045bfd025
+ .quad 0x3f3bcef518e29612
+ .quad 0x8000000000000000
+ /*== poly_coeff[5] ==*/
+ .align 16
+ .quad 0x3fb63C65231FBD16, 0x3fb63C65231FBD16 /* coeff5 */
+ .quad 0xbfbBCB7D4EFBE80B, 0xbfbBCB7D4EFBE80B /* coeff4 */
+ .quad 0x3fc287A7636F341E, 0x3fc287A7636F341E /* coeff3 */
+ .quad 0xbfcBCB7B1526DE36, 0xbfcBCB7B1526DE36 /* coeff2 */
+ .quad 0x3fdBCB7B1526E50E, 0x3fdBCB7B1526E50E /* coeff1 */
+ /*== ExpMask ==*/
+ .align 16
+ .quad 0x000fffffffffffff, 0x000fffffffffffff
+ /*== Two10 ==*/
+ .align 16
+ .quad 0x3f50000000000000, 0x3f50000000000000
+ /*== MinNorm ==*/
+ .align 16
+ .quad 0x0010000000000000, 0x0010000000000000
+ /*== MaxNorm ==*/
+ .align 16
+ .quad 0x7fefffffffffffff, 0x7fefffffffffffff
+ /*== HalfMask ==*/
+ .align 16
+ .quad 0xfffffffffc000000, 0xfffffffffc000000
+ /*== One ==*/
+ .align 16
+ .quad 0x3ff0000000000000, 0x3ff0000000000000
+ /*== Threshold ==*/
+ .align 16
+ .quad 0x4086a00000000000, 0x4086a00000000000
+ /*== Bias ==*/
+ .align 16
+ .quad 0x408ff80000000000, 0x408ff80000000000
+ /*== Bias1 ==*/
+ .align 16
+ .quad 0x408ff00000000000, 0x408ff00000000000
+ /*== L2 ==*/
+ .align 16
+ .quad 0x3fd34413509f79ff, 0x3fd34413509f79ff
+ .align 16
+ .type __svml_dlog10_data_internal,@object
+ .size __svml_dlog10_data_internal,.-__svml_dlog10_data_internal
+ .space 48, 0x00
+ .align 16
+
+.FLT_12:
+ .long 0x00000000,0x43380000,0x00000000,0x43380000
+ .type .FLT_12,@object
+ .size .FLT_12,16
new file mode 100644
@@ -0,0 +1,20 @@
+/* SSE version of vectorized log10, vector length is 4.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define _ZGVdN4v_log10 _ZGVdN4v_log10_sse_wrapper
+#include "../svml_d_log104_core.S"
new file mode 100644
@@ -0,0 +1,27 @@
+/* Multiple versions of vectorized log10, vector length is 4.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define SYMBOL_NAME _ZGVdN4v_log10
+#include "ifunc-mathvec-avx2.h"
+
+libc_ifunc_redirected (REDIRECT_NAME, SYMBOL_NAME, IFUNC_SELECTOR ());
+
+#ifdef SHARED
+__hidden_ver1 (_ZGVdN4v_log10, __GI__ZGVdN4v_log10, __redirect__ZGVdN4v_log10)
+ __attribute__ ((visibility ("hidden")));
+#endif
new file mode 100644
@@ -0,0 +1,1071 @@
+/* Function log10 vectorized with AVX2.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ https://www.gnu.org/licenses/. */
+
+/*
+ * ALGORITHM DESCRIPTION:
+ *
+ * Get short reciprocal approximation Rcp ~ 1/mantissa(x)
+ * R = Rcp*x - 1.0
+ * log10(x) = k*log10(2.0) - log10(Rcp) + poly_approximation(R)
+ * log10(Rcp) is tabulated
+ *
+ *
+ */
+
+/* Offsets for data table __svml_dlog10_data_internal
+ */
+#define Log_HA_table 0
+#define Log_LA_table 4128
+#define poly_coeff 8256
+#define ExpMask 8416
+#define Two10 8448
+#define MinNorm 8480
+#define MaxNorm 8512
+#define HalfMask 8544
+#define One 8576
+#define Threshold 8608
+#define Bias 8640
+#define Bias1 8672
+#define L2 8704
+
+#include <sysdep.h>
+
+ .text
+ .section .text.avx2,"ax",@progbits
+ENTRY(_ZGVdN4v_log10_avx2)
+ pushq %rbp
+ cfi_def_cfa_offset(16)
+ movq %rsp, %rbp
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+ andq $-32, %rsp
+ subq $96, %rsp
+ lea -4222944+__svml_dlog10_data_internal(%rip), %r8
+ vmovapd %ymm0, %ymm3
+
+/* preserve mantissa, set input exponent to 2^(-10) */
+ vandpd ExpMask+__svml_dlog10_data_internal(%rip), %ymm3, %ymm4
+ vorpd Two10+__svml_dlog10_data_internal(%rip), %ymm4, %ymm2
+
+/* reciprocal approximation good to at least 11 bits */
+ vcvtpd2ps %ymm2, %xmm5
+
+/* exponent bits */
+ vpsrlq $20, %ymm3, %ymm7
+ vmovupd One+__svml_dlog10_data_internal(%rip), %ymm14
+ vrcpps %xmm5, %xmm6
+
+/* check range */
+ vcmplt_oqpd MinNorm+__svml_dlog10_data_internal(%rip), %ymm3, %ymm11
+ vcmpnle_uqpd MaxNorm+__svml_dlog10_data_internal(%rip), %ymm3, %ymm12
+ vcvtps2pd %xmm6, %ymm9
+
+/* round reciprocal to nearest integer, will have 1+9 mantissa bits */
+ vroundpd $0, %ymm9, %ymm1
+
+/* exponent*log(2.0) */
+ vmovupd Threshold+__svml_dlog10_data_internal(%rip), %ymm9
+
+/*
+ * prepare table index
+ * table lookup
+ */
+ vpsrlq $40, %ymm1, %ymm15
+
+/* argument reduction */
+ vfmsub213pd %ymm14, %ymm1, %ymm2
+ vcmplt_oqpd %ymm1, %ymm9, %ymm1
+ vorpd %ymm12, %ymm11, %ymm13
+ vmovupd poly_coeff+64+__svml_dlog10_data_internal(%rip), %ymm12
+ vfmadd213pd poly_coeff+96+__svml_dlog10_data_internal(%rip), %ymm2, %ymm12
+
+/* combine and get argument value range mask */
+ vmovmskpd %ymm13, %eax
+ vmulpd %ymm2, %ymm2, %ymm13
+ vextractf128 $1, %ymm7, %xmm8
+ vshufps $221, %xmm8, %xmm7, %xmm10
+
+/* biased exponent in DP format */
+ vcvtdq2pd %xmm10, %ymm0
+ vandpd Bias+__svml_dlog10_data_internal(%rip), %ymm1, %ymm10
+ vorpd Bias1+__svml_dlog10_data_internal(%rip), %ymm10, %ymm11
+ vsubpd %ymm11, %ymm0, %ymm0
+ vmulpd L2+__svml_dlog10_data_internal(%rip), %ymm0, %ymm1
+
+/* polynomial */
+ vmovupd poly_coeff+__svml_dlog10_data_internal(%rip), %ymm0
+ vfmadd213pd poly_coeff+32+__svml_dlog10_data_internal(%rip), %ymm2, %ymm0
+ vmulpd poly_coeff+128+__svml_dlog10_data_internal(%rip), %ymm2, %ymm2
+ vfmadd213pd %ymm12, %ymm13, %ymm0
+ vfmadd213pd %ymm2, %ymm13, %ymm0
+ vextractf128 $1, %ymm15, %xmm6
+ vmovd %xmm15, %edx
+ vmovd %xmm6, %esi
+ movslq %edx, %rdx
+ vpextrd $2, %xmm15, %ecx
+ movslq %esi, %rsi
+ vpextrd $2, %xmm6, %edi
+ movslq %ecx, %rcx
+ movslq %edi, %rdi
+ vmovsd (%r8,%rdx), %xmm4
+ vmovsd (%r8,%rsi), %xmm7
+ vmovhpd (%r8,%rcx), %xmm4, %xmm5
+ vmovhpd (%r8,%rdi), %xmm7, %xmm8
+ vinsertf128 $1, %xmm8, %ymm5, %ymm14
+
+/* reconstruction */
+ vaddpd %ymm0, %ymm14, %ymm2
+ vaddpd %ymm2, %ymm1, %ymm0
+ testl %eax, %eax
+
+/* Go to special inputs processing branch */
+ jne L(SPECIAL_VALUES_BRANCH)
+ # LOE rbx r12 r13 r14 r15 eax ymm0 ymm3
+
+/* Restore registers
+ * and exit the function
+ */
+
+L(EXIT):
+ movq %rbp, %rsp
+ popq %rbp
+ cfi_def_cfa(7, 8)
+ cfi_restore(6)
+ ret
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+
+/* Branch to process
+ * special inputs
+ */
+
+L(SPECIAL_VALUES_BRANCH):
+ vmovupd %ymm3, 32(%rsp)
+ vmovupd %ymm0, 64(%rsp)
+ # LOE rbx r12 r13 r14 r15 eax ymm0
+
+ xorl %edx, %edx
+ # LOE rbx r12 r13 r14 r15 eax edx
+
+ vzeroupper
+ movq %r12, 16(%rsp)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -80; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xb0, 0xff, 0xff, 0xff, 0x22
+ movl %edx, %r12d
+ movq %r13, 8(%rsp)
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -88; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa8, 0xff, 0xff, 0xff, 0x22
+ movl %eax, %r13d
+ movq %r14, (%rsp)
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -96; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa0, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r15 r12d r13d
+
+/* Range mask
+ * bits check
+ */
+
+L(RANGEMASK_CHECK):
+ btl %r12d, %r13d
+
+/* Call scalar math function */
+ jc L(SCALAR_MATH_CALL)
+ # LOE rbx r15 r12d r13d
+
+/* Special inputs
+ * processing loop
+ */
+
+L(SPECIAL_VALUES_LOOP):
+ incl %r12d
+ cmpl $4, %r12d
+
+/* Check bits in range mask */
+ jl L(RANGEMASK_CHECK)
+ # LOE rbx r15 r12d r13d
+
+ movq 16(%rsp), %r12
+ cfi_restore(12)
+ movq 8(%rsp), %r13
+ cfi_restore(13)
+ movq (%rsp), %r14
+ cfi_restore(14)
+ vmovupd 64(%rsp), %ymm0
+
+/* Go to exit */
+ jmp L(EXIT)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -80; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xb0, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -88; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa8, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -96; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa0, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r12 r13 r14 r15 ymm0
+
+/* Scalar math fucntion call
+ * to process special input
+ */
+
+L(SCALAR_MATH_CALL):
+ movl %r12d, %r14d
+ movsd 32(%rsp,%r14,8), %xmm0
+ call log10@PLT
+ # LOE rbx r14 r15 r12d r13d xmm0
+
+ movsd %xmm0, 64(%rsp,%r14,8)
+
+/* Process special inputs in loop */
+ jmp L(SPECIAL_VALUES_LOOP)
+ # LOE rbx r15 r12d r13d
+END(_ZGVdN4v_log10_avx2)
+
+ .section .rodata, "a"
+ .align 32
+
+#ifdef __svml_dlog10_data_internal_typedef
+typedef unsigned int VUINT32;
+typedef struct {
+ __declspec(align(32)) VUINT32 Log_HA_table[(1<<9)+2][2];
+ __declspec(align(32)) VUINT32 Log_LA_table[(1<<9)+1][2];
+ __declspec(align(32)) VUINT32 poly_coeff[5][4][2];
+ __declspec(align(32)) VUINT32 ExpMask[4][2];
+ __declspec(align(32)) VUINT32 Two10[4][2];
+ __declspec(align(32)) VUINT32 MinNorm[4][2];
+ __declspec(align(32)) VUINT32 MaxNorm[4][2];
+ __declspec(align(32)) VUINT32 HalfMask[4][2];
+ __declspec(align(32)) VUINT32 One[4][2];
+ __declspec(align(32)) VUINT32 Threshold[4][2];
+ __declspec(align(32)) VUINT32 Bias[4][2];
+ __declspec(align(32)) VUINT32 Bias1[4][2];
+ __declspec(align(32)) VUINT32 L2[4][2];
+} __svml_dlog10_data_internal;
+#endif
+__svml_dlog10_data_internal:
+ /* Log_HA_table */
+ .quad 0xc0733a7146f6b080, 0xbe1e707ce619c200
+ .quad 0xc0733a7547771970, 0xbe1e79c6c06d6f51
+ .quad 0xc0733a7945aacb70, 0xbe1e78e225fad29c
+ .quad 0xc0733a7d41946970, 0xbe1e76d607f9693b
+ .quad 0xc0733a813b3691f0, 0xbe1e7704b3e0685b
+ .quad 0xc0733a853293df00, 0xbe1e79c1216a27fa
+ .quad 0xc0733a8927aee660, 0xbe1e76dce5734a81
+ .quad 0xc0733a8d1a8a3920, 0xbe1e782ee2ca4dba
+ .quad 0xc0733a910b286430, 0xbe1e7812d1a0a61f
+ .quad 0xc0733a94f98bf010, 0xbe1e77e1b5ecbc61
+ .quad 0xc0733a98e5b76100, 0xbe1e76635cac1586
+ .quad 0xc0733a9ccfad36f0, 0xbe1e7638f7968f32
+ .quad 0xc0733aa0b76feda0, 0xbe1e7840ee76e365
+ .quad 0xc0733aa49d01fcb0, 0xbe1e79f3fd01907e
+ .quad 0xc0733aa88065d7a0, 0xbe1e77bbb3a9c38a
+ .quad 0xc0733aac619dedb0, 0xbe1e7742719bf41d
+ .quad 0xc0733ab040acaa20, 0xbe1e79bcedaf79cb
+ .quad 0xc0733ab41d947450, 0xbe1e762d63cb7ca0
+ .quad 0xc0733ab7f857af50, 0xbe1e77a07be83403
+ .quad 0xc0733abbd0f8ba80, 0xbe1e7763ff836ad0
+ .quad 0xc0733abfa779f130, 0xbe1e7737720ead39
+ .quad 0xc0733ac37bddaad0, 0xbe1e7776a08e55e7
+ .quad 0xc0733ac74e263af0, 0xbe1e793e3c52dd36
+ .quad 0xc0733acb1e55f160, 0xbe1e788a94695051
+ .quad 0xc0733aceec6f1a10, 0xbe1e76508114a813
+ .quad 0xc0733ad2b873fd20, 0xbe1e76909457d23e
+ .quad 0xc0733ad68266df10, 0xbe1e7664a24f9ca4
+ .quad 0xc0733ada4a4a0090, 0xbe1e7a07b3d44b18
+ .quad 0xc0733ade101f9ee0, 0xbe1e76d87594704d
+ .quad 0xc0733ae1d3e9f340, 0xbe1e79563595a182
+ .quad 0xc0733ae595ab33b0, 0xbe1e771880c3c6ab
+ .quad 0xc0733ae955659250, 0xbe1e78c171f517d4
+ .quad 0xc0733aed131b3df0, 0xbe1e77eac3874666
+ .quad 0xc0733af0cece61b0, 0xbe1e790db479d8f6
+ .quad 0xc0733af488812550, 0xbe1e7965d1aa5c90
+ .quad 0xc0733af84035ad10, 0xbe1e78ceb398ba47
+ .quad 0xc0733afbf5ee19c0, 0xbe1e779cc0dcb5aa
+ .quad 0xc0733affa9ac88c0, 0xbe1e7871053953ed
+ .quad 0xc0733b035b731420, 0xbe1e7a082cffa71a
+ .quad 0xc0733b070b43d2a0, 0xbe1e7904b4382fad
+ .quad 0xc0733b0ab920d790, 0xbe1e79b458d0b4f3
+ .quad 0xc0733b0e650c3310, 0xbe1e79d0ded414c6
+ .quad 0xc0733b120f07f200, 0xbe1e763c357a1943
+ .quad 0xc0733b15b7161dd0, 0xbe1e78b80ba6daaa
+ .quad 0xc0733b195d38bd00, 0xbe1e7998e23b8ffd
+ .quad 0xc0733b1d0171d2c0, 0xbe1e7974aa65ee8c
+ .quad 0xc0733b20a3c35f20, 0xbe1e76ccfde752ab
+ .quad 0xc0733b24442f5ef0, 0xbe1e77b4ff19debb
+ .quad 0xc0733b27e2b7cc10, 0xbe1e7772ee478542
+ .quad 0xc0733b2b7f5e9d30, 0xbe1e781d81b58b44
+ .quad 0xc0733b2f1a25c600, 0xbe1e78350d967565
+ .quad 0xc0733b32b30f3720, 0xbe1e783888e48152
+ .quad 0xc0733b364a1cde30, 0xbe1e78367bf7c111
+ .quad 0xc0733b39df50a5d0, 0xbe1e7959e57ca47d
+ .quad 0xc0733b3d72ac75c0, 0xbe1e777322423222
+ .quad 0xc0733b41043232b0, 0xbe1e767ce42a60aa
+ .quad 0xc0733b4493e3be70, 0xbe1e781d445aea19
+ .quad 0xc0733b4821c2f800, 0xbe1e7922fca18e18
+ .quad 0xc0733b4badd1bb80, 0xbe1e76fed3d40647
+ .quad 0xc0733b4f3811e210, 0xbe1e793948c9eabc
+ .quad 0xc0733b52c0854240, 0xbe1e76e487656b8c
+ .quad 0xc0733b56472daf90, 0xbe1e780ab2f71223
+ .quad 0xc0733b59cc0cfaf0, 0xbe1e77189120b09c
+ .quad 0xc0733b5d4f24f270, 0xbe1e7644a0343a12
+ .quad 0xc0733b60d0776160, 0xbe1e78f2a3e4733d
+ .quad 0xc0733b6450061080, 0xbe1e7913b2f73ae5
+ .quad 0xc0733b67cdd2c5c0, 0xbe1e7882d08393b5
+ .quad 0xc0733b6b49df4470, 0xbe1e765e1b209979
+ .quad 0xc0733b6ec42d4d20, 0xbe1e785c9c4620d4
+ .quad 0xc0733b75b394f240, 0xbe1e78878cd0e956
+ .quad 0xc0733b7c9c178630, 0xbe1e789a4112d90b
+ .quad 0xc0733b837dc2b0f0, 0xbe1e79050b8a1766
+ .quad 0xc0733b8a58a3f220, 0xbe1e7790dffc47aa
+ .quad 0xc0733b912cc8a180, 0xbe1e77174593b06a
+ .quad 0xc0733b97fa3defb0, 0xbe1e7677de2d2ecc
+ .quad 0xc0733b9ec110e6b0, 0xbe1e76cff477ca18
+ .quad 0xc0733ba5814e6a80, 0xbe1e78f8644dec7b
+ .quad 0xc0733bac3b0339d0, 0xbe1e764e1361788d
+ .quad 0xc0733bb2ee3bee30, 0xbe1e78c913e738de
+ .quad 0xc0733bb99b04fd30, 0xbe1e76666f5bddaa
+ .quad 0xc0733bc0416ab850, 0xbe1e77e87cbd8ab6
+ .quad 0xc0733bc6e1794e10, 0xbe1e76f18ba1c966
+ .quad 0xc0733bcd7b3cca10, 0xbe1e777c9461b8db
+ .quad 0xc0733bd40ec115d0, 0xbe1e78b78526ffac
+ .quad 0xc0733bda9c11f920, 0xbe1e7942abecfede
+ .quad 0xc0733be1233b1aa0, 0xbe1e76d8a684fd8c
+ .quad 0xc0733be7a4480010, 0xbe1e79622b539ac9
+ .quad 0xc0733bee1f440f30, 0xbe1e7978e7cc20ea
+ .quad 0xc0733bf4943a8de0, 0xbe1e765c9c9de825
+ .quad 0xc0733bfb0336a290, 0xbe1e775d8b138ee2
+ .quad 0xc0733c016c435500, 0xbe1e78bf33465c2f
+ .quad 0xc0733c07cf6b8e80, 0xbe1e78164f7cc441
+ .quad 0xc0733c0e2cba1a50, 0xbe1e7824e64d0b23
+ .quad 0xc0733c148439a630, 0xbe1e78373ae7dd81
+ .quad 0xc0733c1ad5f4c2c0, 0xbe1e7704513e0afe
+ .quad 0xc0733c2121f5e3d0, 0xbe1e7914aa84200f
+ .quad 0xc0733c2768476110, 0xbe1e76b1cde25cf6
+ .quad 0xc0733c2da8f37600, 0xbe1e796120e3862d
+ .quad 0xc0733c33e40442e0, 0xbe1e78ec836d7e7b
+ .quad 0xc0733c3a1983cca0, 0xbe1e77fb13b7dabb
+ .quad 0xc0733c40497bfd70, 0xbe1e783c6fcb2404
+ .quad 0xc0733c4673f6a530, 0xbe1e7628bb93dce8
+ .quad 0xc0733c4c98fd7990, 0xbe1e7857a47b5001
+ .quad 0xc0733c52b89a16d0, 0xbe1e76708dc2831f
+ .quad 0xc0733c58d2d5ffa0, 0xbe1e77b6038651f1
+ .quad 0xc0733c5ee7ba9de0, 0xbe1e792e855bb5b2
+ .quad 0xc0733c64f75142d0, 0xbe1e776cacd5c105
+ .quad 0xc0733c6b01a32740, 0xbe1e77f8a8011315
+ .quad 0xc0733c7106b96c30, 0xbe1e765cf3efcfde
+ .quad 0xc0733c77069d1ad0, 0xbe1e78d837d2efac
+ .quad 0xc0733c7d01572530, 0xbe1e78b615cf772c
+ .quad 0xc0733c82f6f06640, 0xbe1e7650bbbd7a25
+ .quad 0xc0733c88e771a220, 0xbe1e78bcf3495872
+ .quad 0xc0733c8ed2e386c0, 0xbe1e792266832e84
+ .quad 0xc0733c94b94eabd0, 0xbe1e79c1c3c2ca52
+ .quad 0xc0733c9a9abb9340, 0xbe1e78aa61e5807d
+ .quad 0xc0733ca07732a970, 0xbe1e7620fc4cf156
+ .quad 0xc0733ca64ebc4570, 0xbe1e76b914a832c5
+ .quad 0xc0733cac2160a970, 0xbe1e79227f72020e
+ .quad 0xc0733cb1ef280300, 0xbe1e77ac972cc008
+ .quad 0xc0733cb7b81a6b10, 0xbe1e798089be41f4
+ .quad 0xc0733cbd7c3fe6a0, 0xbe1e77942ae037fe
+ .quad 0xc0733cc33ba06690, 0xbe1e7956ae6463d9
+ .quad 0xc0733cc8f643c850, 0xbe1e7918a50c7942
+ .quad 0xc0733cceac31d5d0, 0xbe1e78308eeab604
+ .quad 0xc0733cd45d7245e0, 0xbe1e76dd4ea88445
+ .quad 0xc0733cda0a0cbc60, 0xbe1e77e7c1aa5909
+ .quad 0xc0733cdfb208caa0, 0xbe1e7804b9d20e54
+ .quad 0xc0733ce5556def70, 0xbe1e78f88e99d49c
+ .quad 0xc0733ceaf4439780, 0xbe1e787d74682d68
+ .quad 0xc0733cf08e911d80, 0xbe1e76edc24fe6e7
+ .quad 0xc0733cf6245dca50, 0xbe1e79b347ec86d2
+ .quad 0xc0733cfbb5b0d580, 0xbe1e797cceb2c39b
+ .quad 0xc0733d0142916530, 0xbe1e783adbdc6aa1
+ .quad 0xc0733d06cb068e70, 0xbe1e76e4c20e3d9e
+ .quad 0xc0733d0c4f175570, 0xbe1e77070bf3cf61
+ .quad 0xc0733d11cecaadc0, 0xbe1e781c43502734
+ .quad 0xc0733d174a277a80, 0xbe1e78b11268ea72
+ .quad 0xc0733d1cc1348e90, 0xbe1e7754b83bfc7d
+ .quad 0xc0733d2233f8acb0, 0xbe1e7756c29bf5e9
+ .quad 0xc0733d27a27a87d0, 0xbe1e7952fc1d9333
+ .quad 0xc0733d2d0cc0c350, 0xbe1e778c76ae6077
+ .quad 0xc0733d3272d1f2e0, 0xbe1e7a1896ba8f43
+ .quad 0xc0733d37d4b49b30, 0xbe1e76dafdf432d8
+ .quad 0xc0733d3d326f3180, 0xbe1e795330184013
+ .quad 0xc0733d428c081c80, 0xbe1e763cc774d30f
+ .quad 0xc0733d47e185b3d0, 0xbe1e77030a779c0a
+ .quad 0xc0733d4d32ee40b0, 0xbe1e7908af2a2d7e
+ .quad 0xc0733d528047fe00, 0xbe1e78c4953b797d
+ .quad 0xc0733d57c9991850, 0xbe1e78b43b096579
+ .quad 0xc0733d5d0ee7ae30, 0xbe1e7824ae0a4804
+ .quad 0xc0733d625039d040, 0xbe1e79d2b2fbb740
+ .quad 0xc0733d678d958190, 0xbe1e7662de59a1a6
+ .quad 0xc0733d6cc700b760, 0xbe1e76b251d59aaa
+ .quad 0xc0733d71fc8159b0, 0xbe1e7a00cfd1f487
+ .quad 0xc0733d772e1d4360, 0xbe1e77f4d246167e
+ .quad 0xc0733d7c5bda4200, 0xbe1e767a4ee8e6fc
+ .quad 0xc0733d8185be1640, 0xbe1e777ccf0a8aed
+ .quad 0xc0733d86abce7420, 0xbe1e767d7e279ada
+ .quad 0xc0733d8bce1102d0, 0xbe1e7a05cef4bb90
+ .quad 0xc0733d90ec8b5d40, 0xbe1e78f75369be5b
+ .quad 0xc0733d96074311d0, 0xbe1e77b9612e8c8a
+ .quad 0xc0733d9b1e3da2b0, 0xbe1e794518b9adeb
+ .quad 0xc0733da031808620, 0xbe1e7810626fb934
+ .quad 0xc0733da541112650, 0xbe1e76d87223fa6d
+ .quad 0xc0733daa4cf4e1a0, 0xbe1e794c5e7ca3b5
+ .quad 0xc0733daf55310af0, 0xbe1e789856ef816f
+ .quad 0xc0733db459cae970, 0xbe1e77d2004effbd
+ .quad 0xc0733db95ac7b8f0, 0xbe1e78467d31eb9c
+ .quad 0xc0733dbe582caa00, 0xbe1e79aaa4e25787
+ .quad 0xc0733dc351fee220, 0xbe1e762de8f107bf
+ .quad 0xc0733dc848437b90, 0xbe1e7670670a63fe
+ .quad 0xc0733dcd3aff85d0, 0xbe1e795ca237c6cc
+ .quad 0xc0733dd22a3805b0, 0xbe1e77e55c53c1d9
+ .quad 0xc0733dd715f1f520, 0xbe1e78a806213ac4
+ .quad 0xc0733ddbfe3243b0, 0xbe1e77743a2bc615
+ .quad 0xc0733de0e2fdd660, 0xbe1e78b8b45b0b7d
+ .quad 0xc0733de5c4598800, 0xbe1e78d635f2f4b9
+ .quad 0xc0733deaa24a2920, 0xbe1e7758c396a11e
+ .quad 0xc0733def7cd48020, 0xbe1e7a17a8cc454c
+ .quad 0xc0733df453fd49a0, 0xbe1e783caa73f616
+ .quad 0xc0733df927c93820, 0xbe1e7932cfa29664
+ .quad 0xc0733dfdf83cf490, 0xbe1e777d265c72a6
+ .quad 0xc0733e02c55d1e10, 0xbe1e7775e7c03c60
+ .quad 0xc0733e078f2e4a40, 0xbe1e79f65d52d232
+ .quad 0xc0733e0c55b50570, 0xbe1e76e7e7464b4e
+ .quad 0xc0733e1118f5d250, 0xbe1e77be81cad877
+ .quad 0xc0733e15d8f52a80, 0xbe1e79dd25b5fb3a
+ .quad 0xc0733e1a95b77e80, 0xbe1e78e45f1418ef
+ .quad 0xc0733e1f4f4135a0, 0xbe1e78eb7289505b
+ .quad 0xc0733e240596ae50, 0xbe1e78a468c07cad
+ .quad 0xc0733e28b8bc3e20, 0xbe1e776b558a4009
+ .quad 0xc0733e2d68b631d0, 0xbe1e77412eb9941e
+ .quad 0xc0733e321588cd80, 0xbe1e76b2853f845e
+ .quad 0xc0733e36bf384cb0, 0xbe1e76aa7184273c
+ .quad 0xc0733e3b65c8e260, 0xbe1e7832027f78fa
+ .quad 0xc0733e40093eb930, 0xbe1e7a1c7da131f5
+ .quad 0xc0733e44a99df380, 0xbe1e76a0bc2ae4bc
+ .quad 0xc0733e4946eaab30, 0xbe1e78dff13b6f5d
+ .quad 0xc0733e4de128f250, 0xbe1e765a226dea2c
+ .quad 0xc0733e52785cd290, 0xbe1e78509b989111
+ .quad 0xc0733e570c8a4de0, 0xbe1e7916a4e9803d
+ .quad 0xc0733e5b9db55e30, 0xbe1e7950c15758cc
+ .quad 0xc0733e602be1f5a0, 0xbe1e7922ba1ad420
+ .quad 0xc0733e64b713fe90, 0xbe1e794cbaabcef6
+ .quad 0xc0733e693f4f5bc0, 0xbe1e7837bf883fed
+ .quad 0xc0733e6dc497e850, 0xbe1e76f198ddbbdf
+ .quad 0xc0733e7246f177d0, 0xbe1e7a18c1067764
+ .quad 0xc0733e76c65fd6a0, 0xbe1e76b845a8fd9d
+ .quad 0xc0733e7b42e6c970, 0xbe1e7714012df506
+ .quad 0xc0733e7fbc8a0de0, 0xbe1e7765612922cd
+ .quad 0xc0733e84334d5a50, 0xbe1e7688f5424a00
+ .quad 0xc0733e88a7345df0, 0xbe1e769d011f6663
+ .quad 0xc0733e8d1842c0e0, 0xbe1e79914acbfaf7
+ .quad 0xc0733e91867c2460, 0xbe1e79a85e189bd7
+ .quad 0xc0733e95f1e422a0, 0xbe1e79ea7c726432
+ .quad 0xc0733e9a5a7e4f10, 0xbe1e768a6fbb8e6e
+ .quad 0xc0733e9ec04e3620, 0xbe1e793c75bcc9fc
+ .quad 0xc0733ea323575dd0, 0xbe1e797f78da13d4
+ .quad 0xc0733ea7839d4550, 0xbe1e78d8c9cda978
+ .quad 0xc0733eabe1236540, 0xbe1e77028d480fff
+ .quad 0xc0733eb03bed2fa0, 0xbe1e7a0d0f74ff7c
+ .quad 0xc0733eb493fe1040, 0xbe1e76732e8a35fb
+ .quad 0xc0733eb8e9596c30, 0xbe1e77220caeabeb
+ .quad 0xc0733ebd3c02a260, 0xbe1e797438b645ef
+ .quad 0xc0733ec18bfd0b80, 0xbe1e79207c5fd6e8
+ .quad 0xc0733ec5d94bf9f0, 0xbe1e781c7df8f946
+ .quad 0xc0733eca23f2b9f0, 0xbe1e76736284e2db
+ .quad 0xc0733ece6bf49190, 0xbe1e7a109cc0c3f5
+ .quad 0xc0733ed2b154c120, 0xbe1e767f14a16d50
+ .quad 0xc0733ed6f4168290, 0xbe1e789cd22acaf0
+ .quad 0xc0733edb343d0a40, 0xbe1e764355ca28ad
+ .quad 0xc0733edf71cb8660, 0xbe1e79e4c7a81c45
+ .quad 0xc0733ee3acc51fb0, 0xbe1e761e26b644c2
+ .quad 0xc0733ee7e52cf8c0, 0xbe1e793e9f8fbdd3
+ .quad 0xc0733eec1b062ed0, 0xbe1e78c432991c20
+ .quad 0xc0733ef04e53d940, 0xbe1e78cdd025f4d8
+ .quad 0xc0733ef47f1909f0, 0xbe1e778310c6446e
+ .quad 0xc0733ef8ad58cd20, 0xbe1e7871af3d6e17
+ .quad 0xc0733efcd91629b0, 0xbe1e77e0e906f697
+ .quad 0xc0733f01025420f0, 0xbe1e7a1ae9b27892
+ .quad 0xc0733f052915af00, 0xbe1e76ac64c88f9d
+ .quad 0xc0733f094d5dca60, 0xbe1e779a815589c4
+ .quad 0xc0733f0d6f2f6480, 0xbe1e788f39a4864c
+ .quad 0xc0733f118e8d6980, 0xbe1e79fc51263525
+ .quad 0xc0733f15ab7ac060, 0xbe1e783501f19e90
+ .quad 0xc0733f19c5fa4ae0, 0xbe1e767e82c327ab
+ .quad 0xc0733f1dde0ee5a0, 0xbe1e7a1785d66123
+ .quad 0xc0733f21f3bb6870, 0xbe1e7936d07203da
+ .quad 0xc0733f260702a5e0, 0xbe1e7a010a7ac699
+ .quad 0xc0733f2a17e76bb0, 0xbe1e7975e4e16312
+ .quad 0xc0733f2e266c82b0, 0xbe1e7654b5422330
+ .quad 0xc0733f323294aeb0, 0xbe1e77f8a4909d35
+ .quad 0xc0733f363c62aee0, 0xbe1e792c8e30d226
+ .quad 0xc0733f3a43d93da0, 0xbe1e76f6ac67a1ff
+ .quad 0xc0733f3e48fb1070, 0xbe1e775c2e97715a
+ .quad 0xc0733f424bcad840, 0xbe1e781cd54ae100
+ /*== Log_LA_table ==*/
+ .align 32
+ .quad 0x0000000000000000
+ .quad 0xbf4bc48a867884b7
+ .quad 0xbf5bbd9e9482af09
+ .quad 0xbf64c9096b94befd
+ .quad 0xbf6bafd47221ed26
+ .quad 0xbf714999e2ad8ea6
+ .quad 0xbf74b99563d2a1bd
+ .quad 0xbf7827de6b310350
+ .quad 0xbf7b9476a4fcd10f
+ .quad 0xbf7eff5fbaf25781
+ .quad 0xbf81344daa2d7553
+ .quad 0xbf82e8158b08d957
+ .quad 0xbf849b0851443684
+ .quad 0xbf864d26cce610dd
+ .quad 0xbf87fe71ccc4e6b0
+ .quad 0xbf89aeea1e897fdf
+ .quad 0xbf8b5e908eb13790
+ .quad 0xbf8d0d65e890405a
+ .quad 0xbf8ebb6af653e2ee
+ .quad 0xbf90345040825bad
+ .quad 0xbf910a83a8446c78
+ .quad 0xbf91e05015d30a71
+ .quad 0xbf92b5b5ec0209d3
+ .quad 0xbf938ab58d173e91
+ .quad 0xbf945f4f5acb8be0
+ .quad 0xbf953383b64bf13f
+ .quad 0xbf960753003a94ef
+ .quad 0xbf96dabd98afcc05
+ .quad 0xbf97adc3df3b1ff8
+ .quad 0xbf98806632e451d0
+ .quad 0xbf9952a4f22c5ae9
+ .quad 0xbf9a24807b0e6b5c
+ .quad 0xbf9af5f92b00e610
+ .quad 0xbf9bc70f5ef65a77
+ .quad 0xbf9c97c3735e7c0a
+ .quad 0xbf9d6815c4271775
+ .quad 0xbf9e3806acbd058f
+ .quad 0xbf9f0796880d1c19
+ .quad 0xbf9fd6c5b0851c4c
+ .quad 0xbfa052ca400a4f9b
+ .quad 0xbfa0ba01a8170000
+ .quad 0xbfa121093ce3a205
+ .quad 0xbfa187e12aad8077
+ .quad 0xbfa1ee899d74a03e
+ .quad 0xbfa25502c0fc314c
+ .quad 0xbfa2bb4cc0cafe8d
+ .quad 0xbfa32167c82bdcda
+ .quad 0xbfa38754022e18e2
+ .quad 0xbfa3ed1199a5e425
+ .quad 0xbfa452a0b92cc0ec
+ .quad 0xbfa4b8018b21ed4f
+ .quad 0xbfa51d3439aacd4a
+ .quad 0xbfa58238eeb353da
+ .quad 0xbfa5e70fd3ee6b34
+ .quad 0xbfa64bb912d65c07
+ .quad 0xbfa6b034d4ad33df
+ .quad 0xbfa71483427d2a99
+ .quad 0xbfa778a4851906f3
+ .quad 0xbfa7dc98c51c8242
+ .quad 0xbfa840602aecab3d
+ .quad 0xbfa8a3fadeb847f4
+ .quad 0xbfa90769087836e4
+ .quad 0xbfa96aaacfefcf3c
+ .quad 0xbfa9cdc05cad4042
+ .quad 0xbfaa30a9d609efea
+ .quad 0xbfaa9367632ad897
+ .quad 0xbfaaf5f92b00e610
+ .quad 0xbfab585f544951a4
+ .quad 0xbfabba9a058dfd84
+ .quad 0xbfac1ca96525cf56
+ .quad 0xbfac7e8d993509f9
+ .quad 0xbface046c7ada68d
+ .quad 0xbfad41d5164facb4
+ .quad 0xbfada338aaa98a0c
+ .quad 0xbfae0471aa1868f5
+ .quad 0xbfae658039c88690
+ .quad 0xbfaec6647eb58808
+ .quad 0xbfaf271e9daacf20
+ .quad 0xbfaf87aebb43ce06
+ .quad 0xbfafe814fbec5a77
+ .quad 0xbfb02428c1f08016
+ .quad 0xbfb054323b97a948
+ .quad 0xbfb08426fcdb1ee7
+ .quad 0xbfb0b40717932b96
+ .quad 0xbfb0e3d29d81165e
+ .quad 0xbfb11389a04f4a2e
+ .quad 0xbfb1432c31917d08
+ .quad 0xbfb172ba62c4d6de
+ .quad 0xbfb1a23445501816
+ .quad 0xbfb1d199ea83bfbe
+ .quad 0xbfb200eb639a3173
+ .quad 0xbfb23028c1b7daed
+ .quad 0xbfb25f5215eb594a
+ .quad 0xbfb28e67712d9dfc
+ .quad 0xbfb2bd68e4621371
+ .quad 0xbfb2ec568056c16f
+ .quad 0xbfb31b3055c47118
+ .quad 0xbfb349f6754ed0b4
+ .quad 0xbfb378a8ef84971e
+ .quad 0xbfb3a747d4dfa6f5
+ .quad 0xbfb3d5d335c53179
+ .quad 0xbfb4044b2285d925
+ .quad 0xbfb432afab5dd3ff
+ .quad 0xbfb46100e0750da1
+ .quad 0xbfb48f3ed1df48fb
+ .quad 0xbfb4bd698f9c41cf
+ .quad 0xbfb4eb812997cde4
+ .quad 0xbfb51985afa9fdfd
+ .quad 0xbfb5477731973e85
+ .quad 0xbfb57555bf1077f5
+ .quad 0xbfb5a32167b32f02
+ .quad 0xbfb5d0da3b09a47e
+ .quad 0xbfb5fe80488af4fd
+ .quad 0xbfb62c139f9b3837
+ .quad 0xbfb659944f8ba02d
+ .quad 0xbfb68702679a980a
+ .quad 0xbfb6b45df6f3e2c9
+ .quad 0xbfb6e1a70cb0b99a
+ .quad 0xbfb70eddb7d7ea07
+ .quad 0xbfb73c02075df3e5
+ .quad 0xbfb769140a2526fd
+ .quad 0xbfb79613cefdc07d
+ .quad 0xbfb7c30164a60836
+ .quad 0xbfb7efdcd9ca6d8f
+ .quad 0xbfb81ca63d05a44a
+ .quad 0xbfb8495d9ce0c10c
+ .quad 0xbfb8760307d355ab
+ .quad 0xbfb8a2968c438d41
+ .quad 0xbfb8cf183886480d
+ .quad 0xbfb8fb881adf3713
+ .quad 0xbfb927e64180f790
+ .quad 0xbfb95432ba8d2e2f
+ .quad 0xbfb9806d9414a209
+ .quad 0xbfb9ac96dc175776
+ .quad 0xbfb9d8aea084aa9c
+ .quad 0xbfba04b4ef3b69d8
+ .quad 0xbfba30a9d609efea
+ .quad 0xbfba5c8d62ae3dec
+ .quad 0xbfba885fa2d6151e
+ .quad 0xbfbab420a41f1076
+ .quad 0xbfbadfd07416be07
+ .quad 0xbfbb0b6f203ab82c
+ .quad 0xbfbb36fcb5f8be8a
+ .quad 0xbfbb627942aecedd
+ .quad 0xbfbb8de4d3ab3d98
+ .quad 0xbfbbb93f762cce4f
+ .quad 0xbfbbe4893762cbf7
+ .quad 0xbfbc0fc2246d20f5
+ .quad 0xbfbc3aea4a5c6eff
+ .quad 0xbfbc6601b63226cb
+ .quad 0xbfbc910874e09f98
+ .quad 0xbfbcbbfe934b2e81
+ .quad 0xbfbce6e41e463da5
+ .quad 0xbfbd11b92297632b
+ .quad 0xbfbd3c7dacf5780b
+ .quad 0xbfbd6731ca08aeb9
+ .quad 0xbfbd91d5866aa99c
+ .quad 0xbfbdbc68eea6915b
+ .quad 0xbfbde6ec0f392b05
+ .quad 0xbfbe115ef490ee07
+ .quad 0xbfbe3bc1ab0e19fe
+ .quad 0xbfbe66143f02cc5d
+ .quad 0xbfbe9056bcb315e8
+ .quad 0xbfbeba893055100b
+ .quad 0xbfbee4aba610f204
+ .quad 0xbfbf0ebe2a0125eb
+ .quad 0xbfbf38c0c8325d86
+ .quad 0xbfbf62b38ca3a706
+ .quad 0xbfbf8c9683468191
+ .quad 0xbfbfb669b7fef1a8
+ .quad 0xbfbfe02d36a3956d
+ .quad 0xbfc004f0857edc5c
+ .quad 0xbfc019c2a064b486
+ .quad 0xbfc02e8cf1dac4b8
+ .quad 0xbfc0434f7fb1f307
+ .quad 0xbfc0580a4fb4a3df
+ .quad 0xbfc06cbd67a6c3b6
+ .quad 0xbfc08168cd45d0a9
+ .quad 0xbfc0960c8648e406
+ .quad 0xbfc0aaa89860bbcf
+ .quad 0xbfc0bf3d0937c41c
+ .quad 0xbfc0d3c9de722078
+ .quad 0xbfc0e84f1dadb526
+ .quad 0xbfc0fccccc823059
+ .quad 0xbfc11142f0811357
+ .quad 0xbfc125b18f35bb8e
+ .quad 0xbfc13a18ae256b99
+ .quad 0xbfc14e7852cf5430
+ .quad 0xbfc162d082ac9d10
+ .quad 0xbfc1772143306dc6
+ .quad 0xbfc18b6a99c7f679
+ .quad 0xbfc19fac8bda7897
+ .quad 0xbfc1b3e71ec94f7b
+ .quad 0xbfc1c81a57eff8fd
+ .quad 0xbfc1dc463ca41df8
+ .quad 0xbfc1f06ad2359abd
+ .quad 0xbfc204881dee8777
+ .quad 0xbfc2189e25134081
+ .quad 0xbfc22cacece26ead
+ .quad 0xbfc240b47a950f79
+ .quad 0xbfc254b4d35e7d3c
+ .quad 0xbfc268adfc6c773e
+ .quad 0xbfc27c9ffae729c1
+ .quad 0xbfc2908ad3f13603
+ .quad 0xbfc2a46e8ca7ba2a
+ .quad 0xbfc2b84b2a225923
+ .quad 0xbfc2cc20b1734279
+ .quad 0xbfc2dfef27a73a18
+ .quad 0xbfc2f3b691c5a001
+ .quad 0xbfc30776f4d077f7
+ .quad 0xbfc31b3055c47118
+ .quad 0xbfc32ee2b998ed6e
+ .quad 0xbfc3428e2540096d
+ .quad 0x3fc331f403985097
+ .quad 0x3fc31e56798a910a
+ .quad 0x3fc30abfd8f333b6
+ .quad 0x3fc2f7301cf4e87b
+ .quad 0x3fc2e3a740b7800f
+ .quad 0x3fc2d0253f67e4cb
+ .quad 0x3fc2bcaa14381386
+ .quad 0x3fc2a935ba5f1479
+ .quad 0x3fc295c82d18f434
+ .quad 0x3fc2826167a6bc9c
+ .quad 0x3fc26f01654e6df6
+ .quad 0x3fc25ba8215af7fc
+ .quad 0x3fc24855971c3307
+ .quad 0x3fc23509c1e6d937
+ .quad 0x3fc221c49d147fb3
+ .quad 0x3fc20e8624038fed
+ .quad 0x3fc1fb4e521740f4
+ .quad 0x3fc1e81d22b790d4
+ .quad 0x3fc1d4f291513e01
+ .quad 0x3fc1c1ce9955c0c6
+ .quad 0x3fc1aeb1363b44c8
+ .quad 0x3fc19b9a637ca295
+ .quad 0x3fc1888a1c995931
+ .quad 0x3fc175805d1587c1
+ .quad 0x3fc1627d2079e731
+ .quad 0x3fc14f806253c3ed
+ .quad 0x3fc13c8a1e34f7a0
+ .quad 0x3fc1299a4fb3e306
+ .quad 0x3fc116b0f26b67bb
+ .quad 0x3fc103ce01fae223
+ .quad 0x3fc0f0f17a062353
+ .quad 0x3fc0de1b56356b04
+ .quad 0x3fc0cb4b9235619a
+ .quad 0x3fc0b88229b71227
+ .quad 0x3fc0a5bf186fe483
+ .quad 0x3fc093025a19976c
+ .quad 0x3fc0804bea723aa9
+ .quad 0x3fc06d9bc53c2941
+ .quad 0x3fc05af1e63e03b4
+ .quad 0x3fc0484e4942aa43
+ .quad 0x3fc035b0ea19373b
+ .quad 0x3fc02319c494f951
+ .quad 0x3fc01088d48d6e03
+ .quad 0x3fbffbfc2bbc7803
+ .quad 0x3fbfd6f308ce5b52
+ .quad 0x3fbfb1f6381856f4
+ .quad 0x3fbf8d05b16a6d47
+ .quad 0x3fbf68216c9cc727
+ .quad 0x3fbf4349618fa91a
+ .quad 0x3fbf1e7d882b689a
+ .quad 0x3fbef9bdd860616b
+ .quad 0x3fbed50a4a26eafc
+ .quad 0x3fbeb062d57f4de8
+ .quad 0x3fbe8bc77271b97a
+ .quad 0x3fbe6738190e394c
+ .quad 0x3fbe42b4c16caaf3
+ .quad 0x3fbe1e3d63acb3ba
+ .quad 0x3fbdf9d1f7f5b674
+ .quad 0x3fbdd5727676c959
+ .quad 0x3fbdb11ed766abf4
+ .quad 0x3fbd8cd71303bd26
+ .quad 0x3fbd689b2193f133
+ .quad 0x3fbd446afb64c7e5
+ .quad 0x3fbd204698cb42bd
+ .quad 0x3fbcfc2df223db2d
+ .quad 0x3fbcd820ffd278f3
+ .quad 0x3fbcb41fba42686d
+ .quad 0x3fbc902a19e65111
+ .quad 0x3fbc6c4017382bea
+ .quad 0x3fbc4861aab93a23
+ .quad 0x3fbc248eccf1fba6
+ .quad 0x3fbc00c7767225cb
+ .quad 0x3fbbdd0b9fd09a10
+ .quad 0x3fbbb95b41ab5ce6
+ .quad 0x3fbb95b654a78c87
+ .quad 0x3fbb721cd17157e3
+ .quad 0x3fbb4e8eb0bbf58f
+ .quad 0x3fbb2b0beb419ad0
+ .quad 0x3fbb079479c372ad
+ .quad 0x3fbae4285509950b
+ .quad 0x3fbac0c775e2fde6
+ .quad 0x3fba9d71d5258484
+ .quad 0x3fba7a276badd2c8
+ .quad 0x3fba56e8325f5c87
+ .quad 0x3fba33b4222456f1
+ .quad 0x3fba108b33edb005
+ .quad 0x3fb9ed6d60b30612
+ .quad 0x3fb9ca5aa1729f45
+ .quad 0x3fb9a752ef316149
+ .quad 0x3fb9845642fac8f0
+ .quad 0x3fb9616495e0e1e8
+ .quad 0x3fb93e7de0fc3e80
+ .quad 0x3fb91ba21d6bef77
+ .quad 0x3fb8f8d144557bdf
+ .quad 0x3fb8d60b4ee4d901
+ .quad 0x3fb8b350364c6257
+ .quad 0x3fb8909ff3c4d191
+ .quad 0x3fb86dfa808d36a0
+ .quad 0x3fb84b5fd5eaefd8
+ .quad 0x3fb828cfed29a215
+ .quad 0x3fb8064abf9b30f1
+ .quad 0x3fb7e3d04697b704
+ .quad 0x3fb7c1607b7d7e32
+ .quad 0x3fb79efb57b0f803
+ .quad 0x3fb77ca0d49cb608
+ .quad 0x3fb75a50ebb1624a
+ .quad 0x3fb7380b9665b7c8
+ .quad 0x3fb715d0ce367afc
+ .quad 0x3fb6f3a08ca67270
+ .quad 0x3fb6d17acb3e5f5e
+ .quad 0x3fb6af5f838cf654
+ .quad 0x3fb68d4eaf26d7ee
+ .quad 0x3fb66b4847a68997
+ .quad 0x3fb6494c46ac6e4d
+ .quad 0x3fb6275aa5debf81
+ .quad 0x3fb605735ee985f1
+ .quad 0x3fb5e3966b7e9295
+ .quad 0x3fb5c1c3c5557799
+ .quad 0x3fb59ffb662b815c
+ .quad 0x3fb57e3d47c3af7b
+ .quad 0x3fb55c8963e6adeb
+ .quad 0x3fb53adfb462ce16
+ .quad 0x3fb51940330c000b
+ .quad 0x3fb4f7aad9bbcbaf
+ .quad 0x3fb4d61fa2514a00
+ .quad 0x3fb4b49e86b11e5f
+ .quad 0x3fb4932780c56fe2
+ .quad 0x3fb471ba8a7de2b7
+ .quad 0x3fb450579dcf9186
+ .quad 0x3fb42efeb4b506e9
+ .quad 0x3fb40dafc92e36e2
+ .quad 0x3fb3ec6ad5407868
+ .quad 0x3fb3cb2fd2f67ef1
+ .quad 0x3fb3a9febc60540a
+ .quad 0x3fb388d78b9350ff
+ .quad 0x3fb367ba3aaa1883
+ .quad 0x3fb346a6c3c49066
+ .quad 0x3fb3259d2107db54
+ .quad 0x3fb3049d4c9e52a0
+ .quad 0x3fb2e3a740b7800f
+ .quad 0x3fb2c2baf78817b7
+ .quad 0x3fb2a1d86b49f1e2
+ .quad 0x3fb280ff963c04fc
+ .quad 0x3fb2603072a25f82
+ .quad 0x3fb23f6afac6220a
+ .quad 0x3fb21eaf28f57941
+ .quad 0x3fb1fdfcf7839804
+ .quad 0x3fb1dd5460c8b16f
+ .quad 0x3fb1bcb55f21f307
+ .quad 0x3fb19c1fecf17ee0
+ .quad 0x3fb17b94049e65d0
+ .quad 0x3fb15b11a094a1aa
+ .quad 0x3fb13a98bb450f81
+ .quad 0x3fb11a294f2569f6
+ .quad 0x3fb0f9c356b04389
+ .quad 0x3fb0d966cc6500fa
+ .quad 0x3fb0b913aac7d3a7
+ .quad 0x3fb098c9ec61b3ff
+ .quad 0x3fb078898bc05bf4
+ .quad 0x3fb0585283764178
+ .quad 0x3fb03824ce1a9101
+ .quad 0x3fb0180066492817
+ .quad 0x3fafefca8d451fd6
+ .quad 0x3fafafa6d397efdb
+ .quad 0x3faf6f9594de60f0
+ .quad 0x3faf2f96c6754aee
+ .quad 0x3faeefaa5dc2b239
+ .quad 0x3faeafd05035bd3b
+ .quad 0x3fae70089346a9e6
+ .quad 0x3fae30531c76c34a
+ .quad 0x3fadf0afe1505738
+ .quad 0x3fadb11ed766abf4
+ .quad 0x3fad719ff455f5f7
+ .quad 0x3fad32332dc34dbd
+ .quad 0x3facf2d8795ca5a5
+ .quad 0x3facb38fccd8bfdb
+ .quad 0x3fac74591df72456
+ .quad 0x3fac3534628016dd
+ .quad 0x3fabf62190448d22
+ .quad 0x3fabb7209d1e24e5
+ .quad 0x3fab78317eef1a29
+ .quad 0x3fab39542ba23d73
+ .quad 0x3faafa88992aea19
+ .quad 0x3faabbcebd84fca0
+ .quad 0x3faa7d268eb4c924
+ .quad 0x3faa3e9002c711d2
+ .quad 0x3faa000b0fd0fd6b
+ .quad 0x3fa9c197abf00dd7
+ .quad 0x3fa98335cd4a16c3
+ .quad 0x3fa944e56a0d3450
+ .quad 0x3fa906a6786fc1cb
+ .quad 0x3fa8c878eeb05074
+ .quad 0x3fa88a5cc3159e53
+ .quad 0x3fa84c51ebee8d15
+ .quad 0x3fa80e585f9218fc
+ .quad 0x3fa7d070145f4fd7
+ .quad 0x3fa7929900bd4809
+ .quad 0x3fa754d31b1b179c
+ .quad 0x3fa7171e59efcb5f
+ .quad 0x3fa6d97ab3ba5e10
+ .quad 0x3fa69be81f01af99
+ .quad 0x3fa65e6692547c4e
+ .quad 0x3fa620f604495440
+ .quad 0x3fa5e3966b7e9295
+ .quad 0x3fa5a647be9a54f6
+ .quad 0x3fa56909f44a72fe
+ .quad 0x3fa52bdd034475b8
+ .quad 0x3fa4eec0e2458f30
+ .quad 0x3fa4b1b588129203
+ .quad 0x3fa474baeb77e904
+ .quad 0x3fa437d103498eec
+ .quad 0x3fa3faf7c663060e
+ .quad 0x3fa3be2f2ba7501f
+ .quad 0x3fa381772a00e604
+ .quad 0x3fa344cfb861afae
+ .quad 0x3fa30838cdc2fbfd
+ .quad 0x3fa2cbb2612578b4
+ .quad 0x3fa28f3c69912a74
+ .quad 0x3fa252d6de1564c1
+ .quad 0x3fa21681b5c8c213
+ .quad 0x3fa1da3ce7c91bf8
+ .quad 0x3fa19e086b3b8333
+ .quad 0x3fa161e4374c37f4
+ .quad 0x3fa125d0432ea20e
+ .quad 0x3fa0e9cc861d4944
+ .quad 0x3fa0add8f759cd95
+ .quad 0x3fa071f58e2cdf9b
+ .quad 0x3fa0362241e638ec
+ .quad 0x3f9ff4be13b92920
+ .quad 0x3f9f7d57badb4ee8
+ .quad 0x3f9f061167fc31e8
+ .quad 0x3f9e8eeb09f2f6cb
+ .quad 0x3f9e17e48fa48962
+ .quad 0x3f9da0fde8038de9
+ .quad 0x3f9d2a3702105259
+ .quad 0x3f9cb38fccd8bfdb
+ .quad 0x3f9c3d0837784c41
+ .quad 0x3f9bc6a03117eb97
+ .quad 0x3f9b5057a8ee01ce
+ .quad 0x3f9ada2e8e3e546f
+ .quad 0x3f9a6424d059fc68
+ .quad 0x3f99ee3a5e9f57e8
+ .quad 0x3f99786f2879fc53
+ .quad 0x3f9902c31d62a843
+ .quad 0x3f988d362cdf359e
+ .quad 0x3f9817c846828bbd
+ .quad 0x3f97a27959ec91aa
+ .quad 0x3f972d4956ca2067
+ .quad 0x3f96b8382cd4f551
+ .quad 0x3f964345cbd3a491
+ .quad 0x3f95ce7223998b98
+ .quad 0x3f9559bd2406c3ba
+ .quad 0x3f94e526bd0814d1
+ .quad 0x3f9470aede96e7f2
+ .quad 0x3f93fc5578b93a38
+ .quad 0x3f93881a7b818f9e
+ .quad 0x3f9313fdd70ee5e8
+ .quad 0x3f929fff7b8ca79d
+ .quad 0x3f922c1f59329f1b
+ .quad 0x3f91b85d6044e9ae
+ .quad 0x3f9144b98113eac0
+ .quad 0x3f90d133abfc3f1b
+ .quad 0x3f905dcbd166b033
+ .quad 0x3f8fd503c3904f1d
+ .quad 0x3f8eeeab9b43445d
+ .quad 0x3f8e088f0b004827
+ .quad 0x3f8d22adf3f9579d
+ .quad 0x3f8c3d0837784c41
+ .quad 0x3f8b579db6dec358
+ .quad 0x3f8a726e53a6056e
+ .quad 0x3f898d79ef5eedf0
+ .quad 0x3f88a8c06bb1d2f4
+ .quad 0x3f87c441aa5e6d15
+ .quad 0x3f86dffd8d3bbf70
+ .quad 0x3f85fbf3f637ffc5
+ .quad 0x3f851824c7587eb0
+ .quad 0x3f84348fe2b99002
+ .quad 0x3f8351352a8e733f
+ .quad 0x3f826e1481213c2e
+ .quad 0x3f818b2dc8d2bb91
+ .quad 0x3f80a880e41a67f6
+ .quad 0x3f7f8c1b6b0c8d4e
+ .quad 0x3f7dc7a83f75a96d
+ .quad 0x3f7c03a80ae5e054
+ .quad 0x3f7a401a92ff827e
+ .quad 0x3f787cff9d9147a5
+ .quad 0x3f76ba56f09621bc
+ .quad 0x3f74f8205235102d
+ .quad 0x3f73365b88c0f347
+ .quad 0x3f7175085ab85ff0
+ .quad 0x3f6f684d1d8ae702
+ .quad 0x3f6be76bd77b4fc3
+ .quad 0x3f68676c71434fb9
+ .quad 0x3f64e84e793a474a
+ .quad 0x3f616a117e0d4b30
+ .quad 0x3f5bd96a1d7d9cbc
+ .quad 0x3f54e071754c98ba
+ .quad 0x3f4bd27045bfd025
+ .quad 0x3f3bcef518e29612
+ .quad 0x8000000000000000
+ /*== poly_coeff[5] ==*/
+ .align 32
+ .quad 0x3fb63C65231FBD16, 0x3fb63C65231FBD16, 0x3fb63C65231FBD16, 0x3fb63C65231FBD16 /* coeff5 */
+ .quad 0xbfbBCB7D4EFBE80B, 0xbfbBCB7D4EFBE80B, 0xbfbBCB7D4EFBE80B, 0xbfbBCB7D4EFBE80B /* coeff4 */
+ .quad 0x3fc287A7636F341E, 0x3fc287A7636F341E, 0x3fc287A7636F341E, 0x3fc287A7636F341E /* coeff3 */
+ .quad 0xbfcBCB7B1526DE36, 0xbfcBCB7B1526DE36, 0xbfcBCB7B1526DE36, 0xbfcBCB7B1526DE36 /* coeff2 */
+ .quad 0x3fdBCB7B1526E50E, 0x3fdBCB7B1526E50E, 0x3fdBCB7B1526E50E, 0x3fdBCB7B1526E50E /* coeff1 */
+ /*== ExpMask ==*/
+ .align 32
+ .quad 0x000fffffffffffff, 0x000fffffffffffff, 0x000fffffffffffff, 0x000fffffffffffff
+ /*== Two10 ==*/
+ .align 32
+ .quad 0x3f50000000000000, 0x3f50000000000000, 0x3f50000000000000, 0x3f50000000000000
+ /*== MinNorm ==*/
+ .align 32
+ .quad 0x0010000000000000, 0x0010000000000000, 0x0010000000000000, 0x0010000000000000
+ /*== MaxNorm ==*/
+ .align 32
+ .quad 0x7fefffffffffffff, 0x7fefffffffffffff, 0x7fefffffffffffff, 0x7fefffffffffffff
+ /*== HalfMask ==*/
+ .align 32
+ .quad 0xfffffffffc000000, 0xfffffffffc000000, 0xfffffffffc000000, 0xfffffffffc000000
+ /*== One ==*/
+ .align 32
+ .quad 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000
+ /*== Threshold ==*/
+ .align 32
+ .quad 0x4086a00000000000, 0x4086a00000000000, 0x4086a00000000000, 0x4086a00000000000
+ /*== Bias ==*/
+ .align 32
+ .quad 0x408ff80000000000, 0x408ff80000000000, 0x408ff80000000000, 0x408ff80000000000
+ /*== Bias1 ==*/
+ .align 32
+ .quad 0x408ff00000000000, 0x408ff00000000000, 0x408ff00000000000, 0x408ff00000000000
+ /*== L2 ==*/
+ .align 32
+ .quad 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff
+ .align 32
+ .type __svml_dlog10_data_internal,@object
+ .size __svml_dlog10_data_internal,.-__svml_dlog10_data_internal
new file mode 100644
@@ -0,0 +1,20 @@
+/* AVX2 version of vectorized log10, vector length is 8.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define _ZGVeN8v_log10 _ZGVeN8v_log10_avx2_wrapper
+#include "../svml_d_log108_core.S"
new file mode 100644
@@ -0,0 +1,27 @@
+/* Multiple versions of vectorized log10, vector length is 8.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define SYMBOL_NAME _ZGVeN8v_log10
+#include "ifunc-mathvec-avx512-skx.h"
+
+libc_ifunc_redirected (REDIRECT_NAME, SYMBOL_NAME, IFUNC_SELECTOR ());
+
+#ifdef SHARED
+__hidden_ver1 (_ZGVeN8v_log10, __GI__ZGVeN8v_log10, __redirect__ZGVeN8v_log10)
+ __attribute__ ((visibility ("hidden")));
+#endif
new file mode 100644
@@ -0,0 +1,299 @@
+/* Function log10 vectorized with AVX-512.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ https://www.gnu.org/licenses/. */
+
+/*
+ * ALGORITHM DESCRIPTION:
+ *
+ * Get short reciprocal approximation Rcp ~ 1/mantissa(x)
+ * R = Rcp*x - 1.0
+ * log10(x) = k*log10(2.0) - log10(Rcp) + poly_approximation(R)
+ * log10(Rcp) is tabulated
+ *
+ *
+ */
+
+/* Offsets for data table __svml_dlog10_data_internal_avx512
+ */
+#define Log_tbl 0
+#define One 128
+#define C075 192
+#define poly_coeff9 256
+#define poly_coeff8 320
+#define poly_coeff7 384
+#define poly_coeff6 448
+#define poly_coeff5 512
+#define poly_coeff4 576
+#define poly_coeff3 640
+#define poly_coeff2 704
+#define poly_coeff1 768
+#define L2 832
+
+#include <sysdep.h>
+
+ .text
+ .section .text.evex512,"ax",@progbits
+ENTRY(_ZGVeN8v_log10_skx)
+ pushq %rbp
+ cfi_def_cfa_offset(16)
+ movq %rsp, %rbp
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+ andq $-64, %rsp
+ subq $192, %rsp
+ vmovaps %zmm0, %zmm7
+ vgetmantpd $8, {sae}, %zmm7, %zmm6
+ vmovups One+__svml_dlog10_data_internal_avx512(%rip), %zmm3
+ vmovups poly_coeff5+__svml_dlog10_data_internal_avx512(%rip), %zmm12
+ vmovups poly_coeff3+__svml_dlog10_data_internal_avx512(%rip), %zmm13
+
+/* Start polynomial evaluation */
+ vmovups poly_coeff9+__svml_dlog10_data_internal_avx512(%rip), %zmm10
+ vmovups poly_coeff8+__svml_dlog10_data_internal_avx512(%rip), %zmm1
+ vmovups poly_coeff7+__svml_dlog10_data_internal_avx512(%rip), %zmm11
+ vmovups poly_coeff6+__svml_dlog10_data_internal_avx512(%rip), %zmm14
+
+/* Prepare exponent correction: DblRcp<0.75? */
+ vmovups C075+__svml_dlog10_data_internal_avx512(%rip), %zmm2
+
+/* Table lookup */
+ vmovups __svml_dlog10_data_internal_avx512(%rip), %zmm5
+
+/* GetExp(x) */
+ vgetexppd {sae}, %zmm7, %zmm0
+
+/* DblRcp ~ 1/Mantissa */
+ vrcp14pd %zmm6, %zmm8
+
+/* x<=0? */
+ vfpclasspd $94, %zmm7, %k0
+
+/* round DblRcp to 4 fractional bits (RN mode, no Precision exception) */
+ vrndscalepd $88, {sae}, %zmm8, %zmm4
+ vmovups poly_coeff4+__svml_dlog10_data_internal_avx512(%rip), %zmm8
+ kmovw %k0, %edx
+
+/* Reduced argument: R = DblRcp*Mantissa - 1 */
+ vfmsub213pd {rn-sae}, %zmm3, %zmm4, %zmm6
+ vcmppd $17, {sae}, %zmm2, %zmm4, %k1
+ vfmadd231pd {rn-sae}, %zmm6, %zmm12, %zmm8
+ vmovups poly_coeff2+__svml_dlog10_data_internal_avx512(%rip), %zmm12
+ vfmadd231pd {rn-sae}, %zmm6, %zmm10, %zmm1
+ vfmadd231pd {rn-sae}, %zmm6, %zmm11, %zmm14
+ vmovups poly_coeff1+__svml_dlog10_data_internal_avx512(%rip), %zmm2
+
+/* R^2 */
+ vmulpd {rn-sae}, %zmm6, %zmm6, %zmm15
+ vfmadd231pd {rn-sae}, %zmm6, %zmm13, %zmm12
+
+/* Prepare table index */
+ vpsrlq $48, %zmm4, %zmm9
+
+/* add 1 to Expon if DblRcp<0.75 */
+ vaddpd {rn-sae}, %zmm3, %zmm0, %zmm0{%k1}
+ vmulpd {rn-sae}, %zmm15, %zmm15, %zmm13
+ vfmadd213pd {rn-sae}, %zmm14, %zmm15, %zmm1
+ vfmadd213pd {rn-sae}, %zmm12, %zmm15, %zmm8
+ vpermt2pd Log_tbl+64+__svml_dlog10_data_internal_avx512(%rip), %zmm9, %zmm5
+
+/* polynomial */
+ vfmadd213pd {rn-sae}, %zmm8, %zmm13, %zmm1
+ vfmadd213pd {rn-sae}, %zmm2, %zmm6, %zmm1
+ vfmadd213pd {rn-sae}, %zmm5, %zmm1, %zmm6
+ vmovups L2+__svml_dlog10_data_internal_avx512(%rip), %zmm1
+ vfmadd213pd {rn-sae}, %zmm6, %zmm1, %zmm0
+ testl %edx, %edx
+
+/* Go to special inputs processing branch */
+ jne L(SPECIAL_VALUES_BRANCH)
+ # LOE rbx r12 r13 r14 r15 edx zmm0 zmm7
+
+/* Restore registers
+ * and exit the function
+ */
+
+L(EXIT):
+ movq %rbp, %rsp
+ popq %rbp
+ cfi_def_cfa(7, 8)
+ cfi_restore(6)
+ ret
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+
+/* Branch to process
+ * special inputs
+ */
+
+L(SPECIAL_VALUES_BRANCH):
+ vmovups %zmm7, 64(%rsp)
+ vmovups %zmm0, 128(%rsp)
+ # LOE rbx r12 r13 r14 r15 edx zmm0
+
+ xorl %eax, %eax
+ # LOE rbx r12 r13 r14 r15 eax edx
+
+ vzeroupper
+ movq %r12, 16(%rsp)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -176; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x50, 0xff, 0xff, 0xff, 0x22
+ movl %eax, %r12d
+ movq %r13, 8(%rsp)
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -184; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x48, 0xff, 0xff, 0xff, 0x22
+ movl %edx, %r13d
+ movq %r14, (%rsp)
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -192; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x40, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r15 r12d r13d
+
+/* Range mask
+ * bits check
+ */
+
+L(RANGEMASK_CHECK):
+ btl %r12d, %r13d
+
+/* Call scalar math function */
+ jc L(SCALAR_MATH_CALL)
+ # LOE rbx r15 r12d r13d
+
+/* Special inputs
+ * processing loop
+ */
+
+L(SPECIAL_VALUES_LOOP):
+ incl %r12d
+ cmpl $8, %r12d
+
+/* Check bits in range mask */
+ jl L(RANGEMASK_CHECK)
+ # LOE rbx r15 r12d r13d
+
+ movq 16(%rsp), %r12
+ cfi_restore(12)
+ movq 8(%rsp), %r13
+ cfi_restore(13)
+ movq (%rsp), %r14
+ cfi_restore(14)
+ vmovups 128(%rsp), %zmm0
+
+/* Go to exit */
+ jmp L(EXIT)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -176; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x50, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -184; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x48, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -192; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x40, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r12 r13 r14 r15 zmm0
+
+/* Scalar math fucntion call
+ * to process special input
+ */
+
+L(SCALAR_MATH_CALL):
+ movl %r12d, %r14d
+ movsd 64(%rsp,%r14,8), %xmm0
+ call log10@PLT
+ # LOE rbx r14 r15 r12d r13d xmm0
+
+ movsd %xmm0, 128(%rsp,%r14,8)
+
+/* Process special inputs in loop */
+ jmp L(SPECIAL_VALUES_LOOP)
+ # LOE rbx r15 r12d r13d
+END(_ZGVeN8v_log10_skx)
+
+ .section .rodata, "a"
+ .align 64
+
+#ifdef __svml_dlog10_data_internal_avx512_typedef
+typedef unsigned int VUINT32;
+typedef struct {
+ __declspec(align(64)) VUINT32 Log_tbl[16][2];
+ __declspec(align(64)) VUINT32 One[8][2];
+ __declspec(align(64)) VUINT32 C075[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff9[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff8[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff7[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff6[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff5[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff4[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff3[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff2[8][2];
+ __declspec(align(64)) VUINT32 poly_coeff1[8][2];
+ __declspec(align(64)) VUINT32 L2[8][2];
+ } __svml_dlog10_data_internal_avx512;
+#endif
+__svml_dlog10_data_internal_avx512:
+ /*== Log_tbl ==*/
+ .quad 0x0000000000000000
+ .quad 0xbf9af5f92b00e610
+ .quad 0xbfaa30a9d609efea
+ .quad 0xbfb31b3055c47118
+ .quad 0xbfb8cf183886480d
+ .quad 0xbfbe3bc1ab0e19fe
+ .quad 0xbfc1b3e71ec94f7b
+ .quad 0xbfc42c7e7fe3fc02
+ .quad 0x3fbffbfc2bbc7803
+ .quad 0x3fbb721cd17157e3
+ .quad 0x3fb715d0ce367afc
+ .quad 0x3fb2e3a740b7800f
+ .quad 0x3fadb11ed766abf4
+ .quad 0x3fa5e3966b7e9295
+ .quad 0x3f9cb38fccd8bfdb
+ .quad 0x3f8c3d0837784c41
+ /*== One ==*/
+ .align 64
+ .quad 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000, 0x3ff0000000000000
+ /*== 0.75 ==*/
+ .align 64
+ .quad 0x3fe8000000000000, 0x3fe8000000000000, 0x3fe8000000000000, 0x3fe8000000000000, 0x3fe8000000000000, 0x3fe8000000000000, 0x3fe8000000000000, 0x3fe8000000000000
+ /*== poly_coeff9 ==*/
+ .align 64
+ .quad 0x3fa8c2d828480370, 0x3fa8c2d828480370, 0x3fa8c2d828480370, 0x3fa8c2d828480370, 0x3fa8c2d828480370, 0x3fa8c2d828480370, 0x3fa8c2d828480370, 0x3fa8c2d828480370
+ /*== poly_coeff8 ==*/
+ .align 64
+ .quad 0xbfabd80d96029814, 0xbfabd80d96029814, 0xbfabd80d96029814, 0xbfabd80d96029814, 0xbfabd80d96029814, 0xbfabd80d96029814, 0xbfabd80d96029814, 0xbfabd80d96029814
+ /*== poly_coeff7 ==*/
+ .align 64
+ .quad 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2, 0x3fafc3f6f38b58a2
+ /*== poly_coeff6 ==*/
+ .align 64
+ .quad 0xbfb287a63464dc80, 0xbfb287a63464dc80, 0xbfb287a63464dc80, 0xbfb287a63464dc80, 0xbfb287a63464dc80, 0xbfb287a63464dc80, 0xbfb287a63464dc80, 0xbfb287a63464dc80
+ /*== poly_coeff5 ==*/
+ .align 64
+ .quad 0x3fb63c62777f27d9, 0x3fb63c62777f27d9, 0x3fb63c62777f27d9, 0x3fb63c62777f27d9, 0x3fb63c62777f27d9, 0x3fb63c62777f27d9, 0x3fb63c62777f27d9, 0x3fb63c62777f27d9
+ /*== poly_coeff4 ==*/
+ .align 64
+ .quad 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3, 0xbfbbcb7b153c06a3
+ /*== poly_coeff3 ==*/
+ .align 64
+ .quad 0x3fc287a7636f428c, 0x3fc287a7636f428c, 0x3fc287a7636f428c, 0x3fc287a7636f428c, 0x3fc287a7636f428c, 0x3fc287a7636f428c, 0x3fc287a7636f428c, 0x3fc287a7636f428c
+ /*== poly_coeff2 ==*/
+ .align 64
+ .quad 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db, 0xbfcbcb7b1526e4db
+ /*== poly_coeff1 ==*/
+ .align 64
+ .quad 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e, 0x3fdbcb7b1526e50e
+ /*== L2 ==*/
+ .align 64
+ .quad 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff, 0x3fd34413509f79ff
+ .align 64
+ .type __svml_dlog10_data_internal_avx512,@object
+ .size __svml_dlog10_data_internal_avx512,.-__svml_dlog10_data_internal_avx512
new file mode 100644
@@ -0,0 +1,20 @@
+/* AVX2 version of vectorized log10f.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define _ZGVeN16v_log10f _ZGVeN16v_log10f_avx2_wrapper
+#include "../svml_s_log10f16_core.S"
new file mode 100644
@@ -0,0 +1,28 @@
+/* Multiple versions of vectorized log10f, vector length is 16.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define SYMBOL_NAME _ZGVeN16v_log10f
+#include "ifunc-mathvec-avx512-skx.h"
+
+libc_ifunc_redirected (REDIRECT_NAME, SYMBOL_NAME, IFUNC_SELECTOR ());
+
+#ifdef SHARED
+__hidden_ver1 (_ZGVeN16v_log10f, __GI__ZGVeN16v_log10f,
+ __redirect__ZGVeN16v_log10f)
+ __attribute__ ((visibility ("hidden")));
+#endif
new file mode 100644
@@ -0,0 +1,238 @@
+/* Function log10f vectorized with AVX-512.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ https://www.gnu.org/licenses/. */
+
+/*
+ * ALGORITHM DESCRIPTION:
+ *
+ * Get short reciprocal approximation Rcp ~ 1/mantissa(x)
+ * R = Rcp*x - 1.0
+ * log10(x) = k*log10(2.0) - log10(Rcp) + poly_approximation(R)
+ * log10(Rcp) is tabulated
+ *
+ *
+ */
+
+/* Offsets for data table __svml_slog10_data_internal_avx512
+ */
+#define One 0
+#define coeff4 64
+#define coeff3 128
+#define coeff2 192
+#define coeff1 256
+#define L2 320
+
+#include <sysdep.h>
+
+ .text
+ .section .text.exex512,"ax",@progbits
+ENTRY(_ZGVeN16v_log10f_skx)
+ pushq %rbp
+ cfi_def_cfa_offset(16)
+ movq %rsp, %rbp
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+ andq $-64, %rsp
+ subq $192, %rsp
+ vgetmantps $11, {sae}, %zmm0, %zmm3
+ vmovups __svml_slog10_data_internal_avx512(%rip), %zmm1
+ vgetexpps {sae}, %zmm0, %zmm5
+ vmovups L2+__svml_slog10_data_internal_avx512(%rip), %zmm10
+ vpsrld $19, %zmm3, %zmm7
+ vgetexpps {sae}, %zmm3, %zmm6
+ vsubps {rn-sae}, %zmm1, %zmm3, %zmm11
+ vpermps coeff4+__svml_slog10_data_internal_avx512(%rip), %zmm7, %zmm1
+ vpermps coeff3+__svml_slog10_data_internal_avx512(%rip), %zmm7, %zmm2
+ vsubps {rn-sae}, %zmm6, %zmm5, %zmm9
+ vpermps coeff2+__svml_slog10_data_internal_avx512(%rip), %zmm7, %zmm4
+ vpermps coeff1+__svml_slog10_data_internal_avx512(%rip), %zmm7, %zmm8
+
+/* x<=0? */
+ vfpclassps $94, %zmm0, %k0
+ vfmadd213ps {rn-sae}, %zmm2, %zmm11, %zmm1
+ vmulps {rn-sae}, %zmm10, %zmm9, %zmm12
+ vfmadd213ps {rn-sae}, %zmm4, %zmm11, %zmm1
+ kmovw %k0, %edx
+ vfmadd213ps {rn-sae}, %zmm8, %zmm11, %zmm1
+ vfmadd213ps {rn-sae}, %zmm12, %zmm11, %zmm1
+ testl %edx, %edx
+
+/* Go to special inputs processing branch */
+ jne L(SPECIAL_VALUES_BRANCH)
+ # LOE rbx r12 r13 r14 r15 edx zmm0 zmm1
+
+/* Restore registers
+ * and exit the function
+ */
+
+L(EXIT):
+ vmovaps %zmm1, %zmm0
+ movq %rbp, %rsp
+ popq %rbp
+ cfi_def_cfa(7, 8)
+ cfi_restore(6)
+ ret
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+
+/* Branch to process
+ * special inputs
+ */
+
+L(SPECIAL_VALUES_BRANCH):
+ vmovups %zmm0, 64(%rsp)
+ vmovups %zmm1, 128(%rsp)
+ # LOE rbx r12 r13 r14 r15 edx zmm1
+
+ xorl %eax, %eax
+ # LOE rbx r12 r13 r14 r15 eax edx
+
+ vzeroupper
+ movq %r12, 16(%rsp)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -176; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x50, 0xff, 0xff, 0xff, 0x22
+ movl %eax, %r12d
+ movq %r13, 8(%rsp)
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -184; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x48, 0xff, 0xff, 0xff, 0x22
+ movl %edx, %r13d
+ movq %r14, (%rsp)
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -192; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x40, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r15 r12d r13d
+
+/* Range mask
+ * bits check
+ */
+
+L(RANGEMASK_CHECK):
+ btl %r12d, %r13d
+
+/* Call scalar math function */
+ jc L(SCALAR_MATH_CALL)
+ # LOE rbx r15 r12d r13d
+
+/* Special inputs
+ * processing loop
+ */
+
+L(SPECIAL_VALUES_LOOP):
+ incl %r12d
+ cmpl $16, %r12d
+
+/* Check bits in range mask */
+ jl L(RANGEMASK_CHECK)
+ # LOE rbx r15 r12d r13d
+
+ movq 16(%rsp), %r12
+ cfi_restore(12)
+ movq 8(%rsp), %r13
+ cfi_restore(13)
+ movq (%rsp), %r14
+ cfi_restore(14)
+ vmovups 128(%rsp), %zmm1
+
+/* Go to exit */
+ jmp L(EXIT)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -176; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x50, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -184; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x48, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -64; DW_OP_and; DW_OP_const4s: -192; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xc0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0x40, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r12 r13 r14 r15 zmm1
+
+/* Scalar math fucntion call
+ * to process special input
+ */
+
+L(SCALAR_MATH_CALL):
+ movl %r12d, %r14d
+ movss 64(%rsp,%r14,4), %xmm0
+ call log10f@PLT
+ # LOE rbx r14 r15 r12d r13d xmm0
+
+ movss %xmm0, 128(%rsp,%r14,4)
+
+/* Process special inputs in loop */
+ jmp L(SPECIAL_VALUES_LOOP)
+ # LOE rbx r15 r12d r13d
+END(_ZGVeN16v_log10f_skx)
+
+ .section .rodata, "a"
+ .align 64
+
+#ifdef __svml_slog10_data_internal_avx512_typedef
+typedef unsigned int VUINT32;
+typedef struct {
+ __declspec(align(64)) VUINT32 One[16][1];
+ __declspec(align(64)) VUINT32 coeff4[16][1];
+ __declspec(align(64)) VUINT32 coeff3[16][1];
+ __declspec(align(64)) VUINT32 coeff2[16][1];
+ __declspec(align(64)) VUINT32 coeff1[16][1];
+ __declspec(align(64)) VUINT32 L2[16][1];
+ } __svml_slog10_data_internal_avx512;
+#endif
+__svml_slog10_data_internal_avx512:
+ /*== One ==*/
+ .long 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000
+ // c4
+ .align 64
+ .long 0xbdc9ae9b, 0xbda6fcf4
+ .long 0xbd8bac76, 0xbd6bca30
+ .long 0xbd48a99b, 0xbd2c0a9f
+ .long 0xbd1480db, 0xbd00faf2
+ .long 0xbe823aa9, 0xbe656348
+ .long 0xbe4afbb9, 0xbe346895
+ .long 0xbe20ffff, 0xbe103a0b
+ .long 0xbe01a91c, 0xbde9e84e
+ // c3
+ .align 64
+ .long 0x3e13d888, 0x3e10a87c
+ .long 0x3e0b95c3, 0x3e057f0b
+ .long 0x3dfde038, 0x3df080d9
+ .long 0x3de34c1e, 0x3dd68333
+ .long 0x3dac6e8e, 0x3dd54a51
+ .long 0x3df30f40, 0x3e04235d
+ .long 0x3e0b7033, 0x3e102c90
+ .long 0x3e12ebad, 0x3e141ff8
+ // c2
+ .align 64
+ .long 0xbe5e5a9b, 0xbe5e2677
+ .long 0xbe5d83f5, 0xbe5c6016
+ .long 0xbe5abd0b, 0xbe58a6fd
+ .long 0xbe562e02, 0xbe5362f8
+ .long 0xbe68e27c, 0xbe646747
+ .long 0xbe619a73, 0xbe5ff05a
+ .long 0xbe5f0570, 0xbe5e92d0
+ .long 0xbe5e662b, 0xbe5e5c08
+ // c1
+ .align 64
+ .long 0x3ede5bd8, 0x3ede5b45
+ .long 0x3ede57d8, 0x3ede4eb1
+ .long 0x3ede3d37, 0x3ede2166
+ .long 0x3eddf9d9, 0x3eddc5bb
+ .long 0x3ede08ed, 0x3ede32e7
+ .long 0x3ede4967, 0x3ede5490
+ .long 0x3ede597f, 0x3ede5b50
+ .long 0x3ede5bca, 0x3ede5bd9
+ /*== L2 ==*/
+ .align 64
+ .long 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b
+ .align 64
+ .type __svml_slog10_data_internal_avx512,@object
+ .size __svml_slog10_data_internal_avx512,.-__svml_slog10_data_internal_avx512
new file mode 100644
@@ -0,0 +1,20 @@
+/* SSE2 version of vectorized log10f, vector length is 4.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define _ZGVbN4v_log10f _ZGVbN4v_log10f_sse2
+#include "../svml_s_log10f4_core.S"
new file mode 100644
@@ -0,0 +1,28 @@
+/* Multiple versions of vectorized log10f, vector length is 4.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define SYMBOL_NAME _ZGVbN4v_log10f
+#include "ifunc-mathvec-sse4_1.h"
+
+libc_ifunc_redirected (REDIRECT_NAME, SYMBOL_NAME, IFUNC_SELECTOR ());
+
+#ifdef SHARED
+__hidden_ver1 (_ZGVbN4v_log10f, __GI__ZGVbN4v_log10f,
+ __redirect__ZGVbN4v_log10f)
+ __attribute__ ((visibility ("hidden")));
+#endif
new file mode 100644
@@ -0,0 +1,243 @@
+/* Function log10f vectorized with SSE4.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ https://www.gnu.org/licenses/. */
+
+/*
+ * ALGORITHM DESCRIPTION:
+ *
+ * Get short reciprocal approximation Rcp ~ 1/mantissa(x)
+ * R = Rcp*x - 1.0
+ * log10(x) = k*log10(2.0) - log10(Rcp) + poly_approximation(R)
+ * log10(Rcp) is tabulated
+ *
+ *
+ */
+
+/* Offsets for data table __svml_slog10_data_internal
+ */
+#define MinNorm 0
+#define MaxNorm 16
+#define L2H 32
+#define L2L 48
+#define iBrkValue 64
+#define iOffExpoMask 80
+#define One 96
+#define sPoly 112
+#define L2 256
+
+#include <sysdep.h>
+
+ .text
+ .section .text.sse4,"ax",@progbits
+ENTRY(_ZGVbN4v_log10f_sse4)
+ subq $72, %rsp
+ cfi_def_cfa_offset(80)
+ movaps %xmm0, %xmm1
+
+/* reduction: compute r,n */
+ movdqu iBrkValue+__svml_slog10_data_internal(%rip), %xmm2
+ movaps %xmm0, %xmm4
+ movdqu iOffExpoMask+__svml_slog10_data_internal(%rip), %xmm10
+ psubd %xmm2, %xmm1
+ pand %xmm1, %xmm10
+ psrad $23, %xmm1
+ paddd %xmm2, %xmm10
+ movaps %xmm0, %xmm3
+ movups sPoly+__svml_slog10_data_internal(%rip), %xmm5
+ movups sPoly+32+__svml_slog10_data_internal(%rip), %xmm6
+ movups sPoly+64+__svml_slog10_data_internal(%rip), %xmm7
+ movups sPoly+96+__svml_slog10_data_internal(%rip), %xmm9
+ cvtdq2ps %xmm1, %xmm12
+ cmpltps MinNorm+__svml_slog10_data_internal(%rip), %xmm4
+ cmpnleps MaxNorm+__svml_slog10_data_internal(%rip), %xmm3
+ subps One+__svml_slog10_data_internal(%rip), %xmm10
+ mulps %xmm10, %xmm5
+ movaps %xmm10, %xmm8
+ mulps %xmm10, %xmm6
+ mulps %xmm10, %xmm8
+ addps sPoly+16+__svml_slog10_data_internal(%rip), %xmm5
+ mulps %xmm10, %xmm7
+ addps sPoly+48+__svml_slog10_data_internal(%rip), %xmm6
+ mulps %xmm10, %xmm9
+ mulps %xmm8, %xmm5
+ addps sPoly+80+__svml_slog10_data_internal(%rip), %xmm7
+ addps sPoly+112+__svml_slog10_data_internal(%rip), %xmm9
+ addps %xmm5, %xmm6
+ mulps %xmm8, %xmm6
+ orps %xmm3, %xmm4
+
+/* combine and get argument value range mask */
+ movmskps %xmm4, %edx
+ movups L2L+__svml_slog10_data_internal(%rip), %xmm1
+ addps %xmm6, %xmm7
+ mulps %xmm12, %xmm1
+ mulps %xmm7, %xmm8
+ movups L2H+__svml_slog10_data_internal(%rip), %xmm11
+ addps %xmm8, %xmm9
+ mulps %xmm11, %xmm12
+ mulps %xmm10, %xmm9
+ addps sPoly+128+__svml_slog10_data_internal(%rip), %xmm9
+ mulps %xmm9, %xmm10
+ addps %xmm10, %xmm1
+ addps %xmm12, %xmm1
+ testl %edx, %edx
+
+/* Go to special inputs processing branch */
+ jne L(SPECIAL_VALUES_BRANCH)
+ # LOE rbx rbp r12 r13 r14 r15 edx xmm0 xmm1
+
+/* Restore registers
+ * and exit the function
+ */
+
+L(EXIT):
+ movaps %xmm1, %xmm0
+ addq $72, %rsp
+ cfi_def_cfa_offset(8)
+ ret
+ cfi_def_cfa_offset(80)
+
+/* Branch to process
+ * special inputs
+ */
+
+L(SPECIAL_VALUES_BRANCH):
+ movups %xmm0, 32(%rsp)
+ movups %xmm1, 48(%rsp)
+ # LOE rbx rbp r12 r13 r14 r15 edx
+
+ xorl %eax, %eax
+ movq %r12, 16(%rsp)
+ cfi_offset(12, -64)
+ movl %eax, %r12d
+ movq %r13, 8(%rsp)
+ cfi_offset(13, -72)
+ movl %edx, %r13d
+ movq %r14, (%rsp)
+ cfi_offset(14, -80)
+ # LOE rbx rbp r15 r12d r13d
+
+/* Range mask
+ * bits check
+ */
+
+L(RANGEMASK_CHECK):
+ btl %r12d, %r13d
+
+/* Call scalar math function */
+ jc L(SCALAR_MATH_CALL)
+ # LOE rbx rbp r15 r12d r13d
+
+/* Special inputs
+ * processing loop
+ */
+
+L(SPECIAL_VALUES_LOOP):
+ incl %r12d
+ cmpl $4, %r12d
+
+/* Check bits in range mask */
+ jl L(RANGEMASK_CHECK)
+ # LOE rbx rbp r15 r12d r13d
+
+ movq 16(%rsp), %r12
+ cfi_restore(12)
+ movq 8(%rsp), %r13
+ cfi_restore(13)
+ movq (%rsp), %r14
+ cfi_restore(14)
+ movups 48(%rsp), %xmm1
+
+/* Go to exit */
+ jmp L(EXIT)
+ cfi_offset(12, -64)
+ cfi_offset(13, -72)
+ cfi_offset(14, -80)
+ # LOE rbx rbp r12 r13 r14 r15 xmm1
+
+/* Scalar math fucntion call
+ * to process special input
+ */
+
+L(SCALAR_MATH_CALL):
+ movl %r12d, %r14d
+ movss 32(%rsp,%r14,4), %xmm0
+ call log10f@PLT
+ # LOE rbx rbp r14 r15 r12d r13d xmm0
+
+ movss %xmm0, 48(%rsp,%r14,4)
+
+/* Process special inputs in loop */
+ jmp L(SPECIAL_VALUES_LOOP)
+ # LOE rbx rbp r15 r12d r13d
+END(_ZGVbN4v_log10f_sse4)
+
+ .section .rodata, "a"
+ .align 16
+
+#ifdef __svml_slog10_data_internal_typedef
+typedef unsigned int VUINT32;
+typedef struct {
+ __declspec(align(16)) VUINT32 MinNorm[4][1];
+ __declspec(align(16)) VUINT32 MaxNorm[4][1];
+ __declspec(align(16)) VUINT32 L2H[4][1];
+ __declspec(align(16)) VUINT32 L2L[4][1];
+ __declspec(align(16)) VUINT32 iBrkValue[4][1];
+ __declspec(align(16)) VUINT32 iOffExpoMask[4][1];
+ __declspec(align(16)) VUINT32 One[4][1];
+ __declspec(align(16)) VUINT32 sPoly[9][4][1];
+ __declspec(align(16)) VUINT32 L2[4][1];
+} __svml_slog10_data_internal;
+#endif
+__svml_slog10_data_internal:
+ /*== MinNorm ==*/
+ .long 0x00800000, 0x00800000, 0x00800000, 0x00800000
+ /*== MaxNorm ==*/
+ .align 16
+ .long 0x7f7fffff, 0x7f7fffff, 0x7f7fffff, 0x7f7fffff
+ /*== L2H ==*/
+ .align 16
+ .long 0x3e9a2100, 0x3e9a2100, 0x3e9a2100, 0x3e9a2100
+ /*== L2L ==*/
+ .align 16
+ .long 0xb64AF600, 0xb64AF600, 0xb64AF600, 0xb64AF600
+ /*== iBrkValue = SP 2/3 ==*/
+ .align 16
+ .long 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab
+ /*== iOffExpoMask = SP significand mask ==*/
+ .align 16
+ .long 0x007fffff, 0x007fffff, 0x007fffff, 0x007fffff
+ /*== sOne = SP 1.0 ==*/
+ .align 16
+ .long 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000
+ /*== spoly[9] ==*/
+ .align 16
+ .long 0x3d8063B4, 0x3d8063B4, 0x3d8063B4, 0x3d8063B4 /* coeff9 */
+ .long 0xbd890073, 0xbd890073, 0xbd890073, 0xbd890073 /* coeff8 */
+ .long 0x3d775317, 0x3d775317, 0x3d775317, 0x3d775317 /* coeff7 */
+ .long 0xbd91FB27, 0xbd91FB27, 0xbd91FB27, 0xbd91FB27 /* coeff6 */
+ .long 0x3dB20B96, 0x3dB20B96, 0x3dB20B96, 0x3dB20B96 /* coeff5 */
+ .long 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20 /* coeff4 */
+ .long 0x3e143CE5, 0x3e143CE5, 0x3e143CE5, 0x3e143CE5 /* coeff3 */
+ .long 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5 /* coeff2 */
+ .long 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9 /* coeff1 */
+ /*== L2 ==*/
+ .align 16
+ .long 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b
+ .align 16
+ .type __svml_slog10_data_internal,@object
+ .size __svml_slog10_data_internal,.-__svml_slog10_data_internal
new file mode 100644
@@ -0,0 +1,20 @@
+/* SSE version of vectorized log10f, vector length is 8.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define _ZGVdN8v_log10f _ZGVdN8v_log10f_sse_wrapper
+#include "../svml_s_log10f8_core.S"
new file mode 100644
@@ -0,0 +1,28 @@
+/* Multiple versions of vectorized log10f, vector length is 8.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#define SYMBOL_NAME _ZGVdN8v_log10f
+#include "ifunc-mathvec-avx2.h"
+
+libc_ifunc_redirected (REDIRECT_NAME, SYMBOL_NAME, IFUNC_SELECTOR ());
+
+#ifdef SHARED
+__hidden_ver1 (_ZGVdN8v_log10f, __GI__ZGVdN8v_log10f,
+ __redirect__ZGVdN8v_log10f)
+ __attribute__ ((visibility ("hidden")));
+#endif
new file mode 100644
@@ -0,0 +1,243 @@
+/* Function log10f vectorized with AVX2.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ https://www.gnu.org/licenses/. */
+
+/*
+ * ALGORITHM DESCRIPTION:
+ *
+ * Get short reciprocal approximation Rcp ~ 1/mantissa(x)
+ * R = Rcp*x - 1.0
+ * log10(x) = k*log10(2.0) - log10(Rcp) + poly_approximation(R)
+ * log10(Rcp) is tabulated
+ *
+ *
+ */
+
+/* Offsets for data table __svml_slog10_data_internal
+ */
+#define MinNorm 0
+#define MaxNorm 32
+#define L2H 64
+#define L2L 96
+#define iBrkValue 128
+#define iOffExpoMask 160
+#define One 192
+#define sPoly 224
+#define L2 512
+
+#include <sysdep.h>
+
+ .text
+ .section .text.avx2,"ax",@progbits
+ENTRY(_ZGVdN8v_log10f_avx2)
+ pushq %rbp
+ cfi_def_cfa_offset(16)
+ movq %rsp, %rbp
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+ andq $-32, %rsp
+ subq $96, %rsp
+
+/* reduction: compute r,n */
+ vmovups iBrkValue+__svml_slog10_data_internal(%rip), %ymm4
+ vmovups sPoly+__svml_slog10_data_internal(%rip), %ymm15
+ vmovups sPoly+64+__svml_slog10_data_internal(%rip), %ymm9
+ vmovups sPoly+128+__svml_slog10_data_internal(%rip), %ymm10
+ vmovups sPoly+192+__svml_slog10_data_internal(%rip), %ymm12
+ vpsubd %ymm4, %ymm0, %ymm1
+ vcmplt_oqps MinNorm+__svml_slog10_data_internal(%rip), %ymm0, %ymm5
+ vcmpnle_uqps MaxNorm+__svml_slog10_data_internal(%rip), %ymm0, %ymm6
+ vpand iOffExpoMask+__svml_slog10_data_internal(%rip), %ymm1, %ymm3
+ vpsrad $23, %ymm1, %ymm2
+ vpaddd %ymm4, %ymm3, %ymm8
+ vcvtdq2ps %ymm2, %ymm1
+ vsubps One+__svml_slog10_data_internal(%rip), %ymm8, %ymm13
+ vmulps L2L+__svml_slog10_data_internal(%rip), %ymm1, %ymm14
+ vfmadd213ps sPoly+32+__svml_slog10_data_internal(%rip), %ymm13, %ymm15
+ vfmadd213ps sPoly+96+__svml_slog10_data_internal(%rip), %ymm13, %ymm9
+ vmulps %ymm13, %ymm13, %ymm11
+ vfmadd213ps sPoly+160+__svml_slog10_data_internal(%rip), %ymm13, %ymm10
+ vfmadd213ps sPoly+224+__svml_slog10_data_internal(%rip), %ymm13, %ymm12
+ vfmadd213ps %ymm9, %ymm11, %ymm15
+ vfmadd213ps %ymm10, %ymm11, %ymm15
+ vfmadd213ps %ymm12, %ymm11, %ymm15
+ vfmadd213ps sPoly+256+__svml_slog10_data_internal(%rip), %ymm13, %ymm15
+ vfmadd213ps %ymm14, %ymm13, %ymm15
+ vorps %ymm6, %ymm5, %ymm7
+
+/* combine and get argument value range mask */
+ vmovmskps %ymm7, %edx
+ vfmadd132ps L2H+__svml_slog10_data_internal(%rip), %ymm15, %ymm1
+ testl %edx, %edx
+
+/* Go to special inputs processing branch */
+ jne L(SPECIAL_VALUES_BRANCH)
+ # LOE rbx r12 r13 r14 r15 edx ymm0 ymm1
+
+/* Restore registers
+ * and exit the function
+ */
+
+L(EXIT):
+ vmovaps %ymm1, %ymm0
+ movq %rbp, %rsp
+ popq %rbp
+ cfi_def_cfa(7, 8)
+ cfi_restore(6)
+ ret
+ cfi_def_cfa(6, 16)
+ cfi_offset(6, -16)
+
+/* Branch to process
+ * special inputs
+ */
+
+L(SPECIAL_VALUES_BRANCH):
+ vmovups %ymm0, 32(%rsp)
+ vmovups %ymm1, 64(%rsp)
+ # LOE rbx r12 r13 r14 r15 edx ymm1
+
+ xorl %eax, %eax
+ # LOE rbx r12 r13 r14 r15 eax edx
+
+ vzeroupper
+ movq %r12, 16(%rsp)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -80; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xb0, 0xff, 0xff, 0xff, 0x22
+ movl %eax, %r12d
+ movq %r13, 8(%rsp)
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -88; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa8, 0xff, 0xff, 0xff, 0x22
+ movl %edx, %r13d
+ movq %r14, (%rsp)
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -96; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa0, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r15 r12d r13d
+
+/* Range mask
+ * bits check
+ */
+
+L(RANGEMASK_CHECK):
+ btl %r12d, %r13d
+
+/* Call scalar math function */
+ jc L(SCALAR_MATH_CALL)
+ # LOE rbx r15 r12d r13d
+
+/* Special inputs
+ * processing loop
+ */
+
+L(SPECIAL_VALUES_LOOP):
+ incl %r12d
+ cmpl $8, %r12d
+
+/* Check bits in range mask */
+ jl L(RANGEMASK_CHECK)
+ # LOE rbx r15 r12d r13d
+
+ movq 16(%rsp), %r12
+ cfi_restore(12)
+ movq 8(%rsp), %r13
+ cfi_restore(13)
+ movq (%rsp), %r14
+ cfi_restore(14)
+ vmovups 64(%rsp), %ymm1
+
+/* Go to exit */
+ jmp L(EXIT)
+ /* DW_CFA_expression: r12 (r12) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -80; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0c, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xb0, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r13 (r13) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -88; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0d, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa8, 0xff, 0xff, 0xff, 0x22
+ /* DW_CFA_expression: r14 (r14) (DW_OP_lit8; DW_OP_minus; DW_OP_const4s: -32; DW_OP_and; DW_OP_const4s: -96; DW_OP_plus) */
+ .cfi_escape 0x10, 0x0e, 0x0e, 0x38, 0x1c, 0x0d, 0xe0, 0xff, 0xff, 0xff, 0x1a, 0x0d, 0xa0, 0xff, 0xff, 0xff, 0x22
+ # LOE rbx r12 r13 r14 r15 ymm1
+
+/* Scalar math fucntion call
+ * to process special input
+ */
+
+L(SCALAR_MATH_CALL):
+ movl %r12d, %r14d
+ movss 32(%rsp,%r14,4), %xmm0
+ call log10f@PLT
+ # LOE rbx r14 r15 r12d r13d xmm0
+
+ movss %xmm0, 64(%rsp,%r14,4)
+
+/* Process special inputs in loop */
+ jmp L(SPECIAL_VALUES_LOOP)
+ # LOE rbx r15 r12d r13d
+END(_ZGVdN8v_log10f_avx2)
+
+ .section .rodata, "a"
+ .align 32
+
+#ifdef __svml_slog10_data_internal_typedef
+typedef unsigned int VUINT32;
+typedef struct {
+ __declspec(align(32)) VUINT32 MinNorm[8][1];
+ __declspec(align(32)) VUINT32 MaxNorm[8][1];
+ __declspec(align(32)) VUINT32 L2H[8][1];
+ __declspec(align(32)) VUINT32 L2L[8][1];
+ __declspec(align(32)) VUINT32 iBrkValue[8][1];
+ __declspec(align(32)) VUINT32 iOffExpoMask[8][1];
+ __declspec(align(32)) VUINT32 One[8][1];
+ __declspec(align(32)) VUINT32 sPoly[9][8][1];
+ __declspec(align(32)) VUINT32 L2[8][1];
+} __svml_slog10_data_internal;
+#endif
+__svml_slog10_data_internal:
+ /*== MinNorm ==*/
+ .long 0x00800000, 0x00800000, 0x00800000, 0x00800000, 0x00800000, 0x00800000, 0x00800000, 0x00800000
+ /*== MaxNorm ==*/
+ .align 32
+ .long 0x7f7fffff, 0x7f7fffff, 0x7f7fffff, 0x7f7fffff, 0x7f7fffff, 0x7f7fffff, 0x7f7fffff, 0x7f7fffff
+ /*== L2H ==*/
+ .align 32
+ .long 0x3e9a2100, 0x3e9a2100, 0x3e9a2100, 0x3e9a2100, 0x3e9a2100, 0x3e9a2100, 0x3e9a2100, 0x3e9a2100
+ /*== L2L ==*/
+ .align 32
+ .long 0xb64AF600, 0xb64AF600, 0xb64AF600, 0xb64AF600, 0xb64AF600, 0xb64AF600, 0xb64AF600, 0xb64AF600
+ /*== iBrkValue = SP 2/3 ==*/
+ .align 32
+ .long 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab, 0x3f2aaaab
+ /*== iOffExpoMask = SP significand mask ==*/
+ .align 32
+ .long 0x007fffff, 0x007fffff, 0x007fffff, 0x007fffff, 0x007fffff, 0x007fffff, 0x007fffff, 0x007fffff
+ /*== sOne = SP 1.0 ==*/
+ .align 32
+ .long 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000, 0x3f800000
+ /*== spoly[9] ==*/
+ .align 32
+ .long 0x3d8063B4, 0x3d8063B4, 0x3d8063B4, 0x3d8063B4, 0x3d8063B4, 0x3d8063B4, 0x3d8063B4, 0x3d8063B4 /* coeff9 */
+ .long 0xbd890073, 0xbd890073, 0xbd890073, 0xbd890073, 0xbd890073, 0xbd890073, 0xbd890073, 0xbd890073 /* coeff8 */
+ .long 0x3d775317, 0x3d775317, 0x3d775317, 0x3d775317, 0x3d775317, 0x3d775317, 0x3d775317, 0x3d775317 /* coeff7 */
+ .long 0xbd91FB27, 0xbd91FB27, 0xbd91FB27, 0xbd91FB27, 0xbd91FB27, 0xbd91FB27, 0xbd91FB27, 0xbd91FB27 /* coeff6 */
+ .long 0x3dB20B96, 0x3dB20B96, 0x3dB20B96, 0x3dB20B96, 0x3dB20B96, 0x3dB20B96, 0x3dB20B96, 0x3dB20B96 /* coeff5 */
+ .long 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20, 0xbdDE6E20 /* coeff4 */
+ .long 0x3e143CE5, 0x3e143CE5, 0x3e143CE5, 0x3e143CE5, 0x3e143CE5, 0x3e143CE5, 0x3e143CE5, 0x3e143CE5 /* coeff3 */
+ .long 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5, 0xbe5E5BC5 /* coeff2 */
+ .long 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9, 0x3eDE5BD9 /* coeff1 */
+ /*== L2 ==*/
+ .align 32
+ .long 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b, 0x3e9a209b
+ .align 32
+ .type __svml_slog10_data_internal,@object
+ .size __svml_slog10_data_internal,.-__svml_slog10_data_internal
new file mode 100644
@@ -0,0 +1,29 @@
+/* Function log10 vectorized with SSE2.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_d_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVbN2v_log10)
+WRAPPER_IMPL_SSE2 log10
+END (_ZGVbN2v_log10)
+
+#ifndef USE_MULTIARCH
+ libmvec_hidden_def (_ZGVbN2v_log10)
+#endif
new file mode 100644
@@ -0,0 +1,29 @@
+/* Function log10 vectorized with AVX2, wrapper version.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_d_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVdN4v_log10)
+WRAPPER_IMPL_AVX _ZGVbN2v_log10
+END (_ZGVdN4v_log10)
+
+#ifndef USE_MULTIARCH
+ libmvec_hidden_def (_ZGVdN4v_log10)
+#endif
new file mode 100644
@@ -0,0 +1,25 @@
+/* Function log10 vectorized in AVX ISA as wrapper to SSE4 ISA version.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_d_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVcN4v_log10)
+WRAPPER_IMPL_AVX _ZGVbN2v_log10
+END (_ZGVcN4v_log10)
new file mode 100644
@@ -0,0 +1,25 @@
+/* Function log10 vectorized with AVX-512, wrapper to AVX2.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_d_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVeN8v_log10)
+WRAPPER_IMPL_AVX512 _ZGVdN4v_log10
+END (_ZGVeN8v_log10)
new file mode 100644
@@ -0,0 +1,25 @@
+/* Function log10f vectorized with AVX-512. Wrapper to AVX2 version.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_s_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVeN16v_log10f)
+WRAPPER_IMPL_AVX512 _ZGVdN8v_log10f
+END (_ZGVeN16v_log10f)
new file mode 100644
@@ -0,0 +1,29 @@
+/* Function log10f vectorized with SSE2, wrapper version.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_s_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVbN4v_log10f)
+WRAPPER_IMPL_SSE2 log10f
+END (_ZGVbN4v_log10f)
+
+#ifndef USE_MULTIARCH
+ libmvec_hidden_def (_ZGVbN4v_log10f)
+#endif
new file mode 100644
@@ -0,0 +1,29 @@
+/* Function log10f vectorized with AVX2, wrapper version.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_s_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVdN8v_log10f)
+WRAPPER_IMPL_AVX _ZGVbN4v_log10f
+END (_ZGVdN8v_log10f)
+
+#ifndef USE_MULTIARCH
+ libmvec_hidden_def (_ZGVdN8v_log10f)
+#endif
new file mode 100644
@@ -0,0 +1,25 @@
+/* Function log10f vectorized in AVX ISA as wrapper to SSE4 ISA version.
+ Copyright (C) 2021 Free Software Foundation, Inc.
+ This file is part of the GNU C Library.
+
+ The GNU C Library is free software; you can redistribute it and/or
+ modify it under the terms of the GNU Lesser General Public
+ License as published by the Free Software Foundation; either
+ version 2.1 of the License, or (at your option) any later version.
+
+ The GNU C Library is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ Lesser General Public License for more details.
+
+ You should have received a copy of the GNU Lesser General Public
+ License along with the GNU C Library; if not, see
+ <https://www.gnu.org/licenses/>. */
+
+#include <sysdep.h>
+#include "svml_s_wrapper_impl.h"
+
+ .text
+ENTRY (_ZGVcN8v_log10f)
+WRAPPER_IMPL_AVX _ZGVbN4v_log10f
+END (_ZGVcN8v_log10f)
new file mode 100644
@@ -0,0 +1 @@
+#include "test-double-libmvec-log10.c"
new file mode 100644
@@ -0,0 +1 @@
+#include "test-double-libmvec-log10.c"
new file mode 100644
@@ -0,0 +1 @@
+#include "test-double-libmvec-log10.c"
new file mode 100644
@@ -0,0 +1,3 @@
+#define LIBMVEC_TYPE double
+#define LIBMVEC_FUNC log10
+#include "test-vector-abi-arg1.h"
@@ -38,6 +38,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1), _ZGVbN2v_expm1)
VECTOR_WRAPPER (WRAPPER_NAME (sinh), _ZGVbN2v_sinh)
VECTOR_WRAPPER (WRAPPER_NAME (cbrt), _ZGVbN2v_cbrt)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2), _ZGVbN2vv_atan2)
+VECTOR_WRAPPER (WRAPPER_NAME (log10), _ZGVbN2v_log10)
#define VEC_INT_TYPE __m128i
@@ -41,6 +41,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1), _ZGVdN4v_expm1)
VECTOR_WRAPPER (WRAPPER_NAME (sinh), _ZGVdN4v_sinh)
VECTOR_WRAPPER (WRAPPER_NAME (cbrt), _ZGVdN4v_cbrt)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2), _ZGVdN4vv_atan2)
+VECTOR_WRAPPER (WRAPPER_NAME (log10), _ZGVdN4v_log10)
#ifndef __ILP32__
# define VEC_INT_TYPE __m256i
@@ -38,6 +38,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1), _ZGVcN4v_expm1)
VECTOR_WRAPPER (WRAPPER_NAME (sinh), _ZGVcN4v_sinh)
VECTOR_WRAPPER (WRAPPER_NAME (cbrt), _ZGVcN4v_cbrt)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2), _ZGVcN4vv_atan2)
+VECTOR_WRAPPER (WRAPPER_NAME (log10), _ZGVcN4v_log10)
#define VEC_INT_TYPE __m128i
@@ -38,6 +38,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1), _ZGVeN8v_expm1)
VECTOR_WRAPPER (WRAPPER_NAME (sinh), _ZGVeN8v_sinh)
VECTOR_WRAPPER (WRAPPER_NAME (cbrt), _ZGVeN8v_cbrt)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2), _ZGVeN8vv_atan2)
+VECTOR_WRAPPER (WRAPPER_NAME (log10), _ZGVeN8v_log10)
#ifndef __ILP32__
# define VEC_INT_TYPE __m512i
new file mode 100644
@@ -0,0 +1 @@
+#include "test-float-libmvec-log10f.c"
new file mode 100644
@@ -0,0 +1 @@
+#include "test-float-libmvec-log10f.c"
new file mode 100644
@@ -0,0 +1 @@
+#include "test-float-libmvec-log10f.c"
new file mode 100644
@@ -0,0 +1,3 @@
+#define LIBMVEC_TYPE float
+#define LIBMVEC_FUNC log10f
+#include "test-vector-abi-arg1.h"
@@ -38,6 +38,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1f), _ZGVeN16v_expm1f)
VECTOR_WRAPPER (WRAPPER_NAME (sinhf), _ZGVeN16v_sinhf)
VECTOR_WRAPPER (WRAPPER_NAME (cbrtf), _ZGVeN16v_cbrtf)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2f), _ZGVeN16vv_atan2f)
+VECTOR_WRAPPER (WRAPPER_NAME (log10f), _ZGVeN16v_log10f)
#define VEC_INT_TYPE __m512i
@@ -38,6 +38,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1f), _ZGVbN4v_expm1f)
VECTOR_WRAPPER (WRAPPER_NAME (sinhf), _ZGVbN4v_sinhf)
VECTOR_WRAPPER (WRAPPER_NAME (cbrtf), _ZGVbN4v_cbrtf)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2f), _ZGVbN4vv_atan2f)
+VECTOR_WRAPPER (WRAPPER_NAME (log10f), _ZGVbN4v_log10f)
#define VEC_INT_TYPE __m128i
@@ -41,6 +41,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1f), _ZGVdN8v_expm1f)
VECTOR_WRAPPER (WRAPPER_NAME (sinhf), _ZGVdN8v_sinhf)
VECTOR_WRAPPER (WRAPPER_NAME (cbrtf), _ZGVdN8v_cbrtf)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2f), _ZGVdN8vv_atan2f)
+VECTOR_WRAPPER (WRAPPER_NAME (log10f), _ZGVdN8v_log10f)
/* Redefinition of wrapper to be compatible with _ZGVdN8vvv_sincosf. */
#undef VECTOR_WRAPPER_fFF
@@ -38,6 +38,7 @@ VECTOR_WRAPPER (WRAPPER_NAME (expm1f), _ZGVcN8v_expm1f)
VECTOR_WRAPPER (WRAPPER_NAME (sinhf), _ZGVcN8v_sinhf)
VECTOR_WRAPPER (WRAPPER_NAME (cbrtf), _ZGVcN8v_cbrtf)
VECTOR_WRAPPER_ff (WRAPPER_NAME (atan2f), _ZGVcN8vv_atan2f)
+VECTOR_WRAPPER (WRAPPER_NAME (log10f), _ZGVcN8v_log10f)
#define VEC_INT_TYPE __m128i