[thirdparty/glibc.git] / sysdeps / ieee754 / ldbl-128ibm / e_gammal_r.c

/* Implementation of gamma function according to ISO C.
   Copyright (C) 1997-2021 Free Software Foundation, Inc.
   This file is part of the GNU C Library.
   Contributed by Ulrich Drepper <drepper@cygnus.com>, 1997 and
		  Jakub Jelinek <jj@ultra.linux.cz, 1999.

   The GNU C Library is free software; you can redistribute it and/or
   modify it under the terms of the GNU Lesser General Public
   License as published by the Free Software Foundation; either
   version 2.1 of the License, or (at your option) any later version.

   The GNU C Library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
   Lesser General Public License for more details.

   You should have received a copy of the GNU Lesser General Public
   License along with the GNU C Library; if not, see
   <https://www.gnu.org/licenses/>.  */

#include <math.h>
#include <math_private.h>
#include <fenv_private.h>
#include <math-underflow.h>
#include <float.h>
#include <libm-alias-finite.h>

/* Coefficients B_2k / 2k(2k-1) of x^-(2k-1) inside exp in Stirling's
   approximation to gamma function.  */

static const long double gamma_coeff[] =
  {
    0x1.555555555555555555555555558p-4L,
    -0xb.60b60b60b60b60b60b60b60b6p-12L,
    0x3.4034034034034034034034034p-12L,
    -0x2.7027027027027027027027027p-12L,
    0x3.72a3c5631fe46ae1d4e700dca9p-12L,
    -0x7.daac36664f1f207daac36664f2p-12L,
    0x1.a41a41a41a41a41a41a41a41a4p-8L,
    -0x7.90a1b2c3d4e5f708192a3b4c5ep-8L,
    0x2.dfd2c703c0cfff430edfd2c704p-4L,
    -0x1.6476701181f39edbdb9ce625988p+0L,
    0xd.672219167002d3a7a9c886459cp+0L,
    -0x9.cd9292e6660d55b3f712eb9e08p+4L,
    0x8.911a740da740da740da740da74p+8L,
  };

#define NCOEFF (sizeof (gamma_coeff) / sizeof (gamma_coeff[0]))

/* Return gamma (X), for positive X less than 191, in the form R *
   2^(*EXP2_ADJ), where R is the return value and *EXP2_ADJ is set to
   avoid overflow or underflow in intermediate calculations.  */

static long double
gammal_positive (long double x, int *exp2_adj)
{
  int local_signgam;
  if (x < 0.5L)
    {
      *exp2_adj = 0;
      return __ieee754_expl (__ieee754_lgammal_r (x + 1, &local_signgam)) / x;
    }
  else if (x <= 1.5L)
    {
      *exp2_adj = 0;
      return __ieee754_expl (__ieee754_lgammal_r (x, &local_signgam));
    }
  else if (x < 11.5L)
    {
      /* Adjust into the range for using exp (lgamma).  */
      *exp2_adj = 0;
      long double n = ceill (x - 1.5L);
      long double x_adj = x - n;
      long double eps;
      long double prod = __gamma_productl (x_adj, 0, n, &eps);
      return (__ieee754_expl (__ieee754_lgammal_r (x_adj, &local_signgam))
	      * prod * (1.0L + eps));
    }
  else
    {
      long double eps = 0;
      long double x_eps = 0;
      long double x_adj = x;
      long double prod = 1;
      if (x < 23.0L)
	{
	  /* Adjust into the range for applying Stirling's
	     approximation.  */
	  long double n = ceill (23.0L - x);
	  x_adj = x + n;
	  x_eps = (x - (x_adj - n));
	  prod = __gamma_productl (x_adj - n, x_eps, n, &eps);
	}
      /* The result is now gamma (X_ADJ + X_EPS) / (PROD * (1 + EPS)).
	 Compute gamma (X_ADJ + X_EPS) using Stirling's approximation,
	 starting by computing pow (X_ADJ, X_ADJ) with a power of 2
	 factored out.  */
      long double exp_adj = -eps;
      long double x_adj_int = roundl (x_adj);
      long double x_adj_frac = x_adj - x_adj_int;
      int x_adj_log2;
      long double x_adj_mant = __frexpl (x_adj, &x_adj_log2);
      if (x_adj_mant < M_SQRT1_2l)
	{
	  x_adj_log2--;
	  x_adj_mant *= 2.0L;
	}
      *exp2_adj = x_adj_log2 * (int) x_adj_int;
      long double ret = (__ieee754_powl (x_adj_mant, x_adj)
			 * __ieee754_exp2l (x_adj_log2 * x_adj_frac)
			 * __ieee754_expl (-x_adj)
			 * sqrtl (2 * M_PIl / x_adj)
			 / prod);
      exp_adj += x_eps * __ieee754_logl (x_adj);
      long double bsum = gamma_coeff[NCOEFF - 1];
      long double x_adj2 = x_adj * x_adj;
      for (size_t i = 1; i <= NCOEFF - 1; i++)
	bsum = bsum / x_adj2 + gamma_coeff[NCOEFF - 1 - i];
      exp_adj += bsum / x_adj;
      return ret + ret * __expm1l (exp_adj);
    }
}

long double
__ieee754_gammal_r (long double x, int *signgamp)
{
  int64_t hx;
  double xhi;
  long double ret;

  xhi = ldbl_high (x);
  EXTRACT_WORDS64 (hx, xhi);

  if ((hx & 0x7fffffffffffffffLL) == 0)
    {
      /* Return value for x == 0 is Inf with divide by zero exception.  */
      *signgamp = 0;
      return 1.0 / x;
    }
  if (hx < 0 && (uint64_t) hx < 0xfff0000000000000ULL && rintl (x) == x)
    {
      /* Return value for integer x < 0 is NaN with invalid exception.  */
      *signgamp = 0;
      return (x - x) / (x - x);
    }
  if (hx == 0xfff0000000000000ULL)
    {
      /* x == -Inf.  According to ISO this is NaN.  */
      *signgamp = 0;
      return x - x;
    }
  if ((hx & 0x7ff0000000000000ULL) == 0x7ff0000000000000ULL)
    {
      /* Positive infinity (return positive infinity) or NaN (return
	 NaN).  */
      *signgamp = 0;
      return x + x;
    }

  if (x >= 172.0L)
    {
      /* Overflow.  */
      *signgamp = 0;
      return LDBL_MAX * LDBL_MAX;
    }
  else
    {
      SET_RESTORE_ROUNDL (FE_TONEAREST);
      if (x > 0.0L)
	{
	  *signgamp = 0;
	  int exp2_adj;
	  ret = gammal_positive (x, &exp2_adj);
	  ret = __scalbnl (ret, exp2_adj);
	}
      else if (x >= -0x1p-110L)
	{
	  *signgamp = 0;
	  ret = 1.0L / x;
	}
      else
	{
	  long double tx = truncl (x);
	  *signgamp = (tx == 2.0L * truncl (tx / 2.0L)) ? -1 : 1;
	  if (x <= -191.0L)
	    /* Underflow.  */
	    ret = LDBL_MIN * LDBL_MIN;
	  else
	    {
	      long double frac = tx - x;
	      if (frac > 0.5L)
		frac = 1.0L - frac;
	      long double sinpix = (frac <= 0.25L
				    ? __sinl (M_PIl * frac)
				    : __cosl (M_PIl * (0.5L - frac)));
	      int exp2_adj;
	      ret = M_PIl / (-x * sinpix
			     * gammal_positive (-x, &exp2_adj));
	      ret = __scalbnl (ret, -exp2_adj);
	      math_check_force_underflow_nonneg (ret);
	    }
	}
    }
  if (isinf (ret) && x != 0)
    {
      if (*signgamp < 0)
	return -(-copysignl (LDBL_MAX, ret) * LDBL_MAX);
      else
	return copysignl (LDBL_MAX, ret) * LDBL_MAX;
    }
  else if (ret == 0)
    {
      if (*signgamp < 0)
	return -(-copysignl (LDBL_MIN, ret) * LDBL_MIN);
      else
	return copysignl (LDBL_MIN, ret) * LDBL_MIN;
    }
  else
    return ret;
}
libm_alias_finite (__ieee754_gammal_r, __gammal_r)
Commit	Line	Data
f964490f	1	/* Implementation of gamma function according to ISO C.
2b778ceb	2	Copyright (C) 1997-2021 Free Software Foundation, Inc.
f964490f RM	3	This file is part of the GNU C Library.
f964490f RM	4	Contributed by Ulrich Drepper <drepper@cygnus.com>, 1997 and
0ac5ae23	5	Jakub Jelinek <jj@ultra.linux.cz, 1999.
f964490f RM	6
	7	The GNU C Library is free software; you can redistribute it and/or
	8	modify it under the terms of the GNU Lesser General Public
	9	License as published by the Free Software Foundation; either
	10	version 2.1 of the License, or (at your option) any later version.
	11
	12	The GNU C Library is distributed in the hope that it will be useful,
	13	but WITHOUT ANY WARRANTY; without even the implied warranty of
	14	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	15	Lesser General Public License for more details.
	16
	17	You should have received a copy of the GNU Lesser General Public
59ba27a6	18	License along with the GNU C Library; if not, see
5a82c748	19	<https://www.gnu.org/licenses/>. */
f964490f RM	20
	21	#include <math.h>
	22	#include <math_private.h>
70e2ba33	23	#include <fenv_private.h>
8f5b00d3	24	#include <math-underflow.h>
d8cd06db	25	#include <float.h>
220622dd	26	#include <libm-alias-finite.h>
f964490f	27
d8cd06db JM	28	/* Coefficients B_2k / 2k(2k-1) of x^-(2k-1) inside exp in Stirling's
	29	approximation to gamma function. */
	30
	31	static const long double gamma_coeff[] =
	32	{
	33	0x1.555555555555555555555555558p-4L,
	34	-0xb.60b60b60b60b60b60b60b60b6p-12L,
	35	0x3.4034034034034034034034034p-12L,
	36	-0x2.7027027027027027027027027p-12L,
	37	0x3.72a3c5631fe46ae1d4e700dca9p-12L,
	38	-0x7.daac36664f1f207daac36664f2p-12L,
	39	0x1.a41a41a41a41a41a41a41a41a4p-8L,
	40	-0x7.90a1b2c3d4e5f708192a3b4c5ep-8L,
	41	0x2.dfd2c703c0cfff430edfd2c704p-4L,
	42	-0x1.6476701181f39edbdb9ce625988p+0L,
	43	0xd.672219167002d3a7a9c886459cp+0L,
	44	-0x9.cd9292e6660d55b3f712eb9e08p+4L,
	45	0x8.911a740da740da740da740da74p+8L,
	46	};
	47
	48	#define NCOEFF (sizeof (gamma_coeff) / sizeof (gamma_coeff[0]))
	49
	50	/* Return gamma (X), for positive X less than 191, in the form R *
	51	2^(EXP2_ADJ), where R is the return value and EXP2_ADJ is set to
	52	avoid overflow or underflow in intermediate calculations. */
	53
	54	static long double
	55	gammal_positive (long double x, int *exp2_adj)
	56	{
	57	int local_signgam;
	58	if (x < 0.5L)
	59	{
	60	*exp2_adj = 0;
	61	return __ieee754_expl (__ieee754_lgammal_r (x + 1, &local_signgam)) / x;
	62	}
	63	else if (x <= 1.5L)
	64	{
	65	*exp2_adj = 0;
	66	return __ieee754_expl (__ieee754_lgammal_r (x, &local_signgam));
	67	}
	68	else if (x < 11.5L)
	69	{
	70	/* Adjust into the range for using exp (lgamma). */
	71	*exp2_adj = 0;
71223ef9	72	long double n = ceill (x - 1.5L);
d8cd06db JM	73	long double x_adj = x - n;
	74	long double eps;
	75	long double prod = __gamma_productl (x_adj, 0, n, &eps);
	76	return (__ieee754_expl (__ieee754_lgammal_r (x_adj, &local_signgam))
	77	* prod * (1.0L + eps));
	78	}
	79	else
	80	{
	81	long double eps = 0;
	82	long double x_eps = 0;
	83	long double x_adj = x;
	84	long double prod = 1;
	85	if (x < 23.0L)
	86	{
	87	/* Adjust into the range for applying Stirling's
	88	approximation. */
71223ef9	89	long double n = ceill (23.0L - x);
d8cd06db JM	90	x_adj = x + n;
	91	x_eps = (x - (x_adj - n));
	92	prod = __gamma_productl (x_adj - n, x_eps, n, &eps);
	93	}
	94	/* The result is now gamma (X_ADJ + X_EPS) / (PROD * (1 + EPS)).
	95	Compute gamma (X_ADJ + X_EPS) using Stirling's approximation,
	96	starting by computing pow (X_ADJ, X_ADJ) with a power of 2
	97	factored out. */
	98	long double exp_adj = -eps;
9755bc46	99	long double x_adj_int = roundl (x_adj);
d8cd06db JM	100	long double x_adj_frac = x_adj - x_adj_int;
	101	int x_adj_log2;
	102	long double x_adj_mant = __frexpl (x_adj, &x_adj_log2);
	103	if (x_adj_mant < M_SQRT1_2l)
	104	{
	105	x_adj_log2--;
	106	x_adj_mant *= 2.0L;
	107	}
	108	exp2_adj = x_adj_log2 (int) x_adj_int;
	109	long double ret = (__ieee754_powl (x_adj_mant, x_adj)
	110	* __ieee754_exp2l (x_adj_log2 * x_adj_frac)
	111	* __ieee754_expl (-x_adj)
f67a8147	112	* sqrtl (2 * M_PIl / x_adj)
d8cd06db	113	/ prod);
e02920bc	114	exp_adj += x_eps * __ieee754_logl (x_adj);
d8cd06db JM	115	long double bsum = gamma_coeff[NCOEFF - 1];
	116	long double x_adj2 = x_adj * x_adj;
	117	for (size_t i = 1; i <= NCOEFF - 1; i++)
	118	bsum = bsum / x_adj2 + gamma_coeff[NCOEFF - 1 - i];
	119	exp_adj += bsum / x_adj;
	120	return ret + ret * __expm1l (exp_adj);
	121	}
	122	}
f964490f RM	123
	124	long double
	125	__ieee754_gammal_r (long double x, int *signgamp)
	126	{
f964490f	127	int64_t hx;
765714ca	128	double xhi;
e02920bc	129	long double ret;
f964490f	130
765714ca AM	131	xhi = ldbl_high (x);
765714ca AM	132	EXTRACT_WORDS64 (hx, xhi);
f964490f	133
765714ca	134	if ((hx & 0x7fffffffffffffffLL) == 0)
f964490f RM	135	{
	136	/* Return value for x == 0 is Inf with divide by zero exception. */
	137	*signgamp = 0;
	138	return 1.0 / x;
	139	}
f29b6f17	140	if (hx < 0 && (uint64_t) hx < 0xfff0000000000000ULL && rintl (x) == x)
f964490f RM	141	{
	142	/* Return value for integer x < 0 is NaN with invalid exception. */
	143	*signgamp = 0;
	144	return (x - x) / (x - x);
	145	}
	146	if (hx == 0xfff0000000000000ULL)
	147	{
	148	/* x == -Inf. According to ISO this is NaN. */
	149	*signgamp = 0;
	150	return x - x;
	151	}
d8cd06db JM	152	if ((hx & 0x7ff0000000000000ULL) == 0x7ff0000000000000ULL)
	153	{
	154	/* Positive infinity (return positive infinity) or NaN (return
	155	NaN). */
	156	*signgamp = 0;
	157	return x + x;
	158	}
f964490f	159
d8cd06db JM	160	if (x >= 172.0L)
	161	{
	162	/* Overflow. */
	163	*signgamp = 0;
	164	return LDBL_MAX * LDBL_MAX;
	165	}
e02920bc	166	else
d8cd06db	167	{
e02920bc JM	168	SET_RESTORE_ROUNDL (FE_TONEAREST);
	169	if (x > 0.0L)
	170	{
	171	*signgamp = 0;
	172	int exp2_adj;
	173	ret = gammal_positive (x, &exp2_adj);
	174	ret = __scalbnl (ret, exp2_adj);
	175	}
	176	else if (x >= -0x1p-110L)
	177	{
	178	*signgamp = 0;
	179	ret = 1.0L / x;
	180	}
	181	else
	182	{
7abf97be JM	183	long double tx = truncl (x);
7abf97be JM	184	signgamp = (tx == 2.0L truncl (tx / 2.0L)) ? -1 : 1;
e02920bc JM	185	if (x <= -191.0L)
	186	/* Underflow. */
	187	ret = LDBL_MIN * LDBL_MIN;
	188	else
	189	{
	190	long double frac = tx - x;
	191	if (frac > 0.5L)
	192	frac = 1.0L - frac;
	193	long double sinpix = (frac <= 0.25L
	194	? __sinl (M_PIl * frac)
	195	: __cosl (M_PIl * (0.5L - frac)));
	196	int exp2_adj;
	197	ret = M_PIl / (-x * sinpix
	198	* gammal_positive (-x, &exp2_adj));
	199	ret = __scalbnl (ret, -exp2_adj);
d96164c3	200	math_check_force_underflow_nonneg (ret);
e02920bc JM	201	}
e02920bc JM	202	}
d8cd06db	203	}
e02920bc	204	if (isinf (ret) && x != 0)
d8cd06db	205	{
e02920bc	206	if (*signgamp < 0)
81dca813	207	return -(-copysignl (LDBL_MAX, ret) * LDBL_MAX);
e02920bc	208	else
81dca813	209	return copysignl (LDBL_MAX, ret) * LDBL_MAX;
d8cd06db	210	}
e02920bc	211	else if (ret == 0)
d8cd06db	212	{
e02920bc	213	if (*signgamp < 0)
81dca813	214	return -(-copysignl (LDBL_MIN, ret) * LDBL_MIN);
e02920bc	215	else
81dca813	216	return copysignl (LDBL_MIN, ret) * LDBL_MIN;
d8cd06db	217	}
e02920bc JM	218	else
e02920bc JM	219	return ret;
f964490f	220	}
220622dd	221	libm_alias_finite (__ieee754_gammal_r, __gammal_r)