[thirdparty/glibc.git] / sysdeps / ieee754 / dbl-64 / mpexp.c

/*
 * IBM Accurate Mathematical Library
 * written by International Business Machines Corp.
 * Copyright (C) 2001-2018 Free Software Foundation, Inc.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU  Lesser General Public License as published by
 * the Free Software Foundation; either version 2.1 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License
 * along with this program; if not, see <http://www.gnu.org/licenses/>.
 */
/*************************************************************************/
/*   MODULE_NAME:mpexp.c                                                 */
/*                                                                       */
/*   FUNCTIONS: mpexp                                                    */
/*                                                                       */
/*   FILES NEEDED: mpa.h endian.h mpexp.h                                */
/*                 mpa.c                                                 */
/*                                                                       */
/* Multi-Precision exponential function subroutine                       */
/*   (  for p >= 4, 2**(-55) <= abs(x) <= 1024     ).                    */
/*************************************************************************/

#include "endian.h"
#include "mpa.h"
#include <assert.h>

#ifndef SECTION
# define SECTION
#endif

/* Multi-Precision exponential function subroutine (for p >= 4,
   2**(-55) <= abs(x) <= 1024).  */
void
SECTION
__mpexp (mp_no *x, mp_no *y, int p)
{
  int i, j, k, m, m1, m2, n;
  mantissa_t b;
  static const int np[33] =
    {
      0, 0, 0, 0, 3, 3, 4, 4, 5, 4, 4, 5, 5, 5, 6, 6, 6, 6, 6, 6,
      6, 6, 6, 6, 7, 7, 7, 7, 8, 8, 8, 8, 8
    };

  static const int m1p[33] =
    {
      0, 0, 0, 0,
      17, 23, 23, 28,
      27, 38, 42, 39,
      43, 47, 43, 47,
      50, 54, 57, 60,
      64, 67, 71, 74,
      68, 71, 74, 77,
      70, 73, 76, 78,
      81
    };
  static const int m1np[7][18] =
    {
      {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0},
      {0, 0, 0, 0, 36, 48, 60, 72, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0},
      {0, 0, 0, 0, 24, 32, 40, 48, 56, 64, 72, 0, 0, 0, 0, 0, 0, 0},
      {0, 0, 0, 0, 17, 23, 29, 35, 41, 47, 53, 59, 65, 0, 0, 0, 0, 0},
      {0, 0, 0, 0, 0, 0, 23, 28, 33, 38, 42, 47, 52, 57, 62, 66, 0, 0},
      {0, 0, 0, 0, 0, 0, 0, 0, 27, 0, 0, 39, 43, 47, 51, 55, 59, 63},
      {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 43, 47, 50, 54}
    };
  mp_no mps, mpk, mpt1, mpt2;

  /* Choose m,n and compute a=2**(-m).  */
  n = np[p];
  m1 = m1p[p];
  b = X[1];
  m2 = 24 * EX;
  for (; b < HALFRAD; m2--)
    b *= 2;
  if (b == HALFRAD)
    {
      for (i = 2; i <= p; i++)
	{
	  if (X[i] != 0)
	    break;
	}
      if (i == p + 1)
	m2--;
    }

  m = m1 + m2;
  if (__glibc_unlikely (m <= 0))
    {
      /* The m1np array which is used to determine if we can reduce the
	 polynomial expansion iterations, has only 18 elements.  Besides,
	 numbers smaller than those required by p >= 18 should not come here
	 at all since the fast phase of exp returns 1.0 for anything less
	 than 2^-55.  */
      assert (p < 18);
      m = 0;
      for (i = n - 1; i > 0; i--, n--)
	if (m1np[i][p] + m2 > 0)
	  break;
    }

  /* Compute s=x*2**(-m). Put result in mps.  This is the range-reduced input
     that we will use to compute e^s.  For the final result, simply raise it
     to 2^m.  */
  __pow_mp (-m, &mpt1, p);
  __mul (x, &mpt1, &mps, p);

  /* Compute the Taylor series for e^s:

         1 + x/1! + x^2/2! + x^3/3! ...

     for N iterations.  We compute this as:

         e^x = 1 + (x * n!/1! + x^2 * n!/2! + x^3 * n!/3!) / n!
             = 1 + (x * (n!/1! + x * (n!/2! + x * (n!/3! + x ...)))) / n!

     k! is computed on the fly as KF and at the end of the polynomial loop, KF
     is n!, which can be used directly.  */
  __cpy (&mps, &mpt2, p);

  double kf = 1.0;

  /* Evaluate the rest.  The result will be in mpt2.  */
  for (k = n - 1; k > 0; k--)
    {
      /* n! / k! = n * (n - 1) ... * (n - k + 1) */
      kf *= k + 1;

      __dbl_mp (kf, &mpk, p);
      __add (&mpt2, &mpk, &mpt1, p);
      __mul (&mps, &mpt1, &mpt2, p);
    }
  __dbl_mp (kf, &mpk, p);
  __dvd (&mpt2, &mpk, &mpt1, p);
  __add (&__mpone, &mpt1, &mpt2, p);

  /* Raise polynomial value to the power of 2**m. Put result in y.  */
  for (k = 0, j = 0; k < m;)
    {
      __sqr (&mpt2, &mpt1, p);
      k++;
      if (k == m)
	{
	  j = 1;
	  break;
	}
      __sqr (&mpt1, &mpt2, p);
      k++;
    }
  if (j)
    __cpy (&mpt1, y, p);
  else
    __cpy (&mpt2, y, p);
  return;
}
Commit	Line	Data
e4d82761 UD	1	/*
e4d82761 UD	2	* IBM Accurate Mathematical Library
aeb25823	3	* written by International Business Machines Corp.
688903eb	4	* Copyright (C) 2001-2018 Free Software Foundation, Inc.
e4d82761 UD	5	*
	6	* This program is free software; you can redistribute it and/or modify
	7	* it under the terms of the GNU Lesser General Public License as published by
cc7375ce	8	* the Free Software Foundation; either version 2.1 of the License, or
e4d82761	9	* (at your option) any later version.
50944bca	10	*
e4d82761 UD	11	* This program is distributed in the hope that it will be useful,
	12	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	13	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
c6c6dd48	14	* GNU Lesser General Public License for more details.
e4d82761 UD	15	*
e4d82761 UD	16	* You should have received a copy of the GNU Lesser General Public License
59ba27a6	17	* along with this program; if not, see <http://www.gnu.org/licenses/>.
e4d82761 UD	18	*/
	19	/*************************************************************************/
	20	/* MODULE_NAME:mpexp.c */
	21	/* */
	22	/* FUNCTIONS: mpexp */
	23	/* */
	24	/* FILES NEEDED: mpa.h endian.h mpexp.h */
	25	/* mpa.c */
	26	/* */
	27	/* Multi-Precision exponential function subroutine */
	28	/* ( for p >= 4, 2*(-55) <= abs(x) <= 1024 ). /
	29	/*************************************************************************/
	30
	31	#include "endian.h"
	32	#include "mpa.h"
4d55b4e5	33	#include <assert.h>
e4d82761	34
31d3cc00 UD	35	#ifndef SECTION
	36	# define SECTION
	37	#endif
	38
7490eb81 SP	39	/* Multi-Precision exponential function subroutine (for p >= 4,
7490eb81 SP	40	2*(-55) <= abs(x) <= 1024). /
31d3cc00 UD	41	void
31d3cc00 UD	42	SECTION
7490eb81 SP	43	__mpexp (mp_no x, mp_no y, int p)
	44	{
	45	int i, j, k, m, m1, m2, n;
e7906a47	46	mantissa_t b;
7490eb81 SP	47	static const int np[33] =
	48	{
	49	0, 0, 0, 0, 3, 3, 4, 4, 5, 4, 4, 5, 5, 5, 6, 6, 6, 6, 6, 6,
	50	6, 6, 6, 6, 7, 7, 7, 7, 8, 8, 8, 8, 8
	51	};
4e92d59e	52
7490eb81	53	static const int m1p[33] =
751b85f7 SP	54	{
	55	0, 0, 0, 0,
	56	17, 23, 23, 28,
	57	27, 38, 42, 39,
	58	43, 47, 43, 47,
	59	50, 54, 57, 60,
	60	64, 67, 71, 74,
	61	68, 71, 74, 77,
	62	70, 73, 76, 78,
	63	81
	64	};
7490eb81 SP	65	static const int m1np[7][18] =
	66	{
	67	{0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0},
	68	{0, 0, 0, 0, 36, 48, 60, 72, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0},
	69	{0, 0, 0, 0, 24, 32, 40, 48, 56, 64, 72, 0, 0, 0, 0, 0, 0, 0},
	70	{0, 0, 0, 0, 17, 23, 29, 35, 41, 47, 53, 59, 65, 0, 0, 0, 0, 0},
	71	{0, 0, 0, 0, 0, 0, 23, 28, 33, 38, 42, 47, 52, 57, 62, 66, 0, 0},
	72	{0, 0, 0, 0, 0, 0, 0, 0, 27, 0, 0, 39, 43, 47, 51, 55, 59, 63},
	73	{0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 43, 47, 50, 54}
	74	};
4e92d59e	75	mp_no mps, mpk, mpt1, mpt2;
e4d82761	76
7490eb81 SP	77	/* Choose m,n and compute a=2*(-m). /
	78	n = np[p];
	79	m1 = m1p[p];
d3b9ea61	80	b = X[1];
7490eb81	81	m2 = 24 * EX;
d3b9ea61	82	for (; b < HALFRAD; m2--)
e7906a47	83	b *= 2;
d3b9ea61	84	if (b == HALFRAD)
7490eb81 SP	85	{
	86	for (i = 2; i <= p; i++)
	87	{
a64d7e0e	88	if (X[i] != 0)
7490eb81 SP	89	break;
	90	}
	91	if (i == p + 1)
caa99d06	92	m2--;
7490eb81	93	}
4d55b4e5 SP	94
	95	m = m1 + m2;
	96	if (__glibc_unlikely (m <= 0))
	97	{
	98	/* The m1np array which is used to determine if we can reduce the
	99	polynomial expansion iterations, has only 18 elements. Besides,
	100	numbers smaller than those required by p >= 18 should not come here
	101	at all since the fast phase of exp returns 1.0 for anything less
	102	than 2^-55. */
	103	assert (p < 18);
	104	m = 0;
4d55b4e5 SP	105	for (i = n - 1; i > 0; i--, n--)
	106	if (m1np[i][p] + m2 > 0)
	107	break;
	108	}
e4d82761	109
4e92d59e SP	110	/* Compute s=x2*(-m). Put result in mps. This is the range-reduced input
	111	that we will use to compute e^s. For the final result, simply raise it
	112	to 2^m. */
caa99d06	113	__pow_mp (-m, &mpt1, p);
7490eb81	114	__mul (x, &mpt1, &mps, p);
e4d82761	115
4e92d59e SP	116	/* Compute the Taylor series for e^s:
	117
	118	1 + x/1! + x^2/2! + x^3/3! ...
	119
	120	for N iterations. We compute this as:
	121
	122	e^x = 1 + (x * n!/1! + x^2 * n!/2! + x^3 * n!/3!) / n!
	123	= 1 + (x * (n!/1! + x * (n!/2! + x * (n!/3! + x ...)))) / n!
	124
c2af38aa SP	125	k! is computed on the fly as KF and at the end of the polynomial loop, KF
c2af38aa SP	126	is n!, which can be used directly. */
4e92d59e SP	127	__cpy (&mps, &mpt2, p);
	128
	129	double kf = 1.0;
	130
	131	/* Evaluate the rest. The result will be in mpt2. */
	132	for (k = n - 1; k > 0; k--)
7490eb81	133	{
4e92d59e SP	134	/* n! / k! = n * (n - 1) ... * (n - k + 1) */
	135	kf *= k + 1;
	136
	137	__dbl_mp (kf, &mpk, p);
	138	__add (&mpt2, &mpk, &mpt1, p);
	139	__mul (&mps, &mpt1, &mpt2, p);
7490eb81	140	}
c2af38aa	141	__dbl_mp (kf, &mpk, p);
4e92d59e	142	__dvd (&mpt2, &mpk, &mpt1, p);
107a5bf0	143	__add (&__mpone, &mpt1, &mpt2, p);
e4d82761	144
7490eb81 SP	145	/* Raise polynomial value to the power of 2*m. Put result in y. /
	146	for (k = 0, j = 0; k < m;)
	147	{
d6752ccd	148	__sqr (&mpt2, &mpt1, p);
7490eb81 SP	149	k++;
	150	if (k == m)
	151	{
	152	j = 1;
	153	break;
	154	}
d6752ccd	155	__sqr (&mpt1, &mpt2, p);
7490eb81 SP	156	k++;
	157	}
	158	if (j)
	159	__cpy (&mpt1, y, p);
	160	else
	161	__cpy (&mpt2, y, p);
e4d82761 UD	162	return;
e4d82761 UD	163	}