[thirdparty/glibc.git] / sysdeps / ieee754 / dbl-64 / mpsqrt.c

/*
 * IBM Accurate Mathematical Library
 * written by International Business Machines Corp.
 * Copyright (C) 2001-2019 Free Software Foundation, Inc.
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU Lesser General Public License as published by
 * the Free Software Foundation; either version 2.1 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public License
 * along with this program; if not, see <http://www.gnu.org/licenses/>.
 */
/****************************************************************************/
/*  MODULE_NAME:mpsqrt.c                                                    */
/*                                                                          */
/*  FUNCTION:mpsqrt                                                         */
/*           fastiroot                                                      */
/*                                                                          */
/* FILES NEEDED:endian.h mpa.h mpsqrt.h                                     */
/*              mpa.c                                                       */
/* Multi-Precision square root function subroutine for precision p >= 4.    */
/* The relative error is bounded by 3.501*r**(1-p), where r=2**24.          */
/*                                                                          */
/****************************************************************************/
#include "endian.h"
#include "mpa.h"

#ifndef SECTION
# define SECTION
#endif

#include "mpsqrt.h"

/****************************************************************************/
/* Multi-Precision square root function subroutine for precision p >= 4.    */
/* The relative error is bounded by 3.501*r**(1-p), where r=2**24.          */
/* Routine receives two pointers to  Multi Precision numbers:               */
/* x (left argument) and y (next argument). Routine also receives precision */
/* p as integer. Routine computes sqrt(*x) and stores result in *y          */
/****************************************************************************/

static double fastiroot (double);

void
SECTION
__mpsqrt (mp_no *x, mp_no *y, int p)
{
  int i, m, ey;
  double dx, dy;
  static const mp_no mphalf = {0, {1.0, HALFRAD}};
  static const mp_no mp3halfs = {1, {1.0, 1.0, HALFRAD}};
  mp_no mpxn, mpz, mpu, mpt1, mpt2;

  ey = EX / 2;
  __cpy (x, &mpxn, p);
  mpxn.e -= (ey + ey);
  __mp_dbl (&mpxn, &dx, p);
  dy = fastiroot (dx);
  __dbl_mp (dy, &mpu, p);
  __mul (&mpxn, &mphalf, &mpz, p);

  m = __mpsqrt_mp[p];
  for (i = 0; i < m; i++)
    {
      __sqr (&mpu, &mpt1, p);
      __mul (&mpt1, &mpz, &mpt2, p);
      __sub (&mp3halfs, &mpt2, &mpt1, p);
      __mul (&mpu, &mpt1, &mpt2, p);
      __cpy (&mpt2, &mpu, p);
    }
  __mul (&mpxn, &mpu, y, p);
  EY += ey;
}

/***********************************************************/
/* Compute a double precision approximation for 1/sqrt(x)  */
/* with the relative error bounded by 2**-51.              */
/***********************************************************/
static double
SECTION
fastiroot (double x)
{
  union
  {
    int i[2];
    double d;
  } p, q;
  double y, z, t;
  int n;
  static const double c0 = 0.99674, c1 = -0.53380;
  static const double c2 = 0.45472, c3 = -0.21553;

  p.d = x;
  p.i[HIGH_HALF] = (p.i[HIGH_HALF] & 0x3FFFFFFF) | 0x3FE00000;
  q.d = x;
  y = p.d;
  z = y - 1.0;
  n = (q.i[HIGH_HALF] - p.i[HIGH_HALF]) >> 1;
  z = ((c3 * z + c2) * z + c1) * z + c0;	/* 2**-7         */
  z = z * (1.5 - 0.5 * y * z * z);		/* 2**-14        */
  p.d = z * (1.5 - 0.5 * y * z * z);		/* 2**-28        */
  p.i[HIGH_HALF] -= n;
  t = x * p.d;
  return p.d * (1.5 - 0.5 * p.d * t);
}
Commit	Line	Data
e4d82761 UD	1	/*
e4d82761 UD	2	* IBM Accurate Mathematical Library
aeb25823	3	* written by International Business Machines Corp.
04277e02	4	* Copyright (C) 2001-2019 Free Software Foundation, Inc.
e4d82761 UD	5	*
	6	* This program is free software; you can redistribute it and/or modify
	7	* it under the terms of the GNU Lesser General Public License as published by
cc7375ce	8	* the Free Software Foundation; either version 2.1 of the License, or
e4d82761	9	* (at your option) any later version.
50944bca	10	*
e4d82761 UD	11	* This program is distributed in the hope that it will be useful,
	12	* but WITHOUT ANY WARRANTY; without even the implied warranty of
	13	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
c6c6dd48	14	* GNU Lesser General Public License for more details.
e4d82761 UD	15	*
e4d82761 UD	16	* You should have received a copy of the GNU Lesser General Public License
59ba27a6	17	* along with this program; if not, see <http://www.gnu.org/licenses/>.
e4d82761 UD	18	*/
	19	/****************************************************************************/
	20	/* MODULE_NAME:mpsqrt.c */
	21	/* */
	22	/* FUNCTION:mpsqrt */
	23	/* fastiroot */
	24	/* */
	25	/* FILES NEEDED:endian.h mpa.h mpsqrt.h */
	26	/* mpa.c */
	27	/* Multi-Precision square root function subroutine for precision p >= 4. */
	28	/* The relative error is bounded by 3.501r(1-p), where r=224. /
	29	/* */
	30	/****************************************************************************/
	31	#include "endian.h"
	32	#include "mpa.h"
	33
31d3cc00 UD	34	#ifndef SECTION
	35	# define SECTION
	36	#endif
	37
	38	#include "mpsqrt.h"
	39
e4d82761 UD	40	/****************************************************************************/
	41	/* Multi-Precision square root function subroutine for precision p >= 4. */
	42	/* The relative error is bounded by 3.501r(1-p), where r=224. /
	43	/* Routine receives two pointers to Multi Precision numbers: */
	44	/* x (left argument) and y (next argument). Routine also receives precision */
	45	/* p as integer. Routine computes sqrt(x) and stores result in y */
	46	/****************************************************************************/
	47
09c14ed2	48	static double fastiroot (double);
e4d82761	49
31d3cc00 UD	50	void
31d3cc00 UD	51	SECTION
09c14ed2 SP	52	__mpsqrt (mp_no x, mp_no y, int p)
	53	{
	54	int i, m, ey;
	55	double dx, dy;
b33d4ce4 SP	56	static const mp_no mphalf = {0, {1.0, HALFRAD}};
b33d4ce4 SP	57	static const mp_no mp3halfs = {1, {1.0, 1.0, HALFRAD}};
09c14ed2	58	mp_no mpxn, mpz, mpu, mpt1, mpt2;
e4d82761	59
09c14ed2 SP	60	ey = EX / 2;
	61	__cpy (x, &mpxn, p);
	62	mpxn.e -= (ey + ey);
	63	__mp_dbl (&mpxn, &dx, p);
	64	dy = fastiroot (dx);
	65	__dbl_mp (dy, &mpu, p);
	66	__mul (&mpxn, &mphalf, &mpz, p);
e4d82761	67
09c14ed2 SP	68	m = __mpsqrt_mp[p];
	69	for (i = 0; i < m; i++)
	70	{
	71	__sqr (&mpu, &mpt1, p);
	72	__mul (&mpt1, &mpz, &mpt2, p);
	73	__sub (&mp3halfs, &mpt2, &mpt1, p);
	74	__mul (&mpu, &mpt1, &mpt2, p);
	75	__cpy (&mpt2, &mpu, p);
	76	}
	77	__mul (&mpxn, &mpu, y, p);
	78	EY += ey;
e4d82761 UD	79	}
	80
	81	/***********************************************************/
	82	/* Compute a double precision approximation for 1/sqrt(x) */
	83	/* with the relative error bounded by 2*-51. /
	84	/***********************************************************/
31d3cc00 UD	85	static double
31d3cc00 UD	86	SECTION
09c14ed2 SP	87	fastiroot (double x)
	88	{
	89	union
	90	{
	91	int i[2];
	92	double d;
	93	} p, q;
	94	double y, z, t;
bb3f4825	95	int n;
09c14ed2 SP	96	static const double c0 = 0.99674, c1 = -0.53380;
09c14ed2 SP	97	static const double c2 = 0.45472, c3 = -0.21553;
50944bca	98
e4d82761	99	p.d = x;
09c14ed2	100	p.i[HIGH_HALF] = (p.i[HIGH_HALF] & 0x3FFFFFFF) \| 0x3FE00000;
e4d82761 UD	101	q.d = x;
e4d82761 UD	102	y = p.d;
09c14ed2 SP	103	z = y - 1.0;
	104	n = (q.i[HIGH_HALF] - p.i[HIGH_HALF]) >> 1;
	105	z = ((c3 * z + c2) * z + c1) * z + c0; /* 2*-7 /
	106	z = z * (1.5 - 0.5 * y * z * z); /* 2*-14 /
	107	p.d = z * (1.5 - 0.5 * y * z * z); /* 2*-28 /
e4d82761	108	p.i[HIGH_HALF] -= n;
09c14ed2 SP	109	t = x * p.d;
09c14ed2 SP	110	return p.d * (1.5 - 0.5 * p.d * t);
e4d82761	111	}