Blame sysdeps/ieee754/dbl-64/mpsqrt.c

Packit 6c4009
/*
Packit 6c4009
 * IBM Accurate Mathematical Library
Packit 6c4009
 * written by International Business Machines Corp.
Packit 6c4009
 * Copyright (C) 2001-2018 Free Software Foundation, Inc.
Packit 6c4009
 *
Packit 6c4009
 * This program is free software; you can redistribute it and/or modify
Packit 6c4009
 * it under the terms of the GNU Lesser General Public License as published by
Packit 6c4009
 * the Free Software Foundation; either version 2.1 of the License, or
Packit 6c4009
 * (at your option) any later version.
Packit 6c4009
 *
Packit 6c4009
 * This program is distributed in the hope that it will be useful,
Packit 6c4009
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
Packit 6c4009
 * GNU Lesser General Public License for more details.
Packit 6c4009
 *
Packit 6c4009
 * You should have received a copy of the GNU Lesser General Public License
Packit 6c4009
 * along with this program; if not, see <http://www.gnu.org/licenses/>.
Packit 6c4009
 */
Packit 6c4009
/****************************************************************************/
Packit 6c4009
/*  MODULE_NAME:mpsqrt.c                                                    */
Packit 6c4009
/*                                                                          */
Packit 6c4009
/*  FUNCTION:mpsqrt                                                         */
Packit 6c4009
/*           fastiroot                                                      */
Packit 6c4009
/*                                                                          */
Packit 6c4009
/* FILES NEEDED:endian.h mpa.h mpsqrt.h                                     */
Packit 6c4009
/*              mpa.c                                                       */
Packit 6c4009
/* Multi-Precision square root function subroutine for precision p >= 4.    */
Packit 6c4009
/* The relative error is bounded by 3.501*r**(1-p), where r=2**24.          */
Packit 6c4009
/*                                                                          */
Packit 6c4009
/****************************************************************************/
Packit 6c4009
#include "endian.h"
Packit 6c4009
#include "mpa.h"
Packit 6c4009
Packit 6c4009
#ifndef SECTION
Packit 6c4009
# define SECTION
Packit 6c4009
#endif
Packit 6c4009
Packit 6c4009
#include "mpsqrt.h"
Packit 6c4009
Packit 6c4009
/****************************************************************************/
Packit 6c4009
/* Multi-Precision square root function subroutine for precision p >= 4.    */
Packit 6c4009
/* The relative error is bounded by 3.501*r**(1-p), where r=2**24.          */
Packit 6c4009
/* Routine receives two pointers to  Multi Precision numbers:               */
Packit 6c4009
/* x (left argument) and y (next argument). Routine also receives precision */
Packit 6c4009
/* p as integer. Routine computes sqrt(*x) and stores result in *y          */
Packit 6c4009
/****************************************************************************/
Packit 6c4009
Packit 6c4009
static double fastiroot (double);
Packit 6c4009
Packit 6c4009
void
Packit 6c4009
SECTION
Packit 6c4009
__mpsqrt (mp_no *x, mp_no *y, int p)
Packit 6c4009
{
Packit 6c4009
  int i, m, ey;
Packit 6c4009
  double dx, dy;
Packit 6c4009
  static const mp_no mphalf = {0, {1.0, HALFRAD}};
Packit 6c4009
  static const mp_no mp3halfs = {1, {1.0, 1.0, HALFRAD}};
Packit 6c4009
  mp_no mpxn, mpz, mpu, mpt1, mpt2;
Packit 6c4009
Packit 6c4009
  ey = EX / 2;
Packit 6c4009
  __cpy (x, &mpxn, p);
Packit 6c4009
  mpxn.e -= (ey + ey);
Packit 6c4009
  __mp_dbl (&mpxn, &dx, p);
Packit 6c4009
  dy = fastiroot (dx);
Packit 6c4009
  __dbl_mp (dy, &mpu, p);
Packit 6c4009
  __mul (&mpxn, &mphalf, &mpz, p);
Packit 6c4009
Packit 6c4009
  m = __mpsqrt_mp[p];
Packit 6c4009
  for (i = 0; i < m; i++)
Packit 6c4009
    {
Packit 6c4009
      __sqr (&mpu, &mpt1, p);
Packit 6c4009
      __mul (&mpt1, &mpz, &mpt2, p);
Packit 6c4009
      __sub (&mp3halfs, &mpt2, &mpt1, p);
Packit 6c4009
      __mul (&mpu, &mpt1, &mpt2, p);
Packit 6c4009
      __cpy (&mpt2, &mpu, p);
Packit 6c4009
    }
Packit 6c4009
  __mul (&mpxn, &mpu, y, p);
Packit 6c4009
  EY += ey;
Packit 6c4009
}
Packit 6c4009
Packit 6c4009
/***********************************************************/
Packit 6c4009
/* Compute a double precision approximation for 1/sqrt(x)  */
Packit 6c4009
/* with the relative error bounded by 2**-51.              */
Packit 6c4009
/***********************************************************/
Packit 6c4009
static double
Packit 6c4009
SECTION
Packit 6c4009
fastiroot (double x)
Packit 6c4009
{
Packit 6c4009
  union
Packit 6c4009
  {
Packit 6c4009
    int i[2];
Packit 6c4009
    double d;
Packit 6c4009
  } p, q;
Packit 6c4009
  double y, z, t;
Packit 6c4009
  int n;
Packit 6c4009
  static const double c0 = 0.99674, c1 = -0.53380;
Packit 6c4009
  static const double c2 = 0.45472, c3 = -0.21553;
Packit 6c4009
Packit 6c4009
  p.d = x;
Packit 6c4009
  p.i[HIGH_HALF] = (p.i[HIGH_HALF] & 0x3FFFFFFF) | 0x3FE00000;
Packit 6c4009
  q.d = x;
Packit 6c4009
  y = p.d;
Packit 6c4009
  z = y - 1.0;
Packit 6c4009
  n = (q.i[HIGH_HALF] - p.i[HIGH_HALF]) >> 1;
Packit 6c4009
  z = ((c3 * z + c2) * z + c1) * z + c0;	/* 2**-7         */
Packit 6c4009
  z = z * (1.5 - 0.5 * y * z * z);		/* 2**-14        */
Packit 6c4009
  p.d = z * (1.5 - 0.5 * y * z * z);		/* 2**-28        */
Packit 6c4009
  p.i[HIGH_HALF] -= n;
Packit 6c4009
  t = x * p.d;
Packit 6c4009
  return p.d * (1.5 - 0.5 * p.d * t);
Packit 6c4009
}