Tree - source-git/mpfr - CentOS Git server

source-git / mpfr

Blame src/root.c

Blob History Raw

Packit	fbef6a	`/* mpfr_root -- kth root.`
Packit	fbef6a
Packit	fbef6a	`Copyright 2005-2017 Free Software Foundation, Inc.`
Packit	fbef6a	`Contributed by the AriC and Caramba projects, INRIA.`
Packit	fbef6a
Packit	fbef6a	`This file is part of the GNU MPFR Library.`
Packit	fbef6a
Packit	fbef6a	`The GNU MPFR Library is free software; you can redistribute it and/or modify`
Packit	fbef6a	`it under the terms of the GNU Lesser General Public License as published by`
Packit	fbef6a	`the Free Software Foundation; either version 3 of the License, or (at your`
Packit	fbef6a	`option) any later version.`
Packit	fbef6a
Packit	fbef6a	`The GNU MPFR Library is distributed in the hope that it will be useful, but`
Packit	fbef6a	`WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY`
Packit	fbef6a	`or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public`
Packit	fbef6a	`License for more details.`
Packit	fbef6a
Packit	fbef6a	`You should have received a copy of the GNU Lesser General Public License`
Packit	fbef6a	`along with the GNU MPFR Library; see the file COPYING.LESSER. If not, see`
Packit	fbef6a	`http://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,`
Packit	fbef6a	`51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */`
Packit	fbef6a
Packit	fbef6a	`#define MPFR_NEED_LONGLONG_H`
Packit	fbef6a	`#include "mpfr-impl.h"`
Packit	fbef6a
Packit	fbef6a	`/* The computation of y = x^(1/k) is done as follows, except for large`
Packit	fbef6a	`values of k, for which this would be inefficient or yield internal`
Packit	fbef6a	`integer overflows:`
Packit	fbef6a
Packit	fbef6a	`Let x = sign * m * 2^(k*e) where m is an integer`
Packit	fbef6a
Packit	fbef6a	`with 2^(k(n-1)) <= m < 2^(kn) where n = PREC(y)`
Packit	fbef6a
Packit	fbef6a	`and m = s^k + t where 0 <= t and m < (s+1)^k`
Packit	fbef6a
Packit	fbef6a	`we want that s has n bits i.e. s >= 2^(n-1), or m >= 2^(k*(n-1))`
Packit	fbef6a	`i.e. m must have at least k*(n-1)+1 bits`
Packit	fbef6a
Packit	fbef6a	`then, not taking into account the sign, the result will be`
Packit	fbef6a	`x^(1/k) = s * 2^e or (s+1) * 2^e according to the rounding mode.`
Packit	fbef6a	`*/`
Packit	fbef6a
Packit	fbef6a	`static int`
Packit	fbef6a	`mpfr_root_aux (mpfr_ptr y, mpfr_srcptr x, unsigned long k,`
Packit	fbef6a	`mpfr_rnd_t rnd_mode);`
Packit	fbef6a
Packit	fbef6a	`int`
Packit	fbef6a	`mpfr_root (mpfr_ptr y, mpfr_srcptr x, unsigned long k, mpfr_rnd_t rnd_mode)`
Packit	fbef6a	`{`
Packit	fbef6a	`mpz_t m;`
Packit	fbef6a	`mpfr_exp_t e, r, sh, f;`
Packit	fbef6a	`mpfr_prec_t n, size_m, tmp;`
Packit	fbef6a	`int inexact, negative;`
Packit	fbef6a	`MPFR_SAVE_EXPO_DECL (expo);`
Packit	fbef6a
Packit	fbef6a	`MPFR_LOG_FUNC`
Packit	fbef6a	`(("x[%Pu]=%.*Rg k=%lu rnd=%d",`
Packit	fbef6a	`mpfr_get_prec (x), mpfr_log_prec, x, k, rnd_mode),`
Packit	fbef6a	`("y[%Pu]=%.*Rg inexact=%d",`
Packit	fbef6a	`mpfr_get_prec (y), mpfr_log_prec, y, inexact));`
Packit	fbef6a
Packit	fbef6a	`if (MPFR_UNLIKELY (k <= 1))`
Packit	fbef6a	`{`
Packit	fbef6a	`if (k == 0)`
Packit	fbef6a	`{`
Packit	fbef6a	`MPFR_SET_NAN (y);`
Packit	fbef6a	`MPFR_RET_NAN;`
Packit	fbef6a	`}`
Packit	fbef6a	`else /* y = x^(1/1) = x */`
Packit	fbef6a	`return mpfr_set (y, x, rnd_mode);`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`/* Singular values */`
Packit	fbef6a	`if (MPFR_UNLIKELY (MPFR_IS_SINGULAR (x)))`
Packit	fbef6a	`{`
Packit	fbef6a	`if (MPFR_IS_NAN (x))`
Packit	fbef6a	`{`
Packit	fbef6a	`MPFR_SET_NAN (y); /* NaN^(1/k) = NaN */`
Packit	fbef6a	`MPFR_RET_NAN;`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`if (MPFR_IS_INF (x)) /* +Inf^(1/k) = +Inf`
Packit	fbef6a	`-Inf^(1/k) = -Inf if k odd`
Packit	fbef6a	`-Inf^(1/k) = NaN if k even */`
Packit	fbef6a	`{`
Packit	fbef6a	`if (MPFR_IS_NEG(x) && (k % 2 == 0))`
Packit	fbef6a	`{`
Packit	fbef6a	`MPFR_SET_NAN (y);`
Packit	fbef6a	`MPFR_RET_NAN;`
Packit	fbef6a	`}`
Packit	fbef6a	`MPFR_SET_INF (y);`
Packit	fbef6a	`}`
Packit	fbef6a	`else /* x is necessarily 0: (+0)^(1/k) = +0`
Packit	fbef6a	`(-0)^(1/k) = -0 */`
Packit	fbef6a	`{`
Packit	fbef6a	`MPFR_ASSERTD (MPFR_IS_ZERO (x));`
Packit	fbef6a	`MPFR_SET_ZERO (y);`
Packit	fbef6a	`}`
Packit	fbef6a	`MPFR_SET_SAME_SIGN (y, x);`
Packit	fbef6a	`MPFR_RET (0);`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`/* Returns NAN for x < 0 and k even */`
Packit	fbef6a	`if (MPFR_UNLIKELY (MPFR_IS_NEG (x) && (k % 2 == 0)))`
Packit	fbef6a	`{`
Packit	fbef6a	`MPFR_SET_NAN (y);`
Packit	fbef6a	`MPFR_RET_NAN;`
Packit	fbef6a	`}`
Packit	fbef6a
Packit Service	f62a41	`/* Special case \|x\| = 1. Note that if x = -1, then k is odd`
Packit Service	f62a41	`(NaN results have already been filtered), so that y = -1. */`
Packit Service	f62a41	`if (mpfr_cmpabs (x, __gmpfr_one) == 0)`
Packit Service	f62a41	`return mpfr_set (y, x, rnd_mode);`
Packit Service	f62a41
Packit	fbef6a	`/* General case */`
Packit	fbef6a
Packit	fbef6a	`/* For large k, use exp(log(x)/k). The threshold of 100 seems to be quite`
Packit	fbef6a	`good when the precision goes to infinity. */`
Packit	fbef6a	`if (k > 100)`
Packit	fbef6a	`return mpfr_root_aux (y, x, k, rnd_mode);`
Packit	fbef6a
Packit	fbef6a	`MPFR_SAVE_EXPO_MARK (expo);`
Packit	fbef6a	`mpz_init (m);`
Packit	fbef6a
Packit	fbef6a	`e = mpfr_get_z_2exp (m, x); /* x = m * 2^e */`
Packit	fbef6a	`if ((negative = MPFR_IS_NEG(x)))`
Packit	fbef6a	`mpz_neg (m, m);`
Packit	fbef6a	`r = e % (mpfr_exp_t) k;`
Packit	fbef6a	`if (r < 0)`
Packit	fbef6a	`r += k; /* now r = e (mod k) with 0 <= r < k */`
Packit	fbef6a	`MPFR_ASSERTD (0 <= r && r < k);`
Packit	fbef6a	`/* x = (m2^r) 2^(e-r) where e-r is a multiple of k */`
Packit	fbef6a
Packit	fbef6a	`MPFR_MPZ_SIZEINBASE2 (size_m, m);`
Packit	fbef6a	`/* for rounding to nearest, we want the round bit to be in the root */`
Packit	fbef6a	`n = MPFR_PREC (y) + (rnd_mode == MPFR_RNDN);`
Packit	fbef6a
Packit	fbef6a	`/* we now multiply m by 2^sh so that root(m,k) will give`
Packit	fbef6a	`exactly n bits: we want k(n-1)+1 <= size_m + sh <= kn`
Packit	fbef6a	`i.e. sh = kf + r with f = max(floor((kn-size_m-r)/k),0) */`
Packit	fbef6a	`if ((mpfr_exp_t) size_m + r >= k * (mpfr_exp_t) n)`
Packit	fbef6a	`f = 0; /* we already have too many bits */`
Packit	fbef6a	`else`
Packit	fbef6a	`f = (k * (mpfr_exp_t) n - (mpfr_exp_t) size_m - r) / k;`
Packit	fbef6a	`sh = k * f + r;`
Packit	fbef6a	`mpz_mul_2exp (m, m, sh);`
Packit	fbef6a	`e = e - sh;`
Packit	fbef6a
Packit	fbef6a	`/* invariant: x = m2^e, with e divisible by k /`
Packit	fbef6a
Packit	fbef6a	`/* we reuse the variable m to store the kth root, since it is not needed`
Packit	fbef6a	`any more: we just need to know if the root is exact */`
Packit	fbef6a	`inexact = mpz_root (m, m, k) == 0;`
Packit	fbef6a
Packit	fbef6a	`MPFR_MPZ_SIZEINBASE2 (tmp, m);`
Packit	fbef6a	`sh = tmp - n;`
Packit	fbef6a	`if (sh > 0) /* we have to flush to 0 the last sh bits from m */`
Packit	fbef6a	`{`
Packit	fbef6a	`inexact = inexact \|\| ((mpfr_exp_t) mpz_scan1 (m, 0) < sh);`
Packit	fbef6a	`mpz_fdiv_q_2exp (m, m, sh);`
Packit	fbef6a	`e += k * sh;`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`if (inexact)`
Packit	fbef6a	`{`
Packit	fbef6a	`if (negative)`
Packit	fbef6a	`rnd_mode = MPFR_INVERT_RND (rnd_mode);`
Packit	fbef6a	`if (rnd_mode == MPFR_RNDU \|\| rnd_mode == MPFR_RNDA`
Packit	fbef6a	`\|\| (rnd_mode == MPFR_RNDN && mpz_tstbit (m, 0)))`
Packit	fbef6a	`inexact = 1, mpz_add_ui (m, m, 1);`
Packit	fbef6a	`else`
Packit	fbef6a	`inexact = -1;`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`/* either inexact is not zero, and the conversion is exact, i.e. inexact`
Packit	fbef6a	`is not changed; or inexact=0, and inexact is set only when`
Packit	fbef6a	`rnd_mode=MPFR_RNDN and bit (n+1) from m is 1 */`
Packit	fbef6a	`inexact += mpfr_set_z (y, m, MPFR_RNDN);`
Packit	fbef6a	`MPFR_SET_EXP (y, MPFR_GET_EXP (y) + e / (mpfr_exp_t) k);`
Packit	fbef6a
Packit	fbef6a	`if (negative)`
Packit	fbef6a	`{`
Packit	fbef6a	`MPFR_CHANGE_SIGN (y);`
Packit	fbef6a	`inexact = -inexact;`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`mpz_clear (m);`
Packit	fbef6a	`MPFR_SAVE_EXPO_FREE (expo);`
Packit	fbef6a	`return mpfr_check_range (y, inexact, rnd_mode);`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`/* Compute y <- x^(1/k) using exp(log(x)/k).`
Packit	fbef6a	`Assume all special cases have been eliminated before.`
Packit	fbef6a	`In the extended exponent range, overflows/underflows are not possible.`
Packit	fbef6a	`Assume x > 0, or x < 0 and k odd.`
Packit Service	f62a41	`Also assume \|x\| <> 1 because log(1) = 0, which does not have an exponent`
Packit Service	f62a41	`and would yield a failure in the error bound computation. A priori, this`
Packit Service	f62a41	`constraint is quite artificial because if \|x\| is close enough to 1, then`
Packit Service	f62a41	`the exponent of log\|x\| does not need to be used (in the code, err would`
Packit Service	f62a41	`be 1 in such a domain). So this constraint \|x\| <> 1 could be avoided in`
Packit Service	f62a41	`the code. However, this is an exact case easy to detect, so that such a`
Packit Service	f62a41	`change would be useless. Values very close to 1 are not an issue, since`
Packit Service	f62a41	`an underflow is not possible before the MPFR_GET_EXP.`
Packit	fbef6a	`*/`
Packit	fbef6a	`static int`
Packit	fbef6a	`mpfr_root_aux (mpfr_ptr y, mpfr_srcptr x, unsigned long k, mpfr_rnd_t rnd_mode)`
Packit	fbef6a	`{`
Packit	fbef6a	`int inexact, exact_root = 0;`
Packit	fbef6a	`mpfr_prec_t w; /* working precision */`
Packit	fbef6a	`mpfr_t absx, t;`
Packit	fbef6a	`MPFR_GROUP_DECL(group);`
Packit	fbef6a	`MPFR_TMP_DECL(marker);`
Packit	fbef6a	`MPFR_ZIV_DECL(loop);`
Packit	fbef6a	`MPFR_SAVE_EXPO_DECL (expo);`
Packit	fbef6a
Packit	fbef6a	`MPFR_TMP_INIT_ABS (absx, x);`
Packit	fbef6a
Packit	fbef6a	`MPFR_TMP_MARK(marker);`
Packit	fbef6a	`w = MPFR_PREC(y) + 10;`
Packit	fbef6a	`/* Take some guard bits to prepare for the 'expt' lost bits below.`
Packit	fbef6a	`If \|x\| < 2^k, then log\|x\| < k, thus taking log2(k) bits should be fine. */`
Packit	fbef6a	`if (MPFR_GET_EXP(x) > 0)`
Packit	fbef6a	`w += MPFR_INT_CEIL_LOG2 (MPFR_GET_EXP(x));`
Packit	fbef6a	`MPFR_GROUP_INIT_1(group, w, t);`
Packit	fbef6a	`MPFR_SAVE_EXPO_MARK (expo);`
Packit	fbef6a	`MPFR_ZIV_INIT (loop, w);`
Packit	fbef6a	`for (;;)`
Packit	fbef6a	`{`
Packit	fbef6a	`mpfr_exp_t expt;`
Packit	fbef6a	`unsigned int err;`
Packit	fbef6a
Packit	fbef6a	`mpfr_log (t, absx, MPFR_RNDN);`
Packit	fbef6a	`/* t = log\|x\| * (1 + theta) with \|theta\| <= 2^(-w) */`
Packit	fbef6a	`mpfr_div_ui (t, t, k, MPFR_RNDN);`
Packit Service	f62a41	`/* No possible underflow in mpfr_log and mpfr_div_ui. */`
Packit Service	f62a41	`expt = MPFR_GET_EXP (t); /* assumes t <> 0 */`
Packit	fbef6a	`/* t = log\|x\|/k * (1 + theta) + eps with \|theta\| <= 2^(-w)`
Packit	fbef6a	`and \|eps\| <= 1/2 ulp(t), thus the total error is bounded`
Packit	fbef6a	`by 1.5 * 2^(expt - w) */`
Packit	fbef6a	`mpfr_exp (t, t, MPFR_RNDN);`
Packit	fbef6a	`/* t = \|x\|^(1/k) * exp(tau) * (1 + theta1) with`
Packit	fbef6a	`\|tau\| <= 1.5 * 2^(expt - w) and \|theta1\| <= 2^(-w).`
Packit	fbef6a	`For \|tau\| <= 0.5 we have \|exp(tau)-1\| < 4/3*tau, thus`
Packit	fbef6a	`for w >= expt + 2 we have:`
Packit	fbef6a	`t = \|x\|^(1/k) * (1 + 2^(expt+2)theta2) (1 + theta1) with`
Packit	fbef6a	`\|theta1\|, \|theta2\| <= 2^(-w).`
Packit	fbef6a	`If expt+2 > 0, as long as w >= 1, we have:`
Packit	fbef6a	`t = \|x\|^(1/k) * (1 + 2^(expt+3)*theta3) with \|theta3\| < 2^(-w).`
Packit	fbef6a	`For expt+2 = 0, we have:`
Packit	fbef6a	`t = \|x\|^(1/k) * (1 + 2^2*theta3) with \|theta3\| < 2^(-w).`
Packit	fbef6a	`Finally for expt+2 < 0 we have:`
Packit	fbef6a	`t = \|x\|^(1/k) * (1 + 2*theta3) with \|theta3\| < 2^(-w).`
Packit	fbef6a	`*/`
Packit	fbef6a	`err = (expt + 2 > 0) ? expt + 3`
Packit	fbef6a	`: (expt + 2 == 0) ? 2 : 1;`
Packit	fbef6a	`/* now t = \|x\|^(1/k) * (1 + 2^(err-w)) thus the error is at most`
Packit	fbef6a	`2^(EXP(t) - w + err) */`
Packit	fbef6a	`if (MPFR_LIKELY (MPFR_CAN_ROUND(t, w - err, MPFR_PREC(y), rnd_mode)))`
Packit	fbef6a	`break;`
Packit	fbef6a
Packit	fbef6a	`/* If we fail to round correctly, check for an exact result or a`
Packit	fbef6a	`midpoint result with MPFR_RNDN (regarded as hard-to-round in`
Packit	fbef6a	`all precisions in order to determine the ternary value). */`
Packit	fbef6a	`{`
Packit	fbef6a	`mpfr_t z, zk;`
Packit	fbef6a
Packit	fbef6a	`mpfr_init2 (z, MPFR_PREC(y) + (rnd_mode == MPFR_RNDN));`
Packit	fbef6a	`mpfr_init2 (zk, MPFR_PREC(x));`
Packit	fbef6a	`mpfr_set (z, t, MPFR_RNDN);`
Packit	fbef6a	`inexact = mpfr_pow_ui (zk, z, k, MPFR_RNDN);`
Packit	fbef6a	`exact_root = !inexact && mpfr_equal_p (zk, absx);`
Packit	fbef6a	`if (exact_root) /* z is the exact root, thus round z directly */`
Packit	fbef6a	`inexact = mpfr_set4 (y, z, rnd_mode, MPFR_SIGN (x));`
Packit	fbef6a	`mpfr_clear (zk);`
Packit	fbef6a	`mpfr_clear (z);`
Packit	fbef6a	`if (exact_root)`
Packit	fbef6a	`break;`
Packit	fbef6a	`}`
Packit	fbef6a
Packit	fbef6a	`MPFR_ZIV_NEXT (loop, w);`
Packit	fbef6a	`MPFR_GROUP_REPREC_1(group, w, t);`
Packit	fbef6a	`}`
Packit	fbef6a	`MPFR_ZIV_FREE (loop);`
Packit	fbef6a
Packit	fbef6a	`if (!exact_root)`
Packit	fbef6a	`inexact = mpfr_set4 (y, t, rnd_mode, MPFR_SIGN (x));`
Packit	fbef6a
Packit	fbef6a	`MPFR_GROUP_CLEAR(group);`
Packit	fbef6a	`MPFR_TMP_FREE(marker);`
Packit	fbef6a	`MPFR_SAVE_EXPO_FREE (expo);`
Packit	fbef6a
Packit	fbef6a	`return mpfr_check_range (y, inexact, rnd_mode);`
Packit	fbef6a	`}`

source-git / mpfr

Source Code

Blame src/root.c