mpfr/src/sqr.c

257483Sian/* mpfr_sqr -- Floating square
257483Sian
257483SianCopyright 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013 Free Software Foundation, Inc.
257483SianContributed by the AriC and Caramel projects, INRIA.
257483Sian
257483SianThis file is part of the GNU MPFR Library.
257483Sian
257483SianThe GNU MPFR Library is free software; you can redistribute it and/or modify
257483Sianit under the terms of the GNU Lesser General Public License as published by
257483Sianthe Free Software Foundation; either version 3 of the License, or (at your
261946Sianoption) any later version.
257483Sian
257483SianThe GNU MPFR Library is distributed in the hope that it will be useful, but
257483SianWITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
262427Sianor FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Lesser General Public
257483SianLicense for more details.
290807Sgonzo
323418SianYou should have received a copy of the GNU Lesser General Public License
271550Sianalong with the GNU MPFR Library; see the file COPYING.LESSER.  If not, see
257483Sianhttp://www.gnu.org/licenses/ or write to the Free Software Foundation, Inc.,
323418Sian51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA. */
268835Sbr
268977Sbr#include "mpfr-impl.h"
277644Sbr
277644Sbrint
277644Sbrmpfr_sqr (mpfr_ptr a, mpfr_srcptr b, mpfr_rnd_t rnd_mode)
257483Sian{
292571Sgonzo  int cc, inexact;
292571Sgonzo  mpfr_exp_t ax;
292571Sgonzo  mp_limb_t *tmp;
292574Sgonzo  mp_limb_t b1;
292574Sgonzo  mpfr_prec_t bq;
257483Sian  mp_size_t bn, tn;
257483Sian  MPFR_TMP_DECL(marker);
257483Sian
314510Sian  MPFR_LOG_FUNC
257483Sian    (("x[%Pu]=%.*Rg rnd=%d", mpfr_get_prec (b), mpfr_log_prec, b, rnd_mode),
257483Sian     ("y[%Pu]=%.*Rg inexact=%d",
257483Sian      mpfr_get_prec (a), mpfr_log_prec, a, inexact));
257483Sian
257483Sian  /* deal with special cases */
257483Sian  if (MPFR_UNLIKELY(MPFR_IS_SINGULAR(b)))
257483Sian    {
257483Sian      if (MPFR_IS_NAN(b))
257483Sian        {
257483Sian          MPFR_SET_NAN(a);
257483Sian          MPFR_RET_NAN;
257483Sian        }
257483Sian      MPFR_SET_POS (a);
257483Sian      if (MPFR_IS_INF(b))
257483Sian        MPFR_SET_INF(a);
257483Sian      else
257483Sian        ( MPFR_ASSERTD(MPFR_IS_ZERO(b)), MPFR_SET_ZERO(a) );
257483Sian      MPFR_RET(0);
257483Sian    }
277644Sbr  ax = 2 * MPFR_GET_EXP (b);
277644Sbr  bq = MPFR_PREC(b);
277644Sbr
277644Sbr  MPFR_ASSERTN (2 * (mpfr_uprec_t) bq <= MPFR_PREC_MAX);
277644Sbr
277644Sbr  bn = MPFR_LIMB_SIZE (b); /* number of limbs of b */
277644Sbr  tn = MPFR_PREC2LIMBS (2 * bq); /* number of limbs of square,
277644Sbr                                    2*bn or 2*bn-1 */
277644Sbr
277644Sbr  if (MPFR_UNLIKELY(bn > MPFR_SQR_THRESHOLD))
277644Sbr    return mpfr_mul (a, b, b, rnd_mode);
277644Sbr
277644Sbr  MPFR_TMP_MARK(marker);
277644Sbr  tmp = MPFR_TMP_LIMBS_ALLOC (2 * bn);
277644Sbr
277644Sbr  /* Multiplies the mantissa in temporary allocated space */
  mpn_sqr_n (tmp, MPFR_MANT(b), bn);
  b1 = tmp[2 * bn - 1];

  /* now tmp[0]..tmp[2*bn-1] contains the product of both mantissa,
     with tmp[2*bn-1]>=2^(GMP_NUMB_BITS-2) */
  b1 >>= GMP_NUMB_BITS - 1; /* msb from the product */

  /* if the mantissas of b and c are uniformly distributed in ]1/2, 1],
     then their product is in ]1/4, 1/2] with probability 2*ln(2)-1 ~ 0.386
     and in [1/2, 1] with probability 2-2*ln(2) ~ 0.614 */
  tmp += 2 * bn - tn; /* +0 or +1 */
  if (MPFR_UNLIKELY(b1 == 0))
    mpn_lshift (tmp, tmp, tn, 1); /* tn <= k, so no stack corruption */

  cc = mpfr_round_raw (MPFR_MANT (a), tmp, 2 * bq, 0,
                       MPFR_PREC (a), rnd_mode, &inexact);
  /* cc = 1 ==> result is a power of two */
  if (MPFR_UNLIKELY(cc))
    MPFR_MANT(a)[MPFR_LIMB_SIZE(a)-1] = MPFR_LIMB_HIGHBIT;

  MPFR_TMP_FREE(marker);
  {
    mpfr_exp_t ax2 = ax + (mpfr_exp_t) (b1 - 1 + cc);
    if (MPFR_UNLIKELY( ax2 > __gmpfr_emax))
      return mpfr_overflow (a, rnd_mode, MPFR_SIGN_POS);
    if (MPFR_UNLIKELY( ax2 < __gmpfr_emin))
      {
        /* In the rounding to the nearest mode, if the exponent of the exact
           result (i.e. before rounding, i.e. without taking cc into account)
           is < __gmpfr_emin - 1 or the exact result is a power of 2 (i.e. if
           both arguments are powers of 2), then round to zero. */
        if (rnd_mode == MPFR_RNDN &&
            (ax + (mpfr_exp_t) b1 < __gmpfr_emin || mpfr_powerof2_raw (b)))
          rnd_mode = MPFR_RNDZ;
        return mpfr_underflow (a, rnd_mode, MPFR_SIGN_POS);
      }
    MPFR_SET_EXP (a, ax2);
    MPFR_SET_POS (a);
  }
  MPFR_RET (inexact);
}