config/rs6000/darwin-ldouble.c

75295Sdes/* 128-bit long double support routines for Darwin.
75295Sdes   Copyright (C) 1993, 2003, 2004 Free Software Foundation, Inc.
75295Sdes
75295SdesThis file is part of GCC.
75295Sdes
75295SdesGCC is free software; you can redistribute it and/or modify it under
75295Sdesthe terms of the GNU General Public License as published by the Free
75295SdesSoftware Foundation; either version 2, or (at your option) any later
75295Sdesversion.
75295Sdes
75295SdesIn addition to the permissions in the GNU General Public License, the
75295SdesFree Software Foundation gives you unlimited permission to link the
75295Sdescompiled version of this file into combinations with other programs,
75295Sdesand to distribute those combinations without any restriction coming
75295Sdesfrom the use of this file.  (The General Public License restrictions
75295Sdesdo apply in other respects; for example, they cover modification of
75295Sdesthe file, and distribution when not linked into a combine
75295Sdesexecutable.)
75295Sdes
75295SdesGCC is distributed in the hope that it will be useful, but WITHOUT ANY
75295SdesWARRANTY; without even the implied warranty of MERCHANTABILITY or
75295SdesFITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
75295Sdesfor more details.
75295Sdes
75295SdesYou should have received a copy of the GNU General Public License
75295Sdesalong with GCC; see the file COPYING.  If not, write to the Free
75295SdesSoftware Foundation, 59 Temple Place - Suite 330, Boston, MA
75295Sdes02111-1307, USA.  */
75295Sdes
75295Sdes/* Implementations of floating-point long double basic arithmetic
75295Sdes   functions called by the IBM C compiler when generating code for
75295Sdes   PowerPC platforms.  In particular, the following functions are
75295Sdes   implemented: _xlqadd, _xlqsub, _xlqmul, and _xlqdiv.  Double-double
78073Sdes   algorithms are based on the paper "Doubled-Precision IEEE Standard
75295Sdes   754 Floating-Point Arithmetic" by W. Kahan, February 26, 1987.  An
77965Sdes   alternative published reference is "Software for Doubled-Precision
84246Sdes   Floating-Point Computations", by Seppo Linnainmaa, ACM TOMS vol 7
75295Sdes   no 3, September 1961, pages 272-283.  */
75295Sdes
75295Sdes/* Each long double is made up of two IEEE doubles.  The value of the
75295Sdes   long double is the sum of the values of the two parts.  The most
75295Sdes   significant part is required to be the value of the long double
75295Sdes   rounded to the nearest double, as specified by IEEE.  For Inf
77998Sdes   values, the least significant part is required to be one of +0.0 or
75295Sdes   -0.0.  No other requirements are made; so, for example, 1.0 may be
75295Sdes   represented as (1.0, +0.0) or (1.0, -0.0), and the low part of a
84246Sdes   NaN is don't-care.
84246Sdes
75295Sdes   This code currently assumes big-endian.  */
75295Sdes
75295Sdes#if !_SOFT_FLOAT && (defined (__MACH__) || defined (__powerpc64__))
75295Sdes
84246Sdes#define fabs(x) __builtin_fabs(x)
84246Sdes
84246Sdes#define unlikely(x) __builtin_expect ((x), 0)
84246Sdes
84246Sdes/* All these routines actually take two long doubles as parameters,
84246Sdes   but GCC currently generates poor code when a union is used to turn
84246Sdes   a long double into a pair of doubles.  */
84246Sdes
84246Sdesextern long double _xlqadd (double, double, double, double);
84246Sdesextern long double _xlqsub (double, double, double, double);
75295Sdesextern long double _xlqmul (double, double, double, double);
84246Sdesextern long double _xlqdiv (double, double, double, double);
84246Sdes
75295Sdestypedef union
75295Sdes{
75295Sdes  long double ldval;
84246Sdes  double dval[2];
84246Sdes} longDblUnion;
75295Sdes
75295Sdesstatic const double FPKINF = 1.0/0.0;
75295Sdes
75295Sdes/* Add two 'long double' values and return the result.	*/
75295Sdeslong double
75295Sdes_xlqadd (double a, double b, double c, double d)
75295Sdes{
75295Sdes  longDblUnion z;
75295Sdes  double t, tau, u, FPR_zero, FPR_PosInf;
75295Sdes
84246Sdes  FPR_zero = 0.0;
84246Sdes  FPR_PosInf = FPKINF;
84246Sdes
75295Sdes  if (unlikely (a != a) || unlikely (c != c))
75295Sdes    return a + c;  /* NaN result.  */
75295Sdes
75295Sdes  /* Ordered operands are arranged in order of their magnitudes.  */
75295Sdes
75295Sdes  /* Switch inputs if |(c,d)| > |(a,b)|. */
75295Sdes  if (fabs (c) > fabs (a))
75295Sdes    {
84246Sdes      t = a;
84386Sdes      tau = b;
84386Sdes      a = c;
84386Sdes      b = d;
75295Sdes      c = t;
75295Sdes      d = tau;
75295Sdes    }
75295Sdes
75295Sdes  /* b <- second largest magnitude double. */
75295Sdes  if (fabs (c) > fabs (b))
75295Sdes    {
77998Sdes      t = b;
77998Sdes      b = c;
75295Sdes      c = t;
77998Sdes    }
75295Sdes
88234Sdillon  /* Thanks to commutivity, sum is invariant w.r.t. the next
88234Sdillon     conditional exchange. */
88234Sdillon  tau = d + c;
88234Sdillon
88234Sdillon  /* Order the smallest magnitude doubles.  */
75295Sdes  if (fabs (d) > fabs (c))
84246Sdes    {
77998Sdes      t = c;
84246Sdes      c = d;
75295Sdes      d = t;
84246Sdes    }
75295Sdes
88234Sdillon  t = (tau + b) + a;	     /* Sum values in ascending magnitude order.  */
88234Sdillon
75295Sdes  /* Infinite or zero result.  */
75295Sdes  if (unlikely (t == FPR_zero) || unlikely (fabs (t) == FPR_PosInf))
77998Sdes    return t;
77998Sdes
77998Sdes  /* Usual case.  */
77998Sdes  tau = (((a-t) + b) + c) + d;
77998Sdes  u = t + tau;
75295Sdes  z.dval[0] = u;	       /* Final fixup for long double result.  */
75295Sdes  z.dval[1] = (t - u) + tau;
75295Sdes  return z.ldval;
77998Sdes}
84246Sdes
84246Sdeslong double
75295Sdes_xlqsub (double a, double b, double c, double d)
77998Sdes{
75295Sdes  return _xlqadd (a, b, -c, -d);
77998Sdes}
77998Sdes
77998Sdeslong double
75295Sdes_xlqmul (double a, double b, double c, double d)
75295Sdes{
75295Sdes  longDblUnion z;
75295Sdes  double t, tau, u, v, w, FPR_zero, FPR_PosInf;
75295Sdes
75295Sdes  FPR_zero = 0.0;
84246Sdes  FPR_PosInf = FPKINF;
75295Sdes
75295Sdes  t = a * c;			/* Highest order double term.  */
75295Sdes
77998Sdes  if (unlikely (t != t) || unlikely (t == FPR_zero)
75295Sdes      || unlikely (fabs (t) == FPR_PosInf))
75295Sdes    return t;
75295Sdes
75295Sdes  /* Finite nonzero result requires summing of terms of two highest
75295Sdes     orders.	*/
75295Sdes
75295Sdes  /* Use fused multiply-add to get low part of a * c.	 */
75295Sdes  asm ("fmsub %0,%1,%2,%3" : "=f"(tau) : "f"(a), "f"(c), "f"(t));
77998Sdes  v = a*d;
77998Sdes  w = b*c;
75295Sdes  tau += v + w;	    /* Add in other second-order terms.	 */
75295Sdes  u = t + tau;
75295Sdes
84246Sdes  /* Construct long double result.  */
77998Sdes  z.dval[0] = u;
84246Sdes  z.dval[1] = (t - u) + tau;
84246Sdes  return z.ldval;
84246Sdes}
84246Sdes
84246Sdeslong double
75295Sdes_xlqdiv (double a, double b, double c, double d)
75295Sdes{
75295Sdes  longDblUnion z;
75295Sdes  double s, sigma, t, tau, u, v, w, FPR_zero, FPR_PosInf;
75295Sdes
75295Sdes  FPR_zero = 0.0;
75295Sdes  FPR_PosInf = FPKINF;
75295Sdes
75295Sdes  t = a / c;                    /* highest order double term */
75295Sdes
77998Sdes  if (unlikely (t != t) || unlikely (t == FPR_zero)
88234Sdillon      || unlikely (fabs (t) == FPR_PosInf))
88234Sdillon    return t;
75295Sdes
75295Sdes  /* Finite nonzero result requires corrections to the highest order term.  */
84246Sdes
84246Sdes  s = c * t;                    /* (s,sigma) = c*t exactly. */
84246Sdes  w = -(-b + d * t);	/* Written to get fnmsub for speed, but not
84246Sdes			   numerically necessary.  */
84246Sdes
84246Sdes  /* Use fused multiply-add to get low part of c * t.	 */
77998Sdes  asm ("fmsub %0,%1,%2,%3" : "=f"(sigma) : "f"(c), "f"(t), "f"(s));
84246Sdes  v = a - s;
77998Sdes
84246Sdes  tau = ((v-sigma)+w)/c;   /* Correction to t. */
84246Sdes  u = t + tau;
77998Sdes
75295Sdes  /* Construct long double result. */
75295Sdes  z.dval[0] = u;
75295Sdes  z.dval[1] = (t - u) + tau;
84246Sdes  return z.ldval;
84246Sdes}
84246Sdes
84246Sdes#endif
84246Sdes