src/math/cbrtl.c

33965Sjdp/* origin: FreeBSD /usr/src/lib/msun/src/s_cbrtl.c */
77298Sobrien/*-
89857Sobrien * ====================================================
218822Sdim * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
218822Sdim * Copyright (c) 2009-2011, Bruce D. Evans, Steven G. Kargl, David Schultz.
68765Sobrien *
218822Sdim * Developed at SunPro, a Sun Microsystems, Inc. business.
68765Sobrien * Permission to use, copy, modify, and distribute this
33965Sjdp * software is freely granted, provided that this notice
33965Sjdp * is preserved.
33965Sjdp * ====================================================
33965Sjdp *
33965Sjdp * The argument reduction and testing for exceptional cases was
33965Sjdp * written by Steven G. Kargl with input from Bruce D. Evans
33965Sjdp * and David A. Schultz.
33965Sjdp */
33965Sjdp
33965Sjdp#include "libm.h"
33965Sjdp
33965Sjdp#if LDBL_MANT_DIG == 53 && LDBL_MAX_EXP == 1024
33965Sjdplong double cbrtl(long double x)
33965Sjdp{
33965Sjdp	return cbrt(x);
33965Sjdp}
218822Sdim#elif (LDBL_MANT_DIG == 64 || LDBL_MANT_DIG == 113) && LDBL_MAX_EXP == 16384
218822Sdimstatic const unsigned B1 = 709958130; /* B1 = (127-127.0/3-0.03306235651)*2**23 */
218822Sdim
33965Sjdplong double cbrtl(long double x)
33965Sjdp{
33965Sjdp	union ldshape u = {x}, v;
33965Sjdp	union {float f; uint32_t i;} uft;
33965Sjdp	long double r, s, t, w;
218822Sdim	double_t dr, dt, dx;
89857Sobrien	float_t ft;
89857Sobrien	int e = u.i.se & 0x7fff;
60484Sobrien	int sign = u.i.se & 0x8000;
33965Sjdp
33965Sjdp	/*
33965Sjdp	 * If x = +-Inf, then cbrt(x) = +-Inf.
33965Sjdp	 * If x = NaN, then cbrt(x) = NaN.
33965Sjdp	 */
33965Sjdp	if (e == 0x7fff)
33965Sjdp		return x + x;
33965Sjdp	if (e == 0) {
33965Sjdp		/* Adjust subnormal numbers. */
33965Sjdp		u.f *= 0x1p120;
33965Sjdp		e = u.i.se & 0x7fff;
33965Sjdp		/* If x = +-0, then cbrt(x) = +-0. */
33965Sjdp		if (e == 0)
33965Sjdp			return x;
33965Sjdp		e -= 120;
33965Sjdp	}
33965Sjdp	e -= 0x3fff;
33965Sjdp	u.i.se = 0x3fff;
33965Sjdp	x = u.f;
33965Sjdp	switch (e % 3) {
68765Sobrien	case 1:
33965Sjdp	case -2:
68765Sobrien		x *= 2;
68765Sobrien		e--;
68765Sobrien		break;
68765Sobrien	case 2:
68765Sobrien	case -1:
68765Sobrien		x *= 4;
68765Sobrien		e -= 2;
77298Sobrien		break;
77298Sobrien	}
77298Sobrien	v.f = 1.0;
68765Sobrien	v.i.se = sign | (0x3fff + e/3);
77298Sobrien
77298Sobrien	/*
77298Sobrien	 * The following is the guts of s_cbrtf, with the handling of
77298Sobrien	 * special values removed and extra care for accuracy not taken,
77298Sobrien	 * but with most of the extra accuracy not discarded.
218822Sdim	 */
77298Sobrien
77298Sobrien	/* ~5-bit estimate: */
77298Sobrien	uft.f = x;
77298Sobrien	uft.i = (uft.i & 0x7fffffff)/3 + B1;
77298Sobrien	ft = uft.f;
68765Sobrien
68765Sobrien	/* ~16-bit estimate: */
68765Sobrien	dx = x;
68765Sobrien	dt = ft;
68765Sobrien	dr = dt * dt * dt;
77298Sobrien	dt = dt * (dx + dx + dr) / (dx + dr + dr);
77298Sobrien
218822Sdim	/* ~47-bit estimate: */
77298Sobrien	dr = dt * dt * dt;
218822Sdim	dt = dt * (dx + dx + dr) / (dx + dr + dr);
68765Sobrien
218822Sdim#if LDBL_MANT_DIG == 64
68765Sobrien	/*
68765Sobrien	 * dt is cbrtl(x) to ~47 bits (after x has been reduced to 1 <= x < 8).
68765Sobrien	 * Round it away from zero to 32 bits (32 so that t*t is exact, and
68765Sobrien	 * away from zero for technical reasons).
68765Sobrien	 */
77298Sobrien	t = dt + (0x1.0p32L + 0x1.0p-31L) - 0x1.0p32;
68765Sobrien#elif LDBL_MANT_DIG == 113
68765Sobrien	/*
68765Sobrien	 * Round dt away from zero to 47 bits.  Since we don't trust the 47,
68765Sobrien	 * add 2 47-bit ulps instead of 1 to round up.  Rounding is slow and
68765Sobrien	 * might be avoidable in this case, since on most machines dt will
218822Sdim	 * have been evaluated in 53-bit precision and the technical reasons
68765Sobrien	 * for rounding up might not apply to either case in cbrtl() since
68765Sobrien	 * dt is much more accurate than needed.
68765Sobrien	 */
68765Sobrien	t = dt + 0x2.0p-46 + 0x1.0p60L - 0x1.0p60;
68765Sobrien#endif
68765Sobrien
68765Sobrien	/*
68765Sobrien	 * Final step Newton iteration to 64 or 113 bits with
68765Sobrien	 * error < 0.667 ulps
68765Sobrien	 */
68765Sobrien	s = t*t;         /* t*t is exact */
68765Sobrien	r = x/s;         /* error <= 0.5 ulps; |r| < |t| */
33965Sjdp	w = t+t;         /* t+t is exact */
33965Sjdp	r = (r-t)/(w+r); /* r-t is exact; w+r ~= 3*t */
33965Sjdp	t = t+t*r;       /* error <= 0.5 + 0.5/3 + epsilon */
33965Sjdp
33965Sjdp	t *= v.f;
33965Sjdp	return t;
218822Sdim}
218822Sdim#endif
218822Sdim