syscons/plasma/fp16.c

293034Sdes/*-
293034Sdes * Copyright (c) 2015 Dag-Erling Sm��rgrav
293034Sdes * All rights reserved.
293034Sdes *
293034Sdes * Redistribution and use in source and binary forms, with or without
293034Sdes * modification, are permitted provided that the following conditions
293034Sdes * are met:
293034Sdes * 1. Redistributions of source code must retain the above copyright
293034Sdes *    notice, this list of conditions and the following disclaimer.
293034Sdes * 2. Redistributions in binary form must reproduce the above copyright
293034Sdes *    notice, this list of conditions and the following disclaimer in the
293034Sdes *    documentation and/or other materials provided with the distribution.
293034Sdes *
293034Sdes * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
293034Sdes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
293034Sdes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
293034Sdes * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
293034Sdes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
293034Sdes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
293034Sdes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
293034Sdes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
293034Sdes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
293034Sdes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
293034Sdes * SUCH DAMAGE.
293034Sdes *
293034Sdes * $FreeBSD$
293034Sdes */
293034Sdes
293034Sdes#ifdef _KERNEL
293034Sdes#include <sys/libkern.h>
293034Sdes#else
293034Sdes#include <stdio.h>
293034Sdes#include <strings.h>
293034Sdes#endif
293034Sdes
293034Sdes#include "fp16.h"
293034Sdes
293034Sdes/*
293034Sdes * Compute the quare root of x, using Newton's method with 2^(log2(x)/2)
293034Sdes * as the initial estimate.
293034Sdes */
293034Sdesfp16_t
293034Sdesfp16_sqrt(fp16_t x)
293034Sdes{
293034Sdes	fp16_t y, delta;
293034Sdes	signed int log2x;
293034Sdes
293034Sdes	/* special case */
293034Sdes	if (x == 0)
293034Sdes		return (0);
293034Sdes
293034Sdes	/* shift toward 0 by half the logarithm */
293034Sdes	log2x = flsl(x) - 1;
293034Sdes	if (log2x >= 16) {
293034Sdes		y = x >> (log2x - 16) / 2;
293034Sdes	} else {
293034Sdes#if 0
293034Sdes		y = x << (16 - log2x) / 2;
293034Sdes#else
293034Sdes		/* XXX for now, return 0 for anything < 1 */
293034Sdes		return (0);
293034Sdes#endif
293034Sdes	}
293034Sdes	while (y > 0) {
293034Sdes		/* delta = y^2 / 2y */
293034Sdes		delta = fp16_div(fp16_sub(fp16_mul(y, y), x), y * 2);
293034Sdes		if (delta == 0)
293034Sdes			break;
293034Sdes		y = fp16_sub(y, delta);
293034Sdes	}
293034Sdes	return (y);
293034Sdes}
293034Sdes
293049Sdesstatic fp16_t fp16_sin_table[256] = {
293049Sdes	    0,	  402,	  804,	 1206,	 1608,	 2010,	 2412,	 2814,
293049Sdes	 3215,	 3617,	 4018,	 4420,	 4821,	 5222,	 5622,	 6023,
293049Sdes	 6423,	 6823,	 7223,	 7623,	 8022,	 8421,	 8819,	 9218,
293049Sdes	 9616,	10013,	10410,	10807,	11204,	11600,	11995,	12390,
293049Sdes	12785,	13179,	13573,	13966,	14359,	14751,	15142,	15533,
293049Sdes	15923,	16313,	16702,	17091,	17479,	17866,	18253,	18638,
293049Sdes	19024,	19408,	19792,	20175,	20557,	20938,	21319,	21699,
293049Sdes	22078,	22456,	22833,	23210,	23586,	23960,	24334,	24707,
293049Sdes	25079,	25450,	25820,	26189,	26557,	26925,	27291,	27656,
293049Sdes	28020,	28383,	28745,	29105,	29465,	29824,	30181,	30538,
293049Sdes	30893,	31247,	31600,	31952,	32302,	32651,	32999,	33346,
293049Sdes	33692,	34036,	34379,	34721,	35061,	35400,	35738,	36074,
293049Sdes	36409,	36743,	37075,	37406,	37736,	38064,	38390,	38716,
293049Sdes	39039,	39362,	39682,	40002,	40319,	40636,	40950,	41263,
293049Sdes	41575,	41885,	42194,	42501,	42806,	43110,	43412,	43712,
293049Sdes	44011,	44308,	44603,	44897,	45189,	45480,	45768,	46055,
293049Sdes	46340,	46624,	46906,	47186,	47464,	47740,	48015,	48288,
293049Sdes	48558,	48828,	49095,	49360,	49624,	49886,	50146,	50403,
293049Sdes	50660,	50914,	51166,	51416,	51665,	51911,	52155,	52398,
293049Sdes	52639,	52877,	53114,	53348,	53581,	53811,	54040,	54266,
293049Sdes	54491,	54713,	54933,	55152,	55368,	55582,	55794,	56004,
293049Sdes	56212,	56417,	56621,	56822,	57022,	57219,	57414,	57606,
293049Sdes	57797,	57986,	58172,	58356,	58538,	58718,	58895,	59070,
293049Sdes	59243,	59414,	59583,	59749,	59913,	60075,	60235,	60392,
293049Sdes	60547,	60700,	60850,	60998,	61144,	61288,	61429,	61568,
293049Sdes	61705,	61839,	61971,	62100,	62228,	62353,	62475,	62596,
293049Sdes	62714,	62829,	62942,	63053,	63162,	63268,	63371,	63473,
293049Sdes	63571,	63668,	63762,	63854,	63943,	64030,	64115,	64197,
293049Sdes	64276,	64353,	64428,	64501,	64571,	64638,	64703,	64766,
293049Sdes	64826,	64884,	64939,	64992,	65043,	65091,	65136,	65179,
293049Sdes	65220,	65258,	65294,	65327,	65358,	65386,	65412,	65436,
293049Sdes	65457,	65475,	65491,	65505,	65516,	65524,	65531,	65534,
293034Sdes};
293034Sdes
293034Sdes/*
293049Sdes * Compute the sine of theta.
293049Sdes */
293049Sdesfp16_t
293049Sdesfp16_sin(fp16_t theta)
293049Sdes{
293049Sdes	unsigned int i;
293049Sdes
293049Sdes	i = 1024 * (theta % FP16_2PI) / FP16_2PI;
293049Sdes	switch (i / 256) {
293049Sdes	case 0:
293049Sdes		return (fp16_sin_table[i % 256]);
293049Sdes	case 1:
293049Sdes		return (fp16_sin_table[255 - i % 256]);
293049Sdes	case 2:
293049Sdes		return (-fp16_sin_table[i % 256]);
293049Sdes	case 3:
293049Sdes		return (-fp16_sin_table[255 - i % 256]);
293049Sdes	default:
293049Sdes		/* inconceivable! */
293049Sdes		return (0);
293049Sdes	}
293049Sdes}
293049Sdes
293049Sdes/*
293034Sdes * Compute the cosine of theta.
293034Sdes */
293034Sdesfp16_t
293034Sdesfp16_cos(fp16_t theta)
293034Sdes{
293034Sdes	unsigned int i;
293034Sdes
293034Sdes	i = 1024 * (theta % FP16_2PI) / FP16_2PI;
293034Sdes	switch (i / 256) {
293034Sdes	case 0:
293049Sdes		return (fp16_sin_table[255 - i % 256]);
293034Sdes	case 1:
293049Sdes		return (-fp16_sin_table[i % 256]);
293034Sdes	case 2:
293049Sdes		return (-fp16_sin_table[255 - i % 256]);
293034Sdes	case 3:
293049Sdes		return (fp16_sin_table[i % 256]);
293034Sdes	default:
293034Sdes		/* inconceivable! */
293034Sdes		return (0);
293034Sdes	}
293034Sdes}