Blame - third_party/astc-encoder/Source/astc_mathlib_softfloat.cpp - swiftshader.googlesource.com/SwiftShader

blob: 975db2c7ba0064553bdb408a9771c15e5385d220 [file] [log] [blame]

Alexis Hetu	1b90087	2020-02-24 12:09:16 -0500	[diff] [blame^]	1	// SPDX-License-Identifier: Apache-2.0
				2	// ----------------------------------------------------------------------------
				3	// Copyright 2011-2020 Arm Limited
				4	//
				5	// Licensed under the Apache License, Version 2.0 (the "License"); you may not
				6	// use this file except in compliance with the License. You may obtain a copy
				7	// of the License at:
				8	//
				9	// http://www.apache.org/licenses/LICENSE-2.0
				10	//
				11	// Unless required by applicable law or agreed to in writing, software
				12	// distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
				13	// WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
				14	// License for the specific language governing permissions and limitations
				15	// under the License.
				16	// ----------------------------------------------------------------------------
				17
				18	/**
				19	* @brief Soft-float library for IEEE-754.
				20	*/
				21
				22	#include "astc_mathlib.h"
				23
				24	/******************************************
				25	helper functions and their lookup tables
				26	******************************************/
				27	/* count leading zeros functions. Only used when the input is nonzero. */
				28
				29	#if defined(__GNUC__) && (defined(__i386) \|\| defined(__amd64))
				30	#elif defined(__arm__) && defined(__ARMCC_VERSION)
				31	#elif defined(__arm__) && defined(__GNUC__)
				32	#else
				33	/* table used for the slow default versions. */
				34	static const uint8_t clz_table[256] =
				35	{
				36	8, 7, 6, 6, 5, 5, 5, 5, 4, 4, 4, 4, 4, 4, 4, 4,
				37	3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
				38	2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
				39	2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
				40	1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
				41	1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
				42	1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
				43	1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
				44	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				45	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				46	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				47	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				48	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				49	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				50	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
				51	0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
				52	};
				53	#endif
				54
				55	/*
				56	32-bit count-leading-zeros function: use the Assembly instruction whenever possible. */
				57	uint32_t clz32(uint32_t inp)
				58	{
				59	#if defined(__GNUC__) && (defined(__i386) \|\| defined(__amd64))
				60	uint32_t bsr;
				61	__asm__("bsrl %1, %0": "=r"(bsr):"r"(inp \| 1));
				62	return 31 - bsr;
				63	#else
				64	#if defined(__arm__) && defined(__ARMCC_VERSION)
				65	return __clz(inp); /* armcc builtin */
				66	#else
				67	#if defined(__arm__) && defined(__GNUC__)
				68	uint32_t lz;
				69	__asm__("clz %0, %1": "=r"(lz):"r"(inp));
				70	return lz;
				71	#else
				72	/* slow default version */
				73	uint32_t summa = 24;
				74	if (inp >= UINT32_C(0x10000))
				75	{
				76	inp >>= 16;
				77	summa -= 16;
				78	}
				79	if (inp >= UINT32_C(0x100))
				80	{
				81	inp >>= 8;
				82	summa -= 8;
				83	}
				84	return summa + clz_table[inp];
				85	#endif
				86	#endif
				87	#endif
				88	}
				89
				90	/* convert from FP16 to FP32. */
				91	sf32 sf16_to_sf32(sf16 inp)
				92	{
				93	uint32_t inpx = inp;
				94
				95	/*
				96	This table contains, for every FP16 sign/exponent value combination,
				97	the difference between the input FP16 value and the value obtained
				98	by shifting the correct FP32 result right by 13 bits.
				99	This table allows us to handle every case except denormals and NaN
				100	with just 1 table lookup, 2 shifts and 1 add.
				101	*/
				102
				103	#define WITH_MB(a) INT32_C((a) \| (1 << 31))
				104	static const int32_t tbl[64] =
				105	{
				106	WITH_MB(0x00000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000),
				107	INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000),
				108	INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000),
				109	INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), INT32_C(0x1C000), WITH_MB(0x38000),
				110	WITH_MB(0x38000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000),
				111	INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000),
				112	INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000),
				113	INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), INT32_C(0x54000), WITH_MB(0x70000)
				114	};
				115
				116	int32_t res = tbl[inpx >> 10];
				117	res += inpx;
				118
				119	/* the normal cases: the MSB of 'res' is not set. */
				120	if (res >= 0) /* signed compare */
				121	return res << 13;
				122
				123	/* Infinity and Zero: the bottom 10 bits of 'res' are clear. */
				124	if ((res & UINT32_C(0x3FF)) == 0)
				125	return res << 13;
				126
				127	/* NaN: the exponent field of 'inp' is not zero; NaNs must be quietened. */
				128	if ((inpx & 0x7C00) != 0)
				129	return (res << 13) \| UINT32_C(0x400000);
				130
				131	/* the remaining cases are Denormals. */
				132	{
				133	uint32_t sign = (inpx & UINT32_C(0x8000)) << 16;
				134	uint32_t mskval = inpx & UINT32_C(0x7FFF);
				135	uint32_t leadingzeroes = clz32(mskval);
				136	mskval <<= leadingzeroes;
				137	return (mskval >> 8) + ((0x85 - leadingzeroes) << 23) + sign;
				138	}
				139	}
				140
				141	/* convert from soft-float to native-float */
				142	float sf16_to_float(sf16 p)
				143	{
				144	if32 i;
				145	i.u = sf16_to_sf32(p);
				146	return i.f;
				147	}
				148