1f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/************************************************************************** 2f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 3f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Copyright 2010 Luca Barbieri 4f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 5f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Permission is hereby granted, free of charge, to any person obtaining 6f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * a copy of this software and associated documentation files (the 7f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * "Software"), to deal in the Software without restriction, including 8f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * without limitation the rights to use, copy, modify, merge, publish, 9f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * distribute, sublicense, and/or sell copies of the Software, and to 10f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * permit persons to whom the Software is furnished to do so, subject to 11f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * the following conditions: 12f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 13f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * The above copyright notice and this permission notice (including the 14f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * next paragraph) shall be included in all copies or substantial 15f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * portions of the Software. 16f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 17f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 18f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 19f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. 20f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE 21f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION 22f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION 23f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 24f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 25f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org **************************************************************************/ 26f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 27f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 28f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifndef U_HALF_H 29f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#define U_HALF_H 30f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 31f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "pipe/p_compiler.h" 32f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "util/u_math.h" 33f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 34f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifdef __cplusplus 35f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgextern "C" { 36f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif 37f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 38f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/* 39f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * References for float <-> half conversions 40f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 41f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * http://fgiesen.wordpress.com/2012/03/28/half-to-float-done-quic/ 42f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * https://gist.github.com/2156668 43f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * https://gist.github.com/2144712 44f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */ 45f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 46f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgstatic INLINE uint16_t 47f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgutil_float_to_half(float f) 48f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 49f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org uint32_t sign_mask = 0x80000000; 50f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org uint32_t round_mask = ~0xfff; 51f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org uint32_t f32inf = 0xff << 23; 52f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org uint32_t f16inf = 0x1f << 23; 53f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org uint32_t sign; 54f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org union fi magic; 55f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org union fi f32; 56f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org uint16_t f16; 57f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 58f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org magic.ui = 0xf << 23; 59f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 60f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.f = f; 61f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 62f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Sign */ 63f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org sign = f32.ui & sign_mask; 64f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui ^= sign; 65f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 66f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (f32.ui == f32inf) { 67f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Inf */ 68f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f16 = 0x7c00; 69f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } else if (f32.ui > f32inf) { 70f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* NaN */ 71f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f16 = 0x7e00; 72f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } else { 73f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Number */ 74f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui &= round_mask; 75f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.f *= magic.f; 76f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui -= round_mask; 77f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 78f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Clamp to infinity if overflowed */ 79f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (f32.ui > f16inf) 80f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui = f16inf; 81f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 82f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f16 = f32.ui >> 13; 83f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 84f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 85f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Sign */ 86f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f16 |= sign >> 16; 87f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 88f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return f16; 89f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 90f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 91f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgstatic INLINE float 92f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgutil_half_to_float(uint16_t f16) 93f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 94f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org union fi infnan; 95f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org union fi magic; 96f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org union fi f32; 97f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 98f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org infnan.ui = 0x8f << 23; 99f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org infnan.f = 65536.0f; 100f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org magic.ui = 0xef << 23; 101f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 102f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Exponent / Mantissa */ 103f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui = (f16 & 0x7fff) << 13; 104f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 105f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Adjust */ 106f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.f *= magic.f; 107f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 108f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Inf / NaN */ 109f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (f32.f >= infnan.f) 110f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui |= 0xff << 23; 111f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 112f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* Sign */ 113f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org f32.ui |= (f16 & 0x8000) << 16; 114f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 115f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return f32.f; 116f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 117f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 118f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifdef __cplusplus 119f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 120f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif 121f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 122f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif /* U_HALF_H */ 123f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 124