1f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/**************************************************************************
2f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
3f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Copyright 2010 Luca Barbieri
4f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
5f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Permission is hereby granted, free of charge, to any person obtaining
6f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * a copy of this software and associated documentation files (the
7f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * "Software"), to deal in the Software without restriction, including
8f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * without limitation the rights to use, copy, modify, merge, publish,
9f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * distribute, sublicense, and/or sell copies of the Software, and to
10f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * permit persons to whom the Software is furnished to do so, subject to
11f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * the following conditions:
12f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
13f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * The above copyright notice and this permission notice (including the
14f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * next paragraph) shall be included in all copies or substantial
15f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * portions of the Software.
16f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
17f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
18f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
20f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE
21f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
22f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
23f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
24f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
25f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org **************************************************************************/
26f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
27f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
28f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifndef U_HALF_H
29f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#define U_HALF_H
30f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
31f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "pipe/p_compiler.h"
32f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "util/u_math.h"
33f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
34f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifdef __cplusplus
35f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgextern "C" {
36f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif
37f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
38f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/*
39f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * References for float <-> half conversions
40f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
41f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *  http://fgiesen.wordpress.com/2012/03/28/half-to-float-done-quic/
42f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *  https://gist.github.com/2156668
43f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *  https://gist.github.com/2144712
44f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */
45f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
46f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgstatic INLINE uint16_t
47f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgutil_float_to_half(float f)
48f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
49f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   uint32_t sign_mask  = 0x80000000;
50f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   uint32_t round_mask = ~0xfff;
51f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   uint32_t f32inf = 0xff << 23;
52f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   uint32_t f16inf = 0x1f << 23;
53f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   uint32_t sign;
54f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   union fi magic;
55f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   union fi f32;
56f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   uint16_t f16;
57f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
58f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   magic.ui = 0xf << 23;
59f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
60f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   f32.f = f;
61f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
62f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Sign */
63f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   sign = f32.ui & sign_mask;
64f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   f32.ui ^= sign;
65f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
66f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if (f32.ui == f32inf) {
67f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      /* Inf */
68f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f16 = 0x7c00;
69f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   } else if (f32.ui > f32inf) {
70f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      /* NaN */
71f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f16 = 0x7e00;
72f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   } else {
73f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      /* Number */
74f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f32.ui &= round_mask;
75f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f32.f  *= magic.f;
76f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f32.ui -= round_mask;
77f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
78f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      /* Clamp to infinity if overflowed */
79f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      if (f32.ui > f16inf)
80f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         f32.ui = f16inf;
81f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
82f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f16 = f32.ui >> 13;
83f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
84f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
85f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Sign */
86f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   f16 |= sign >> 16;
87f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
88f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return f16;
89f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
90f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
91f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgstatic INLINE float
92f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgutil_half_to_float(uint16_t f16)
93f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
94f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   union fi infnan;
95f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   union fi magic;
96f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   union fi f32;
97f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
98f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   infnan.ui = 0x8f << 23;
99f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   infnan.f = 65536.0f;
100f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   magic.ui  = 0xef << 23;
101f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
102f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Exponent / Mantissa */
103f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   f32.ui = (f16 & 0x7fff) << 13;
104f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
105f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Adjust */
106f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   f32.f *= magic.f;
107f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
108f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Inf / NaN */
109f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if (f32.f >= infnan.f)
110f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      f32.ui |= 0xff << 23;
111f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
112f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   /* Sign */
113f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   f32.ui |= (f16 & 0x8000) << 16;
114f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
115f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return f32.f;
116f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
117f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
118f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#ifdef __cplusplus
119f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
120f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif
121f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
122f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#endif /* U_HALF_H */
123f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
124