| // Copyright 2016 The SwiftShader Authors. All Rights Reserved. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| #ifndef sw_Half_hpp |
| #define sw_Half_hpp |
| |
| #include <algorithm> |
| #include <cmath> |
| |
| namespace sw |
| { |
| class half |
| { |
| public: |
| half() = default; |
| explicit half(float f); |
| |
| operator float() const; |
| |
| half &operator=(half h); |
| half &operator=(float f); |
| |
| private: |
| unsigned short fp16i; |
| }; |
| |
| inline half shortAsHalf(short s) |
| { |
| union |
| { |
| half h; |
| short s; |
| } hs; |
| |
| hs.s = s; |
| |
| return hs.h; |
| } |
| |
| class RGB9E5 |
| { |
| unsigned int R : 9; |
| unsigned int G : 9; |
| unsigned int B : 9; |
| unsigned int E : 5; |
| |
| public: |
| RGB9E5(float rgb[3]) |
| { |
| // B is the exponent bias (15) |
| constexpr int g_sharedexp_bias = 15; |
| |
| // N is the number of mantissa bits per component (9) |
| constexpr int g_sharedexp_mantissabits = 9; |
| |
| // Emax is the maximum allowed biased exponent value (31) |
| constexpr int g_sharedexp_maxexponent = 31; |
| |
| constexpr float g_sharedexp_max = |
| ((static_cast<float>(1 << g_sharedexp_mantissabits) - 1) / |
| static_cast<float>(1 << g_sharedexp_mantissabits)) * |
| static_cast<float>(1 << (g_sharedexp_maxexponent - g_sharedexp_bias)); |
| |
| const float red_c = std::max<float>(0, std::min(g_sharedexp_max, rgb[0])); |
| const float green_c = std::max<float>(0, std::min(g_sharedexp_max, rgb[1])); |
| const float blue_c = std::max<float>(0, std::min(g_sharedexp_max, rgb[2])); |
| |
| const float max_c = std::max<float>(std::max<float>(red_c, green_c), blue_c); |
| const float exp_p = |
| std::max<float>(-g_sharedexp_bias - 1, floor(log(max_c))) + 1 + g_sharedexp_bias; |
| const int max_s = static_cast<int>( |
| floor((max_c / (pow(2.0f, exp_p - g_sharedexp_bias - g_sharedexp_mantissabits))) + 0.5f)); |
| const int exp_s = |
| static_cast<int>((max_s < pow(2.0f, g_sharedexp_mantissabits)) ? exp_p : exp_p + 1); |
| |
| R = static_cast<unsigned int>( |
| floor((red_c / (pow(2.0f, exp_s - g_sharedexp_bias - g_sharedexp_mantissabits))) + 0.5f)); |
| G = static_cast<unsigned int>( |
| floor((green_c / (pow(2.0f, exp_s - g_sharedexp_bias - g_sharedexp_mantissabits))) + 0.5f)); |
| B = static_cast<unsigned int>( |
| floor((blue_c / (pow(2.0f, exp_s - g_sharedexp_bias - g_sharedexp_mantissabits))) + 0.5f)); |
| E = exp_s; |
| } |
| |
| operator unsigned int() const |
| { |
| return *reinterpret_cast<const unsigned int*>(this); |
| } |
| |
| void toRGB16F(half rgb[3]) const |
| { |
| constexpr int offset = 24; // Exponent bias (15) + number of mantissa bits per component (9) = 24 |
| |
| const float factor = (1u << E) * (1.0f / (1 << offset)); |
| rgb[0] = half(R * factor); |
| rgb[1] = half(G * factor); |
| rgb[2] = half(B * factor); |
| } |
| }; |
| |
| class R11G11B10F |
| { |
| unsigned int R : 11; |
| unsigned int G : 11; |
| unsigned int B : 10; |
| |
| static inline half float11ToFloat16(unsigned short fp11) |
| { |
| return shortAsHalf(fp11 << 4); // Sign bit 0 |
| } |
| |
| static inline half float10ToFloat16(unsigned short fp10) |
| { |
| return shortAsHalf(fp10 << 5); // Sign bit 0 |
| } |
| |
| inline unsigned short float32ToFloat11(float fp32) |
| { |
| const unsigned int float32MantissaMask = 0x7FFFFF; |
| const unsigned int float32ExponentMask = 0x7F800000; |
| const unsigned int float32SignMask = 0x80000000; |
| const unsigned int float32ValueMask = ~float32SignMask; |
| const unsigned int float32ExponentFirstBit = 23; |
| const unsigned int float32ExponentBias = 127; |
| |
| const unsigned short float11Max = 0x7BF; |
| const unsigned short float11MantissaMask = 0x3F; |
| const unsigned short float11ExponentMask = 0x7C0; |
| const unsigned short float11BitMask = 0x7FF; |
| const unsigned int float11ExponentBias = 14; |
| |
| const unsigned int float32Maxfloat11 = 0x477E0000; |
| const unsigned int float32Minfloat11 = 0x38800000; |
| |
| const unsigned int float32Bits = *reinterpret_cast<unsigned int*>(&fp32); |
| const bool float32Sign = (float32Bits & float32SignMask) == float32SignMask; |
| |
| unsigned int float32Val = float32Bits & float32ValueMask; |
| |
| if((float32Val & float32ExponentMask) == float32ExponentMask) |
| { |
| // INF or NAN |
| if((float32Val & float32MantissaMask) != 0) |
| { |
| return float11ExponentMask | |
| (((float32Val >> 17) | (float32Val >> 11) | (float32Val >> 6) | (float32Val)) & |
| float11MantissaMask); |
| } |
| else if(float32Sign) |
| { |
| // -INF is clamped to 0 since float11 is positive only |
| return 0; |
| } |
| else |
| { |
| return float11ExponentMask; |
| } |
| } |
| else if(float32Sign) |
| { |
| // float11 is positive only, so clamp to zero |
| return 0; |
| } |
| else if(float32Val > float32Maxfloat11) |
| { |
| // The number is too large to be represented as a float11, set to max |
| return float11Max; |
| } |
| else |
| { |
| if(float32Val < float32Minfloat11) |
| { |
| // The number is too small to be represented as a normalized float11 |
| // Convert it to a denormalized value. |
| const unsigned int shift = (float32ExponentBias - float11ExponentBias) - |
| (float32Val >> float32ExponentFirstBit); |
| float32Val = |
| ((1 << float32ExponentFirstBit) | (float32Val & float32MantissaMask)) >> shift; |
| } |
| else |
| { |
| // Rebias the exponent to represent the value as a normalized float11 |
| float32Val += 0xC8000000; |
| } |
| |
| return ((float32Val + 0xFFFF + ((float32Val >> 17) & 1)) >> 17) & float11BitMask; |
| } |
| } |
| |
| inline unsigned short float32ToFloat10(float fp32) |
| { |
| const unsigned int float32MantissaMask = 0x7FFFFF; |
| const unsigned int float32ExponentMask = 0x7F800000; |
| const unsigned int float32SignMask = 0x80000000; |
| const unsigned int float32ValueMask = ~float32SignMask; |
| const unsigned int float32ExponentFirstBit = 23; |
| const unsigned int float32ExponentBias = 127; |
| |
| const unsigned short float10Max = 0x3DF; |
| const unsigned short float10MantissaMask = 0x1F; |
| const unsigned short float10ExponentMask = 0x3E0; |
| const unsigned short float10BitMask = 0x3FF; |
| const unsigned int float10ExponentBias = 14; |
| |
| const unsigned int float32Maxfloat10 = 0x477C0000; |
| const unsigned int float32Minfloat10 = 0x38800000; |
| |
| const unsigned int float32Bits = *reinterpret_cast<unsigned int*>(&fp32); |
| const bool float32Sign = (float32Bits & float32SignMask) == float32SignMask; |
| |
| unsigned int float32Val = float32Bits & float32ValueMask; |
| |
| if((float32Val & float32ExponentMask) == float32ExponentMask) |
| { |
| // INF or NAN |
| if((float32Val & float32MantissaMask) != 0) |
| { |
| return float10ExponentMask | |
| (((float32Val >> 18) | (float32Val >> 13) | (float32Val >> 3) | (float32Val)) & |
| float10MantissaMask); |
| } |
| else if(float32Sign) |
| { |
| // -INF is clamped to 0 since float11 is positive only |
| return 0; |
| } |
| else |
| { |
| return float10ExponentMask; |
| } |
| } |
| else if(float32Sign) |
| { |
| // float10 is positive only, so clamp to zero |
| return 0; |
| } |
| else if(float32Val > float32Maxfloat10) |
| { |
| // The number is too large to be represented as a float11, set to max |
| return float10Max; |
| } |
| else |
| { |
| if(float32Val < float32Minfloat10) |
| { |
| // The number is too small to be represented as a normalized float11 |
| // Convert it to a denormalized value. |
| const unsigned int shift = (float32ExponentBias - float10ExponentBias) - |
| (float32Val >> float32ExponentFirstBit); |
| float32Val = |
| ((1 << float32ExponentFirstBit) | (float32Val & float32MantissaMask)) >> shift; |
| } |
| else |
| { |
| // Rebias the exponent to represent the value as a normalized float11 |
| float32Val += 0xC8000000; |
| } |
| |
| return ((float32Val + 0x1FFFF + ((float32Val >> 18) & 1)) >> 18) & float10BitMask; |
| } |
| } |
| |
| public: |
| R11G11B10F(float rgb[3]) |
| { |
| R = float32ToFloat11(rgb[0]); |
| G = float32ToFloat11(rgb[1]); |
| B = float32ToFloat10(rgb[2]); |
| } |
| |
| operator unsigned int() const |
| { |
| return *reinterpret_cast<const unsigned int*>(this); |
| } |
| |
| void toRGB16F(half rgb[3]) const |
| { |
| rgb[0] = float11ToFloat16(R); |
| rgb[1] = float11ToFloat16(G); |
| rgb[2] = float10ToFloat16(B); |
| } |
| }; |
| } |
| |
| #endif // sw_Half_hpp |