hikogui/0.6.0/a00401_source.html

// Copyright Take Vos 2020-2021.

// Distributed under the Boost Software License, Version 1.0.

// (See accompanying file LICENSE_1_0.txt or copy at https://www.boost.org/LICENSE_1_0.txt)


#pragma once


#include "required.hpp"

#include <cstdint>

#include <type_traits>


namespace hi::inline v1 {


constexpr uint32_t float16_bias = 15;

constexpr uint32_t float32_bias = 127;

constexpr uint32_t f32_to_f16_adjustment_exponent = float32_bias - float16_bias;

constexpr uint32_t f32_to_f16_lowest_normal_exponent = 0x01 + f32_to_f16_adjustment_exponent;

constexpr uint32_t f32_to_f16_infinite_exponent = 0x1f + f32_to_f16_adjustment_exponent;

constexpr uint32_t f32_to_f16_adjustment = f32_to_f16_adjustment_exponent << 23;

constexpr uint32_t f32_to_f16_lowest_normal = f32_to_f16_lowest_normal_exponent << 23;

constexpr uint32_t f32_to_f16_infinite = f32_to_f16_infinite_exponent << 23;


constexpr float cvtsh_ss(uint16_t value) noexcept

{

    // Convert the 16 bit values to 32 bit with leading zeros.

    uint32_t u = value;


    // Extract the sign bit.

    hilet sign = (u >> 15) << 31;


    // Strip the sign bit and align the exponent/mantissa boundary to a float 32.

    u = (u << 17) >> 4;


    // Adjust the bias. f32_to_f16_adjustment

    u = u + f32_to_f16_adjustment;


    // Get a mask of '1' bits when the half-float would be normal or infinite.

    hilet is_normal = u > (f32_to_f16_lowest_normal - 1);


    // Add the sign bit back in.

    u = u | sign;


    // Keep the value if normal, if denormal make it zero.

    u = is_normal ? u : 0;


    return std::bit_cast<float>(u);

}


constexpr uint16_t cvtss_sh(float value) noexcept

{

    // Interpret the floating point number as 32 bit-field.

    auto u = std::bit_cast<uint32_t>(value);


    // Get the sign of the floating point number as a bit mask of the upper 17 bits.

    hilet sign = static_cast<uint32_t>(static_cast<int32_t>(u) >> 31) << 15;


    // Strip sign bit.

    u = (u << 1) >> 1;


    // Get a mask of '1' bits when the half-float would be normal or infinite.

    hilet is_normal = u > (f32_to_f16_lowest_normal - 1);


    // Clamp the floating point number to where the half-float would be infinite.

    u = std::min(u, f32_to_f16_infinite); // SSE4.1


    // Convert the bias from float to half-float.

    u = u - f32_to_f16_adjustment;


    // Shift the float until it becomes a half-float. This truncates the mantissa.

    u = u >> 13;


    // Keep the value if normal, if denormal make it zero.

    u = is_normal ? u : 0;


    // Add the sign bit back in, also set the upper 16 bits so that saturated pack

    // will work correctly when converting to int16.

    u = u | sign;


    // Saturate and pack the 32 bit integers to 16 bit integers.

    return static_cast<uint16_t>(u);

}


class float16 {

    uint16_t v;


public:

    constexpr float16() noexcept : v(0) {}

    constexpr float16(float16 const &) noexcept = default;

    constexpr float16(float16 &&) noexcept = default;

    constexpr float16 &operator=(float16 const &) noexcept = default;

    constexpr float16 &operator=(float16 &&) noexcept = default;


    constexpr explicit float16(float other) noexcept : v(cvtss_sh(other)) {}

    constexpr explicit float16(double other) noexcept : float16(static_cast<float>(other)) {}

    constexpr explicit float16(long double other) noexcept : float16(static_cast<float>(other)) {}


    constexpr float16 &operator=(float other) noexcept

    {

        v = cvtss_sh(other);

        return *this;

    }


    constexpr operator float() const noexcept

    {

        return cvtsh_ss(v);

    }


    [[nodiscard]] static constexpr float16 from_uint16_t(uint16_t const rhs) noexcept

    {

        auto r = float16{};

        r.v = rhs;

        return r;

    }


    [[nodiscard]] constexpr uint16_t get() const noexcept

    {

        return v;

    }


    constexpr float16 &set(uint16_t rhs) noexcept

    {

        v = rhs;

        return *this;

    }


    [[nodiscard]] std::size_t hash() const noexcept

    {

        return std::hash<uint16_t>{}(v);

    }


    [[nodiscard]] constexpr friend bool operator==(float16 const &lhs, float16 const &rhs) noexcept = default;


    [[nodiscard]] constexpr friend float16 operator*(float16 const &lhs, float16 const &rhs) noexcept

    {

        return float16{static_cast<float>(lhs) * static_cast<float>(rhs)};

    }

};


} // namespace hi::inline v1


template<>


struct std::hash<hi::float16> {

    std::size_t operator()(hi::float16 const &rhs) noexcept

    {

        return rhs.hash();

    }

};


template<>


struct std::numeric_limits<hi::float16> {

    using value_type = hi::float16;


    static constexpr bool is_specialized = true;

    static constexpr bool is_signed = true;

    static constexpr bool is_integer = false;

    static constexpr bool is_exact = false;

    static constexpr bool has_infinity = true;

    static constexpr bool has_quiet_NaN = true;

    static constexpr bool has_signaling_NaN = false;

    static constexpr float_denorm_style has_denorm = std::denorm_present;

    static constexpr bool has_denorm_loss = false;

    static constexpr float_round_style round_style = std::round_to_nearest;

    static constexpr bool is_iec559 = true;

    static constexpr bool is_bounded = true;

    static constexpr bool is_modulo = false;

    static constexpr int digits = 10;

    static constexpr int digits10 = 4;

    static constexpr int max_digits10 = 4;

    static constexpr int min_exponent = -14;

    static constexpr int min_exponent10 = -3;

    static constexpr int max_exponent = 15;

    static constexpr int max_exponent10 = 3;

    static constexpr bool traps = false;

    static constexpr bool tinyness_before = false;


    static constexpr value_type min() noexcept

    {

        return hi::float16::from_uint16_t(0x0400);

    }


    static constexpr value_type lowest() noexcept

    {

        return hi::float16::from_uint16_t(0xfbff);

    }


    static constexpr value_type max() noexcept

    {

        return hi::float16::from_uint16_t(0x7bff);

    }


    static constexpr value_type epsilon() noexcept

    {

        return hi::float16::from_uint16_t(0xfbff);

    }


    static constexpr value_type round_error() noexcept

    {

        return hi::float16::from_uint16_t(0x3800); // 0.5

    }


    static constexpr value_type infinity() noexcept

    {

        return hi::float16::from_uint16_t(0x7c00);

    }


    static constexpr value_type quiet_NaN() noexcept

    {

        return hi::float16::from_uint16_t(0x7c01);

    }


    static constexpr value_type signaling_NaN() noexcept

    {

        return hi::float16::from_uint16_t(0x7e01);

    }


    static constexpr value_type denorm_min() noexcept

    {

        return hi::float16::from_uint16_t(0x0001);

    }

};


required.hpp
This file includes required definitions.

hilet
#define hilet
Invariant should be the default for variables.
Definition required.hpp:23

v1::float16
Definition float16.hpp:82

std::numeric_limits::denorm_min
T denorm_min(T... args)

std::numeric_limits::epsilon
T epsilon(T... args)

std::hash

std::numeric_limits::infinity
T infinity(T... args)

std::is_signed

std::numeric_limits::lowest
T lowest(T... args)

std::numeric_limits::max
T max(T... args)

std::min
T min(T... args)

std::numeric_limits

std::hash::operator()
T operator()(T... args)

std::numeric_limits::quiet_NaN
T quiet_NaN(T... args)

std::numeric_limits::round_error
T round_error(T... args)

std::numeric_limits::signaling_NaN
T signaling_NaN(T... args)

std::size_t