apalak
/
luna_mobile_online


								#pragma once


								#include <cstdint>

								#include <cmath>


								class bfloat16

								{

								    uint16_t value;


								    union FloatBits

								    {

								        float f;

								        uint16_t s[2];

								        uint32_t i;

								    };


								    bfloat16(uint16_t x, bool) : value(x)

								    {}


								public:

								    bfloat16() = default;


								    bfloat16(float x)

								    {

								        *this = x;

								    }


								    bfloat16& operator = (float x)

								    {

								        FloatBits b {x};

								        switch(std::fpclassify(x))

								        {

								        case FP_SUBNORMAL:

								        case FP_ZERO:

								            // sign preserving zero (denormal go to zero)

								            value = b.s[1];

								            value &= 0x8000;

								            break;

								        case FP_INFINITE:

								            value = b.s[1];

								            break;

								        case FP_NAN:

								            // truncate and set MSB of the mantissa force QNAN

								            value = b.s[1];

								            value |= 1 << 6;

								            break;

								        case FP_NORMAL:

								            // round to nearest even and truncate

								            unsigned int rounding_bias = 0x00007FFF + (b.s[1] & 0x1);

								            b.i += rounding_bias;

								            value = b.s[1];

								            break;

								        }


								        return *this;

								    }


								    operator float() const

								    {

								        FloatBits b {0};

								        b.s[1] = value;

								        return b.f;

								    }


								    inline bfloat16 operator - () const

								    {

								        return bfloat16(value ^ 0x8000, true);

								    }

								};


								inline bfloat16 operator + (bfloat16 a, bfloat16 b)

								{

								    return float(a) + float(b);

								}


								inline bfloat16 operator - (bfloat16 a, bfloat16 b)

								{

								    return float(a) + float(-b);

								}


								inline bfloat16 operator * (bfloat16 a, bfloat16 b)

								{

								    return float(a) * float(b);

								}


								inline bfloat16 operator / (bfloat16 a, bfloat16 b)

								{

								    return float(a) / float(b);

								}


								inline bfloat16& operator += (bfloat16& a, const bfloat16 b)

								{

									a = a + b;

									return a;

								}


								inline bfloat16& operator -= (bfloat16& a, const bfloat16 b)

								{

									a = a - b;

									return a;

								}


								inline bfloat16& operator *= (bfloat16& a, const bfloat16 b)

								{

									a = a * b;

									return a;

								}


								inline bfloat16& operator /= (bfloat16& a, const bfloat16 b)

								{

									a = a / b;

									return a;

								}


								// Comparison operators

								inline bfloat16 operator == (const bfloat16 a, const bfloat16 b)

								{

									return float(a) == float(b);

								}


								inline bfloat16 operator != (const bfloat16 a, const bfloat16 b)

								{

									return !(a == b);

								}


								inline bfloat16 operator < (const bfloat16 a, const bfloat16 b)

								{

									return float(a) < float(b);

								}


								inline bfloat16 operator <= (const bfloat16 a, const bfloat16 b)

								{

									return float(a) <= float(b);

								}


								inline bfloat16 operator > (const bfloat16 a, const bfloat16 b)

								{

									return float(a) > float(b);

								}


								inline bfloat16 operator >= (const bfloat16 a, const bfloat16 b)

								{

									return float(a) >= float(b);

								}