d6/d82/GPUORTFloat16_8h_source.html

// Copyright (c) Microsoft Corporation. All rights reserved.

// Licensed under the MIT License.


// This code was created from:

//    - https://github.com/microsoft/onnxruntime/blob/main/include/onnxruntime/core/session/onnxruntime_float16.h

//    - https://github.com/microsoft/onnxruntime/blob/main/include/onnxruntime/core/session/onnxruntime_cxx_api.h


#ifndef GPUORTFLOAT16_H

#define GPUORTFLOAT16_H


#ifndef GPUCA_GPUCODE_DEVICE

#include <stdint.h>

#include <cmath>

#include <cstring>

#include <limits>

#endif


#include "GPUCommonDef.h"

#include "GPUCommonMath.h"


namespace o2

{


namespace OrtDataType

{


namespace detail

{


enum class endian {

#if defined(_WIN32)

  little = 0,

  big = 1,

  native = little,

#elif defined(__GNUC__) || defined(__clang__)

  little = __ORDER_LITTLE_ENDIAN__,

  big = __ORDER_BIG_ENDIAN__,

  native = __BYTE_ORDER__,

#else

#error OrtDataType::detail::endian is not implemented in this environment.

#endif

};


static_assert(

  endian::native == endian::little || endian::native == endian::big,

  "Only little-endian or big-endian native byte orders are supported.");


} // namespace detail


template <class Derived>


struct Float16Impl {

 protected:

  GPUd() constexpr static uint16_t ToUint16Impl(float v) noexcept;


  GPUd() float ToFloatImpl() const noexcept;


  GPUd() uint16_t AbsImpl() const noexcept

  {

    return static_cast<uint16_t>(val & ~kSignMask);

  }


  GPUd() uint16_t NegateImpl() const noexcept

  {

    return IsNaN() ? val : static_cast<uint16_t>(val ^ kSignMask);

  }


 public:

  // uint16_t special values

  static constexpr uint16_t kSignMask = 0x8000U;

  static constexpr uint16_t kBiasedExponentMask = 0x7C00U;

  static constexpr uint16_t kPositiveInfinityBits = 0x7C00U;

  static constexpr uint16_t kNegativeInfinityBits = 0xFC00U;

  static constexpr uint16_t kPositiveQNaNBits = 0x7E00U;

  static constexpr uint16_t kNegativeQNaNBits = 0xFE00U;

  static constexpr uint16_t kEpsilonBits = 0x4170U;

  static constexpr uint16_t kMinValueBits = 0xFBFFU; // Minimum normal number

  static constexpr uint16_t kMaxValueBits = 0x7BFFU; // Largest normal number

  static constexpr uint16_t kOneBits = 0x3C00U;

  static constexpr uint16_t kMinusOneBits = 0xBC00U;


  uint16_t val{0};


  GPUdDefault() Float16Impl() = default;


  GPUd() bool IsNegative() const noexcept

  {

    return static_cast<int16_t>(val) < 0;

  }


  GPUd() bool IsNaN() const noexcept

  {

    return AbsImpl() > kPositiveInfinityBits;

  }


  GPUd() bool IsFinite() const noexcept

  {

    return AbsImpl() < kPositiveInfinityBits;

  }


  GPUd() bool IsPositiveInfinity() const noexcept

  {

    return val == kPositiveInfinityBits;

  }


  GPUd() bool IsNegativeInfinity() const noexcept

  {

    return val == kNegativeInfinityBits;

  }


  GPUd() bool IsInfinity() const noexcept

  {

    return AbsImpl() == kPositiveInfinityBits;

  }


  GPUd() bool IsNaNOrZero() const noexcept

  {

    auto abs = AbsImpl();

    return (abs == 0 || abs > kPositiveInfinityBits);

  }


  GPUd() bool IsNormal() const noexcept

  {

    auto abs = AbsImpl();

    return (abs < kPositiveInfinityBits)          // is finite

           && (abs != 0)                          // is not zero

           && ((abs & kBiasedExponentMask) != 0); // is not subnormal (has a non-zero exponent)

  }


  GPUd() bool IsSubnormal() const noexcept

  {

    auto abs = AbsImpl();

    return (abs < kPositiveInfinityBits)          // is finite

           && (abs != 0)                          // is not zero

           && ((abs & kBiasedExponentMask) == 0); // is subnormal (has a zero exponent)

  }


  GPUd() Derived Abs() const noexcept { return Derived::FromBits(AbsImpl()); }


  GPUd() Derived Negate() const noexcept { return Derived::FromBits(NegateImpl()); }


  GPUd() static bool AreZero(const Float16Impl& lhs, const Float16Impl& rhs) noexcept

  {

    return static_cast<uint16_t>((lhs.val | rhs.val) & ~kSignMask) == 0;

  }


  GPUd() bool operator==(const Float16Impl& rhs) const noexcept

  {

    if (IsNaN() || rhs.IsNaN()) {

      // IEEE defines that NaN is not equal to anything, including itself.

      return false;

    }

    return val == rhs.val;

  }


  GPUd() bool operator!=(const Float16Impl& rhs) const noexcept { return !(*this == rhs); }


  GPUd() bool operator<(const Float16Impl& rhs) const noexcept

  {

    if (IsNaN() || rhs.IsNaN()) {

      // IEEE defines that NaN is unordered with respect to everything, including itself.

      return false;

    }


    const bool left_is_negative = IsNegative();

    if (left_is_negative != rhs.IsNegative()) {

      // When the signs of left and right differ, we know that left is less than right if it is

      // the negative value. The exception to this is if both values are zero, in which case IEEE

      // says they should be equal, even if the signs differ.

      return left_is_negative && !AreZero(*this, rhs);

    }

    return (val != rhs.val) && ((val < rhs.val) ^ left_is_negative);

  }

};


// The following Float16_t conversions are based on the code from

// Eigen library.


// The conversion routines are Copyright (c) Fabian Giesen, 2016.

// The original license follows:

//

// Copyright (c) Fabian Giesen, 2016

// All rights reserved.

// Redistribution and use in source and binary forms, with or without

// modification, are permitted.

// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

// HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.


namespace detail

{


union float32_bits {

  unsigned int u;

  float f;

};


}; // namespace detail


template <class Derived>

GPUdi() constexpr uint16_t Float16Impl<Derived>::ToUint16Impl(float v) noexcept

{

  detail::float32_bits f{};

  f.f = v;


  constexpr detail::float32_bits f32infty = {255 << 23};

  constexpr detail::float32_bits f16max = {(127 + 16) << 23};

  constexpr detail::float32_bits denorm_magic = {((127 - 15) + (23 - 10) + 1) << 23};

  constexpr unsigned int sign_mask = 0x80000000u;

  uint16_t val = static_cast<uint16_t>(0x0u);


  unsigned int sign = f.u & sign_mask;

  f.u ^= sign;


  // NOTE all the integer compares in this function can be safely

  // compiled into signed compares since all operands are below

  // 0x80000000. Important if you want fast straight SSE2 code

  // (since there's no unsigned PCMPGTD).


  if (f.u >= f16max.u) {                        // result is Inf or NaN (all exponent bits set)

    val = (f.u > f32infty.u) ? 0x7e00 : 0x7c00; // NaN->qNaN and Inf->Inf

  } else {                                      // (De)normalized number or zero

    if (f.u < (113 << 23)) {                    // resulting FP16 is subnormal or zero

      // use a magic value to align our 10 mantissa bits at the bottom of

      // the float. as long as FP addition is round-to-nearest-even this

      // just works.

      f.f += denorm_magic.f;


      // and one integer subtract of the bias later, we have our final float!

      val = static_cast<uint16_t>(f.u - denorm_magic.u);

    } else {

      unsigned int mant_odd = (f.u >> 13) & 1; // resulting mantissa is odd


      // update exponent, rounding bias part 1

      // Equivalent to `f.u += ((unsigned int)(15 - 127) << 23) + 0xfff`, but

      // without arithmetic overflow.

      f.u += 0xc8000fffU;

      // rounding bias part 2

      f.u += mant_odd;

      // take the bits!

      val = static_cast<uint16_t>(f.u >> 13);

    }

  }


  val |= static_cast<uint16_t>(sign >> 16);

  return val;

}


template <class Derived>

GPUdi() float Float16Impl<Derived>::ToFloatImpl() const noexcept

{

  constexpr detail::float32_bits magic = {113 << 23};

  constexpr unsigned int shifted_exp = 0x7c00 << 13; // exponent mask after shift

  detail::float32_bits o{};


  o.u = (val & 0x7fff) << 13;           // exponent/mantissa bits

  unsigned int exp = shifted_exp & o.u; // just the exponent

  o.u += (127 - 15) << 23;              // exponent adjust


  // handle exponent special cases

  if (exp == shifted_exp) {  // Inf/NaN?

    o.u += (128 - 16) << 23; // extra exp adjust

  } else if (exp == 0) {     // Zero/Denormal?

    o.u += 1 << 23;          // extra exp adjust

    o.f -= magic.f;          // re-normalize

  }


  // Attempt to workaround the Internal Compiler Error on ARM64

  // for bitwise | operator, including std::bitset

#if (defined _MSC_VER) && (defined _M_ARM || defined _M_ARM64 || defined _M_ARM64EC)

  if (IsNegative()) {

    return -o.f;

  }

#else

  // original code:

  o.u |= (val & 0x8000U) << 16U; // sign bit

#endif

  return o.f;

}


template <class Derived>

struct BFloat16Impl {

 protected:

  GPUd() static uint16_t ToUint16Impl(float v) noexcept;


  GPUd() float ToFloatImpl() const noexcept;


  GPUd() uint16_t AbsImpl() const noexcept

  {

    return static_cast<uint16_t>(val & ~kSignMask);

  }


  GPUd() uint16_t NegateImpl() const noexcept

  {

    return IsNaN() ? val : static_cast<uint16_t>(val ^ kSignMask);

  }


 public:

  // uint16_t special values

  static constexpr uint16_t kSignMask = 0x8000U;

  static constexpr uint16_t kBiasedExponentMask = 0x7F80U;

  static constexpr uint16_t kPositiveInfinityBits = 0x7F80U;

  static constexpr uint16_t kNegativeInfinityBits = 0xFF80U;

  static constexpr uint16_t kPositiveQNaNBits = 0x7FC1U;

  static constexpr uint16_t kNegativeQNaNBits = 0xFFC1U;

  static constexpr uint16_t kSignaling_NaNBits = 0x7F80U;

  static constexpr uint16_t kEpsilonBits = 0x0080U;

  static constexpr uint16_t kMinValueBits = 0xFF7FU;

  static constexpr uint16_t kMaxValueBits = 0x7F7FU;

  static constexpr uint16_t kRoundToNearest = 0x7FFFU;

  static constexpr uint16_t kOneBits = 0x3F80U;

  static constexpr uint16_t kMinusOneBits = 0xBF80U;


  uint16_t val{0};


  GPUdDefault() BFloat16Impl() = default;


  GPUd() bool IsNegative() const noexcept

  {

    return static_cast<int16_t>(val) < 0;

  }


  GPUd() bool IsNaN() const noexcept

  {

    return AbsImpl() > kPositiveInfinityBits;

  }


  GPUd() bool IsFinite() const noexcept

  {

    return AbsImpl() < kPositiveInfinityBits;

  }


  GPUd() bool IsPositiveInfinity() const noexcept

  {

    return val == kPositiveInfinityBits;

  }


  GPUd() bool IsNegativeInfinity() const noexcept

  {

    return val == kNegativeInfinityBits;

  }


  GPUd() bool IsInfinity() const noexcept

  {

    return AbsImpl() == kPositiveInfinityBits;

  }


  GPUd() bool IsNaNOrZero() const noexcept

  {

    auto abs = AbsImpl();

    return (abs == 0 || abs > kPositiveInfinityBits);

  }


  GPUd() bool IsNormal() const noexcept

  {

    auto abs = AbsImpl();

    return (abs < kPositiveInfinityBits)          // is finite

           && (abs != 0)                          // is not zero

           && ((abs & kBiasedExponentMask) != 0); // is not subnormal (has a non-zero exponent)

  }


  GPUd() bool IsSubnormal() const noexcept

  {

    auto abs = AbsImpl();

    return (abs < kPositiveInfinityBits)          // is finite

           && (abs != 0)                          // is not zero

           && ((abs & kBiasedExponentMask) == 0); // is subnormal (has a zero exponent)

  }


  GPUd() Derived Abs() const noexcept { return Derived::FromBits(AbsImpl()); }


  GPUd() Derived Negate() const noexcept { return Derived::FromBits(NegateImpl()); }


  GPUd() static bool AreZero(const BFloat16Impl& lhs, const BFloat16Impl& rhs) noexcept

  {

    // IEEE defines that positive and negative zero are equal, this gives us a quick equality check

    // for two values by or'ing the private bits together and stripping the sign. They are both zero,

    // and therefore equivalent, if the resulting value is still zero.

    return static_cast<uint16_t>((lhs.val | rhs.val) & ~kSignMask) == 0;

  }

};


template <class Derived>

GPUdi() uint16_t BFloat16Impl<Derived>::ToUint16Impl(float v) noexcept

{

  uint16_t result;

  if (o2::gpu::CAMath::IsNaN(v)) {

    result = kPositiveQNaNBits;

  } else {

    auto get_msb_half = [](float fl) {

      uint16_t result;

#ifdef GPUCA_GPUCODE

      o2::gpu::CAMath::memcpy(&result, reinterpret_cast<char*>(&fl) + sizeof(uint16_t), sizeof(uint16_t));

#else

#ifdef __cpp_if_constexpr

      if constexpr (detail::endian::native == detail::endian::little)

#else

      if (detail::endian::native == detail::endian::little)

#endif

      {

        std::memcpy(&result, reinterpret_cast<char*>(&fl) + sizeof(uint16_t), sizeof(uint16_t));

      } else {

        std::memcpy(&result, &fl, sizeof(uint16_t));

      }

#endif

      return result;

    };


    uint16_t upper_bits = get_msb_half(v);

    union {

      uint32_t U32;

      float F32;

    };

    F32 = v;

    U32 += (upper_bits & 1) + kRoundToNearest;

    result = get_msb_half(F32);

  }

  return result;

}


template <class Derived>

GPUdi() float BFloat16Impl<Derived>::ToFloatImpl() const noexcept

{

  if (IsNaN()) {

    return o2::gpu::CAMath::QuietNaN();

  }

  float result;

  char* const first = reinterpret_cast<char*>(&result);

  char* const second = first + sizeof(uint16_t);

#ifdef GPUCA_GPUCODE

  first[0] = first[1] = 0;

  o2::gpu::CAMath::memcpy(second, &val, sizeof(uint16_t));

#else

#ifdef __cpp_if_constexpr

  if constexpr (detail::endian::native == detail::endian::little)

#else

  if (detail::endian::native == detail::endian::little)

#endif

  {

    std::memset(first, 0, sizeof(uint16_t));

    std::memcpy(second, &val, sizeof(uint16_t));

  } else {

    std::memcpy(first, &val, sizeof(uint16_t));

    std::memset(second, 0, sizeof(uint16_t));

  }

#endif

  return result;

}


struct Float16_t : OrtDataType::Float16Impl<Float16_t> {

 private:

  constexpr explicit Float16_t(uint16_t v) noexcept { val = v; }


 public:

  using Base = OrtDataType::Float16Impl<Float16_t>;


  GPUdDefault() Float16_t() = default;


  GPUd() constexpr static Float16_t FromBits(uint16_t v) noexcept { return Float16_t(v); }


  GPUd() explicit Float16_t(float v) noexcept { val = Base::ToUint16Impl(v); }


  GPUd() float ToFloat() const noexcept { return Base::ToFloatImpl(); }


  using Base::IsNegative;


  using Base::IsNaN;


  using Base::IsFinite;


  using Base::IsPositiveInfinity;


  using Base::IsNegativeInfinity;


  using Base::IsInfinity;


  using Base::IsNaNOrZero;


  using Base::IsNormal;


  using Base::IsSubnormal;


  using Base::Abs;


  using Base::Negate;


  using Base::AreZero;


  GPUdi() explicit operator float() const noexcept { return ToFloat(); }


  using Base::operator==;

  using Base::operator!=;

  using Base::operator<;

};


static_assert(sizeof(Float16_t) == sizeof(uint16_t), "Sizes must match");


struct BFloat16_t : OrtDataType::BFloat16Impl<BFloat16_t> {

 private:

  constexpr explicit BFloat16_t(uint16_t v) noexcept { val = v; }


 public:

  using Base = OrtDataType::BFloat16Impl<BFloat16_t>;


  GPUdDefault() BFloat16_t() = default;


  GPUd() static constexpr BFloat16_t FromBits(uint16_t v) noexcept { return BFloat16_t(v); }


  GPUd() explicit BFloat16_t(float v) noexcept { val = Base::ToUint16Impl(v); }


  GPUd() float ToFloat() const noexcept { return Base::ToFloatImpl(); }


  using Base::IsNegative;


  using Base::IsNaN;


  using Base::IsFinite;


  using Base::IsPositiveInfinity;


  using Base::IsNegativeInfinity;


  using Base::IsInfinity;


  using Base::IsNaNOrZero;


  using Base::IsNormal;


  using Base::IsSubnormal;


  using Base::Abs;


  using Base::Negate;


  using Base::AreZero;


  GPUdi() explicit operator float() const noexcept { return ToFloat(); }


  // We do not have an inherited impl for the below operators

  // as the internal class implements them a little differently

  bool operator==(const BFloat16_t& rhs) const noexcept;

  bool operator!=(const BFloat16_t& rhs) const noexcept { return !(*this == rhs); }

  bool operator<(const BFloat16_t& rhs) const noexcept;

};


static_assert(sizeof(BFloat16_t) == sizeof(uint16_t), "Sizes must match");


} // namespace OrtDataType


} // namespace o2

#endif

exp
uint64_t exp(uint64_t base, uint8_t exp) noexcept
Definition StringUtils.cxx:192

GPUdi
#define GPUdi()
Definition GPUCommonDefAPI.h:34

GPUdDefault
#define GPUdDefault()
Definition GPUCommonDefAPI.h:32

GPUd
#define GPUd()
Definition GPUCommonDefAPI.h:31

GPUCommonDef.h

GPUCommonMath.h

o
bool o
Definition GPUTPCGMMerger.cxx:1437

int

result
GLuint64EXT * result
Definition glcorearb.h:5662

v
const GLdouble * v
Definition glcorearb.h:832

f
GLdouble f
Definition glcorearb.h:310

val
GLuint GLfloat * val
Definition glcorearb.h:1582

Catch::Matchers::IsNaN
IsNaNMatcher IsNaN()
Definition catch_amalgamated.cxx:7764

o2::OrtDataType::detail::endian
endian
Definition GPUORTFloat16.h:30

o2::OrtDataType::GPUdi
GPUdi() const expr uint16_t Float16Impl< Derived > GPUdi() uint16_t BFloat16Impl< Derived >
IEEE 754 half-precision floating point data type.
Definition GPUORTFloat16.h:531

o2::framework::Abs
@ Abs
Definition BasicOps.h:44

o2::math_utils::detail::rhs
D const SVectorGPU< T, D > & rhs
Definition SMatrixGPU.h:191

o2::math_utils::detail::lhs
D & lhs
Definition SMatrixGPU.h:190

o2
a couple of static helper functions to create timestamp values for CCDB queries or override obsolete ...
Definition BitstreamReader.h:24

Base
Definition testAbstractRefAccessor.cxx:23

o2::OrtDataType::BFloat16_t
bfloat16 (Brain Floating Point) data type
Definition GPUORTFloat16.h:757

o2::OrtDataType::BFloat16_t::GPUdDefault
GPUdDefault() BFloat16_t()=default

o2::OrtDataType::BFloat16_t::Base
OrtDataType::BFloat16Impl< BFloat16_t > Base
Definition GPUORTFloat16.h:769

o2::OrtDataType::BFloat16_t::GPUdi
GPUdi() explicit operator float() const noexcept
User defined conversion operator. Converts BFloat16_t to float.
Definition GPUORTFloat16.h:871

o2::OrtDataType::BFloat16_t::GPUd
GPUd() float ToFloat() const noexcept
Converts bfloat16 to float.
Definition GPUORTFloat16.h:790

o2::OrtDataType::BFloat16_t::operator!=
bool operator!=(const BFloat16_t &rhs) const noexcept
Definition GPUORTFloat16.h:876

o2::OrtDataType::BFloat16_t::GPUd
GPUd() explicit BFloat16_t(float v) noexcept
__ctor from float. Float is converted into bfloat16 16-bit representation.
Definition GPUORTFloat16.h:784

o2::OrtDataType::BFloat16_t::operator==
bool operator==(const BFloat16_t &rhs) const noexcept

o2::OrtDataType::BFloat16_t::operator<
bool operator<(const BFloat16_t &rhs) const noexcept

o2::OrtDataType::BFloat16_t::GPUd
GPUd() static const expr BFloat16_t FromBits(uint16_t v) noexcept
Explicit conversion to uint16_t representation of bfloat16.
Definition GPUORTFloat16.h:778

o2::OrtDataType::Float16Impl
Shared implementation between public and internal classes. CRTP pattern.
Definition GPUORTFloat16.h:54

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsNaNOrZero() const noexcept
Tests if the value is NaN or zero. Useful for comparisons.
Definition GPUORTFloat16.h:163

o2::OrtDataType::Float16Impl::noexcept
const Float16Impl &rhs noexcept
Definition GPUORTFloat16.h:214

o2::OrtDataType::Float16Impl::kSignMask
static constexpr uint16_t kSignMask
Definition GPUORTFloat16.h:89

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsPositiveInfinity() const noexcept
Tests if the value represents positive infinity.
Definition GPUORTFloat16.h:136

o2::OrtDataType::Float16Impl::kNegativeInfinityBits
static constexpr uint16_t kNegativeInfinityBits
Definition GPUORTFloat16.h:92

o2::OrtDataType::Float16Impl::val
uint16_t val
Definition GPUORTFloat16.h:101

o2::OrtDataType::Float16Impl::GPUd
GPUd() Derived Abs() const noexcept
Creates an instance that represents absolute value.
Definition GPUORTFloat16.h:197

o2::OrtDataType::Float16Impl::kNegativeQNaNBits
static constexpr uint16_t kNegativeQNaNBits
Definition GPUORTFloat16.h:94

o2::OrtDataType::Float16Impl::kPositiveInfinityBits
static constexpr uint16_t kPositiveInfinityBits
Definition GPUORTFloat16.h:91

o2::OrtDataType::Float16Impl::kMinusOneBits
static constexpr uint16_t kMinusOneBits
Definition GPUORTFloat16.h:99

o2::OrtDataType::Float16Impl::GPUd
GPUd() uint16_t NegateImpl() const noexcept
Creates a new instance with the sign flipped.
Definition GPUORTFloat16.h:82

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsNegativeInfinity() const noexcept
Tests if the value represents negative infinity.
Definition GPUORTFloat16.h:145

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsNaN() const noexcept
Tests if the value is NaN.
Definition GPUORTFloat16.h:118

o2::OrtDataType::Float16Impl::kBiasedExponentMask
static constexpr uint16_t kBiasedExponentMask
Definition GPUORTFloat16.h:90

o2::OrtDataType::Float16Impl::kOneBits
static constexpr uint16_t kOneBits
Definition GPUORTFloat16.h:98

o2::OrtDataType::Float16Impl::kEpsilonBits
static constexpr uint16_t kEpsilonBits
Definition GPUORTFloat16.h:95

o2::OrtDataType::Float16Impl::kMaxValueBits
static constexpr uint16_t kMaxValueBits
Definition GPUORTFloat16.h:97

o2::OrtDataType::Float16Impl::kMinValueBits
static constexpr uint16_t kMinValueBits
Definition GPUORTFloat16.h:96

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsSubnormal() const noexcept
Tests if the value is subnormal (denormal).
Definition GPUORTFloat16.h:185

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsInfinity() const noexcept
Tests if the value is either positive or negative infinity.
Definition GPUORTFloat16.h:154

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsNormal() const noexcept
Tests if the value is normal (not zero, subnormal, infinite, or NaN).
Definition GPUORTFloat16.h:173

o2::OrtDataType::Float16Impl::GPUd
GPUd() static bool AreZero(const Float16Impl &lhs
IEEE defines that positive and negative zero are equal, this gives us a quick equality check for two ...

o2::OrtDataType::Float16Impl::GPUdDefault
GPUdDefault() Float16Impl()=default

o2::OrtDataType::Float16Impl::GPUd
GPUd() bool IsFinite() const noexcept
Tests if the value is finite.
Definition GPUORTFloat16.h:127

o2::OrtDataType::Float16Impl::GPUd
GPUd() const expr static uint16_t ToUint16Impl(float v) noexcept
Converts from float to uint16_t float16 representation.

o2::OrtDataType::Float16Impl::kPositiveQNaNBits
static constexpr uint16_t kPositiveQNaNBits
Definition GPUORTFloat16.h:93

o2::OrtDataType::Float16Impl::GPUd
GPUd() Derived Negate() const noexcept
Creates a new instance with the sign flipped.
Definition GPUORTFloat16.h:203

o2::OrtDataType::detail::float32_bits
Definition GPUORTFloat16.h:271

o2::OrtDataType::detail::float32_bits::f
float f
Definition GPUORTFloat16.h:273

o2::OrtDataType::detail::float32_bits::u
unsigned int u
Definition GPUORTFloat16.h:272