ROCmSoftwarePlatform/hipCUB/bfloat16_8hpp_source.html

 /******************************************************************************
  * Copyright (c) 2021, NVIDIA CORPORATION.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are met:
  *     * Redistributions of source code must retain the above copyright
  *       notice, this list of conditions and the following disclaimer.
  *     * Redistributions in binary form must reproduce the above copyright
  *       notice, this list of conditions and the following disclaimer in the
  *       documentation and/or other materials provided with the distribution.
  *     * Neither the name of the NVIDIA CORPORATION nor the
  *       names of its contributors may be used to endorse or promote products
  *       derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  *
  ******************************************************************************/

 #pragma once

 #include <stdint.h>
 #include <hipcub/util_type.hpp>

 #include <iosfwd>

 #if defined(__HIP_PLATFORM_NVIDIA__)
 #include <cuda_bf16.h>
 #endif

 #ifdef __GNUC__
 // There's a ton of type-punning going on in this file.
 #pragma GCC diagnostic push
 #pragma GCC diagnostic ignored "-Wstrict-aliasing"
 #endif


 /******************************************************************************
  * bfloat16_t
  ******************************************************************************/

 struct bfloat16_t
 {
     uint16_t __x;

 #ifdef __HIP_PLATFORM_AMD__

     __host__ __device__ __forceinline__
     bfloat16_t(const hip_bfloat16  &other)
     {
         __x = reinterpret_cast<const uint16_t&>(other);
     }

 #elif defined(__HIP_PLATFORM_NVIDIA__)

     __host__ __device__ __forceinline__
     bfloat16_t(const __nv_bfloat16 &other)
     {
         __x = reinterpret_cast<const uint16_t&>(other);
     }

 #endif

     __host__ __device__ __forceinline__
     bfloat16_t(int a)
     {
         *this = bfloat16_t(float(a));
     }

     bfloat16_t() = default;

     __host__ __device__ __forceinline__
     bfloat16_t(float a)
     {
         // Reference:
         // https://github.com/pytorch/pytorch/blob/44cc873fba5e5ffc4d4d4eef3bd370b653ce1ce1/c10/util/BFloat16.h#L51
         uint16_t ir;
         if (a != a) {
             ir = UINT16_C(0x7FFF);
         } else {
             union {
                 uint32_t U32;
                 float F32;
             };

             F32 = a;
             uint32_t rounding_bias = ((U32 >> 16) & 1) + UINT32_C(0x7FFF);
             ir = static_cast<uint16_t>((U32 + rounding_bias) >> 16);
         }
         this->__x = ir;
     }

 #ifdef __HIP_PLATFORM_AMD__

     __host__ __device__ __forceinline__
     operator hip_bfloat16 () const
     {
         return reinterpret_cast<const hip_bfloat16 &>(__x);
     }

 #elif defined(__HIP_PLATFORM_NVIDIA__)

     __host__ __device__ __forceinline__
     operator __nv_bfloat16() const
     {
         return reinterpret_cast<const __nv_bfloat16&>(__x);
     }

 #endif

     __host__ __device__ __forceinline__
     operator float() const
     {
         float f = 0;
         uint32_t *p = reinterpret_cast<uint32_t *>(&f);
         *p = uint32_t(__x) << 16;
         return f;
     }

     __host__ __device__ __forceinline__
     uint16_t raw() const
     {
         return this->__x;
     }

     __host__ __device__ __forceinline__
     friend bool operator ==(const bfloat16_t &a, const bfloat16_t &b){
         return (a.__x == b.__x);
     }

     __host__ __device__ __forceinline__
     bool operator !=(const bfloat16_t &other) const
     {
         return (this->__x != other.__x);
     }

     __host__ __device__ __forceinline__
     bfloat16_t& operator +=(const bfloat16_t &rhs)
     {
         *this = bfloat16_t(float(*this) + float(rhs));
         return *this;
     }

     __host__ __device__ __forceinline__
     bfloat16_t operator*(const bfloat16_t &other)
     {
         return bfloat16_t(float(*this) * float(other));
     }

     __host__ __device__ __forceinline__
     bfloat16_t operator+(const bfloat16_t &other)
     {
         return bfloat16_t(float(*this) + float(other));
     }

     __host__ __device__ __forceinline__
     bfloat16_t operator-(const bfloat16_t &other)
     {
         return bfloat16_t(float(*this) - float(other));
     }

     __host__ __device__ __forceinline__
     bool operator<(const bfloat16_t &other) const
     {
         return float(*this) < float(other);
     }

     __host__ __device__ __forceinline__
     bool operator<=(const bfloat16_t &other) const
     {
         return float(*this) <= float(other);
     }

     __host__ __device__ __forceinline__
     bool operator>(const bfloat16_t &other) const
     {
         return float(*this) > float(other);
     }

     __host__ __device__ __forceinline__
     bool operator>=(const bfloat16_t &other) const
     {
         return float(*this) >= float(other);
     }

     __host__ __device__ __forceinline__
     static bfloat16_t max() {
         uint16_t max_word = 0x7F7F;
         return reinterpret_cast<bfloat16_t&>(max_word);
     }

     __host__ __device__ __forceinline__
     static bfloat16_t lowest() {
         uint16_t lowest_word = 0xFF7F;
         return reinterpret_cast<bfloat16_t&>(lowest_word);
     }
 };


 /******************************************************************************
  * I/O stream overloads
  ******************************************************************************/

 inline std::ostream& operator<<(std::ostream &out, const bfloat16_t &x)
 {
     out << (float)x;
     return out;
 }

 #if defined(__HIP_PLATFORM_NVIDIA__)

     inline std::ostream& operator<<(std::ostream &out, const __nv_bfloat16 &x)
     {
         return out << bfloat16_t(x);
     }

 #endif


 /******************************************************************************
  * Traits overloads
  ******************************************************************************/

 template <>
 struct hipcub::FpLimits<bfloat16_t>
 {
     static __host__ __device__ __forceinline__ bfloat16_t Max() { return bfloat16_t::max(); }

     static __host__ __device__ __forceinline__ bfloat16_t Lowest() { return bfloat16_t::lowest(); }
 };

 template <> struct hipcub::NumericTraits<bfloat16_t> : hipcub::BaseTraits<FLOATING_POINT, true, false, unsigned short, bfloat16_t> {};

 #ifdef __GNUC__
 #pragma GCC diagnostic pop
 #endif
bfloat16_t::operator+=
__host__ __device__ __forceinline__ bfloat16_t & operator+=(const bfloat16_t &rhs)
Assignment by sum.
Definition: bfloat16.hpp:166

bfloat16_t::operator<=
__host__ __device__ __forceinline__ bool operator<=(const bfloat16_t &other) const
Less-than-equal.
Definition: bfloat16.hpp:202

bfloat16_t
Host-based fp16 data type compatible and convertible with __nv_bfloat16 or hip_bfloat16.
Definition: bfloat16.hpp:58

Max
Definition: thread_operators.hpp:105

bfloat16_t::raw
__host__ __device__ __forceinline__ uint16_t raw() const
Get raw storage.
Definition: bfloat16.hpp:146

bfloat16_t::bfloat16_t
__host__ __device__ __forceinline__ bfloat16_t(float a)
Constructor from float.
Definition: bfloat16.hpp:94

bfloat16_t::operator+
__host__ __device__ __forceinline__ bfloat16_t operator+(const bfloat16_t &other)
Add.
Definition: bfloat16.hpp:181

bfloat16_t::operator>=
__host__ __device__ __forceinline__ bool operator>=(const bfloat16_t &other) const
Greater-than-equal.
Definition: bfloat16.hpp:216

bfloat16_t::operator>
__host__ __device__ __forceinline__ bool operator>(const bfloat16_t &other) const
Greater-than.
Definition: bfloat16.hpp:209

bfloat16_t::bfloat16_t
bfloat16_t()=default
Default constructor.

bfloat16_t::bfloat16_t
__host__ __device__ __forceinline__ bfloat16_t(int a)
Constructor from integer.
Definition: bfloat16.hpp:84

bfloat16_t::operator==
__host__ __device__ __forceinline__ friend bool operator==(const bfloat16_t &a, const bfloat16_t &b)
Equality.
Definition: bfloat16.hpp:153

bfloat16_t::max
__host__ __device__ static __forceinline__ bfloat16_t max()
numeric_traits<bfloat16_t>::max
Definition: bfloat16.hpp:223

bfloat16_t::operator*
__host__ __device__ __forceinline__ bfloat16_t operator*(const bfloat16_t &other)
Multiply.
Definition: bfloat16.hpp:174

operator<<
std::ostream & operator<<(std::ostream &out, const bfloat16_t &x)
Insert formatted bfloat16_t into the output stream.
Definition: bfloat16.hpp:242

bfloat16_t::lowest
__host__ __device__ static __forceinline__ bfloat16_t lowest()
numeric_traits<bfloat16_t>::lowest
Definition: bfloat16.hpp:230

bfloat16_t::operator-
__host__ __device__ __forceinline__ bfloat16_t operator-(const bfloat16_t &other)
Subtract.
Definition: bfloat16.hpp:188

bfloat16_t::operator<
__host__ __device__ __forceinline__ bool operator<(const bfloat16_t &other) const
Less-than.
Definition: bfloat16.hpp:195

bfloat16_t::operator!=
__host__ __device__ __forceinline__ bool operator!=(const bfloat16_t &other) const
Inequality.
Definition: bfloat16.hpp:159