ROCmSoftwarePlatform/hipCUB/half_8hpp_source.html

 /******************************************************************************
  * Copyright (c) 2011, Duane Merrill.  All rights reserved.
  * Copyright (c) 2011-2023, NVIDIA CORPORATION.  All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are met:
  *     * Redistributions of source code must retain the above copyright
  *       notice, this list of conditions and the following disclaimer.
  *     * Redistributions in binary form must reproduce the above copyright
  *       notice, this list of conditions and the following disclaimer in the
  *       documentation and/or other materials provided with the distribution.
  *     * Neither the name of the NVIDIA CORPORATION nor the
  *       names of its contributors may be used to endorse or promote products
  *       derived from this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  * DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE FOR ANY
  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
  * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  *
  ******************************************************************************/

 #pragma once

  #include <stdint.h>
  #include <hipcub/util_type.hpp>

  #if defined(__HIP_PLATFORM_NVIDIA__)
      #include <cuda_fp16.h>
  #endif

  #include <iosfwd>

 #ifdef __GNUC__
 // There's a ton of type-punning going on in this file.
 #pragma GCC diagnostic push
 #pragma GCC diagnostic ignored "-Wstrict-aliasing"
 #endif


 /******************************************************************************
  * half_t
  ******************************************************************************/

 struct half_t
 {
     uint16_t __x;

     __host__ __device__ __forceinline__
     half_t(const __half &other)
     {
         __x = reinterpret_cast<const uint16_t&>(other);
     }

     __host__ __device__ __forceinline__
     half_t(int a)
     {
         *this = half_t(float(a));
     }

     half_t() = default;

     __host__ __device__ __forceinline__
     half_t(float a)
     {
         // Stolen from Norbert Juffa
         uint32_t ia = *reinterpret_cast<uint32_t*>(&a);
         uint16_t ir;

         ir = (ia >> 16) & 0x8000;

         if ((ia & 0x7f800000) == 0x7f800000)
         {
             if ((ia & 0x7fffffff) == 0x7f800000)
             {
                 ir |= 0x7c00; /* infinity */
             }
             else
             {
                 ir = 0x7fff; /* canonical NaN */
             }
         }
         else if ((ia & 0x7f800000) >= 0x33000000)
         {
             int32_t shift = (int32_t) ((ia >> 23) & 0xff) - 127;
             if (shift > 15)
             {
                 ir |= 0x7c00; /* infinity */
             }
             else
             {
                 ia = (ia & 0x007fffff) | 0x00800000; /* extract mantissa */
                 if (shift < -14)
                 { /* denormal */
                     ir |= ia >> (-1 - shift);
                     ia = ia << (32 - (-1 - shift));
                 }
                 else
                 { /* normal */
                     ir |= ia >> (24 - 11);
                     ia = ia << (32 - (24 - 11));
                     ir = static_cast<uint16_t>(ir + ((14 + shift) << 10));
                 }
                 /* IEEE-754 round to nearest of even */
                 if ((ia > 0x80000000) || ((ia == 0x80000000) && (ir & 1)))
                 {
                     ir++;
                 }
             }
         }

         this->__x = ir;
     }

     __host__ __device__ __forceinline__
     operator float() const
     {
         // Stolen from Andrew Kerr

         int sign        = ((this->__x >> 15) & 1);
         int exp         = ((this->__x >> 10) & 0x1f);
         int mantissa    = (this->__x & 0x3ff);
         uint32_t f      = 0;

         if (exp > 0 && exp < 31)
         {
             // normal
             exp += 112;
             f = (sign << 31) | (exp << 23) | (mantissa << 13);
         }
         else if (exp == 0)
         {
             if (mantissa)
             {
                 // subnormal
                 exp += 113;
                 while ((mantissa & (1 << 10)) == 0)
                 {
                     mantissa <<= 1;
                     exp--;
                 }
                 mantissa &= 0x3ff;
                 f = (sign << 31) | (exp << 23) | (mantissa << 13);
             }
             else if (sign)
             {
                 f = 0x80000000; // negative zero
             }
             else
             {
                 f = 0x0;        // zero
             }
         }
         else if (exp == 31)
         {
             if (mantissa)
             {
                 f = 0x7fffffff | (sign << 31);     // not a number
             }
             else
             {
                 f = (0xff << 23) | (sign << 31);    //  inf
             }
         }
         return *reinterpret_cast<float const *>(&f);
     }


     __host__ __device__ __forceinline__
     uint16_t raw() const
     {
         return this->__x;
     }

     __host__ __device__ __forceinline__
     bool operator ==(const half_t &other) const
     {
         return (this->__x == other.__x);
     }

     __host__ __device__ __forceinline__
     bool operator !=(const half_t &other) const
     {
         return (this->__x != other.__x);
     }

     __host__ __device__ __forceinline__
     half_t& operator +=(const half_t &rhs)
     {
         *this = half_t(float(*this) + float(rhs));
         return *this;
     }

     __host__ __device__ __forceinline__
     half_t operator*(const half_t &other)
     {
         return half_t(float(*this) * float(other));
     }

     __host__ __device__ __forceinline__ half_t operator/(const half_t& other) const
     {
         return half_t(float(*this) / float(other));
     }

     __host__ __device__ __forceinline__
     half_t operator+(const half_t &other)
     {
         return half_t(float(*this) + float(other));
     }

     __host__ __device__ __forceinline__
     half_t operator-(const half_t &other)
     {
         return half_t(float(*this) - float(other));
     }

     __host__ __device__ __forceinline__
     bool operator<(const half_t &other) const
     {
         return float(*this) < float(other);
     }

     __host__ __device__ __forceinline__
     bool operator<=(const half_t &other) const
     {
         return float(*this) <= float(other);
     }

     __host__ __device__ __forceinline__
     bool operator>(const half_t &other) const
     {
         return float(*this) > float(other);
     }

     __host__ __device__ __forceinline__
     bool operator>=(const half_t &other) const
     {
         return float(*this) >= float(other);
     }

     __host__ __device__ __forceinline__
     static half_t max() {
         uint16_t max_word = 0x7BFF;
         return reinterpret_cast<half_t&>(max_word);
     }

     __host__ __device__ __forceinline__
     static half_t lowest() {
         uint16_t lowest_word = 0xFBFF;
         return reinterpret_cast<half_t&>(lowest_word);
     }
 };


 /******************************************************************************
  * I/O stream overloads
  ******************************************************************************/

 inline std::ostream& operator<<(std::ostream &out, const half_t &x)
 {
     out << (float)x;
     return out;
 }

 /******************************************************************************
  * Traits overloads
  ******************************************************************************/

 template <>
 struct hipcub::FpLimits<half_t>
 {
     static __host__ __device__ __forceinline__ half_t Max() { return half_t::max(); }

     static __host__ __device__ __forceinline__ half_t Lowest() { return half_t::lowest(); }
 };

 template <> struct hipcub::NumericTraits<half_t> : hipcub::BaseTraits<FLOATING_POINT, true, false, unsigned short, half_t> {};


 #ifdef __GNUC__
 #pragma GCC diagnostic pop
 #endif
half_t::operator>
__host__ __device__ __forceinline__ bool operator>(const half_t &other) const
Greater-than.
Definition: half.hpp:260

half_t::operator>=
__host__ __device__ __forceinline__ bool operator>=(const half_t &other) const
Greater-than-equal.
Definition: half.hpp:267

half_t::half_t
__host__ __device__ __forceinline__ half_t(int a)
Constructor from integer.
Definition: half.hpp:72

half_t::operator+
__host__ __device__ __forceinline__ half_t operator+(const half_t &other)
Add.
Definition: half.hpp:232

half_t::raw
__host__ __device__ __forceinline__ uint16_t raw() const
Get raw storage.
Definition: half.hpp:190

half_t::operator<=
__host__ __device__ __forceinline__ bool operator<=(const half_t &other) const
Less-than-equal.
Definition: half.hpp:253

half_t::half_t
half_t()=default
Default constructor.

Max
Definition: thread_operators.hpp:105

half_t::operator+=
__host__ __device__ __forceinline__ half_t & operator+=(const half_t &rhs)
Assignment by sum.
Definition: half.hpp:211

operator<<
std::ostream & operator<<(std::ostream &out, const half_t &x)
Insert formatted half_t into the output stream.
Definition: half.hpp:293

half_t::half_t
__host__ __device__ __forceinline__ half_t(float a)
Constructor from float.
Definition: half.hpp:82

half_t
Host-based fp16 data type compatible and convertible with __half.
Definition: half.hpp:59

half_t::half_t
__host__ __device__ __forceinline__ half_t(const __half &other)
Constructor from __half.
Definition: half.hpp:65

half_t::lowest
__host__ __device__ static __forceinline__ half_t lowest()
numeric_traits<half_t>::lowest
Definition: half.hpp:281

half_t::operator==
__host__ __device__ __forceinline__ bool operator==(const half_t &other) const
Equality.
Definition: half.hpp:197

half_t::operator!=
__host__ __device__ __forceinline__ bool operator!=(const half_t &other) const
Inequality.
Definition: half.hpp:204

half_t::operator/
__host__ __device__ __forceinline__ half_t operator/(const half_t &other) const
Divide.
Definition: half.hpp:225

half_t::operator-
__host__ __device__ __forceinline__ half_t operator-(const half_t &other)
Subtract.
Definition: half.hpp:239

half_t::max
__host__ __device__ static __forceinline__ half_t max()
numeric_traits<half_t>::max
Definition: half.hpp:274

half_t::operator<
__host__ __device__ __forceinline__ bool operator<(const half_t &other) const
Less-than.
Definition: half.hpp:246

half_t::operator*
__host__ __device__ __forceinline__ half_t operator*(const half_t &other)
Multiply.
Definition: half.hpp:219