release/current/mxfp_8hh_source.html

/*

 * Copyright (c) 2024 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#ifndef __ARCH_AMDGPU_COMMON_DTYPE_MXFP_HH__

#define __ARCH_AMDGPU_COMMON_DTYPE_MXFP_HH__


#include <cmath>

#include <cstdint>

#include <iostream>


#include "arch/amdgpu/common/dtype/mxfp_convert.hh"


namespace gem5

{


namespace AMDGPU

{


// Base class for all microscaling types. The sizes of everything are

// determined by the enum fields in the FMT struct. All of these share the

// same operator overloads which convert to float before arithmetic and

// convert back if assigned to a microscaling type.

template<typename FMT>


class mxfp

{

  public:

    mxfp() = default;


    mxfp(float f) : mode(roundTiesToEven)

    {

        data = float_to_mxfp(f);

    }

    mxfp(float f) : mode(roundTiesToEven) {…}


    // Set raw bits, used by gem5 to set a raw value read from VGPRs.


    mxfp(const uint32_t& raw)

    {

        // The info unions end up being "left" aligned. For example, in FP4

        // only the bits 31:28 are used. Shift the input by the storage size

        // of 32 by the type size (sign + exponent + mantissa bits).

        data = raw;

        data <<= (32 - int(FMT::sbits) - int(FMT::ebits) - int(FMT::mbits));

    }

    mxfp(const uint32_t& raw) {…}


    mxfp(const mxfp& f)

    {

        FMT conv_out;

        conv_out = convertMXFP<FMT, decltype(f.getFmt())>(f.getFmt());

        data = conv_out.storage;

    }

    mxfp(const mxfp& f) {…}


    mxfp&


    operator=(const float& f)

    {

       data = float_to_mxfp(f);

       return *this;

    }

    operator=(const float& f) {…}


    mxfp&


    operator=(const mxfp& f)

    {

        FMT conv_out;

        conv_out = convertMXFP<FMT, decltype(f.getFmt())>(f.getFmt());

        data = conv_out.storage;

        return *this;

    }

    operator=(const mxfp& f) {…}


    operator float() const

    {

        binary32 out;

        FMT in;

        in.storage = data;

        out = convertMXFP<binary32, FMT>(in, mode);


        return out.fp32;

    }

    operator float() const {…}


    constexpr static int


    size()

    {

        return int(FMT::mbits) + int(FMT::ebits) + int(FMT::sbits);

    }

    size() {…}


    // Intentionally use storage > size() so that a storage type is not needed

    // as a template parameter.

    uint32_t data = 0;


    FMT


    getFmt() const

    {

        FMT out;

        out.storage = data;

        return out;

    }

    getFmt() const {…}


    void


    setFmt(FMT in)

    {

        data = in.storage;

    }

    setFmt(FMT in) {…}


    // Used for upcasting

    void


    scaleMul(const float& f)

    {

        binary32 bfp;

        bfp.fp32 = f;

        int scale_val = bfp.exp;


        // Scale value of 0xFF is NaN. Scaling by NaN returns NaN.

        // In this implementation, types without NaN define it as max().

        if (scale_val == 0xFF) {

            data = FMT::nan;

            return;

        }


        scale_val -= bfp.bias;


        FMT in = getFmt();

        int exp = in.exp;


        if (exp + scale_val > max_exp<FMT>()) {

            in.exp = max_exp<FMT>();

        } else if (exp + scale_val < min_exp<FMT>()) {

            in.exp = min_exp<FMT>();

        } else {

            in.exp = exp + scale_val;

        }


        data = in.storage;

    }

    scaleMul(const float& f) {…}


    // Used for downcasting

    void


    scaleDiv(const float& f)

    {

        binary32 bfp;

        bfp.fp32 = f;

        int scale_val = bfp.exp;


        // Scale value of 0xFF is NaN. Scaling by NaN returns NaN.

        // In this implementation, types without NaN define it as max().

        if (scale_val == 0xFF) {

            data = FMT::nan;

            return;

        }


        scale_val -= bfp.bias;


        FMT in = getFmt();

        int exp = in.exp;


        if (exp - scale_val > max_exp<FMT>()) {

            in.exp = max_exp<FMT>();

        } else if (exp - scale_val < min_exp<FMT>()) {

            in.exp = min_exp<FMT>();

        } else {

            in.exp = exp - scale_val;


            // Output become denorm

            if (in.exp == 0) {

                uint32_t m = in.mant | 1 << FMT::mbits;

                m >>= 1;

                in.mant = m & mask(FMT::mbits);

            }

        }


        data = in.storage;

    }

    scaleDiv(const float& f) {…}


  private:

    mxfpRoundingMode mode = roundTiesToEven;


    uint32_t


    float_to_mxfp(float f)

    {

        binary32 in;

        in.fp32 = f;


        FMT out;

        out.storage = 0;


        out = convertMXFP<FMT, binary32>(in, mode);


        return out.storage;

    }

    float_to_mxfp(float f) {…}

};

class mxfp {…};


// Unary operators

template<typename T>


inline T operator+(T a)

{

    return a;

}

inline T operator+(T a) {…}


template<typename T>


inline T operator-(T a)

{

    // Flip sign bit

    a.data ^= 0x80000000;

    return a;

}

inline T operator-(T a) {…}


template<typename T>


inline T operator++(T a)

{

    a = a + T(1.0f);

    return a;

}

inline T operator++(T a) {…}


template<typename T>


inline T operator--(T a)

{

    a = a - T(1.0f);

    return a;

}

inline T operator--(T a) {…}


template<typename T>


inline T operator++(T a, int)

{

    T original = a;

    ++a;

    return original;

}

inline T operator++(T a, int) {…}


template<typename T>


inline T operator--(T a, int)

{

    T original = a;

    --a;

    return original;

}

inline T operator--(T a, int) {…}


// Math operators

template<typename T>


inline T operator+(T a, T b)

{

    return T(float(a) + float(b));

}

inline T operator+(T a, T b) {…}


template<typename T>


inline T operator-(T a, T b)

{

    return T(float(a) - float(b));

}

inline T operator-(T a, T b) {…}


template<typename T>


inline T operator*(T a, T b)

{

    return T(float(a) * float(b));

}

inline T operator*(T a, T b) {…}


template<typename T>


inline T operator/(T a, T b)

{

    return T(float(a) / float(b));

}

inline T operator/(T a, T b) {…}


template<typename T>


inline T operator+=(T &a, T b)

{

    a = a + b;

    return a;

}

inline T operator+=(T &a, T b) {…}


template<typename T>


inline T operator-=(T &a, T b)

{

    a = a - b;

    return a;

}

inline T operator-=(T &a, T b) {…}


template<typename T>


inline T operator*=(T &a, T b)

{

    a = a * b;

    return a;

}

inline T operator*=(T &a, T b) {…}


template<typename T>


inline T operator/=(T &a, T b)

{

    a = a / b;

    return a;

}

inline T operator/=(T &a, T b) {…}


// Comparison operators

template<typename T>


inline bool operator<(T a, T b)

{

    return float(a) < float(b);

}

inline bool operator<(T a, T b) {…}


template<typename T>


inline bool operator>(T a, T b)

{

    return float(a) > float(b);

}

inline bool operator>(T a, T b) {…}


template<typename T>


inline bool operator<=(T a, T b)

{

    return float(a) <= float(b);

}

inline bool operator<=(T a, T b) {…}


template<typename T>


inline bool operator>=(T a, T b)

{

    return float(a) >= float(b);

}

inline bool operator>=(T a, T b) {…}


template<typename T>


inline bool operator==(T a, T b)

{

    return float(a) == float(b);

}

inline bool operator==(T a, T b) {…}


template<typename T>


inline bool operator!=(T a, T b)

{

    return float(a) != float(b);

}

inline bool operator!=(T a, T b) {…}


} // namespace AMDGPU


} // namespace gem5


#endif // __ARCH_AMDGPU_COMMON_DTYPE_MXFP_HH__

gem5::AMDGPU::mxfp
Definition mxfp.hh:53

gem5::AMDGPU::mxfp::mxfp
mxfp(const mxfp &f)
Definition mxfp.hh:71

gem5::AMDGPU::mxfp::getFmt
FMT getFmt() const
Definition mxfp.hh:115

gem5::AMDGPU::mxfp::scaleMul
void scaleMul(const float &f)
Definition mxfp.hh:130

gem5::AMDGPU::mxfp::setFmt
void setFmt(FMT in)
Definition mxfp.hh:123

gem5::AMDGPU::mxfp::operator=
mxfp & operator=(const mxfp &f)
Definition mxfp.hh:86

gem5::AMDGPU::mxfp::float_to_mxfp
uint32_t float_to_mxfp(float f)
Definition mxfp.hh:201

gem5::AMDGPU::mxfp::size
static constexpr int size()
Definition mxfp.hh:105

gem5::AMDGPU::mxfp::mxfp
mxfp(const uint32_t &raw)
Definition mxfp.hh:62

gem5::AMDGPU::mxfp::mode
mxfpRoundingMode mode
Definition mxfp.hh:198

gem5::AMDGPU::mxfp::scaleDiv
void scaleDiv(const float &f)
Definition mxfp.hh:161

gem5::AMDGPU::mxfp::mxfp
mxfp()=default

gem5::AMDGPU::mxfp::operator=
mxfp & operator=(const float &f)
Definition mxfp.hh:79

gem5::AMDGPU::mxfp::mxfp
mxfp(float f)
Definition mxfp.hh:56

gem5::AMDGPU::mxfp::data
uint32_t data
Definition mxfp.hh:112

mxfp_convert.hh

gem5::AMDGPU::operator-=
T operator-=(T &a, T b)
Definition mxfp.hh:293

gem5::AMDGPU::operator<
bool operator<(T a, T b)
Definition mxfp.hh:315

gem5::AMDGPU::operator==
bool operator==(T a, T b)
Definition mxfp.hh:339

gem5::AMDGPU::operator*=
T operator*=(T &a, T b)
Definition mxfp.hh:300

gem5::AMDGPU::operator--
T operator--(T a)
Definition mxfp.hh:238

gem5::AMDGPU::operator++
T operator++(T a)
Definition mxfp.hh:231

gem5::AMDGPU::operator*
T operator*(T a, T b)
Definition mxfp.hh:274

gem5::AMDGPU::operator-
T operator-(T a)
Definition mxfp.hh:223

gem5::AMDGPU::operator+
T operator+(T a)
Definition mxfp.hh:217

gem5::AMDGPU::operator+=
T operator+=(T &a, T b)
Definition mxfp.hh:286

gem5::AMDGPU::convertMXFP
dFMT convertMXFP(sFMT in, mxfpRoundingMode mode=roundTiesToEven, uint32_t seed=0)
Definition mxfp_convert.hh:62

gem5::AMDGPU::operator!=
bool operator!=(T a, T b)
Definition mxfp.hh:345

gem5::AMDGPU::operator<=
bool operator<=(T a, T b)
Definition mxfp.hh:327

gem5::AMDGPU::operator/
T operator/(T a, T b)
Definition mxfp.hh:280

gem5::AMDGPU::operator>=
bool operator>=(T a, T b)
Definition mxfp.hh:333

gem5::AMDGPU::operator>
bool operator>(T a, T b)
Definition mxfp.hh:321

gem5::AMDGPU::mxfpRoundingMode
mxfpRoundingMode
Definition mxfp_convert.hh:49

gem5::AMDGPU::roundTiesToEven
@ roundTiesToEven
Definition mxfp_convert.hh:50

gem5::AMDGPU::operator/=
T operator/=(T &a, T b)
Definition mxfp.hh:307

gem5::ArmISA::mask
Bitfield< 3, 0 > mask
Definition pcstate.hh:63

gem5::ArmISA::b
Bitfield< 7 > b
Definition misc_types.hh:468

gem5::ArmISA::a
Bitfield< 8 > a
Definition misc_types.hh:66

gem5::ArmISA::f
Bitfield< 6 > f
Definition misc_types.hh:68

gem5::ArmISA::m
Bitfield< 0 > m
Definition misc_types.hh:479

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::AMDGPU::binary32_u
Definition binary32.hh:46

gem5::AMDGPU::binary32_u::storage
uint32_t storage
Definition binary32.hh:59

gem5::AMDGPU::binary32_u::fp32
float fp32
Definition binary32.hh:60