develop/vfp_8hh_source.html

/*

 * Copyright (c) 2010-2013, 2019, 2024-2025 Arm Limited

 * All rights reserved

 *

 * The license below extends only to copyright in the software and shall

 * not be construed as granting a license to any other intellectual

 * property including but not limited to intellectual property relating

 * to a hardware implementation of the functionality of the software

 * licensed hereunder.  You may use the software subject to the license

 * terms below provided that you ensure that this notice is replicated

 * unmodified and in its entirety in all distributions of the software,

 * modified or unmodified, in source code or in binary form.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are

 * met: redistributions of source code must retain the above copyright

 * notice, this list of conditions and the following disclaimer;

 * redistributions in binary form must reproduce the above copyright

 * notice, this list of conditions and the following disclaimer in the

 * documentation and/or other materials provided with the distribution;

 * neither the name of the copyright holders nor the names of its

 * contributors may be used to endorse or promote products derived from

 * this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 */


#ifndef __ARCH_ARM_INSTS_VFP_HH__

#define __ARCH_ARM_INSTS_VFP_HH__


#include <fenv.h>


#include <cmath>


#include "arch/arm/insts/misc.hh"

#include "arch/arm/pcstate.hh"

#include "arch/arm/regs/misc.hh"

#include "cpu/thread_context.hh"


namespace gem5

{


namespace ArmISA

{


enum VfpMicroMode

{

    VfpNotAMicroop,

    VfpMicroop,

    VfpFirstMicroop,

    VfpLastMicroop

};


template<class T>

static inline void


setVfpMicroFlags(VfpMicroMode mode, T &flags)

{

    switch (mode) {

      case VfpMicroop:

        flags[StaticInst::IsMicroop] = true;

        break;

      case VfpFirstMicroop:

        flags[StaticInst::IsMicroop] =

            flags[StaticInst::IsFirstMicroop] = true;

        break;

      case VfpLastMicroop:

        flags[StaticInst::IsMicroop] =

            flags[StaticInst::IsLastMicroop] = true;

        break;

      case VfpNotAMicroop:

        break;

    }

    if (mode == VfpMicroop || mode == VfpFirstMicroop) {

        flags[StaticInst::IsDelayedCommit] = true;

    }

}


enum FeExceptionBit

{

    FeDivByZero = FE_DIVBYZERO,

    FeInexact = FE_INEXACT,

    FeInvalid = FE_INVALID,

    FeOverflow = FE_OVERFLOW,

    FeUnderflow = FE_UNDERFLOW,

    FeAllExceptions = FE_ALL_EXCEPT

};


enum FeRoundingMode

{

    FeRoundDown = FE_DOWNWARD,

    FeRoundNearest = FE_TONEAREST,

    FeRoundZero = FE_TOWARDZERO,

    FeRoundUpward = FE_UPWARD

};


enum VfpRoundingMode

{

    VfpRoundNearest = 0,

    VfpRoundUpward = 1,

    VfpRoundDown = 2,

    VfpRoundZero = 3,

    VfpRoundAway = 4

};


static inline float bitsToFp(uint64_t, float);

static inline double bitsToFp(uint64_t, double);

static inline uint32_t fpToBits(float);

static inline uint64_t fpToBits(double);


constexpr int


fpclassifyFpH(uint16_t __x)

{

    // Extract sign, exponent, and fraction

    uint16_t exponent = bits(__x, 14, 10);

    uint16_t fraction = bits(__x, 9, 0);


    // Classification logic

    if (exponent == 0) {

        if (fraction == 0) {

            return FP_ZERO;  // Zero (positive or negative)

        } else {

            return FP_SUBNORMAL;  // Subnormal number

        }

    } else if (exponent == 0x1F) {

        if (fraction == 0) {

            return FP_INFINITE;  // Infinity (positive or negative)

        } else {

            return FP_NAN;  // Not a Number (NaN)

        }

    } else {

        return FP_NORMAL;  // Normalized number

    }

}


template <class fpType>

static inline bool


flushToZero(fpType &op)

{

    fpType junk = 0.0;

    if (std::fpclassify(op) == FP_SUBNORMAL) {

        uint64_t bitMask = 0x1ULL << (sizeof(fpType) * 8 - 1);

        op = bitsToFp(fpToBits(op) & bitMask, junk);

        return true;

    }

    return false;

}


static inline bool


flushToZeroFpH(uint16_t& op)

{

    if (fpclassifyFpH(op) == FP_SUBNORMAL) {

        op = op & 0x8000;

        return true;

    }

    return false;

}


template <class fpType>

static inline bool


flushToZero(fpType &op1, fpType &op2)

{

    bool flush1 = flushToZero(op1);

    bool flush2 = flushToZero(op2);

    return flush1 || flush2;

}


template <class fpType>

static inline void


vfpFlushToZero(FPSCR &fpscr, fpType &op)

{

    if (fpscr.fz == 1 && flushToZero(op)) {

        fpscr.idc = 1;

    }

}


static inline void


vfpFlushToZeroFpH(FPSCR &fpscr, uint16_t& op)

{

    if (fpscr.fz16 == 1 && flushToZeroFpH(op)) {

        fpscr.idc = 1;

    }

}


template <class fpType>

static inline void


vfpFlushToZero(FPSCR &fpscr, fpType &op1, fpType &op2)

{

    vfpFlushToZero(fpscr, op1);

    vfpFlushToZero(fpscr, op2);

}


static inline uint32_t


fpToBits(float fp)

{

    union

    {

        float fp;

        uint32_t bits;

    } val;

    val.fp = fp;

    return val.bits;

}


static inline uint64_t


fpToBits(double fp)

{

    union

    {

        double fp;

        uint64_t bits;

    } val;

    val.fp = fp;

    return val.bits;

}


static inline float


bitsToFp(uint64_t bits, float junk)

{

    union

    {

        float fp;

        uint32_t bits;

    } val;

    val.bits = bits;

    return val.fp;

}


static inline double


bitsToFp(uint64_t bits, double junk)

{

    union

    {

        double fp;

        uint64_t bits;

    } val;

    val.bits = bits;

    return val.fp;

}


template <class fpType>

static inline bool


isSnan(fpType val)

{

    const bool single = (sizeof(fpType) == sizeof(float));

    const uint64_t qnan =

        single ? 0x7fc00000 : 0x7ff8000000000000ULL;

    return std::isnan(val) && ((fpToBits(val) & qnan) != qnan);

}


typedef int VfpSavedState;


VfpSavedState prepFpState(uint32_t rMode);

void finishVfp(FPSCR &fpscr, VfpSavedState state, bool flush, FPSCR mask = FpscrExcMask);


template <class fpType>

fpType fixDest(FPSCR fpscr, fpType val, fpType op1);


template <class fpType>

fpType fixDest(FPSCR fpscr, fpType val, fpType op1, fpType op2);


template <class fpType>

fpType fixDivDest(FPSCR fpscr, fpType val, fpType op1, fpType op2);


float fixFpDFpSDest(FPSCR fpscr, double val);

double fixFpSFpDDest(FPSCR fpscr, float val);


uint16_t vcvtFpSFpH(FPSCR &fpscr, bool flush, bool defaultNan,

                    uint32_t rMode, bool ahp, float op);

uint16_t vcvtFpDFpH(FPSCR &fpscr, bool flush, bool defaultNan,

                    uint32_t rMode, bool ahp, double op);


float  vcvtFpHFpS(FPSCR &fpscr, bool defaultNan, bool ahp, uint16_t op);

double vcvtFpHFpD(FPSCR &fpscr, bool defaultNan, bool ahp, uint16_t op);


static inline double


makeDouble(uint32_t low, uint32_t high)

{

    double junk = 0.0;

    return bitsToFp((uint64_t)low | ((uint64_t)high << 32), junk);

}


static inline uint32_t


lowFromDouble(double val)

{

    return fpToBits(val);

}


static inline uint32_t


highFromDouble(double val)

{

    return fpToBits(val) >> 32;

}


static inline void


setFPExceptions(int exceptions) {

    feclearexcept(FeAllExceptions);

    feraiseexcept(exceptions);

}


template <typename T>

uint64_t

GEM5_NO_OPTIMIZE


vfpFpToFixed(T val, bool isSigned, uint8_t width, uint8_t imm, bool

             useRmode = true, VfpRoundingMode roundMode = VfpRoundZero,

             bool aarch64 = false)

{

    int  rmode;

    bool roundAwayFix = false;


    if (!useRmode) {

        rmode = fegetround();

    } else {

        switch (roundMode)

        {

          case VfpRoundNearest:

            rmode = FeRoundNearest;

            break;

          case VfpRoundUpward:

            rmode = FeRoundUpward;

            break;

          case VfpRoundDown:

            rmode = FeRoundDown;

            break;

          case VfpRoundZero:

            rmode = FeRoundZero;

            break;

          case VfpRoundAway:

            // There is no equivalent rounding mode, use round down and we'll

            // fix it later

            rmode        = FeRoundDown;

            roundAwayFix = true;

            break;

          default:

            panic("Unsupported roundMode %d\n", roundMode);

        }

    }

    __asm__ __volatile__("" : "=m" (rmode) : "m" (rmode));

    fesetround(FeRoundNearest);

    val = val * pow(2.0, imm);

    __asm__ __volatile__("" : "=m" (val) : "m" (val));

    fesetround(rmode);

    feclearexcept(FeAllExceptions);

    __asm__ __volatile__("" : "=m" (val) : "m" (val));

    T origVal = val;

    val = rint(val);

    __asm__ __volatile__("" : "=m" (val) : "m" (val));


    int exceptions = fetestexcept(FeAllExceptions);


    int fpType = std::fpclassify(val);

    if (fpType == FP_SUBNORMAL || fpType == FP_NAN) {

        if (fpType == FP_NAN) {

            exceptions |= FeInvalid;

        }

        val = 0.0;

    } else if (origVal != val) {

        switch (rmode) {

          case FeRoundNearest:

            if (origVal - val > 0.5)

                val += 1.0;

            else if (val - origVal > 0.5)

                val -= 1.0;

            break;

          case FeRoundDown:

            if (roundAwayFix) {

                // The ordering on the subtraction looks a bit odd in that we

                // don't do the obvious origVal - val, instead we do

                // -(val - origVal). This is required to get the corruct bit

                // exact behaviour when very close to the 0.5 threshold.

                volatile T error = val;

                error -= origVal;

                error = -error;

                if ( (error >  0.5) ||

                    ((error == 0.5) && (val >= 0)) )

                    val += 1.0;

            } else {

                if (origVal < val)

                    val -= 1.0;

            }

            break;

          case FeRoundUpward:

            if (origVal > val)

                val += 1.0;

            break;

        }

        exceptions |= FeInexact;

    }


    __asm__ __volatile__("" : "=m" (val) : "m" (val));


    if (isSigned) {

        bool     outOfRange = false;

        int64_t  result     = (int64_t) val;

        uint64_t finalVal;


        if (!aarch64) {

            if (width == 16) {

                finalVal = (int16_t)val;

            } else if (width == 32) {

                finalVal =(int32_t)val;

            } else if (width == 64) {

                finalVal = result;

            } else {

                panic("Unsupported width %d\n", width);

            }


            // check if value is in range

            int64_t minVal = ~mask(width-1);

            if ((double)val < minVal) {

                outOfRange = true;

                finalVal = minVal;

            }

            int64_t maxVal = mask(width-1);

            if ((double)val > maxVal) {

                outOfRange = true;

                finalVal = maxVal;

            }

        } else {

            bool isNeg = val < 0;

            finalVal = result & mask(width);

            // If the result is supposed to be less than 64 bits check that the

            // upper bits that got thrown away are just sign extension bits

            if (width != 64) {

                outOfRange = ((uint64_t) result >> (width - 1)) !=

                             (isNeg ? mask(64-width+1) : 0);

            }

            // Check if the original floating point value doesn't matches the

            // integer version we are also out of range. So create a saturated

            // result.

            if (isNeg) {

                outOfRange |= val < result;

                if (outOfRange) {

                    finalVal = 1LL << (width-1);

                }

            } else {

                outOfRange |= val > result;

                if (outOfRange) {

                    finalVal = mask(width-1);

                }

            }

        }


        // Raise an exception if the value was out of range

        if (outOfRange) {

            exceptions |= FeInvalid;

            exceptions &= ~FeInexact;

        }

        setFPExceptions(exceptions);

        return finalVal;

    } else {

        if ((double)val < 0) {

            exceptions |= FeInvalid;

            exceptions &= ~FeInexact;

            setFPExceptions(exceptions);

            return 0;

        }


        uint64_t result = ((uint64_t) val) & mask(width);

        if (val > result) {

            exceptions |= FeInvalid;

            exceptions &= ~FeInexact;

            setFPExceptions(exceptions);

            return mask(width);

        }


        setFPExceptions(exceptions);

        return result;

    }

};


template <typename T>

T

GEM5_NO_OPTIMIZE


vfpFpRint(T val, bool exact, bool defaultNan, bool useRmode = true,

          VfpRoundingMode roundMode = VfpRoundZero)

{

    int  rmode;

    bool roundAwayFix = false;


    if (!useRmode) {

        rmode = fegetround();

    } else {

        switch (roundMode)

        {

          case VfpRoundNearest:

            rmode = FeRoundNearest;

            break;

          case VfpRoundUpward:

            rmode = FeRoundUpward;

            break;

          case VfpRoundDown:

            rmode = FeRoundDown;

            break;

          case VfpRoundZero:

            rmode = FeRoundZero;

            break;

          case VfpRoundAway:

            // There is no equivalent rounding mode, use round down and we'll

            // fix it later

            rmode        = FeRoundDown;

            roundAwayFix = true;

            break;

          default:

            panic("Unsupported roundMode %d\n", roundMode);

        }

    }

    __asm__ __volatile__("" : "=m" (rmode) : "m" (rmode));

    __asm__ __volatile__("" : "=m" (val) : "m" (val));

    fesetround(rmode);

    feclearexcept(FeAllExceptions);

    __asm__ __volatile__("" : "=m" (val) : "m" (val));

    T origVal = val;

    val = rint(val);

    __asm__ __volatile__("" : "=m" (val) : "m" (val));


    int exceptions = fetestexcept(FeAllExceptions);

    if (!exact) {

        exceptions &= ~FeInexact;

    }


    int fpType = std::fpclassify(val);

    if (fpType == FP_SUBNORMAL || fpType == FP_NAN) {

        if (fpType == FP_NAN) {

            if (isSnan(val)) {

                exceptions |= FeInvalid;

            }

            if (defaultNan || !isSnan(val)) {

                bool single = (sizeof(T) == sizeof(float));

                uint64_t qnan = single ? 0x7fc00000 : 0x7ff8000000000000ULL;

                val = bitsToFp(qnan, (T)0.0);

            }

        } else {

            val = 0.0;

        }

    } else if (origVal != val) {

        switch (rmode) {

          case FeRoundNearest:

            if (origVal - val > 0.5)

                val += 1.0;

            else if (val - origVal > 0.5)

                val -= 1.0;

            break;

          case FeRoundDown:

            if (roundAwayFix) {

                // The ordering on the subtraction looks a bit odd in that we

                // don't do the obvious origVal - val, instead we do

                // -(val - origVal). This is required to get the corruct bit

                // exact behaviour when very close to the 0.5 threshold.

                volatile T error = val;

                error -= origVal;

                error = -error;

                if ( (error >  0.5) ||

                    ((error == 0.5) && (val >= 0)) )

                    val += 1.0;

            } else {

                if (origVal < val)

                    val -= 1.0;

            }

            break;

          case FeRoundUpward:

            if (origVal > val)

                val += 1.0;

            break;

        }

        if (exact) {

            exceptions |= FeInexact;

        }

    }

    // Fix signal of zero.

    fpType = std::fpclassify(val);

    if (fpType == FP_ZERO) {

        bool single = (sizeof(T) == sizeof(float));

        uint64_t mask = single ? 0x80000000 : 0x8000000000000000ULL;

        val = bitsToFp((fpToBits(val) & (~mask)) | (fpToBits(origVal) & mask),

                       (T)0.0);

    }


    // __asm__ __volatile__("" : "=m" (val) : "m" (val));

    setFPExceptions(exceptions);


    return val;

};


float vfpUFixedToFpS(bool flush, bool defaultNan,

        uint64_t val, uint8_t width, uint8_t imm);

float vfpSFixedToFpS(bool flush, bool defaultNan,

        int64_t val, uint8_t width, uint8_t imm);


double vfpUFixedToFpD(bool flush, bool defaultNan,

        uint64_t val, uint8_t width, uint8_t imm);

double vfpSFixedToFpD(bool flush, bool defaultNan,

        int64_t val, uint8_t width, uint8_t imm);


float fprSqrtEstimate(FPSCR &fpscr, float op);

uint16_t fprSqrtEstimateFpH(FPSCR &fpscr, uint16_t op);

uint32_t unsignedRSqrtEstimate(uint32_t op);


float fpRecipEstimate(FPSCR &fpscr, float op);

uint16_t fpRecipEstimateFpH(FPSCR &fpscr, uint16_t op);

uint32_t unsignedRecipEstimate(uint32_t op);


FPSCR

fpStandardFPSCRValue(const FPSCR &fpscr);


class VfpMacroOp : public PredMacroOp

{

  public:

    static bool


    inScalarBank(RegIndex idx)

    {

        return (idx % 32) < 8;

    }


  protected:

    bool wide;


    VfpMacroOp(const char *mnem, ExtMachInst _machInst,

            OpClass __opClass, bool _wide) :

        PredMacroOp(mnem, _machInst, __opClass), wide(_wide)

    {}


    RegIndex addStride(RegIndex idx, unsigned stride);

    void nextIdxs(RegIndex &dest, RegIndex &op1, RegIndex &op2);

    void nextIdxs(RegIndex &dest, RegIndex &op1);

    void nextIdxs(RegIndex &dest);

};


template <typename T>

static inline T


fpAdd(T a, T b)

{

    return a + b;

};


template <typename T>

static inline T


fpSub(T a, T b)

{

    return a - b;

};


static inline float


fpAddS(float a, float b)

{

    return a + b;

}


static inline double


fpAddD(double a, double b)

{

    return a + b;

}


static inline float


fpSubS(float a, float b)

{

    return a - b;

}


static inline double


fpSubD(double a, double b)

{

    return a - b;

}


static inline float


fpDivS(float a, float b)

{

    return a / b;

}


static inline double


fpDivD(double a, double b)

{

    return a / b;

}


template <typename T>

static inline T


fpDiv(T a, T b)

{

    return a / b;

};


template <typename T>

static inline T


fpMulX(T a, T b)

{

    uint64_t opData;

    uint32_t sign1;

    uint32_t sign2;

    const bool single = (sizeof(T) == sizeof(float));

    if (single) {

        opData = (fpToBits(a));

        sign1 = opData>>31;

        opData = (fpToBits(b));

        sign2 = opData>>31;

    } else {

        opData = (fpToBits(a));

        sign1 = opData>>63;

        opData = (fpToBits(b));

        sign2 = opData>>63;

    }

    bool inf1 = (std::fpclassify(a) == FP_INFINITE);

    bool inf2 = (std::fpclassify(b) == FP_INFINITE);

    bool zero1 = (std::fpclassify(a) == FP_ZERO);

    bool zero2 = (std::fpclassify(b) == FP_ZERO);

    if ((inf1 && zero2) || (zero1 && inf2)) {

        if (sign1 ^ sign2)

            return (T)(-2.0);

        else

            return (T)(2.0);

    } else {

        return (a * b);

    }

};


template <typename T>

static inline T


fpMul(T a, T b)

{

    return a * b;

};


static inline float


fpMulS(float a, float b)

{

    return a * b;

}


static inline double


fpMulD(double a, double b)

{

    return a * b;

}


template <typename T>

static inline T

// @todo remove this when all calls to it have been replaced with the new fplib implementation


fpMulAdd(T op1, T op2, T addend)

{

    T result;


    if (sizeof(T) == sizeof(float))

        result = fmaf(op1, op2, addend);

    else

        result = fma(op1, op2, addend);


    // ARM doesn't generate signed nan's from this opperation, so fix up the result

    if (std::isnan(result) && !std::isnan(op1) &&

        !std::isnan(op2) && !std::isnan(addend))

    {

        uint64_t bitMask = 0x1ULL << ((sizeof(T) * 8) - 1);

        result = bitsToFp(fpToBits(result) & ~bitMask, op1);

    }

    return result;

}


template <typename T>

static inline T


fpRIntX(T a, FPSCR &fpscr)

{

    T rVal;


    rVal = rint(a);

    if (rVal != a && !std::isnan(a))

        fpscr.ixc = 1;

    return (rVal);

};


template <typename T>

static inline T


fpMaxNum(T a, T b)

{

    const bool     single = (sizeof(T) == sizeof(float));

    const uint64_t qnan   = single ? 0x7fc00000 : 0x7ff8000000000000ULL;


    if (std::isnan(a))

        return ((fpToBits(a) & qnan) == qnan) ? b : a;

    if (std::isnan(b))

        return ((fpToBits(b) & qnan) == qnan) ? a : b;

    // Handle comparisons of +0 and -0.

    if (!std::signbit(a) && std::signbit(b))

        return a;

    return fmax(a, b);

};


template <typename T>

static inline T


fpMax(T a, T b)

{

    if (std::isnan(a))

        return a;

    if (std::isnan(b))

        return b;

    return fpMaxNum<T>(a, b);

};


template <typename T>

static inline T


fpMinNum(T a, T b)

{

    const bool     single = (sizeof(T) == sizeof(float));

    const uint64_t qnan   = single ? 0x7fc00000 : 0x7ff8000000000000ULL;


    if (std::isnan(a))

        return ((fpToBits(a) & qnan) == qnan) ? b : a;

    if (std::isnan(b))

        return ((fpToBits(b) & qnan) == qnan) ? a : b;

    // Handle comparisons of +0 and -0.

    if (std::signbit(a) && !std::signbit(b))

        return a;

    return fmin(a, b);

};


template <typename T>

static inline T


fpMin(T a, T b)

{

    if (std::isnan(a))

        return a;

    if (std::isnan(b))

        return b;

    return fpMinNum<T>(a, b);

};


template <typename T>

static inline T


fpRSqrts(T a, T b)

{

    int fpClassA = std::fpclassify(a);

    int fpClassB = std::fpclassify(b);

    T aXb;

    int fpClassAxB;


    if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||

        (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {

        return 1.5;

    }

    aXb = a*b;

    fpClassAxB = std::fpclassify(aXb);

    if (fpClassAxB == FP_SUBNORMAL) {

       feraiseexcept(FeUnderflow);

       return 1.5;

    }

    return (3.0 - (a * b)) / 2.0;

};


template <typename T>

static inline T


fpRecps(T a, T b)

{

    int fpClassA = std::fpclassify(a);

    int fpClassB = std::fpclassify(b);

    T aXb;

    int fpClassAxB;


    if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||

        (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {

        return 2.0;

    }

    aXb = a*b;

    fpClassAxB = std::fpclassify(aXb);

    if (fpClassAxB == FP_SUBNORMAL) {

       feraiseexcept(FeUnderflow);

       return 2.0;

    }

    return 2.0 - (a * b);

};


static inline float


fpRSqrtsS(float a, float b)

{

    int fpClassA = std::fpclassify(a);

    int fpClassB = std::fpclassify(b);

    float aXb;

    int fpClassAxB;


    if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||

        (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {

        return 1.5;

    }

    aXb = a*b;

    fpClassAxB = std::fpclassify(aXb);

    if (fpClassAxB == FP_SUBNORMAL) {

       feraiseexcept(FeUnderflow);

       return 1.5;

    }

    return (3.0 - (a * b)) / 2.0;

}


static inline float


fpRecpsS(float a, float b)

{

    int fpClassA = std::fpclassify(a);

    int fpClassB = std::fpclassify(b);

    float aXb;

    int fpClassAxB;


    if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||

        (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {

        return 2.0;

    }

    aXb = a*b;

    fpClassAxB = std::fpclassify(aXb);

    if (fpClassAxB == FP_SUBNORMAL) {

       feraiseexcept(FeUnderflow);

       return 2.0;

    }

    return 2.0 - (a * b);

}


template <typename T>

static inline T


roundNEven(T a) {

    T val;


    val = round(a);

    if (a - val == 0.5) {

        if ( (((int) a) & 1) == 0 ) val += 1.0;

    }

    else if (a - val == -0.5) {

        if ( (((int) a) & 1) == 0 ) val -= 1.0;

    }

    return val;

}


class FpOp : public PredOp

{

  protected:


    FpOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass) :

        PredOp(mnem, _machInst, __opClass)

    {}


    virtual float


    doOp(float op1, float op2) const

    {

        panic("Unimplemented version of doOp called.\n");

    }


    virtual float


    doOp(float op1) const

    {

        panic("Unimplemented version of doOp called.\n");

    }


    virtual double


    doOp(double op1, double op2) const

    {

        panic("Unimplemented version of doOp called.\n");

    }


    virtual double


    doOp(double op1) const

    {

        panic("Unimplemented version of doOp called.\n");

    }


    double


    dbl(uint32_t low, uint32_t high) const

    {

        double junk = 0.0;

        return bitsToFp((uint64_t)low | ((uint64_t)high << 32), junk);

    }


    uint32_t


    dblLow(double val) const

    {

        return fpToBits(val);

    }


    uint32_t


    dblHi(double val) const

    {

        return fpToBits(val) >> 32;

    }


    template <class fpType>

    fpType

    processNans(FPSCR &fpscr, bool &done, bool defaultNan,

                fpType op1, fpType op2) const;


    template <class fpType>

    fpType

    ternaryOp(FPSCR &fpscr, fpType op1, fpType op2, fpType op3,

              fpType (*func)(fpType, fpType, fpType),

              bool flush, bool defaultNan, uint32_t rMode) const;


    template <class fpType>

    fpType

    binaryOp(FPSCR &fpscr, fpType op1, fpType op2,

            fpType (*func)(fpType, fpType),

            bool flush, bool defaultNan, uint32_t rMode) const;


    template <class fpType>

    fpType

    unaryOp(FPSCR &fpscr, fpType op1,

            fpType (*func)(fpType),

            bool flush, uint32_t rMode) const;


    void


    advancePC(PCStateBase &pcState) const override

    {

        auto &apc = pcState.as<PCState>();

        if (flags[IsLastMicroop]) {

            apc.uEnd();

        } else if (flags[IsMicroop]) {

            apc.uAdvance();

        } else {

            apc.advance();

        }

    }


    void


    advancePC(ThreadContext *tc) const override

    {

        PCState pc = tc->pcState().as<PCState>();

        if (flags[IsLastMicroop]) {

            pc.uEnd();

        } else if (flags[IsMicroop]) {

            pc.uAdvance();

        } else {

            pc.advance();

        }

        tc->pcState(pc);

    }


    float


    fpSqrt (FPSCR fpscr,float x) const

    {


        return unaryOp(fpscr,x,sqrtf,fpscr.fz,fpscr.rMode);


    }


    double


    fpSqrt (FPSCR fpscr,double x) const

    {


        return unaryOp(fpscr,x,sqrt,fpscr.fz,fpscr.rMode);


    }


};


class FpCondCompRegOp : public FpOp

{

  protected:

    RegIndex op1, op2;

    ConditionCode condCode;

    uint8_t defCc;


    FpCondCompRegOp(const char *mnem, ExtMachInst _machInst,

                       OpClass __opClass, RegIndex _op1, RegIndex _op2,

                       ConditionCode _condCode, uint8_t _defCc) :

        FpOp(mnem, _machInst, __opClass),

        op1(_op1), op2(_op2), condCode(_condCode), defCc(_defCc)

    {}


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpCondSelOp : public FpOp

{

  protected:

    RegIndex dest, op1, op2;

    ConditionCode condCode;


    FpCondSelOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass,

                RegIndex _dest, RegIndex _op1, RegIndex _op2,

                ConditionCode _condCode) :

        FpOp(mnem, _machInst, __opClass),

        dest(_dest), op1(_op1), op2(_op2), condCode(_condCode)

    {}


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegRegOp : public FpOp

{

  protected:

    RegIndex dest;

    RegIndex op1;


    FpRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass,

               RegIndex _dest, RegIndex _op1,

               VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass), dest(_dest), op1(_op1)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegImmOp : public FpOp

{

  protected:

    RegIndex dest;

    uint64_t imm;


    FpRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass,

               RegIndex _dest, uint64_t _imm,

               VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass), dest(_dest), imm(_imm)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegRegImmOp : public FpOp

{

  protected:

    RegIndex dest;

    RegIndex op1;

    uint64_t imm;


    FpRegRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass,

                  RegIndex _dest, RegIndex _op1,

                  uint64_t _imm, VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass), dest(_dest), op1(_op1), imm(_imm)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegRegRegOp : public FpOp

{

  protected:

    RegIndex dest;

    RegIndex op1;

    RegIndex op2;


    FpRegRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass,

                  RegIndex _dest, RegIndex _op1, RegIndex _op2,

                  VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass), dest(_dest), op1(_op1), op2(_op2)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegRegRegCondOp : public FpOp

{

  protected:

    RegIndex dest;

    RegIndex op1;

    RegIndex op2;

    ConditionCode cond;


    FpRegRegRegCondOp(const char *mnem, ExtMachInst _machInst,

                      OpClass __opClass, RegIndex _dest, RegIndex _op1,

                      RegIndex _op2, ConditionCode _cond,

                      VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass), dest(_dest), op1(_op1), op2(_op2),

        cond(_cond)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegRegRegRegOp : public FpOp

{

  protected:

    RegIndex dest;

    RegIndex op1;

    RegIndex op2;

    RegIndex op3;


    FpRegRegRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass,

                     RegIndex _dest, RegIndex _op1, RegIndex _op2,

                     RegIndex _op3, VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass), dest(_dest), op1(_op1), op2(_op2),

        op3(_op3)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


class FpRegRegRegImmOp : public FpOp

{

  protected:

    RegIndex dest;

    RegIndex op1;

    RegIndex op2;

    uint64_t imm;


    FpRegRegRegImmOp(const char *mnem, ExtMachInst _machInst,

                     OpClass __opClass, RegIndex _dest,

                     RegIndex _op1, RegIndex _op2,

                     uint64_t _imm, VfpMicroMode mode = VfpNotAMicroop) :

        FpOp(mnem, _machInst, __opClass),

        dest(_dest), op1(_op1), op2(_op2), imm(_imm)

    {

        setVfpMicroFlags(mode, flags);

    }


    std::string generateDisassembly(

            Addr pc, const loader::SymbolTable *symtab) const override;

};


FPSCR fpVASimdFPSCRValue(const FPSCR &fpscr);


FPSCR fpVASimdCvtFPSCRValue(const FPSCR &fpscr);


FPSCR fpRestoreFPSCRValue(const FPSCR fpscr_exec, const FPSCR &fpscr);


} // namespace ArmISA

} // namespace gem5


#endif //__ARCH_ARM_INSTS_VFP_HH__

misc.hh

misc.hh

pcstate.hh

gem5::ArmISA::FpCondCompRegOp::condCode
ConditionCode condCode
Definition vfp.hh:1065

gem5::ArmISA::FpCondCompRegOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:52

gem5::ArmISA::FpCondCompRegOp::FpCondCompRegOp
FpCondCompRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _op1, RegIndex _op2, ConditionCode _condCode, uint8_t _defCc)
Definition vfp.hh:1068

gem5::ArmISA::FpCondCompRegOp::defCc
uint8_t defCc
Definition vfp.hh:1066

gem5::ArmISA::FpCondCompRegOp::op2
RegIndex op2
Definition vfp.hh:1064

gem5::ArmISA::FpCondCompRegOp::op1
RegIndex op1
Definition vfp.hh:1064

gem5::ArmISA::FpCondSelOp::op2
RegIndex op2
Definition vfp.hh:1082

gem5::ArmISA::FpCondSelOp::op1
RegIndex op1
Definition vfp.hh:1082

gem5::ArmISA::FpCondSelOp::FpCondSelOp
FpCondSelOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, RegIndex _op2, ConditionCode _condCode)
Definition vfp.hh:1085

gem5::ArmISA::FpCondSelOp::condCode
ConditionCode condCode
Definition vfp.hh:1083

gem5::ArmISA::FpCondSelOp::dest
RegIndex dest
Definition vfp.hh:1082

gem5::ArmISA::FpCondSelOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:67

gem5::ArmISA::FpOp::advancePC
void advancePC(ThreadContext *tc) const override
Definition vfp.hh:1031

gem5::ArmISA::FpOp::advancePC
void advancePC(PCStateBase &pcState) const override
Definition vfp.hh:1018

gem5::ArmISA::FpOp::fpSqrt
float fpSqrt(FPSCR fpscr, float x) const
Definition vfp.hh:1045

gem5::ArmISA::FpOp::dblLow
uint32_t dblLow(double val) const
Definition vfp.hh:983

gem5::ArmISA::FpOp::unaryOp
fpType unaryOp(FPSCR &fpscr, fpType op1, fpType(*func)(fpType), bool flush, uint32_t rMode) const
Definition vfp.cc:1236

gem5::ArmISA::FpOp::processNans
fpType processNans(FPSCR &fpscr, bool &done, bool defaultNan, fpType op1, fpType op2) const
Definition vfp.cc:1043

gem5::ArmISA::FpOp::dblHi
uint32_t dblHi(double val) const
Definition vfp.hh:989

gem5::ArmISA::FpOp::doOp
virtual double doOp(double op1) const
Definition vfp.hh:970

gem5::ArmISA::FpOp::ternaryOp
fpType ternaryOp(FPSCR &fpscr, fpType op1, fpType op2, fpType op3, fpType(*func)(fpType, fpType, fpType), bool flush, bool defaultNan, uint32_t rMode) const
Definition vfp.cc:1087

gem5::ArmISA::FpOp::doOp
virtual float doOp(float op1) const
Definition vfp.hh:958

gem5::ArmISA::FpOp::binaryOp
fpType binaryOp(FPSCR &fpscr, fpType op1, fpType op2, fpType(*func)(fpType, fpType), bool flush, bool defaultNan, uint32_t rMode) const
Definition vfp.cc:1165

gem5::ArmISA::FpOp::doOp
virtual double doOp(double op1, double op2) const
Definition vfp.hh:964

gem5::ArmISA::FpOp::fpSqrt
double fpSqrt(FPSCR fpscr, double x) const
Definition vfp.hh:1053

gem5::ArmISA::FpOp::FpOp
FpOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass)
Definition vfp.hh:947

gem5::ArmISA::FpOp::doOp
virtual float doOp(float op1, float op2) const
Definition vfp.hh:952

gem5::ArmISA::FpOp::dbl
double dbl(uint32_t low, uint32_t high) const
Definition vfp.hh:976

gem5::ArmISA::FpRegImmOp::dest
RegIndex dest
Definition vfp.hh:1117

gem5::ArmISA::FpRegImmOp::imm
uint64_t imm
Definition vfp.hh:1118

gem5::ArmISA::FpRegImmOp::FpRegImmOp
FpRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, uint64_t _imm, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1120

gem5::ArmISA::FpRegImmOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:95

gem5::ArmISA::FpRegRegImmOp::dest
RegIndex dest
Definition vfp.hh:1135

gem5::ArmISA::FpRegRegImmOp::op1
RegIndex op1
Definition vfp.hh:1136

gem5::ArmISA::FpRegRegImmOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:106

gem5::ArmISA::FpRegRegImmOp::FpRegRegImmOp
FpRegRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, uint64_t _imm, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1139

gem5::ArmISA::FpRegRegImmOp::imm
uint64_t imm
Definition vfp.hh:1137

gem5::ArmISA::FpRegRegOp::FpRegRegOp
FpRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1102

gem5::ArmISA::FpRegRegOp::dest
RegIndex dest
Definition vfp.hh:1099

gem5::ArmISA::FpRegRegOp::op1
RegIndex op1
Definition vfp.hh:1100

gem5::ArmISA::FpRegRegOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:83

gem5::ArmISA::FpRegRegRegCondOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:133

gem5::ArmISA::FpRegRegRegCondOp::op1
RegIndex op1
Definition vfp.hh:1174

gem5::ArmISA::FpRegRegRegCondOp::FpRegRegRegCondOp
FpRegRegRegCondOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, RegIndex _op2, ConditionCode _cond, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1178

gem5::ArmISA::FpRegRegRegCondOp::op2
RegIndex op2
Definition vfp.hh:1175

gem5::ArmISA::FpRegRegRegCondOp::dest
RegIndex dest
Definition vfp.hh:1173

gem5::ArmISA::FpRegRegRegCondOp::cond
ConditionCode cond
Definition vfp.hh:1176

gem5::ArmISA::FpRegRegRegImmOp::FpRegRegRegImmOp
FpRegRegRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, RegIndex _op2, uint64_t _imm, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1221

gem5::ArmISA::FpRegRegRegImmOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:164

gem5::ArmISA::FpRegRegRegImmOp::dest
RegIndex dest
Definition vfp.hh:1216

gem5::ArmISA::FpRegRegRegImmOp::op1
RegIndex op1
Definition vfp.hh:1217

gem5::ArmISA::FpRegRegRegImmOp::op2
RegIndex op2
Definition vfp.hh:1218

gem5::ArmISA::FpRegRegRegImmOp::imm
uint64_t imm
Definition vfp.hh:1219

gem5::ArmISA::FpRegRegRegOp::dest
RegIndex dest
Definition vfp.hh:1154

gem5::ArmISA::FpRegRegRegOp::op2
RegIndex op2
Definition vfp.hh:1156

gem5::ArmISA::FpRegRegRegOp::FpRegRegRegOp
FpRegRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, RegIndex _op2, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1158

gem5::ArmISA::FpRegRegRegOp::op1
RegIndex op1
Definition vfp.hh:1155

gem5::ArmISA::FpRegRegRegOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:119

gem5::ArmISA::FpRegRegRegRegOp::FpRegRegRegRegOp
FpRegRegRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, RegIndex _dest, RegIndex _op1, RegIndex _op2, RegIndex _op3, VfpMicroMode mode=VfpNotAMicroop)
Definition vfp.hh:1200

gem5::ArmISA::FpRegRegRegRegOp::op3
RegIndex op3
Definition vfp.hh:1198

gem5::ArmISA::FpRegRegRegRegOp::dest
RegIndex dest
Definition vfp.hh:1195

gem5::ArmISA::FpRegRegRegRegOp::op2
RegIndex op2
Definition vfp.hh:1197

gem5::ArmISA::FpRegRegRegRegOp::op1
RegIndex op1
Definition vfp.hh:1196

gem5::ArmISA::FpRegRegRegRegOp::generateDisassembly
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
Definition vfp.cc:148

gem5::ArmISA::PredMacroOp::PredMacroOp
PredMacroOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass)
Constructor.
Definition pred_inst.hh:350

gem5::ArmISA::PredOp::PredOp
PredOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass)
Constructor.
Definition pred_inst.hh:223

gem5::ArmISA::VfpMacroOp::inScalarBank
static bool inScalarBank(RegIndex idx)
Definition vfp.hh:621

gem5::ArmISA::VfpMacroOp::nextIdxs
void nextIdxs(RegIndex &dest, RegIndex &op1, RegIndex &op2)
Definition vfp.cc:1306

gem5::ArmISA::VfpMacroOp::addStride
RegIndex addStride(RegIndex idx, unsigned stride)
Definition vfp.cc:1293

gem5::ArmISA::VfpMacroOp::VfpMacroOp
VfpMacroOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, bool _wide)
Definition vfp.hh:629

gem5::ArmISA::VfpMacroOp::wide
bool wide
Definition vfp.hh:627

gem5::PCStateBase
Definition pcstate.hh:59

gem5::PCStateBase::as
Target & as()
Definition pcstate.hh:73

gem5::PowerISA::PCState
Definition pcstate.hh:43

gem5::StaticInst::flags
std::bitset< Num_Flags > flags
Flag values for this instruction.
Definition static_inst.hh:103

gem5::ThreadContext
ThreadContext is the external interface to all thread state for anything outside of the CPU.
Definition thread_context.hh:89

gem5::ThreadContext::pcState
virtual const PCStateBase & pcState() const =0

gem5::loader::SymbolTable
Definition symtab.hh:152

GEM5_NO_OPTIMIZE
#define GEM5_NO_OPTIMIZE
Definition compiler.hh:141

thread_context.hh

gem5::bits
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
Definition bitfield.hh:79

panic
#define panic(...)
This implements a cprintf based panic() function.
Definition logging.hh:220

gem5::ArmISA
Definition decoder.cc:55

gem5::ArmISA::flushToZero
flushToZero
Definition misc_types.hh:585

gem5::ArmISA::unsignedRecipEstimate
uint32_t unsignedRecipEstimate(uint32_t op)
Definition vfp.cc:1015

gem5::ArmISA::FeRoundingMode
FeRoundingMode
Definition vfp.hh:99

gem5::ArmISA::FeRoundZero
@ FeRoundZero
Definition vfp.hh:102

gem5::ArmISA::FeRoundNearest
@ FeRoundNearest
Definition vfp.hh:101

gem5::ArmISA::FeRoundUpward
@ FeRoundUpward
Definition vfp.hh:103

gem5::ArmISA::FeRoundDown
@ FeRoundDown
Definition vfp.hh:100

gem5::ArmISA::fpToBits
static uint32_t fpToBits(float)
Definition vfp.hh:203

gem5::ArmISA::fixDivDest
fpType fixDivDest(bool flush, bool defaultNan, fpType val, fpType op1, fpType op2)
Definition vfp.cc:301

gem5::ArmISA::highFromDouble
static uint32_t highFromDouble(double val)
Definition vfp.hh:299

gem5::ArmISA::fpMulD
static double fpMulD(double a, double b)
Definition vfp.hh:745

gem5::ArmISA::fpMin
static T fpMin(T a, T b)
Definition vfp.hh:831

gem5::ArmISA::mask
Bitfield< 3, 0 > mask
Definition pcstate.hh:63

gem5::ArmISA::fpMax
static T fpMax(T a, T b)
Definition vfp.hh:803

gem5::ArmISA::fpRecipEstimateFpH
uint16_t fpRecipEstimateFpH(FPSCR &fpscr, uint16_t op)
Definition vfp.cc:948

gem5::ArmISA::vfpSFixedToFpD
double vfpSFixedToFpD(bool flush, bool defaultNan, int64_t val, uint8_t width, uint8_t imm)
Definition vfp.cc:731

gem5::ArmISA::vfpFpRint
T GEM5_NO_OPTIMIZE vfpFpRint(T val, bool exact, bool defaultNan, bool useRmode=true, VfpRoundingMode roundMode=VfpRoundZero)
Definition vfp.hh:485

gem5::ArmISA::mode
Bitfield< 4, 0 > mode
Definition misc_types.hh:74

gem5::ArmISA::width
Bitfield< 4 > width
Definition misc_types.hh:72

gem5::ArmISA::stride
Bitfield< 21, 20 > stride
Definition misc_types.hh:533

gem5::ArmISA::fpRIntX
static T fpRIntX(T a, FPSCR &fpscr)
Definition vfp.hh:774

gem5::ArmISA::fpSub
static T fpSub(T a, T b)
Definition vfp.hh:649

gem5::ArmISA::imm
Bitfield< 7, 0 > imm
Definition types.hh:132

gem5::ArmISA::b
Bitfield< 7 > b
Definition misc_types.hh:471

gem5::ArmISA::FpscrExcMask
static const uint32_t FpscrExcMask
Definition misc.hh:3021

gem5::ArmISA::fpRSqrtsS
static float fpRSqrtsS(float a, float b)
Definition vfp.hh:886

gem5::ArmISA::fpDivS
static float fpDivS(float a, float b)
Definition vfp.hh:679

gem5::ArmISA::vcvtFpHFpD
double vcvtFpHFpD(FPSCR &fpscr, bool defaultNan, bool ahp, uint16_t op)
Definition vfp.cc:654

gem5::ArmISA::rMode
Bitfield< 23, 22 > rMode
Definition misc_types.hh:534

gem5::ArmISA::fpMulX
static T fpMulX(T a, T b)
Definition vfp.hh:699

gem5::ArmISA::fprSqrtEstimateFpH
uint16_t fprSqrtEstimateFpH(FPSCR &fpscr, uint16_t op)
Definition vfp.cc:813

gem5::ArmISA::fpRecpsS
static float fpRecpsS(float a, float b)
Definition vfp.hh:907

gem5::ArmISA::vfpUFixedToFpS
float vfpUFixedToFpS(bool flush, bool defaultNan, uint64_t val, uint8_t width, uint8_t imm)
Definition vfp.cc:674

gem5::ArmISA::unsignedRSqrtEstimate
uint32_t unsignedRSqrtEstimate(uint32_t op)
Definition vfp.cc:873

gem5::ArmISA::prepFpState
VfpSavedState prepFpState(uint32_t rMode)
Definition vfp.cc:182

gem5::ArmISA::fixFpDFpSDest
float fixFpDFpSDest(FPSCR fpscr, double val)
Definition vfp.cc:336

gem5::ArmISA::flushToZeroFpH
static bool flushToZeroFpH(uint16_t &op)
Definition vfp.hh:159

gem5::ArmISA::VfpSavedState
int VfpSavedState
Definition vfp.hh:260

gem5::ArmISA::fpMul
static T fpMul(T a, T b)
Definition vfp.hh:733

gem5::ArmISA::fpMulS
static float fpMulS(float a, float b)
Definition vfp.hh:739

gem5::ArmISA::fpDiv
static T fpDiv(T a, T b)
Definition vfp.hh:692

gem5::ArmISA::finishVfp
void finishVfp(FPSCR &fpscr, VfpSavedState state, bool flush, FPSCR mask)
Definition vfp.cc:204

gem5::ArmISA::fixFpSFpDDest
double fixFpSFpDDest(FPSCR fpscr, float val)
Definition vfp.cc:372

gem5::ArmISA::FeExceptionBit
FeExceptionBit
Definition vfp.hh:89

gem5::ArmISA::FeUnderflow
@ FeUnderflow
Definition vfp.hh:94

gem5::ArmISA::FeDivByZero
@ FeDivByZero
Definition vfp.hh:90

gem5::ArmISA::FeInvalid
@ FeInvalid
Definition vfp.hh:92

gem5::ArmISA::FeOverflow
@ FeOverflow
Definition vfp.hh:93

gem5::ArmISA::FeAllExceptions
@ FeAllExceptions
Definition vfp.hh:95

gem5::ArmISA::FeInexact
@ FeInexact
Definition vfp.hh:91

gem5::ArmISA::vcvtFpHFpS
float vcvtFpHFpS(FPSCR &fpscr, bool defaultNan, bool ahp, uint16_t op)
Definition vfp.cc:664

gem5::ArmISA::roundNEven
static T roundNEven(T a)
Definition vfp.hh:929

gem5::ArmISA::VfpMicroMode
VfpMicroMode
Definition vfp.hh:57

gem5::ArmISA::VfpNotAMicroop
@ VfpNotAMicroop
Definition vfp.hh:58

gem5::ArmISA::VfpMicroop
@ VfpMicroop
Definition vfp.hh:59

gem5::ArmISA::VfpFirstMicroop
@ VfpFirstMicroop
Definition vfp.hh:60

gem5::ArmISA::VfpLastMicroop
@ VfpLastMicroop
Definition vfp.hh:61

gem5::ArmISA::fpMinNum
static T fpMinNum(T a, T b)
Definition vfp.hh:814

gem5::ArmISA::ConditionCode
ConditionCode
Definition cc.hh:104

gem5::ArmISA::vfpSFixedToFpS
float vfpSFixedToFpS(bool flush, bool defaultNan, int64_t val, uint8_t width, uint8_t imm)
Definition vfp.cc:692

gem5::ArmISA::lowFromDouble
static uint32_t lowFromDouble(double val)
Definition vfp.hh:293

gem5::ArmISA::fixDest
fpType fixDest(bool flush, bool defaultNan, fpType val, fpType op1)
Definition vfp.cc:230

gem5::ArmISA::a
Bitfield< 8 > a
Definition misc_types.hh:66

gem5::ArmISA::vfpUFixedToFpD
double vfpUFixedToFpD(bool flush, bool defaultNan, uint64_t val, uint8_t width, uint8_t imm)
Definition vfp.cc:712

gem5::ArmISA::bitsToFp
static float bitsToFp(uint64_t, float)
Definition vfp.hh:227

gem5::ArmISA::fpclassifyFpH
constexpr int fpclassifyFpH(uint16_t __x)
Definition vfp.hh:121

gem5::ArmISA::fpMulAdd
static T fpMulAdd(T op1, T op2, T addend)
Definition vfp.hh:753

gem5::ArmISA::fpAddD
static double fpAddD(double a, double b)
Definition vfp.hh:661

gem5::ArmISA::fpSubS
static float fpSubS(float a, float b)
Definition vfp.hh:667

gem5::ArmISA::fpVASimdCvtFPSCRValue
FPSCR fpVASimdCvtFPSCRValue(const FPSCR &fpscr)
Definition vfp.cc:1349

gem5::ArmISA::vcvtFpDFpH
uint16_t vcvtFpDFpH(FPSCR &fpscr, bool flush, bool defaultNan, uint32_t rMode, bool ahp, double op)
Definition vfp.cc:584

gem5::ArmISA::fpSubD
static double fpSubD(double a, double b)
Definition vfp.hh:673

gem5::ArmISA::vfpFpToFixed
uint64_t GEM5_NO_OPTIMIZE vfpFpToFixed(T val, bool isSigned, uint8_t width, uint8_t imm, bool useRmode=true, VfpRoundingMode roundMode=VfpRoundZero, bool aarch64=false)
Definition vfp.hh:313

gem5::ArmISA::fpStandardFPSCRValue
FPSCR fpStandardFPSCRValue(const FPSCR &fpscr)
Definition vfp.cc:1031

gem5::ArmISA::fpRSqrts
static T fpRSqrts(T a, T b)
Definition vfp.hh:842

gem5::ArmISA::isSnan
static bool isSnan(fpType val)
Definition vfp.hh:252

gem5::ArmISA::vfpFlushToZeroFpH
static void vfpFlushToZeroFpH(FPSCR &fpscr, uint16_t &op)
Definition vfp.hh:187

gem5::ArmISA::vcvtFpSFpH
uint16_t vcvtFpSFpH(FPSCR &fpscr, bool flush, bool defaultNan, uint32_t rMode, bool ahp, float op)
Definition vfp.cc:576

gem5::ArmISA::setFPExceptions
static void setFPExceptions(int exceptions)
Definition vfp.hh:305

gem5::ArmISA::fpAdd
static T fpAdd(T a, T b)
Definition vfp.hh:642

gem5::ArmISA::fpAddS
static float fpAddS(float a, float b)
Definition vfp.hh:655

gem5::ArmISA::makeDouble
static double makeDouble(uint32_t low, uint32_t high)
Definition vfp.hh:286

gem5::ArmISA::vfpFlushToZero
static void vfpFlushToZero(FPSCR &fpscr, fpType &op)
Definition vfp.hh:179

gem5::ArmISA::aarch64
Bitfield< 34 > aarch64
Definition types.hh:81

gem5::ArmISA::fpDivD
static double fpDivD(double a, double b)
Definition vfp.hh:685

gem5::ArmISA::setVfpMicroFlags
static void setVfpMicroFlags(VfpMicroMode mode, T &flags)
Definition vfp.hh:66

gem5::ArmISA::fp
Bitfield< 19, 16 > fp
Definition misc_types.hh:225

gem5::ArmISA::fpRecps
static T fpRecps(T a, T b)
Definition vfp.hh:864

gem5::ArmISA::ahp
Bitfield< 26 > ahp
Definition misc_types.hh:537

gem5::ArmISA::fprSqrtEstimate
float fprSqrtEstimate(FPSCR &fpscr, float op)
Definition vfp.cc:770

gem5::ArmISA::fpRecipEstimate
float fpRecipEstimate(FPSCR &fpscr, float op)
Definition vfp.cc:912

gem5::ArmISA::VfpRoundingMode
VfpRoundingMode
Definition vfp.hh:107

gem5::ArmISA::VfpRoundNearest
@ VfpRoundNearest
Definition vfp.hh:108

gem5::ArmISA::VfpRoundZero
@ VfpRoundZero
Definition vfp.hh:111

gem5::ArmISA::VfpRoundAway
@ VfpRoundAway
Definition vfp.hh:112

gem5::ArmISA::VfpRoundUpward
@ VfpRoundUpward
Definition vfp.hh:109

gem5::ArmISA::VfpRoundDown
@ VfpRoundDown
Definition vfp.hh:110

gem5::ArmISA::fpRestoreFPSCRValue
FPSCR fpRestoreFPSCRValue(const FPSCR fpscr_exec, const FPSCR &fpscr)
Definition vfp.cc:1361

gem5::ArmISA::fpVASimdFPSCRValue
FPSCR fpVASimdFPSCRValue(const FPSCR &fpscr)
Definition vfp.cc:1337

gem5::ArmISA::fpMaxNum
static T fpMaxNum(T a, T b)
Definition vfp.hh:786

gem5::MipsISA::pc
Bitfield< 4 > pc
Definition pra_constants.hh:243

gem5::RiscvISA::fmin
FloatType fmin(FloatType a, FloatType b)
Definition utility.hh:377

gem5::RiscvISA::x
Bitfield< 3 > x
Definition pagetable.hh:78

gem5::RiscvISA::fmax
FloatType fmax(FloatType a, FloatType b)
Definition utility.hh:389

gem5::X86ISA::op
Bitfield< 4 > op
Definition types.hh:83

gem5::X86ISA::val
Bitfield< 63 > val
Definition misc.hh:804

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::RegIndex
uint16_t RegIndex
Definition types.hh:176

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

std::isnan
constexpr bool isnan(gem5::AMDGPU::fp16_e5m10_info a)
Definition fp16_e5m10.hh:83

gem5::X86ISA::ExtMachInst
Definition types.hh:213