Go to the documentation of this file.
38 #ifndef __ARCH_ARM_INSTS_VFP_HH__
39 #define __ARCH_ARM_INSTS_VFP_HH__
68 flags[StaticInst::IsMicroop] =
true;
71 flags[StaticInst::IsMicroop] =
72 flags[StaticInst::IsFirstMicroop] =
true;
75 flags[StaticInst::IsMicroop] =
76 flags[StaticInst::IsLastMicroop] =
true;
82 flags[StaticInst::IsDelayedCommit] =
true;
113 static inline float bitsToFp(uint64_t,
float);
114 static inline double bitsToFp(uint64_t,
double);
115 static inline uint32_t
fpToBits(
float);
116 static inline uint64_t
fpToBits(
double);
118 template <
class fpType>
123 if (std::fpclassify(
op) == FP_SUBNORMAL) {
124 uint64_t bitMask = 0x1ULL << (
sizeof(fpType) * 8 - 1);
131 template <
class fpType>
137 return flush1 || flush2;
140 template <
class fpType>
149 template <
class fpType>
157 static inline uint32_t
169 static inline uint64_t
205 template <
class fpType>
209 const bool single = (
sizeof(fpType) ==
sizeof(
float));
210 const uint64_t qnan =
211 single ? 0x7fc00000 : 0x7ff8000000000000ULL;
220 template <
class fpType>
221 fpType
fixDest(FPSCR fpscr, fpType
val, fpType op1);
223 template <
class fpType>
224 fpType
fixDest(FPSCR fpscr, fpType
val, fpType op1, fpType op2);
226 template <
class fpType>
227 fpType
fixDivDest(FPSCR fpscr, fpType
val, fpType op1, fpType op2);
232 uint16_t
vcvtFpSFpH(FPSCR &fpscr,
bool flush,
bool defaultNan,
234 uint16_t
vcvtFpDFpH(FPSCR &fpscr,
bool flush,
bool defaultNan,
237 float vcvtFpHFpS(FPSCR &fpscr,
bool defaultNan,
bool ahp, uint16_t
op);
238 double vcvtFpHFpD(FPSCR &fpscr,
bool defaultNan,
bool ahp, uint16_t
op);
244 return bitsToFp((uint64_t)low | ((uint64_t)
high << 32), junk);
247 static inline uint32_t
253 static inline uint32_t
262 feraiseexcept(exceptions);
265 template <
typename T>
272 bool roundAwayFix =
false;
275 rmode = fegetround();
298 panic(
"Unsupported roundMode %d\n", roundMode);
301 __asm__ __volatile__(
"" :
"=m" (rmode) :
"m" (rmode));
304 __asm__ __volatile__(
"" :
"=m" (
val) :
"m" (
val));
307 __asm__ __volatile__(
"" :
"=m" (
val) :
"m" (
val));
310 __asm__ __volatile__(
"" :
"=m" (
val) :
"m" (
val));
314 int fpType = std::fpclassify(
val);
315 if (fpType == FP_SUBNORMAL || fpType == FP_NAN) {
316 if (fpType == FP_NAN) {
320 }
else if (origVal !=
val) {
323 if (origVal -
val > 0.5)
325 else if (
val - origVal > 0.5)
337 if ( (
error > 0.5) ||
353 __asm__ __volatile__(
"" :
"=m" (
val) :
"m" (
val));
356 bool outOfRange =
false;
357 int64_t result = (int64_t)
val;
362 finalVal = (int16_t)
val;
363 }
else if (
width == 32) {
364 finalVal =(int32_t)
val;
365 }
else if (
width == 64) {
373 if ((
double)
val < minVal) {
378 if ((
double)
val > maxVal) {
383 bool isNeg =
val < 0;
388 outOfRange = ((uint64_t) result >> (
width - 1)) !=
395 outOfRange |=
val < result;
397 finalVal = 1LL << (
width-1);
400 outOfRange |=
val > result;
415 if ((
double)
val < 0) {
461 return (idx % 32) < 8;
468 OpClass __opClass,
bool _wide) :
473 void nextIdxs(IntRegIndex &dest, IntRegIndex &op1, IntRegIndex &op2);
474 void nextIdxs(IntRegIndex &dest, IntRegIndex &op1);
478 template <
typename T>
485 template <
typename T>
528 template <
typename T>
535 template <
typename T>
542 const bool single = (
sizeof(T) ==
sizeof(
float));
554 bool inf1 = (std::fpclassify(
a) == FP_INFINITE);
555 bool inf2 = (std::fpclassify(
b) == FP_INFINITE);
556 bool zero1 = (std::fpclassify(
a) == FP_ZERO);
557 bool zero2 = (std::fpclassify(
b) == FP_ZERO);
558 if ((inf1 && zero2) || (zero1 && inf2)) {
569 template <
typename T>
588 template <
typename T>
595 if (
sizeof(T) ==
sizeof(
float))
596 result = fmaf(op1, op2, addend);
598 result = fma(op1, op2, addend);
601 if (std::isnan(result) && !std::isnan(op1) &&
602 !std::isnan(op2) && !std::isnan(addend))
604 uint64_t bitMask = 0x1ULL << ((
sizeof(T) * 8) - 1);
610 template <
typename T>
617 if (rVal !=
a && !std::isnan(
a))
622 template <
typename T>
626 const bool single = (
sizeof(T) ==
sizeof(
float));
627 const uint64_t qnan = single ? 0x7fc00000 : 0x7ff8000000000000ULL;
634 if (!std::signbit(
a) && std::signbit(
b))
639 template <
typename T>
647 return fpMaxNum<T>(
a,
b);
650 template <
typename T>
654 const bool single = (
sizeof(T) ==
sizeof(
float));
655 const uint64_t qnan = single ? 0x7fc00000 : 0x7ff8000000000000ULL;
662 if (std::signbit(
a) && !std::signbit(
b))
667 template <
typename T>
675 return fpMinNum<T>(
a,
b);
678 template <
typename T>
682 int fpClassA = std::fpclassify(
a);
683 int fpClassB = std::fpclassify(
b);
687 if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||
688 (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {
692 fpClassAxB = std::fpclassify(aXb);
693 if (fpClassAxB == FP_SUBNORMAL) {
697 return (3.0 - (
a *
b)) / 2.0;
700 template <
typename T>
704 int fpClassA = std::fpclassify(
a);
705 int fpClassB = std::fpclassify(
b);
709 if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||
710 (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {
714 fpClassAxB = std::fpclassify(aXb);
715 if (fpClassAxB == FP_SUBNORMAL) {
719 return 2.0 - (
a *
b);
726 int fpClassA = std::fpclassify(
a);
727 int fpClassB = std::fpclassify(
b);
731 if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||
732 (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {
736 fpClassAxB = std::fpclassify(aXb);
737 if (fpClassAxB == FP_SUBNORMAL) {
741 return (3.0 - (
a *
b)) / 2.0;
747 int fpClassA = std::fpclassify(
a);
748 int fpClassB = std::fpclassify(
b);
752 if ((fpClassA == FP_ZERO && fpClassB == FP_INFINITE) ||
753 (fpClassA == FP_INFINITE && fpClassB == FP_ZERO)) {
757 fpClassAxB = std::fpclassify(aXb);
758 if (fpClassAxB == FP_SUBNORMAL) {
762 return 2.0 - (
a *
b);
765 template <
typename T>
771 if (
a -
val == 0.5) {
772 if ( (((
int)
a) & 1) == 0 )
val += 1.0;
774 else if (
a -
val == -0.5) {
775 if ( (((
int)
a) & 1) == 0 )
val -= 1.0;
786 PredOp(mnem, _machInst, __opClass)
790 doOp(
float op1,
float op2)
const
792 panic(
"Unimplemented version of doOp called.\n");
798 panic(
"Unimplemented version of doOp called.\n");
802 doOp(
double op1,
double op2)
const
804 panic(
"Unimplemented version of doOp called.\n");
810 panic(
"Unimplemented version of doOp called.\n");
817 return bitsToFp((uint64_t)low | ((uint64_t)
high << 32), junk);
832 template <
class fpType>
834 processNans(FPSCR &fpscr,
bool &done,
bool defaultNan,
835 fpType op1, fpType op2)
const;
837 template <
class fpType>
839 ternaryOp(FPSCR &fpscr, fpType op1, fpType op2, fpType op3,
840 fpType (*func)(fpType, fpType, fpType),
841 bool flush,
bool defaultNan, uint32_t
rMode)
const;
843 template <
class fpType>
845 binaryOp(FPSCR &fpscr, fpType op1, fpType op2,
846 fpType (*func)(fpType, fpType),
847 bool flush,
bool defaultNan, uint32_t
rMode)
const;
849 template <
class fpType>
851 unaryOp(FPSCR &fpscr, fpType op1,
852 fpType (*func)(fpType),
853 bool flush, uint32_t
rMode)
const;
858 if (
flags[IsLastMicroop]) {
860 }
else if (
flags[IsMicroop]) {
871 return unaryOp(fpscr,
x,sqrtf,fpscr.fz,fpscr.rMode);
879 return unaryOp(fpscr,
x,sqrt,fpscr.fz,fpscr.rMode);
892 OpClass __opClass, IntRegIndex _op1, IntRegIndex _op2,
894 FpOp(mnem, _machInst, __opClass),
909 IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2,
911 FpOp(mnem, _machInst, __opClass),
926 IntRegIndex _dest, IntRegIndex _op1,
928 FpOp(mnem, _machInst, __opClass),
dest(_dest),
op1(_op1)
944 IntRegIndex _dest, uint64_t _imm,
946 FpOp(mnem, _machInst, __opClass),
dest(_dest),
imm(_imm)
963 IntRegIndex _dest, IntRegIndex _op1,
965 FpOp(mnem, _machInst, __opClass),
dest(_dest),
op1(_op1),
imm(_imm)
982 IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2,
984 FpOp(mnem, _machInst, __opClass),
dest(_dest),
op1(_op1),
op2(_op2)
1002 OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1,
1005 FpOp(mnem, _machInst, __opClass),
dest(_dest),
op1(_op1),
op2(_op2),
1024 IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2,
1026 FpOp(mnem, _machInst, __opClass),
dest(_dest),
op1(_op1),
op2(_op2),
1045 OpClass __opClass, IntRegIndex _dest,
1046 IntRegIndex _op1, IntRegIndex _op2,
1048 FpOp(mnem, _machInst, __opClass),
1061 #endif //__ARCH_ARM_INSTS_VFP_HH__
uint32_t unsignedRSqrtEstimate(uint32_t op)
fpType binaryOp(FPSCR &fpscr, fpType op1, fpType op2, fpType(*func)(fpType, fpType), bool flush, bool defaultNan, uint32_t rMode) const
FpOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass)
static T fpMinNum(T a, T b)
static T fpRecps(T a, T b)
static float bitsToFp(uint64_t, float)
float vfpUFixedToFpS(bool flush, bool defaultNan, uint64_t val, uint8_t width, uint8_t imm)
float fixFpDFpSDest(FPSCR fpscr, double val)
double fpSqrt(FPSCR fpscr, double x) const
float fprSqrtEstimate(FPSCR &fpscr, float op)
static void setVfpMicroFlags(VfpMicroMode mode, T &flags)
static float fpRSqrtsS(float a, float b)
double dbl(uint32_t low, uint32_t high) const
static T fpMaxNum(T a, T b)
FpRegRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, uint64_t _imm, VfpMicroMode mode=VfpNotAMicroop)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
static float fpMulS(float a, float b)
static double fpSubD(double a, double b)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
uint32_t dblHi(double val) const
static T fpRSqrts(T a, T b)
static void setFPExceptions(int exceptions)
uint64_t vfpFpToFixed(T val, bool isSigned, uint8_t width, uint8_t imm, bool useRmode=true, VfpRoundingMode roundMode=VfpRoundZero, bool aarch64=false)
static double fpAddD(double a, double b)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
static void vfpFlushToZero(FPSCR &fpscr, fpType &op)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
FpRegRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2, VfpMicroMode mode=VfpNotAMicroop)
void advancePC(PCState &pcState) const override
static float fpSubS(float a, float b)
float vfpSFixedToFpS(bool flush, bool defaultNan, int64_t val, uint8_t width, uint8_t imm)
static const uint32_t FpscrExcMask
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
FpRegRegRegCondOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2, ConditionCode _cond, VfpMicroMode mode=VfpNotAMicroop)
virtual float doOp(float op1) const
fpType processNans(FPSCR &fpscr, bool &done, bool defaultNan, fpType op1, fpType op2) const
FpRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, uint64_t _imm, VfpMicroMode mode=VfpNotAMicroop)
void finishVfp(FPSCR &fpscr, VfpSavedState state, bool flush, FPSCR mask)
VfpMacroOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, bool _wide)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
static float fpDivS(float a, float b)
FpRegRegRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2, IntRegIndex _op3, VfpMicroMode mode=VfpNotAMicroop)
static double makeDouble(uint32_t low, uint32_t high)
double vfpUFixedToFpD(bool flush, bool defaultNan, uint64_t val, uint8_t width, uint8_t imm)
uint16_t vcvtFpSFpH(FPSCR &fpscr, bool flush, bool defaultNan, uint32_t rMode, bool ahp, float op)
FpCondCompRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _op1, IntRegIndex _op2, ConditionCode _condCode, uint8_t _defCc)
float vcvtFpHFpS(FPSCR &fpscr, bool defaultNan, bool ahp, uint16_t op)
virtual float doOp(float op1, float op2) const
FpCondSelOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2, ConditionCode _condCode)
static T fpMulAdd(T op1, T op2, T addend)
std::bitset< Num_Flags > flags
Flag values for this instruction.
IntRegIndex addStride(IntRegIndex idx, unsigned stride)
uint32_t dblLow(double val) const
static float fpAddS(float a, float b)
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
double vfpSFixedToFpD(bool flush, bool defaultNan, int64_t val, uint8_t width, uint8_t imm)
void nextIdxs(IntRegIndex &dest, IntRegIndex &op1, IntRegIndex &op2)
static T fpRIntX(T a, FPSCR &fpscr)
double vcvtFpHFpD(FPSCR &fpscr, bool defaultNan, bool ahp, uint16_t op)
static uint32_t fpToBits(float)
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
static bool inScalarBank(IntRegIndex idx)
Base class for predicated macro-operations.
virtual double doOp(double op1) const
fpType fixDivDest(bool flush, bool defaultNan, fpType val, fpType op1, fpType op2)
static T fpMulX(T a, T b)
virtual double doOp(double op1, double op2) const
float fpRecipEstimate(FPSCR &fpscr, float op)
static uint32_t highFromDouble(double val)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
VfpSavedState prepFpState(uint32_t rMode)
FpRegRegRegImmOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, IntRegIndex _op2, uint64_t _imm, VfpMicroMode mode=VfpNotAMicroop)
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
static double fpMulD(double a, double b)
fpType unaryOp(FPSCR &fpscr, fpType op1, fpType(*func)(fpType), bool flush, uint32_t rMode) const
FPSCR fpStandardFPSCRValue(const FPSCR &fpscr)
fpType ternaryOp(FPSCR &fpscr, fpType op1, fpType op2, fpType op3, fpType(*func)(fpType, fpType, fpType), bool flush, bool defaultNan, uint32_t rMode) const
uint32_t unsignedRecipEstimate(uint32_t op)
static float fpRecpsS(float a, float b)
Base class for predicated integer operations.
fpType fixDest(bool flush, bool defaultNan, fpType val, fpType op1)
static bool isSnan(fpType val)
Reference material can be found at the JEDEC website: UFS standard http://www.jedec....
static uint32_t lowFromDouble(double val)
float fpSqrt(FPSCR fpscr, float x) const
Bitfield< 21, 20 > stride
std::string generateDisassembly(Addr pc, const loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
FpRegRegOp(const char *mnem, ExtMachInst _machInst, OpClass __opClass, IntRegIndex _dest, IntRegIndex _op1, VfpMicroMode mode=VfpNotAMicroop)
uint16_t vcvtFpDFpH(FPSCR &fpscr, bool flush, bool defaultNan, uint32_t rMode, bool ahp, double op)
#define panic(...)
This implements a cprintf based panic() function.
static double fpDivD(double a, double b)
double fixFpSFpDDest(FPSCR fpscr, float val)
Generated on Tue Sep 7 2021 14:53:41 for gem5 by doxygen 1.8.17