gem5
v20.0.0.2
|
#include <op_encodings.hh>
Classes | |
struct | BufferRsrcDescriptor |
Public Member Functions | |
Inst_MUBUF (InFmt_MUBUF *, const std::string &opcode) | |
~Inst_MUBUF () | |
int | instSize () const override |
void | generateDisassembly () override |
bool | isScalarRegister (int opIdx) override |
bool | isVectorRegister (int opIdx) override |
int | getRegisterIndex (int opIdx, GPUDynInstPtr gpuDynInst) override |
![]() | |
GCN3GPUStaticInst (const std::string &opcode) | |
~GCN3GPUStaticInst () | |
bool | isFlatScratchRegister (int opIdx) override |
bool | isExecMaskRegister (int opIdx) override |
bool | isSrcOperand (int opIdx) override |
bool | isDstOperand (int opIdx) override |
int | getOperandSize (int opIdx) override |
int | coalescerTokenCount () const override |
Return the number of tokens needed by the coalescer. More... | |
ScalarRegU32 | srcLiteral () const override |
![]() | |
GPUStaticInst (const std::string &opcode) | |
void | instAddr (int inst_addr) |
int | instAddr () const |
int | nextInstAddr () const |
void | instNum (int num) |
int | instNum () |
void | ipdInstNum (int num) |
int | ipdInstNum () const |
virtual void | execute (GPUDynInstPtr gpuDynInst)=0 |
const std::string & | disassemble () |
virtual int | getNumOperands ()=0 |
virtual bool | isCondRegister (int operandIndex)=0 |
virtual int | numDstRegOperands ()=0 |
virtual int | numSrcRegOperands ()=0 |
virtual bool | isValid () const =0 |
bool | isALU () const |
bool | isBranch () const |
bool | isNop () const |
bool | isReturn () const |
bool | isUnconditionalJump () const |
bool | isSpecialOp () const |
bool | isWaitcnt () const |
bool | isBarrier () const |
bool | isMemFence () const |
bool | isMemRef () const |
bool | isFlat () const |
bool | isLoad () const |
bool | isStore () const |
bool | isAtomic () const |
bool | isAtomicNoRet () const |
bool | isAtomicRet () const |
bool | isScalar () const |
bool | readsSCC () const |
bool | writesSCC () const |
bool | readsVCC () const |
bool | writesVCC () const |
bool | isAtomicAnd () const |
bool | isAtomicOr () const |
bool | isAtomicXor () const |
bool | isAtomicCAS () const |
bool | isAtomicExch () const |
bool | isAtomicAdd () const |
bool | isAtomicSub () const |
bool | isAtomicInc () const |
bool | isAtomicDec () const |
bool | isAtomicMax () const |
bool | isAtomicMin () const |
bool | isArgLoad () const |
bool | isGlobalMem () const |
bool | isLocalMem () const |
bool | isArgSeg () const |
bool | isGlobalSeg () const |
bool | isGroupSeg () const |
bool | isKernArgSeg () const |
bool | isPrivateSeg () const |
bool | isReadOnlySeg () const |
bool | isSpillSeg () const |
bool | isWorkitemScope () const |
bool | isWavefrontScope () const |
bool | isWorkgroupScope () const |
bool | isDeviceScope () const |
bool | isSystemScope () const |
bool | isNoScope () const |
bool | isRelaxedOrder () const |
bool | isAcquire () const |
bool | isRelease () const |
bool | isAcquireRelease () const |
bool | isNoOrder () const |
bool | isGloballyCoherent () const |
Coherence domain of a memory instruction. More... | |
bool | isSystemCoherent () const |
virtual void | initiateAcc (GPUDynInstPtr gpuDynInst) |
virtual void | completeAcc (GPUDynInstPtr gpuDynInst) |
virtual uint32_t | getTargetPc () |
void | setFlag (Flags flag) |
virtual void | execLdAcq (GPUDynInstPtr gpuDynInst) |
virtual void | execSt (GPUDynInstPtr gpuDynInst) |
virtual void | execAtomic (GPUDynInstPtr gpuDynInst) |
virtual void | execAtomicAcq (GPUDynInstPtr gpuDynInst) |
Protected Member Functions | |
template<typename T > | |
void | initMemRead (GPUDynInstPtr gpuDynInst) |
template<typename T > | |
void | initMemWrite (GPUDynInstPtr gpuDynInst) |
void | injectGlobalMemFence (GPUDynInstPtr gpuDynInst) |
template<typename VOFF , typename VIDX , typename SRSRC , typename SOFF > | |
void | calcAddr (GPUDynInstPtr gpuDynInst, VOFF v_off, VIDX v_idx, SRSRC s_rsrc_desc, SOFF s_offset, int inst_offset) |
MUBUF insructions calculate their addresses as follows: More... | |
![]() | |
void | panicUnimplemented () const |
Protected Attributes | |
InFmt_MUBUF | instData |
InFmt_MUBUF_1 | extData |
![]() | |
ScalarRegU32 | _srcLiteral |
if the instruction has a src literal - an immediate value that is part of the instruction stream - we store that here More... | |
![]() | |
const std::string | opcode |
std::string | disassembly |
int | _instNum |
int | _instAddr |
int | _ipdInstNum |
Identifier of the immediate post-dominator instruction. More... | |
std::bitset< Num_Flags > | _flags |
Additional Inherited Members | |
![]() | |
Enums::StorageClassType | executed_as |
![]() | |
static uint64_t | dynamic_id_count |
Definition at line 530 of file op_encodings.hh.
Gcn3ISA::Inst_MUBUF::Inst_MUBUF | ( | InFmt_MUBUF * | iFmt, |
const std::string & | opcode | ||
) |
Definition at line 1862 of file op_encodings.cc.
References Gcn3ISA::GCN3GPUStaticInst::_srcLiteral, extData, Gcn3ISA::InFmt_MUBUF::GLC, instData, GPUStaticInst::setFlag(), and Gcn3ISA::InFmt_MUBUF::SLC.
Gcn3ISA::Inst_MUBUF::~Inst_MUBUF | ( | ) |
Definition at line 1878 of file op_encodings.cc.
|
inlineprotected |
MUBUF insructions calculate their addresses as follows:
index = (IDXEN ? vgpr_idx : 0) + (const_add_tid_en ? TID : 0) offset = (OFFEN ? vgpr_off : 0) + inst_off
/ ====================== LINEAR ADDRESSING ====================== / VADDR = base + sgpr_off + offset + stride * index
/ ===================== SWIZZLED ADDRESSING ===================== / index_msb = index / const_index_stride index_lsb = index % const_index_stride offset_msb = offset / const_element_size offset_lsb = offset % const_element_size buffer_offset = ((index_msb * stride + offset_msb * const_element_size) * const_index_stride + index_lsb * const_element_size + offset_lsb)
VADDR = base + sgpr_off + buffer_offset
first we calculate the buffer's index and offset. these will be used for either linear or swizzled buffers.
Definition at line 653 of file op_encodings.hh.
References Gcn3ISA::NumVecElemPerVecReg(), ArmISA::stride, and MipsISA::vaddr.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute().
|
overridevirtual |
Reimplemented from Gcn3ISA::GCN3GPUStaticInst.
Definition at line 1889 of file op_encodings.cc.
References GPUStaticInst::disassembly, extData, instData, Gcn3ISA::InFmt_MUBUF::OFFSET, Gcn3ISA::InFmt_MUBUF_1::SOFFSET, Gcn3ISA::InFmt_MUBUF_1::SRSRC, Gcn3ISA::InFmt_MUBUF_1::VADDR, and Gcn3ISA::InFmt_MUBUF_1::VDATA.
|
overridevirtual |
Reimplemented from Gcn3ISA::GCN3GPUStaticInst.
Definition at line 1949 of file op_encodings.cc.
References extData, fatal, GPUStaticInst::getNumOperands(), Gcn3ISA::InFmt_MUBUF_1::SOFFSET, Gcn3ISA::InFmt_MUBUF_1::SRSRC, Gcn3ISA::InFmt_MUBUF_1::VADDR, and Gcn3ISA::InFmt_MUBUF_1::VDATA.
|
inlineprotected |
Definition at line 569 of file op_encodings.hh.
References Packet::dataStatic(), Gcn3ISA::NumVecElemPerVecReg(), MemCmd::ReadReq, and MipsISA::vaddr.
|
inlineprotected |
Definition at line 595 of file op_encodings.hh.
References Packet::dataStatic(), Gcn3ISA::NumVecElemPerVecReg(), MipsISA::vaddr, and MemCmd::WriteReq.
|
inlineprotected |
Definition at line 618 of file op_encodings.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::initiateAcc(), and Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::initiateAcc().
|
overridevirtual |
Implements GPUStaticInst.
Definition at line 1883 of file op_encodings.cc.
|
overridevirtual |
Reimplemented from Gcn3ISA::GCN3GPUStaticInst.
Definition at line 1907 of file op_encodings.cc.
References fatal, and GPUStaticInst::getNumOperands().
|
overridevirtual |
Reimplemented from Gcn3ISA::GCN3GPUStaticInst.
Definition at line 1928 of file op_encodings.cc.
References fatal, and GPUStaticInst::getNumOperands().
|
protected |
Definition at line 705 of file op_encodings.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), generateDisassembly(), getRegisterIndex(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::initiateAcc(), and Inst_MUBUF().
|
protected |
Definition at line 703 of file op_encodings.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), generateDisassembly(), Inst_MUBUF(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_ADD::Inst_MUBUF__BUFFER_ATOMIC_ADD(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_ADD_X2::Inst_MUBUF__BUFFER_ATOMIC_ADD_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_AND::Inst_MUBUF__BUFFER_ATOMIC_AND(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_AND_X2::Inst_MUBUF__BUFFER_ATOMIC_AND_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP::Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP_X2::Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_DEC::Inst_MUBUF__BUFFER_ATOMIC_DEC(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_DEC_X2::Inst_MUBUF__BUFFER_ATOMIC_DEC_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_INC::Inst_MUBUF__BUFFER_ATOMIC_INC(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_INC_X2::Inst_MUBUF__BUFFER_ATOMIC_INC_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_OR::Inst_MUBUF__BUFFER_ATOMIC_OR(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_OR_X2::Inst_MUBUF__BUFFER_ATOMIC_OR_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SMAX::Inst_MUBUF__BUFFER_ATOMIC_SMAX(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SMAX_X2::Inst_MUBUF__BUFFER_ATOMIC_SMAX_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SMIN::Inst_MUBUF__BUFFER_ATOMIC_SMIN(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SMIN_X2::Inst_MUBUF__BUFFER_ATOMIC_SMIN_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SUB::Inst_MUBUF__BUFFER_ATOMIC_SUB(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SUB_X2::Inst_MUBUF__BUFFER_ATOMIC_SUB_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SWAP::Inst_MUBUF__BUFFER_ATOMIC_SWAP(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_SWAP_X2::Inst_MUBUF__BUFFER_ATOMIC_SWAP_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_UMAX::Inst_MUBUF__BUFFER_ATOMIC_UMAX(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_UMAX_X2::Inst_MUBUF__BUFFER_ATOMIC_UMAX_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_UMIN::Inst_MUBUF__BUFFER_ATOMIC_UMIN(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_UMIN_X2::Inst_MUBUF__BUFFER_ATOMIC_UMIN_X2(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_XOR::Inst_MUBUF__BUFFER_ATOMIC_XOR(), Gcn3ISA::Inst_MUBUF__BUFFER_ATOMIC_XOR_X2::Inst_MUBUF__BUFFER_ATOMIC_XOR_X2(), and Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::Inst_MUBUF__BUFFER_STORE_DWORD().