| gem5
    v21.1.0.2
    | 
#include <instructions.hh>
 
  
| Public Member Functions | |
| Inst_DS__DS_BPERMUTE_B32 (InFmt_DS *) | |
| ~Inst_DS__DS_BPERMUTE_B32 () | |
| int | getNumOperands () override | 
| int | numDstRegOperands () override | 
| int | numSrcRegOperands () override | 
| int | getOperandSize (int opIdx) override | 
| void | execute (GPUDynInstPtr) override | 
|  Public Member Functions inherited from gem5::Gcn3ISA::Inst_DS | |
| Inst_DS (InFmt_DS *, const std::string &opcode) | |
| ~Inst_DS () | |
| int | instSize () const override | 
| void | generateDisassembly () override | 
| void | initOperandInfo () override | 
|  Public Member Functions inherited from gem5::Gcn3ISA::GCN3GPUStaticInst | |
| GCN3GPUStaticInst (const std::string &opcode) | |
| ~GCN3GPUStaticInst () | |
| bool | isFlatScratchRegister (int opIdx) override | 
| bool | isExecMaskRegister (int opIdx) override | 
| int | coalescerTokenCount () const override | 
| Return the number of tokens needed by the coalescer.  More... | |
| ScalarRegU32 | srcLiteral () const override | 
|  Public Member Functions inherited from gem5::GPUStaticInst | |
| GPUStaticInst (const std::string &opcode) | |
| virtual | ~GPUStaticInst () | 
| void | instAddr (int inst_addr) | 
| int | instAddr () const | 
| int | nextInstAddr () const | 
| void | instNum (int num) | 
| int | instNum () | 
| void | ipdInstNum (int num) | 
| int | ipdInstNum () const | 
| void | initDynOperandInfo (Wavefront *wf, ComputeUnit *cu) | 
| const std::string & | disassemble () | 
| int | numSrcVecOperands () | 
| int | numDstVecOperands () | 
| int | numSrcVecDWords () | 
| int | numDstVecDWords () | 
| int | numSrcScalarOperands () | 
| int | numDstScalarOperands () | 
| int | numSrcScalarDWords () | 
| int | numDstScalarDWords () | 
| int | maxOperandSize () | 
| bool | isALU () const | 
| bool | isBranch () const | 
| bool | isCondBranch () const | 
| bool | isNop () const | 
| bool | isReturn () const | 
| bool | isEndOfKernel () const | 
| bool | isKernelLaunch () const | 
| bool | isSDWAInst () const | 
| bool | isDPPInst () const | 
| bool | isUnconditionalJump () const | 
| bool | isSpecialOp () const | 
| bool | isWaitcnt () const | 
| bool | isSleep () const | 
| bool | isBarrier () const | 
| bool | isMemSync () const | 
| bool | isMemRef () const | 
| bool | isFlat () const | 
| bool | isLoad () const | 
| bool | isStore () const | 
| bool | isAtomic () const | 
| bool | isAtomicNoRet () const | 
| bool | isAtomicRet () const | 
| bool | isScalar () const | 
| bool | readsSCC () const | 
| bool | writesSCC () const | 
| bool | readsVCC () const | 
| bool | writesVCC () const | 
| bool | readsEXEC () const | 
| bool | writesEXEC () const | 
| bool | readsMode () const | 
| bool | writesMode () const | 
| bool | ignoreExec () const | 
| bool | isAtomicAnd () const | 
| bool | isAtomicOr () const | 
| bool | isAtomicXor () const | 
| bool | isAtomicCAS () const | 
| bool | isAtomicExch () const | 
| bool | isAtomicAdd () const | 
| bool | isAtomicSub () const | 
| bool | isAtomicInc () const | 
| bool | isAtomicDec () const | 
| bool | isAtomicMax () const | 
| bool | isAtomicMin () const | 
| bool | isArgLoad () const | 
| bool | isGlobalMem () const | 
| bool | isLocalMem () const | 
| bool | isArgSeg () const | 
| bool | isGlobalSeg () const | 
| bool | isGroupSeg () const | 
| bool | isKernArgSeg () const | 
| bool | isPrivateSeg () const | 
| bool | isReadOnlySeg () const | 
| bool | isSpillSeg () const | 
| bool | isGloballyCoherent () const | 
| Coherence domain of a memory instruction.  More... | |
| bool | isSystemCoherent () const | 
| bool | isF16 () const | 
| bool | isF32 () const | 
| bool | isF64 () const | 
| bool | isFMA () const | 
| bool | isMAC () const | 
| bool | isMAD () const | 
| virtual void | initiateAcc (GPUDynInstPtr gpuDynInst) | 
| virtual void | completeAcc (GPUDynInstPtr gpuDynInst) | 
| virtual uint32_t | getTargetPc () | 
| void | setFlag (Flags flag) | 
| const std::string & | opcode () const | 
| const std::vector< OperandInfo > & | srcOperands () const | 
| const std::vector< OperandInfo > & | dstOperands () const | 
| const std::vector< OperandInfo > & | srcVecRegOperands () const | 
| const std::vector< OperandInfo > & | dstVecRegOperands () const | 
| const std::vector< OperandInfo > & | srcScalarRegOperands () const | 
| const std::vector< OperandInfo > & | dstScalarRegOperands () const | 
| Additional Inherited Members | |
|  Public Types inherited from gem5::GPUStaticInst | |
| enum | OpType { SRC_VEC, SRC_SCALAR, DST_VEC, DST_SCALAR } | 
| typedef int(RegisterManager::* | MapRegFn) (Wavefront *, int) | 
|  Public Attributes inherited from gem5::GPUStaticInst | |
| enums::StorageClassType | executed_as | 
|  Static Public Attributes inherited from gem5::GPUStaticInst | |
| static uint64_t | dynamic_id_count | 
|  Protected Member Functions inherited from gem5::Gcn3ISA::Inst_DS | |
| template<typename T > | |
| void | initMemRead (GPUDynInstPtr gpuDynInst, Addr offset) | 
| template<int N> | |
| void | initMemRead (GPUDynInstPtr gpuDynInst, Addr offset) | 
| template<typename T > | |
| void | initDualMemRead (GPUDynInstPtr gpuDynInst, Addr offset0, Addr offset1) | 
| template<typename T > | |
| void | initMemWrite (GPUDynInstPtr gpuDynInst, Addr offset) | 
| template<int N> | |
| void | initMemWrite (GPUDynInstPtr gpuDynInst, Addr offset) | 
| template<typename T > | |
| void | initDualMemWrite (GPUDynInstPtr gpuDynInst, Addr offset0, Addr offset1) | 
| void | calcAddr (GPUDynInstPtr gpuDynInst, ConstVecOperandU32 &addr) | 
|  Protected Member Functions inherited from gem5::Gcn3ISA::GCN3GPUStaticInst | |
| void | panicUnimplemented () const | 
|  Protected Attributes inherited from gem5::Gcn3ISA::Inst_DS | |
| InFmt_DS | instData | 
| InFmt_DS_1 | extData | 
|  Protected Attributes inherited from gem5::Gcn3ISA::GCN3GPUStaticInst | |
| ScalarRegU32 | _srcLiteral | 
| if the instruction has a src literal - an immediate value that is part of the instruction stream - we store that here  More... | |
|  Protected Attributes inherited from gem5::GPUStaticInst | |
| const std::string | _opcode | 
| std::string | disassembly | 
| int | _instNum | 
| int | _instAddr | 
| std::vector< OperandInfo > | srcOps | 
| std::vector< OperandInfo > | dstOps | 
Definition at line 32491 of file instructions.hh.
| gem5::Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::Inst_DS__DS_BPERMUTE_B32 | ( | InFmt_DS * | iFmt | ) | 
While this operation doesn't actually use DS storage we classify it as a load here because it does a writeback to a VGPR, which fits in better with the LDS pipeline logic.
Definition at line 32492 of file instructions.cc.
References gem5::GPUStaticInst::setFlag().
| gem5::Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::~Inst_DS__DS_BPERMUTE_B32 | ( | ) | 
Definition at line 32504 of file instructions.cc.
| 
 | overridevirtual | 
One of the offset fields can be used for the index. It is assumed OFFSET0 would be used, as OFFSET1 is typically only used for DS ops that operate on two disparate pieces of data.
The address provided is a byte address, but VGPRs are 4 bytes, so we must divide by 4 to get the actual VGPR index. Additionally, the index is calculated modulo the WF size, 64 in this case, so we simply extract bits 7-2.
If the shuffled index corresponds to a lane that is inactive then this instruction writes a 0 to the active lane in VDST.
This is needed because we treat this instruction as a load but it's not an actual memory request. Without this, the destination register never gets marked as free, leading to a possible deadlock
Implements gem5::GPUStaticInst.
Definition at line 32510 of file instructions.cc.
References gem5::X86ISA::addr, gem5::Gcn3ISA::InFmt_DS_1::ADDR, gem5::bits(), gem5::Wavefront::computeUnit, data, gem5::Gcn3ISA::InFmt_DS_1::DATA0, gem5::Wavefront::decLGKMInstsIssued(), gem5::Wavefront::execMask(), gem5::Wavefront::execUnitId, gem5::Gcn3ISA::Inst_DS::extData, gem5::MipsISA::index, gem5::Gcn3ISA::Inst_DS::instData, gem5::Gcn3ISA::NumVecElemPerVecReg(), gem5::Gcn3ISA::InFmt_DS::OFFSET0, gem5::Gcn3ISA::InFmt_DS::OFFSET1, panic_if, gem5::Wavefront::rdLmReqsInPipe, gem5::Wavefront::simdId, gem5::Wavefront::validateRequestCounters(), gem5::Gcn3ISA::InFmt_DS_1::VDST, gem5::ComputeUnit::vrf, and gem5::Gcn3ISA::VecOperand< DataType, Const, NumDwords >::write().
| 
 | inlineoverridevirtual | 
Implements gem5::GPUStaticInst.
Definition at line 32498 of file instructions.hh.
References numDstRegOperands(), and numSrcRegOperands().
| 
 | inlineoverridevirtual | 
Reimplemented from gem5::Gcn3ISA::GCN3GPUStaticInst.
Definition at line 32507 of file instructions.hh.
References fatal.
| 
 | inlineoverridevirtual | 
Implements gem5::GPUStaticInst.
Definition at line 32503 of file instructions.hh.
Referenced by getNumOperands().
| 
 | inlineoverridevirtual | 
Implements gem5::GPUStaticInst.
Definition at line 32504 of file instructions.hh.
Referenced by getNumOperands().