gem5 v23.0.0.1
Loading...
Searching...
No Matches
Public Member Functions | List of all members
gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32 Class Reference

#include <instructions.hh>

Inheritance diagram for gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32:
gem5::VegaISA::Inst_DS gem5::VegaISA::VEGAGPUStaticInst gem5::GPUStaticInst

Public Member Functions

 Inst_DS__DS_SWIZZLE_B32 (InFmt_DS *)
 
 ~Inst_DS__DS_SWIZZLE_B32 ()
 
int getNumOperands () override
 
int numDstRegOperands () override
 
int numSrcRegOperands () override
 
int getOperandSize (int opIdx) override
 
void execute (GPUDynInstPtr) override
 
- Public Member Functions inherited from gem5::VegaISA::Inst_DS
 Inst_DS (InFmt_DS *, const std::string &opcode)
 
 ~Inst_DS ()
 
int instSize () const override
 
void generateDisassembly () override
 
void initOperandInfo () override
 
- Public Member Functions inherited from gem5::VegaISA::VEGAGPUStaticInst
 VEGAGPUStaticInst (const std::string &opcode)
 
 ~VEGAGPUStaticInst ()
 
void generateDisassembly () override
 
bool isFlatScratchRegister (int opIdx) override
 
bool isExecMaskRegister (int opIdx) override
 
void initOperandInfo () override
 
int getOperandSize (int opIdx) override
 
int coalescerTokenCount () const override
 Return the number of tokens needed by the coalescer.
 
ScalarRegU32 srcLiteral () const override
 
- Public Member Functions inherited from gem5::GPUStaticInst
 GPUStaticInst (const std::string &opcode)
 
virtual ~GPUStaticInst ()
 
void instAddr (int inst_addr)
 
int instAddr () const
 
int nextInstAddr () const
 
void instNum (int num)
 
int instNum ()
 
void ipdInstNum (int num)
 
int ipdInstNum () const
 
virtual TheGpuISA::ScalarRegU32 srcLiteral () const
 
void initDynOperandInfo (Wavefront *wf, ComputeUnit *cu)
 
virtual void initOperandInfo ()=0
 
virtual void execute (GPUDynInstPtr gpuDynInst)=0
 
virtual void generateDisassembly ()=0
 
const std::string & disassemble ()
 
virtual int getNumOperands ()=0
 
virtual bool isFlatScratchRegister (int opIdx)=0
 
virtual bool isExecMaskRegister (int opIdx)=0
 
virtual int getOperandSize (int operandIndex)=0
 
virtual int numDstRegOperands ()=0
 
virtual int numSrcRegOperands ()=0
 
int numSrcVecOperands ()
 
int numDstVecOperands ()
 
int numSrcVecDWords ()
 
int numDstVecDWords ()
 
int numSrcScalarOperands ()
 
int numDstScalarOperands ()
 
int numSrcScalarDWords ()
 
int numDstScalarDWords ()
 
int maxOperandSize ()
 
virtual int coalescerTokenCount () const
 
bool isALU () const
 
bool isBranch () const
 
bool isCondBranch () const
 
bool isNop () const
 
bool isReturn () const
 
bool isEndOfKernel () const
 
bool isKernelLaunch () const
 
bool isSDWAInst () const
 
bool isDPPInst () const
 
bool isUnconditionalJump () const
 
bool isSpecialOp () const
 
bool isWaitcnt () const
 
bool isSleep () const
 
bool isBarrier () const
 
bool isMemSync () const
 
bool isMemRef () const
 
bool isFlat () const
 
bool isFlatGlobal () const
 
bool isLoad () const
 
bool isStore () const
 
bool isAtomic () const
 
bool isAtomicNoRet () const
 
bool isAtomicRet () const
 
bool isScalar () const
 
bool readsSCC () const
 
bool writesSCC () const
 
bool readsVCC () const
 
bool writesVCC () const
 
bool readsEXEC () const
 
bool writesEXEC () const
 
bool readsMode () const
 
bool writesMode () const
 
bool ignoreExec () const
 
bool isAtomicAnd () const
 
bool isAtomicOr () const
 
bool isAtomicXor () const
 
bool isAtomicCAS () const
 
bool isAtomicExch () const
 
bool isAtomicAdd () const
 
bool isAtomicSub () const
 
bool isAtomicInc () const
 
bool isAtomicDec () const
 
bool isAtomicMax () const
 
bool isAtomicMin () const
 
bool isArgLoad () const
 
bool isGlobalMem () const
 
bool isLocalMem () const
 
bool isArgSeg () const
 
bool isGlobalSeg () const
 
bool isGroupSeg () const
 
bool isKernArgSeg () const
 
bool isPrivateSeg () const
 
bool isReadOnlySeg () const
 
bool isSpillSeg () const
 
bool isGloballyCoherent () const
 Coherence domain of a memory instruction.
 
bool isSystemCoherent () const
 
bool isF16 () const
 
bool isF32 () const
 
bool isF64 () const
 
bool isFMA () const
 
bool isMAC () const
 
bool isMAD () const
 
virtual int instSize () const =0
 
virtual void initiateAcc (GPUDynInstPtr gpuDynInst)
 
virtual void completeAcc (GPUDynInstPtr gpuDynInst)
 
virtual uint32_t getTargetPc ()
 
void setFlag (Flags flag)
 
const std::string & opcode () const
 
const std::vector< OperandInfo > & srcOperands () const
 
const std::vector< OperandInfo > & dstOperands () const
 
const std::vector< OperandInfo > & srcVecRegOperands () const
 
const std::vector< OperandInfo > & dstVecRegOperands () const
 
const std::vector< OperandInfo > & srcScalarRegOperands () const
 
const std::vector< OperandInfo > & dstScalarRegOperands () const
 

Additional Inherited Members

- Public Types inherited from gem5::GPUStaticInst
enum  OpType { SRC_VEC , SRC_SCALAR , DST_VEC , DST_SCALAR }
 
typedef int(RegisterManager::* MapRegFn) (Wavefront *, int)
 
- Public Attributes inherited from gem5::GPUStaticInst
enums::StorageClassType executed_as
 
- Static Public Attributes inherited from gem5::GPUStaticInst
static uint64_t dynamic_id_count
 
- Protected Member Functions inherited from gem5::VegaISA::Inst_DS
template<typename T >
void initMemRead (GPUDynInstPtr gpuDynInst, Addr offset)
 
template<int N>
void initMemRead (GPUDynInstPtr gpuDynInst, Addr offset)
 
template<typename T >
void initDualMemRead (GPUDynInstPtr gpuDynInst, Addr offset0, Addr offset1)
 
template<typename T >
void initMemWrite (GPUDynInstPtr gpuDynInst, Addr offset)
 
template<int N>
void initMemWrite (GPUDynInstPtr gpuDynInst, Addr offset)
 
template<typename T >
void initDualMemWrite (GPUDynInstPtr gpuDynInst, Addr offset0, Addr offset1)
 
template<typename T >
void initAtomicAccess (GPUDynInstPtr gpuDynInst, Addr offset)
 
void calcAddr (GPUDynInstPtr gpuDynInst, ConstVecOperandU32 &addr)
 
- Protected Member Functions inherited from gem5::VegaISA::VEGAGPUStaticInst
void panicUnimplemented () const
 
- Protected Attributes inherited from gem5::VegaISA::Inst_DS
InFmt_DS instData
 
InFmt_DS_1 extData
 
- Protected Attributes inherited from gem5::VegaISA::VEGAGPUStaticInst
ScalarRegU32 _srcLiteral
 if the instruction has a src literal - an immediate value that is part of the instruction stream - we store that here
 
- Protected Attributes inherited from gem5::GPUStaticInst
const std::string _opcode
 
std::string disassembly
 
int _instNum
 
int _instAddr
 
std::vector< OperandInfosrcOps
 
std::vector< OperandInfodstOps
 

Detailed Description

Definition at line 32989 of file instructions.hh.

Constructor & Destructor Documentation

◆ Inst_DS__DS_SWIZZLE_B32()

gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::Inst_DS__DS_SWIZZLE_B32 ( InFmt_DS iFmt)

While this operation doesn't actually use DS storage we classify it as a load here because it does a writeback to a VGPR, which fits in better with the LDS pipeline logic.

Definition at line 35893 of file instructions.cc.

References gem5::GPUStaticInst::setFlag().

◆ ~Inst_DS__DS_SWIZZLE_B32()

gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::~Inst_DS__DS_SWIZZLE_B32 ( )

Definition at line 35904 of file instructions.cc.

Member Function Documentation

◆ execute()

void gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::execute ( GPUDynInstPtr  gpuDynInst)
overridevirtual

The "DS pattern" is comprised of both offset fields. That is, the swizzle pattern between lanes. Bit 15 of the DS pattern dictates which swizzle mode to use. There are two different swizzle patterns: 1) QDMode and 2) Bit-masks mode. If bit 15 is set use QDMode else use Bit-masks mode. The remaining bits dictate how to swizzle the lanes.

QDMode: Chunks the lanes into 4s and swizzles among them. Bits 7:6 dictate where lane 3 (of the current chunk) gets its date, 5:4 lane 2, etc.

Bit-mask: This mode breaks bits 14:0 into 3 equal-sized chunks. 14:10 is the xor_mask, 9:5 is the or_mask, and 4:0 is the and_mask. Each lane is swizzled by performing the appropriate operation using these masks.

This operation allows data sharing between groups of four consecutive threads. Note the increment by 4 in the for loop.

This is needed because we treat this instruction as a load but it's not an actual memory request. Without this, the destination register never gets marked as free, leading to a possible deadlock

Implements gem5::GPUStaticInst.

Definition at line 35913 of file instructions.cc.

References gem5::bits(), gem5::Wavefront::computeUnit, data, gem5::VegaISA::InFmt_DS_1::DATA0, gem5::Wavefront::decLGKMInstsIssued(), gem5::Wavefront::execUnitId, gem5::VegaISA::Inst_DS::extData, gem5::MipsISA::index, gem5::VegaISA::Inst_DS::instData, gem5::ArmISA::NumVecElemPerVecReg, gem5::VegaISA::InFmt_DS::OFFSET0, gem5::VegaISA::InFmt_DS::OFFSET1, panic_if, gem5::Wavefront::simdId, gem5::VegaISA::InFmt_DS_1::VDST, gem5::ComputeUnit::vrf, and gem5::VegaISA::VecOperand< DataType, Const, NumDwords >::write().

◆ getNumOperands()

int gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::getNumOperands ( )
inlineoverridevirtual

Implements gem5::GPUStaticInst.

Definition at line 32996 of file instructions.hh.

References numDstRegOperands(), and numSrcRegOperands().

◆ getOperandSize()

int gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::getOperandSize ( int  opIdx)
inlineoverridevirtual

Implements gem5::GPUStaticInst.

Definition at line 33005 of file instructions.hh.

References fatal.

◆ numDstRegOperands()

int gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::numDstRegOperands ( )
inlineoverridevirtual

Implements gem5::GPUStaticInst.

Definition at line 33001 of file instructions.hh.

Referenced by getNumOperands().

◆ numSrcRegOperands()

int gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::numSrcRegOperands ( )
inlineoverridevirtual

Implements gem5::GPUStaticInst.

Definition at line 33002 of file instructions.hh.

Referenced by getNumOperands().


The documentation for this class was generated from the following files:

Generated on Mon Jul 10 2023 15:33:26 for gem5 by doxygen 1.9.7