gem5
v20.0.0.0
|
#include <wavefront.hh>
Public Types | |
enum | itype_e { I_ALU, I_GLOBAL, I_SHARED, I_FLAT, I_PRIVATE } |
enum | status_e { S_STOPPED, S_RETURNING, S_RUNNING } |
typedef WavefrontParams | Params |
![]() | |
typedef SimObjectParams | Params |
Public Member Functions | |
uint32_t | remap (uint32_t vgprIndex, uint32_t size, uint8_t mode=0) |
void | resizeRegFiles (int num_cregs, int num_sregs, int num_dregs) |
bool | isGmInstruction (GPUDynInstPtr ii) |
bool | isLmInstruction (GPUDynInstPtr ii) |
bool | isOldestInstGMem () |
bool | isOldestInstLMem () |
bool | isOldestInstPrivMem () |
bool | isOldestInstFlatMem () |
bool | isOldestInstALU () |
bool | isOldestInstBarrier () |
void | computeActualWgSz (NDRange *ndr) |
void | initCallArgMem (int func_args_size_per_item, int wf_size) |
template<typename CType > | |
CType | readCallArgMem (int lane, int addr) |
template<typename CType > | |
void | writeCallArgMem (int lane, int addr, CType val) |
Wavefront (const Params *p) | |
~Wavefront () | |
virtual void | init () |
init() is called after all C++ SimObjects have been created and all ports are connected. More... | |
void | setParent (ComputeUnit *cu) |
void | start (uint64_t _wfDynId, uint64_t _base_ptr) |
void | exec () |
void | updateResources () |
int | ready (itype_e type) |
bool | instructionBufferHasBranch () |
void | regStats () |
Callback to set stat parameters. More... | |
VectorMask | getPred () |
bool | waitingAtBarrier (int lane) |
void | pushToReconvergenceStack (uint32_t pc, uint32_t rpc, const VectorMask &exec_mask) |
void | popFromReconvergenceStack () |
uint32_t | pc () const |
uint32_t | rpc () const |
VectorMask | execMask () const |
bool | execMask (int lane) const |
void | pc (uint32_t new_pc) |
void | discardFetch () |
uint32_t | getStaticContextSize () const |
Returns the size of the static hardware context of a particular wavefront This should be updated everytime the context is changed. More... | |
void | getContext (const void *out) |
Returns the hardware context as a stream of bytes This method is designed for HSAIL execution. More... | |
void | setContext (const void *in) |
Sets the hardware context fromt a stream of bytes This method is designed for HSAIL execution. More... | |
TheGpuISA::GPUISA & | gpuISA () |
![]() | |
virtual | ~SimObject () |
virtual const std::string | name () const |
virtual void | loadState (CheckpointIn &cp) |
loadState() is called on each SimObject when restoring from a checkpoint. More... | |
virtual void | initState () |
initState() is called on each SimObject when not restoring from a checkpoint. More... | |
virtual void | regProbePoints () |
Register probe points for this object. More... | |
virtual void | regProbeListeners () |
Register probe listeners for this object. More... | |
ProbeManager * | getProbeManager () |
Get the probe manager for this object. More... | |
virtual Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) |
Get a port with a given name and index. More... | |
virtual void | startup () |
startup() is the final initialization call before simulation. More... | |
DrainState | drain () override |
Provide a default implementation of the drain interface for objects that don't need draining. More... | |
virtual void | memWriteback () |
Write back dirty buffers to memory using functional writes. More... | |
virtual void | memInvalidate () |
Invalidate the contents of memory buffers. More... | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
const Params * | params () const |
SimObject (const Params *_params) | |
![]() | |
EventQueue * | eventQueue () const |
void | schedule (Event &event, Tick when) |
void | deschedule (Event &event) |
void | reschedule (Event &event, Tick when, bool always=false) |
void | schedule (Event *event, Tick when) |
void | deschedule (Event *event) |
void | reschedule (Event *event, Tick when, bool always=false) |
void | wakeupEventQueue (Tick when=(Tick) -1) |
void | setCurTick (Tick newVal) |
EventManager (EventManager &em) | |
EventManager (EventManager *em) | |
EventManager (EventQueue *eq) | |
![]() | |
Serializable () | |
virtual | ~Serializable () |
void | serializeSection (CheckpointOut &cp, const char *name) const |
Serialize an object into a new section. More... | |
void | serializeSection (CheckpointOut &cp, const std::string &name) const |
void | unserializeSection (CheckpointIn &cp, const char *name) |
Unserialize an a child object. More... | |
void | unserializeSection (CheckpointIn &cp, const std::string &name) |
![]() | |
DrainState | drainState () const |
Return the current drain state of an object. More... | |
virtual void | notifyFork () |
Notify a child process of a fork. More... | |
![]() | |
Group (Group *parent, const char *name=nullptr) | |
Construct a new statistics group. More... | |
virtual | ~Group () |
virtual void | resetStats () |
Callback to reset stats. More... | |
virtual void | preDumpStats () |
Callback before stats are dumped. More... | |
void | addStat (Stats::Info *info) |
Register a stat with this group. More... | |
const std::map< std::string, Group * > & | getStatGroups () const |
Get all child groups associated with this object. More... | |
const std::vector< Info * > & | getStats () const |
Get all stats associated with this object. More... | |
void | addStatGroup (const char *name, Group *block) |
Add a stat block as a child of this block. More... | |
const Info * | resolveStat (std::string name) const |
Resolve a stat by its name within this group. More... | |
Group ()=delete | |
Group (const Group &)=delete | |
Group & | operator= (const Group &)=delete |
Private Attributes | |
TheGpuISA::GPUISA | _gpuISA |
std::deque< std::unique_ptr< ReconvergenceStackEntry > > | reconvergenceStack |
Stack containing Control Flow Graph nodes (i.e., kernel instructions) to be visited by the wavefront, and the associated execution masks. More... | |
Additional Inherited Members | |
![]() | |
static void | serializeAll (CheckpointOut &cp) |
Serialize all SimObjects in the system. More... | |
static SimObject * | find (const char *name) |
Find the SimObject with the given name and return a pointer to it. More... | |
![]() | |
static const std::string & | currentSection () |
Gets the fully-qualified name of the active section. More... | |
static void | serializeAll (const std::string &cpt_dir) |
static void | unserializeGlobals (CheckpointIn &cp) |
![]() | |
Drainable () | |
virtual | ~Drainable () |
virtual void | drainResume () |
Resume execution after a successful drain. More... | |
void | signalDrainDone () const |
Signal that an object is drained. More... | |
![]() | |
const SimObjectParams * | _params |
Cached copy of the object parameters. More... | |
![]() | |
EventQueue * | eventq |
A pointer to this object's event queue. More... | |
Definition at line 145 of file wavefront.hh.
typedef WavefrontParams Wavefront::Params |
Definition at line 319 of file wavefront.hh.
enum Wavefront::itype_e |
Enumerator | |
---|---|
I_ALU | |
I_GLOBAL | |
I_SHARED | |
I_FLAT | |
I_PRIVATE |
Definition at line 148 of file wavefront.hh.
enum Wavefront::status_e |
Enumerator | |
---|---|
S_STOPPED | |
S_RETURNING | |
S_RUNNING |
Definition at line 149 of file wavefront.hh.
Wavefront::Wavefront | ( | const Params * | p | ) |
Definition at line 49 of file wavefront.cc.
References barCnt, barrierCnt, condRegState, dropFetch, ArmISA::i, lastAddr, lastTrace, maxDpVgprs, maxSpVgprs, memReqsInPipe, memTraceBusy, oldBarrierCnt, oldDgpr, oldDgprTcnt, oldVgpr, oldVgprTcnt, outstandingReqs, outstandingReqsRdGm, outstandingReqsRdLm, outstandingReqsWrGm, outstandingReqsWrLm, pendingFetch, rdGmReqsInPipe, rdLmReqsInPipe, reservedVectorRegs, S_STOPPED, simdId, stalledAtBarrier, startVgprIndex, status, wfSlotId, workItemFlatId, workItemId, wrGmReqsInPipe, and wrLmReqsInPipe.
Wavefront::~Wavefront | ( | ) |
Definition at line 147 of file wavefront.cc.
References callArgMem, and condRegState.
void Wavefront::computeActualWgSz | ( | NDRange * | ndr | ) |
Definition at line 980 of file wavefront.cc.
References actualWgSz, actualWgSzTotal, ArmISA::d, gridSz, NDRange::wgId, and workGroupSz.
Referenced by ComputeUnit::fillKernelState().
void Wavefront::discardFetch | ( | ) |
Definition at line 807 of file wavefront.cc.
References dropFetch, instructionBuffer, and pendingFetch.
Referenced by exec().
void Wavefront::exec | ( | ) |
Definition at line 640 of file wavefront.cc.
References _gpuISA, ComputeUnit::activeLanesPerGMemInstrDist, ComputeUnit::activeLanesPerLMemInstrDist, ComputeUnit::aluPipe, computeUnit, ComputeUnit::controlFlowDivergenceDist, ComputeUnit::cu_id, discardFetch(), DPRINTF, dstRegOpDist, execMask(), ComputeUnit::execRateDist, ComputeUnit::GlbMemUnitId(), Shader::hsail_mode, instructionBuffer, isGmInstruction(), isLmInstruction(), ComputeUnit::issuePeriod, ComputeUnit::lastExecCycle, ComputeUnit::nextGlbRdBus(), ComputeUnit::nextLocRdBus(), ComputeUnit::numInstrExecuted, ComputeUnit::numVecOpsExecuted, pc(), popFromReconvergenceStack(), rpc(), S_RETURNING, S_STOPPED, Stats::DistBase< Derived, Stor >::sample(), sc_core::SC_NONE, ComputeUnit::shader, ComputeUnit::ShrMemUnitId(), simdId, Shader::SIMT, ComputeUnit::spBypassLength(), srcRegOpDist, status, Shader::ticks(), ComputeUnit::totalCycles, ComputeUnit::updateInstStats(), Stats::ScalarBase< Derived, Stor >::value(), ComputeUnit::vrf, ComputeUnit::vrfToGlobalMemPipeBus, ComputeUnit::vrfToLocalMemPipeBus, wfDynId, wfSlotId, and ComputeUnit::wfWait.
VectorMask Wavefront::execMask | ( | ) | const |
Definition at line 826 of file wavefront.cc.
References reconvergenceStack.
Referenced by Gcn3ISA::Inst_DS::calcAddr(), RegAddrOperand< RegOperandType >::calcVector(), exec(), HsailISA::CbrInstBase< SRegOperand >::execute(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOP1__S_AND_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_OR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_XOR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_ANDN2_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_ORN2_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_NAND_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_NOR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_XNOR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECNZ::execute(), Gcn3ISA::Inst_VOP2__V_CNDMASK_B32::execute(), Gcn3ISA::Inst_VOP2__V_ADD_F32::execute(), Gcn3ISA::Inst_VOP2__V_SUB_F32::execute(), Gcn3ISA::Inst_VOP2__V_SUBREV_F32::execute(), Gcn3ISA::Inst_VOP2__V_MUL_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP2__V_MUL_F32::execute(), Gcn3ISA::Inst_VOP2__V_MUL_I32_I24::execute(), Gcn3ISA::Inst_VOP2__V_MUL_HI_I32_I24::execute(), Gcn3ISA::Inst_VOP2__V_MUL_U32_U24::execute(), Gcn3ISA::Inst_VOP2__V_MUL_HI_U32_U24::execute(), Gcn3ISA::Inst_VOP2__V_MIN_F32::execute(), Gcn3ISA::Inst_VOP2__V_MAX_F32::execute(), Gcn3ISA::Inst_VOP2__V_MIN_I32::execute(), Gcn3ISA::Inst_VOP2__V_MAX_I32::execute(), Gcn3ISA::Inst_VOP2__V_MIN_U32::execute(), Gcn3ISA::Inst_VOP2__V_MAX_U32::execute(), Gcn3ISA::Inst_VOP2__V_LSHRREV_B32::execute(), Gcn3ISA::Inst_VOP2__V_ASHRREV_I32::execute(), Gcn3ISA::Inst_VOP2__V_LSHLREV_B32::execute(), Gcn3ISA::Inst_VOP2__V_AND_B32::execute(), Gcn3ISA::Inst_VOP2__V_OR_B32::execute(), Gcn3ISA::Inst_VOP2__V_XOR_B32::execute(), Gcn3ISA::Inst_VOP2__V_MAC_F32::execute(), Gcn3ISA::Inst_VOP2__V_MADMK_F32::execute(), Gcn3ISA::Inst_VOP2__V_MADAK_F32::execute(), Gcn3ISA::Inst_VOP2__V_ADD_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUB_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUBREV_U32::execute(), Gcn3ISA::Inst_VOP2__V_ADDC_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUBB_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUBBREV_U32::execute(), Gcn3ISA::Inst_VOP2__V_ADD_U16::execute(), Gcn3ISA::Inst_VOP2__V_SUB_U16::execute(), Gcn3ISA::Inst_VOP2__V_SUBREV_U16::execute(), Gcn3ISA::Inst_VOP2__V_MUL_LO_U16::execute(), Gcn3ISA::Inst_VOP2__V_LSHLREV_B16::execute(), Gcn3ISA::Inst_VOP2__V_LSHRREV_B16::execute(), Gcn3ISA::Inst_VOP2__V_ASHRREV_I16::execute(), Gcn3ISA::Inst_VOP2__V_MAX_U16::execute(), Gcn3ISA::Inst_VOP2__V_MAX_I16::execute(), Gcn3ISA::Inst_VOP2__V_MIN_U16::execute(), Gcn3ISA::Inst_VOP2__V_MIN_I16::execute(), Gcn3ISA::Inst_VOP1__V_MOV_B32::execute(), Gcn3ISA::Inst_VOP1__V_READFIRSTLANE_B32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_I32_F64::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F64_I32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_I32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_U32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_U32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_RPI_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_FLR_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_F64::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F64_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE0::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE1::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE2::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE3::execute(), Gcn3ISA::Inst_VOP1__V_CVT_U32_F64::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F64_U32::execute(), Gcn3ISA::Inst_VOP1__V_TRUNC_F64::execute(), Gcn3ISA::Inst_VOP1__V_CEIL_F64::execute(), Gcn3ISA::Inst_VOP1__V_RNDNE_F64::execute(), Gcn3ISA::Inst_VOP1__V_FLOOR_F64::execute(), Gcn3ISA::Inst_VOP1__V_FRACT_F32::execute(), Gcn3ISA::Inst_VOP1__V_TRUNC_F32::execute(), Gcn3ISA::Inst_VOP1__V_CEIL_F32::execute(), Gcn3ISA::Inst_VOP1__V_RNDNE_F32::execute(), Gcn3ISA::Inst_VOP1__V_FLOOR_F32::execute(), Gcn3ISA::Inst_VOP1__V_EXP_F32::execute(), Gcn3ISA::Inst_VOP1__V_LOG_F32::execute(), Gcn3ISA::Inst_VOP1__V_RCP_F32::execute(), Gcn3ISA::Inst_VOP1__V_RCP_IFLAG_F32::execute(), Gcn3ISA::Inst_VOP1__V_RSQ_F32::execute(), Gcn3ISA::Inst_VOP1__V_RCP_F64::execute(), Gcn3ISA::Inst_VOP1__V_RSQ_F64::execute(), Gcn3ISA::Inst_VOP1__V_SQRT_F32::execute(), Gcn3ISA::Inst_VOP1__V_SQRT_F64::execute(), Gcn3ISA::Inst_VOP1__V_SIN_F32::execute(), Gcn3ISA::Inst_VOP1__V_COS_F32::execute(), Gcn3ISA::Inst_VOP1__V_NOT_B32::execute(), Gcn3ISA::Inst_VOP1__V_BFREV_B32::execute(), Gcn3ISA::Inst_VOP1__V_FFBH_U32::execute(), Gcn3ISA::Inst_VOP1__V_FFBL_B32::execute(), Gcn3ISA::Inst_VOP1__V_FFBH_I32::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_EXP_I32_F64::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_MANT_F64::execute(), Gcn3ISA::Inst_VOP1__V_FRACT_F64::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_EXP_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_MANT_F32::execute(), Gcn3ISA::Inst_VOP1__V_EXP_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP1__V_LOG_LEGACY_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_CLASS_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_CLASS_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_CLASS_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_CLASS_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_O_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_U_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NEQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_TRU_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_O_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_U_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NEQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_TRU_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_O_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_U_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NEQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_TRU_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_O_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_U_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NEQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_TRU_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_CLASS_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_CLASS_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_CLASS_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_CLASS_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_TRU_F16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_F16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_TRU_F16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_O_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_U_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NEQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_TRU_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_O_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_U_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NEQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_TRU_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_O_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_U_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NEQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_TRU_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_O_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_U_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NEQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_TRU_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_U64::execute(), Gcn3ISA::Inst_VOP3__V_CNDMASK_B32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_F32::execute(), Gcn3ISA::Inst_VOP3__V_SUB_F32::execute(), Gcn3ISA::Inst_VOP3__V_SUBREV_F32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_F32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_I32_I24::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_I32_I24::execute(), Gcn3ISA::Inst_VOP3__V_MUL_U32_U24::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_U32_U24::execute(), Gcn3ISA::Inst_VOP3__V_MIN_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAX_F32::execute(), Gcn3ISA::Inst_VOP3__V_MIN_I32::execute(), Gcn3ISA::Inst_VOP3__V_MAX_I32::execute(), Gcn3ISA::Inst_VOP3__V_MIN_U32::execute(), Gcn3ISA::Inst_VOP3__V_MAX_U32::execute(), Gcn3ISA::Inst_VOP3__V_LSHRREV_B32::execute(), Gcn3ISA::Inst_VOP3__V_ASHRREV_I32::execute(), Gcn3ISA::Inst_VOP3__V_LSHLREV_B32::execute(), Gcn3ISA::Inst_VOP3__V_AND_B32::execute(), Gcn3ISA::Inst_VOP3__V_OR_B32::execute(), Gcn3ISA::Inst_VOP3__V_XOR_B32::execute(), Gcn3ISA::Inst_VOP3__V_MAC_F32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUB_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUBREV_U32::execute(), Gcn3ISA::Inst_VOP3__V_ADDC_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUBB_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUBBREV_U32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_U16::execute(), Gcn3ISA::Inst_VOP3__V_SUB_U16::execute(), Gcn3ISA::Inst_VOP3__V_SUBREV_U16::execute(), Gcn3ISA::Inst_VOP3__V_MUL_LO_U16::execute(), Gcn3ISA::Inst_VOP3__V_LSHLREV_B16::execute(), Gcn3ISA::Inst_VOP3__V_LSHRREV_B16::execute(), Gcn3ISA::Inst_VOP3__V_ASHRREV_I16::execute(), Gcn3ISA::Inst_VOP3__V_MAX_U16::execute(), Gcn3ISA::Inst_VOP3__V_MAX_I16::execute(), Gcn3ISA::Inst_VOP3__V_MIN_U16::execute(), Gcn3ISA::Inst_VOP3__V_MIN_I16::execute(), Gcn3ISA::Inst_VOP3__V_MOV_B32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_I32_F64::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F64_I32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_I32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_U32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_U32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_RPI_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_FLR_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_F64::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F64_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE0::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE1::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE2::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE3::execute(), Gcn3ISA::Inst_VOP3__V_CVT_U32_F64::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F64_U32::execute(), Gcn3ISA::Inst_VOP3__V_TRUNC_F64::execute(), Gcn3ISA::Inst_VOP3__V_CEIL_F64::execute(), Gcn3ISA::Inst_VOP3__V_RNDNE_F64::execute(), Gcn3ISA::Inst_VOP3__V_FLOOR_F64::execute(), Gcn3ISA::Inst_VOP3__V_FRACT_F32::execute(), Gcn3ISA::Inst_VOP3__V_TRUNC_F32::execute(), Gcn3ISA::Inst_VOP3__V_CEIL_F32::execute(), Gcn3ISA::Inst_VOP3__V_RNDNE_F32::execute(), Gcn3ISA::Inst_VOP3__V_FLOOR_F32::execute(), Gcn3ISA::Inst_VOP3__V_EXP_F32::execute(), Gcn3ISA::Inst_VOP3__V_LOG_F32::execute(), Gcn3ISA::Inst_VOP3__V_RCP_F32::execute(), Gcn3ISA::Inst_VOP3__V_RCP_IFLAG_F32::execute(), Gcn3ISA::Inst_VOP3__V_RSQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_RCP_F64::execute(), Gcn3ISA::Inst_VOP3__V_RSQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_SQRT_F32::execute(), Gcn3ISA::Inst_VOP3__V_SQRT_F64::execute(), Gcn3ISA::Inst_VOP3__V_SIN_F32::execute(), Gcn3ISA::Inst_VOP3__V_COS_F32::execute(), Gcn3ISA::Inst_VOP3__V_NOT_B32::execute(), Gcn3ISA::Inst_VOP3__V_BFREV_B32::execute(), Gcn3ISA::Inst_VOP3__V_FFBH_U32::execute(), Gcn3ISA::Inst_VOP3__V_FFBL_B32::execute(), Gcn3ISA::Inst_VOP3__V_FFBH_I32::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_EXP_I32_F64::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_MANT_F64::execute(), Gcn3ISA::Inst_VOP3__V_FRACT_F64::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_EXP_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_MANT_F32::execute(), Gcn3ISA::Inst_VOP3__V_EXP_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_LOG_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_I32_I24::execute(), Gcn3ISA::Inst_VOP3__V_MAD_U32_U24::execute(), Gcn3ISA::Inst_VOP3__V_BFE_U32::execute(), Gcn3ISA::Inst_VOP3__V_BFE_I32::execute(), Gcn3ISA::Inst_VOP3__V_BFI_B32::execute(), Gcn3ISA::Inst_VOP3__V_FMA_F32::execute(), Gcn3ISA::Inst_VOP3__V_FMA_F64::execute(), Gcn3ISA::Inst_VOP3__V_LERP_U8::execute(), Gcn3ISA::Inst_VOP3__V_ALIGNBIT_B32::execute(), Gcn3ISA::Inst_VOP3__V_ALIGNBYTE_B32::execute(), Gcn3ISA::Inst_VOP3__V_MIN3_F32::execute(), Gcn3ISA::Inst_VOP3__V_MIN3_I32::execute(), Gcn3ISA::Inst_VOP3__V_MIN3_U32::execute(), Gcn3ISA::Inst_VOP3__V_MAX3_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAX3_I32::execute(), Gcn3ISA::Inst_VOP3__V_MAX3_U32::execute(), Gcn3ISA::Inst_VOP3__V_MED3_F32::execute(), Gcn3ISA::Inst_VOP3__V_MED3_I32::execute(), Gcn3ISA::Inst_VOP3__V_MED3_U32::execute(), Gcn3ISA::Inst_VOP3__V_SAD_U8::execute(), Gcn3ISA::Inst_VOP3__V_SAD_HI_U8::execute(), Gcn3ISA::Inst_VOP3__V_SAD_U16::execute(), Gcn3ISA::Inst_VOP3__V_SAD_U32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_PK_U8_F32::execute(), Gcn3ISA::Inst_VOP3__V_DIV_FIXUP_F64::execute(), Gcn3ISA::Inst_VOP3__V_DIV_SCALE_F64::execute(), Gcn3ISA::Inst_VOP3__V_DIV_FMAS_F64::execute(), Gcn3ISA::Inst_VOP3__V_MAD_U64_U32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_I64_I32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_U16::execute(), Gcn3ISA::Inst_VOP3__V_MAD_I16::execute(), Gcn3ISA::Inst_VOP3__V_PERM_B32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_F64::execute(), Gcn3ISA::Inst_VOP3__V_MUL_F64::execute(), Gcn3ISA::Inst_VOP3__V_MIN_F64::execute(), Gcn3ISA::Inst_VOP3__V_MAX_F64::execute(), Gcn3ISA::Inst_VOP3__V_LDEXP_F64::execute(), Gcn3ISA::Inst_VOP3__V_MUL_LO_U32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_U32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_I32::execute(), Gcn3ISA::Inst_VOP3__V_LDEXP_F32::execute(), Gcn3ISA::Inst_VOP3__V_BCNT_U32_B32::execute(), Gcn3ISA::Inst_VOP3__V_LSHLREV_B64::execute(), Gcn3ISA::Inst_VOP3__V_LSHRREV_B64::execute(), Gcn3ISA::Inst_VOP3__V_ASHRREV_I64::execute(), Gcn3ISA::Inst_VOP3__V_BFM_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), HsailISA::Call::MagicSimBreak(), popFromReconvergenceStack(), and Gcn3ISA::ScalarOperand< DataType, Const, NumDwords >::write().
bool Wavefront::execMask | ( | int | lane | ) | const |
Definition at line 832 of file wavefront.cc.
References reconvergenceStack.
void Wavefront::getContext | ( | const void * | out | ) |
Returns the hardware context as a stream of bytes This method is designed for HSAIL execution.
Definition at line 855 of file wavefront.cc.
References barCnt, barrierCnt, barrierId, computeUnit, condRegState, ComputeUnit::cu_id, ArmISA::i, initMask, ldsChunk, maxBarCnt, maxDpVgprs, maxSpVgprs, ConditionRegisterState::numRegs(), oldBarrierCnt, privBase, ConditionRegisterState::read(), LdsChunk::read(), reconvergenceStack, remap(), simdId, LdsChunk::size(), spillBase, X86ISA::val, ComputeUnit::vrf, wfId, ComputeUnit::wfSize(), wgId, and workItemId.
|
inline |
Definition at line 336 of file wavefront.hh.
References ReconvergenceStackEntry::execMask, ReconvergenceStackEntry::pc, and ReconvergenceStackEntry::rpc.
Referenced by HsailISA::Call::execPseudoInst(), HsailISA::LdaInst< DestDataType, AddrOperandType >::execute(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::Call::MagicJoinWFBar(), HsailISA::Call::MagicMaskLower(), HsailISA::Call::MagicMaskUpper(), HsailISA::Call::MagicMostSigBroadcast(), HsailISA::Call::MagicMostSigThread(), HsailISA::Call::MagicPanic(), HsailISA::Call::MagicPrefixSum(), HsailISA::Call::MagicPrintLane(), HsailISA::Call::MagicPrintLane64(), HsailISA::Call::MagicPrintWF32(), HsailISA::Call::MagicPrintWF32ID(), HsailISA::Call::MagicPrintWF64(), HsailISA::Call::MagicPrintWFFloat(), HsailISA::Call::MagicPrintWFID64(), HsailISA::Call::MagicReduction(), HsailISA::Call::MagicWaitWFBar(), and HsailISA::Call::MagicXactCasLd().
uint32_t Wavefront::getStaticContextSize | ( | ) | const |
Returns the size of the static hardware context of a particular wavefront This should be updated everytime the context is changed.
Definition at line 845 of file wavefront.cc.
References barCnt, barrierCnt, barrierId, computeUnit, ComputeUnit::cu_id, initMask, ldsChunk, maxBarCnt, oldBarrierCnt, privBase, spillBase, wfId, ComputeUnit::wfSize(), and wgId.
|
inline |
Definition at line 376 of file wavefront.hh.
|
virtual |
init() is called after all C++ SimObjects have been created and all ports are connected.
Initializations that are independent of unserialization but rely on a fully instantiated and connected SimObject graph should be done here.
Reimplemented from SimObject.
Definition at line 133 of file wavefront.cc.
References reservedVectorRegs, and startVgprIndex.
Referenced by Gcn3ISA::Inst_SMEM__S_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX16::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX2::execute(), and Gcn3ISA::Inst_SMEM__S_STORE_DWORDX4::execute().
|
inline |
Definition at line 300 of file wavefront.hh.
bool Wavefront::instructionBufferHasBranch | ( | ) |
Definition at line 264 of file wavefront.cc.
References instructionBuffer.
Referenced by FetchUnit::exec().
bool Wavefront::isGmInstruction | ( | GPUDynInstPtr | ii | ) |
Definition at line 163 of file wavefront.cc.
Referenced by exec().
bool Wavefront::isLmInstruction | ( | GPUDynInstPtr | ii | ) |
Definition at line 172 of file wavefront.cc.
Referenced by exec().
bool Wavefront::isOldestInstALU | ( | ) |
Definition at line 182 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
Referenced by ScoreboardCheckStage::collectStatistics().
bool Wavefront::isOldestInstBarrier | ( | ) |
Definition at line 197 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstFlatMem | ( | ) |
Definition at line 249 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
Referenced by ScoreboardCheckStage::collectStatistics().
bool Wavefront::isOldestInstGMem | ( | ) |
Definition at line 210 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
Referenced by ScoreboardCheckStage::collectStatistics().
bool Wavefront::isOldestInstLMem | ( | ) |
Definition at line 223 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
Referenced by ScoreboardCheckStage::collectStatistics().
bool Wavefront::isOldestInstPrivMem | ( | ) |
Definition at line 236 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
Referenced by ScoreboardCheckStage::collectStatistics().
uint32_t Wavefront::pc | ( | ) | const |
Definition at line 814 of file wavefront.cc.
References reconvergenceStack.
Referenced by Gcn3ISA::GPUISA::advancePC(), exec(), HsailISA::BrnInstBase< SRegOperand >::execute(), HsailISA::CbrInstBase< SRegOperand >::execute(), HsailISA::BrInstBase< SRegOperand >::execute(), Gcn3ISA::Inst_SOP1__S_GETPC_B64::execute(), Gcn3ISA::Inst_SOP1__S_SETPC_B64::execute(), Gcn3ISA::Inst_SOP1__S_SWAPPC_B64::execute(), Gcn3ISA::Inst_SOPP__S_BRANCH::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_SCC0::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_SCC1::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_VCCZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_VCCNZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECNZ::execute(), FetchUnit::initiateFetch(), popFromReconvergenceStack(), and pushToReconvergenceStack().
void Wavefront::pc | ( | uint32_t | new_pc | ) |
Definition at line 839 of file wavefront.cc.
References reconvergenceStack.
void Wavefront::popFromReconvergenceStack | ( | ) |
Definition at line 789 of file wavefront.cc.
References computeUnit, ComputeUnit::cu_id, DPRINTF, execMask(), pc(), reconvergenceStack, simdId, sc_dt::to_string(), wfDynId, and wfSlotId.
Referenced by exec(), HsailISA::BrnInstBase< SRegOperand >::execute(), HsailISA::CbrInstBase< SRegOperand >::execute(), and HsailISA::BrInstBase< SRegOperand >::execute().
void Wavefront::pushToReconvergenceStack | ( | uint32_t | pc, |
uint32_t | rpc, | ||
const VectorMask & | exec_mask | ||
) |
Definition at line 781 of file wavefront.cc.
References pc(), reconvergenceStack, and rpc().
Referenced by HsailISA::CbrInstBase< SRegOperand >::execute(), setContext(), and ComputeUnit::startWavefront().
|
inline |
Definition at line 307 of file wavefront.hh.
References CallArgMem::getLaneAddr().
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), and ListOperand::get().
int Wavefront::ready | ( | itype_e | type | ) |
Definition at line 303 of file wavefront.cc.
References ComputeUnit::AllAtBarrier(), barrierCnt, barrierId, computeUnit, ComputeUnit::cu_id, dispatchId, DPRINTF, ComputeUnit::getRefCounter(), ComputeUnit::globalMemoryPipe, I_ALU, I_FLAT, I_GLOBAL, I_PRIVATE, I_SHARED, instructionBuffer, ArmISA::j, ComputeUnit::localMemoryPipe, memReqsInPipe, ComputeUnit::numGlbMemUnits, ComputeUnit::numLocMemUnits, oldBarrierCnt, outstandingReqs, outstandingReqsRdGm, outstandingReqsRdLm, outstandingReqsWrGm, outstandingReqsWrLm, panic, RD_WR, rdGmReqsInPipe, rdLmReqsInPipe, S_RETURNING, S_STOPPED, simdId, stalledAtBarrier, status, ComputeUnit::vrf, ComputeUnit::vrfToGlobalMemPipeBus, ComputeUnit::vrfToLocalMemPipeBus, wfSlotId, ComputeUnit::wfWait, wgId, wrGmReqsInPipe, and wrLmReqsInPipe.
Referenced by ScoreboardCheckStage::exec().
|
virtual |
Callback to set stat parameters.
This callback is typically used for complex stats (e.g., distributions) that need parameters in addition to a name and a description. Stat names and descriptions should typically be set from the constructor usingo from the constructor using the ADD_STAT macro.
Reimplemented from Stats::Group.
Definition at line 93 of file wavefront.cc.
References Stats::DataWrap< Derived, InfoProxyType >::desc(), dstRegOpDist, Stats::Distribution::init(), SimObject::name(), Stats::DataWrap< Derived, InfoProxyType >::name(), numTimesBlockedDueRAWDependencies, numTimesBlockedDueVrfPortAvail, numTimesBlockedDueWAXDependencies, Stats::Group::regStats(), and srcRegOpDist.
uint32_t Wavefront::remap | ( | uint32_t | vgprIndex, |
uint32_t | size, | ||
uint8_t | mode = 0 |
||
) |
Definition at line 280 of file wavefront.cc.
References computeUnit, maxSpVgprs, reservedVectorRegs, simdId, startVgprIndex, and ComputeUnit::vrf.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), VectorRegisterFile::exec(), SRegOperand::get(), DRegOperand::get(), getContext(), VectorRegisterFile::operandsReady(), SRegOperand::set(), DRegOperand::set(), setContext(), and VectorRegisterFile::updateResources().
void Wavefront::resizeRegFiles | ( | int | num_cregs, |
int | num_sregs, | ||
int | num_dregs | ||
) |
Definition at line 140 of file wavefront.cc.
References condRegState, ConditionRegisterState::init(), maxDpVgprs, and maxSpVgprs.
Referenced by ComputeUnit::fillKernelState().
uint32_t Wavefront::rpc | ( | ) | const |
Definition at line 820 of file wavefront.cc.
References reconvergenceStack.
Referenced by exec(), HsailISA::BrnInstBase< SRegOperand >::execute(), HsailISA::CbrInstBase< SRegOperand >::execute(), HsailISA::BrInstBase< SRegOperand >::execute(), and pushToReconvergenceStack().
void Wavefront::setContext | ( | const void * | in | ) |
Sets the hardware context fromt a stream of bytes This method is designed for HSAIL execution.
Restoring LDS contents
Definition at line 922 of file wavefront.cc.
References barCnt, barrierCnt, barrierId, computeUnit, condRegState, ComputeUnit::cu_id, ReconvergenceStackEntry::execMask, ArmISA::i, initMask, ldsChunk, maxBarCnt, maxDpVgprs, maxSpVgprs, ConditionRegisterState::numRegs(), oldBarrierCnt, ReconvergenceStackEntry::pc, privBase, pushToReconvergenceStack(), remap(), ReconvergenceStackEntry::rpc, simdId, LdsChunk::size(), spillBase, X86ISA::val, ComputeUnit::vrf, wfId, ComputeUnit::wfSize(), wgId, workItemId, ConditionRegisterState::write(), and LdsChunk::write().
|
inline |
Definition at line 325 of file wavefront.hh.
References ConditionRegisterState::exec(), ConditionRegisterState::regStats(), and type.
void Wavefront::start | ( | uint64_t | _wfDynId, |
uint64_t | _base_ptr | ||
) |
Definition at line 155 of file wavefront.cc.
References basePtr, S_RUNNING, status, and wfDynId.
Referenced by ComputeUnit::startWavefront().
void Wavefront::updateResources | ( | ) |
Definition at line 540 of file wavefront.cc.
References ComputeUnit::aluPipe, computeUnit, ComputeUnit::GlbMemUnitId(), instructionBuffer, ComputeUnit::issuePeriod, memReqsInPipe, ComputeUnit::nextGlbRdBus(), ComputeUnit::nextLocRdBus(), rdGmReqsInPipe, rdLmReqsInPipe, sc_core::SC_NONE, ComputeUnit::shader, ComputeUnit::ShrMemUnitId(), simdId, ComputeUnit::spBypassLength(), Shader::ticks(), ComputeUnit::vrf, ComputeUnit::vrfToGlobalMemPipeBus, ComputeUnit::vrfToLocalMemPipeBus, ComputeUnit::wfWait, wrGmReqsInPipe, and wrLmReqsInPipe.
Referenced by ScheduleStage::exec().
bool Wavefront::waitingAtBarrier | ( | int | lane | ) |
Definition at line 775 of file wavefront.cc.
|
inline |
Definition at line 314 of file wavefront.hh.
References addr, CallArgMem::setLaneAddr(), and X86ISA::val.
Referenced by ListOperand::set().
|
private |
Definition at line 382 of file wavefront.hh.
Referenced by exec().
uint32_t Wavefront::actualWgSz[3] |
Definition at line 200 of file wavefront.hh.
Referenced by computeActualWgSz(), and ComputeUnit::startWavefront().
uint32_t Wavefront::actualWgSzTotal |
Definition at line 201 of file wavefront.hh.
Referenced by computeActualWgSz(), ComputeUnit::startWavefront(), and ComputeUnit::StartWorkgroup().
std::vector<int> Wavefront::barCnt |
Definition at line 251 of file wavefront.hh.
Referenced by getContext(), getStaticContextSize(), HsailISA::Call::MagicJoinWFBar(), HsailISA::Call::MagicWaitWFBar(), setContext(), ComputeUnit::startWavefront(), waitingAtBarrier(), and Wavefront().
uint32_t Wavefront::barrierCnt |
Definition at line 155 of file wavefront.hh.
Referenced by ComputeUnit::AllAtBarrier(), HsailISA::Barrier::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), getContext(), getStaticContextSize(), ready(), ComputeUnit::DataPort::recvTimingResp(), setContext(), ComputeUnit::startWavefront(), and Wavefront().
uint32_t Wavefront::barrierId |
Definition at line 156 of file wavefront.hh.
Referenced by ComputeUnit::AllAtBarrier(), getContext(), getStaticContextSize(), ready(), setContext(), and ComputeUnit::startWavefront().
uint32_t Wavefront::barrierSlots |
Definition at line 157 of file wavefront.hh.
Referenced by ComputeUnit::startWavefront().
uint64_t Wavefront::basePtr |
Definition at line 152 of file wavefront.hh.
Referenced by FetchUnit::initiateFetch(), and start().
CallArgMem* Wavefront::callArgMem |
Definition at line 298 of file wavefront.hh.
Referenced by ~Wavefront().
ComputeUnit* Wavefront::computeUnit |
Definition at line 165 of file wavefront.hh.
Referenced by HsailISA::Call::calcAddr(), HsailISA::calcPrivAddr(), RegAddrOperand< RegOperandType >::calcVector(), NoRegAddrOperand::calcVector(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), LocalMemPipeline::exec(), GlobalMemPipeline::exec(), ConditionRegisterState::exec(), exec(), HsailISA::Call::execPseudoInst(), HsailISA::LdaInst< DestDataType, AddrOperandType >::execute(), HsailISA::CbrInstBase< SRegOperand >::execute(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), SRegOperand::get(), DRegOperand::get(), getContext(), getStaticContextSize(), HsailISA::MemFence::initiateAcc(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicJoinWFBar(), HsailISA::Call::MagicLoadGlobalU32Reg(), HsailISA::Call::MagicMaskLower(), HsailISA::Call::MagicMaskUpper(), HsailISA::Call::MagicMostSigBroadcast(), HsailISA::Call::MagicMostSigThread(), HsailISA::Call::MagicPanic(), HsailISA::Call::MagicPrefixSum(), HsailISA::Call::MagicPrintLane(), HsailISA::Call::MagicPrintLane64(), HsailISA::Call::MagicPrintWF32(), HsailISA::Call::MagicPrintWF32ID(), HsailISA::Call::MagicPrintWF64(), HsailISA::Call::MagicPrintWFFloat(), HsailISA::Call::MagicPrintWFID64(), HsailISA::Call::MagicReduction(), HsailISA::Call::MagicSimBreak(), HsailISA::Call::MagicWaitWFBar(), HsailISA::Call::MagicXactCasLd(), popFromReconvergenceStack(), ready(), remap(), SRegOperand::set(), DRegOperand::set(), CRegOperand::set(), ListOperand::set(), setContext(), and updateResources().
class ConditionRegisterState* Wavefront::condRegState |
Definition at line 173 of file wavefront.hh.
Referenced by CRegOperand::get(), getContext(), resizeRegFiles(), CRegOperand::set(), setContext(), Wavefront(), and ~Wavefront().
uint32_t Wavefront::dispatchId |
Definition at line 206 of file wavefront.hh.
Referenced by HsailISA::Ret::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), ready(), and ComputeUnit::startWavefront().
bool Wavefront::dropFetch |
Definition at line 170 of file wavefront.hh.
Referenced by discardFetch(), HsailISA::Ret::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), HsailISA::Call::MagicWaitWFBar(), ComputeUnit::startWavefront(), and Wavefront().
Stats::Distribution Wavefront::dstRegOpDist |
Definition at line 294 of file wavefront.hh.
Referenced by exec(), and regStats().
uint32_t Wavefront::gridSz[3] |
Definition at line 196 of file wavefront.hh.
Referenced by computeActualWgSz(), and ComputeUnit::fillKernelState().
VectorMask Wavefront::initMask |
Definition at line 248 of file wavefront.hh.
Referenced by HsailISA::Ret::execute(), getContext(), getStaticContextSize(), setContext(), and ComputeUnit::startWavefront().
std::deque<GPUDynInstPtr> Wavefront::instructionBuffer |
Definition at line 167 of file wavefront.hh.
Referenced by ScoreboardCheckStage::collectStatistics(), discardFetch(), FetchUnit::exec(), exec(), HsailISA::Ret::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchUnit::initiateFetch(), instructionBufferHasBranch(), isOldestInstALU(), isOldestInstBarrier(), isOldestInstFlatMem(), isOldestInstGMem(), isOldestInstLMem(), isOldestInstPrivMem(), HsailISA::Call::MagicWaitWFBar(), ready(), ComputeUnit::startWavefront(), and updateResources().
uint8_t* Wavefront::kernelArgs |
Definition at line 278 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), and ComputeUnit::fillKernelState().
int Wavefront::kernId |
Definition at line 161 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), HsailISA::Call::MagicSimBreak(), GpuDispatcher::notifyWgCompl(), ComputeUnit::DataPort::recvTimingResp(), and ComputeUnit::startWavefront().
std::vector<Addr> Wavefront::lastAddr |
Definition at line 190 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), and Wavefront().
uint64_t Wavefront::lastTrace |
Definition at line 226 of file wavefront.hh.
Referenced by Wavefront().
LdsChunk* Wavefront::ldsChunk |
Definition at line 258 of file wavefront.hh.
Referenced by HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execAtomic(), getContext(), getStaticContextSize(), Gcn3ISA::Inst_DS::initDualMemRead(), Gcn3ISA::Inst_DS::initDualMemWrite(), Gcn3ISA::Inst_DS::initMemRead(), Gcn3ISA::Inst_DS::initMemWrite(), setContext(), and ComputeUnit::startWavefront().
int Wavefront::maxBarCnt |
Definition at line 252 of file wavefront.hh.
Referenced by getContext(), getStaticContextSize(), HsailISA::Call::MagicJoinWFBar(), HsailISA::Call::MagicWaitWFBar(), setContext(), ComputeUnit::startWavefront(), and waitingAtBarrier().
uint32_t Wavefront::maxDpVgprs |
Definition at line 177 of file wavefront.hh.
Referenced by getContext(), resizeRegFiles(), setContext(), and Wavefront().
uint32_t Wavefront::maxDynWaveId |
Definition at line 205 of file wavefront.hh.
uint32_t Wavefront::maxSpVgprs |
Definition at line 175 of file wavefront.hh.
Referenced by getContext(), remap(), resizeRegFiles(), setContext(), and Wavefront().
uint32_t Wavefront::memReqsInPipe |
Definition at line 211 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), ready(), updateResources(), and Wavefront().
int Wavefront::memTraceBusy |
Definition at line 225 of file wavefront.hh.
Referenced by Wavefront().
Stats::Scalar Wavefront::numTimesBlockedDueRAWDependencies |
Definition at line 290 of file wavefront.hh.
Referenced by VectorRegisterFile::operandsReady(), and regStats().
Stats::Scalar Wavefront::numTimesBlockedDueVrfPortAvail |
Definition at line 284 of file wavefront.hh.
Referenced by regStats().
Stats::Scalar Wavefront::numTimesBlockedDueWAXDependencies |
Definition at line 287 of file wavefront.hh.
Referenced by VectorRegisterFile::operandsReady(), and regStats().
uint32_t Wavefront::oldBarrierCnt |
Definition at line 154 of file wavefront.hh.
Referenced by HsailISA::Barrier::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), getContext(), getStaticContextSize(), ready(), setContext(), ComputeUnit::startWavefront(), and Wavefront().
std::vector<uint64_t> Wavefront::oldDgpr |
Definition at line 241 of file wavefront.hh.
Referenced by Wavefront().
uint32_t Wavefront::oldDgprId |
Definition at line 243 of file wavefront.hh.
uint64_t Wavefront::oldDgprTcnt |
Definition at line 245 of file wavefront.hh.
Referenced by Wavefront().
std::vector<uint32_t> Wavefront::oldVgpr |
Definition at line 234 of file wavefront.hh.
Referenced by Wavefront().
uint32_t Wavefront::oldVgprId |
Definition at line 236 of file wavefront.hh.
uint64_t Wavefront::oldVgprTcnt |
Definition at line 238 of file wavefront.hh.
Referenced by Wavefront().
uint32_t Wavefront::outstandingReqs |
Definition at line 208 of file wavefront.hh.
Referenced by ComputeUnit::AllAtBarrier(), LocalMemPipeline::exec(), GlobalMemPipeline::exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX16::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX4::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), ready(), ComputeUnit::DataPort::recvTimingResp(), and Wavefront().
uint32_t Wavefront::outstandingReqsRdGm |
Definition at line 217 of file wavefront.hh.
Referenced by GlobalMemPipeline::exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), ready(), and Wavefront().
uint32_t Wavefront::outstandingReqsRdLm |
Definition at line 219 of file wavefront.hh.
Referenced by LocalMemPipeline::exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), ready(), and Wavefront().
uint32_t Wavefront::outstandingReqsWrGm |
Definition at line 213 of file wavefront.hh.
Referenced by GlobalMemPipeline::exec(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), ready(), and Wavefront().
uint32_t Wavefront::outstandingReqsWrLm |
Definition at line 215 of file wavefront.hh.
Referenced by LocalMemPipeline::exec(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), ready(), and Wavefront().
bool Wavefront::pendingFetch |
Definition at line 169 of file wavefront.hh.
Referenced by discardFetch(), FetchUnit::exec(), HsailISA::Ret::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), HsailISA::Call::MagicWaitWFBar(), ComputeUnit::startWavefront(), and Wavefront().
Addr Wavefront::privBase |
Definition at line 268 of file wavefront.hh.
Referenced by HsailISA::calcPrivAddr(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), getContext(), getStaticContextSize(), setContext(), and ComputeUnit::startWavefront().
uint32_t Wavefront::privSizePerItem |
Definition at line 270 of file wavefront.hh.
Referenced by HsailISA::calcPrivAddr(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), and ComputeUnit::fillKernelState().
uint32_t Wavefront::rdGmReqsInPipe |
Definition at line 221 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::MemFence::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), ready(), updateResources(), and Wavefront().
uint32_t Wavefront::rdLmReqsInPipe |
Definition at line 220 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), ready(), updateResources(), and Wavefront().
|
private |
Stack containing Control Flow Graph nodes (i.e., kernel instructions) to be visited by the wavefront, and the associated execution masks.
The reconvergence stack grows every time the wavefront reaches a divergence point (branch instruction), and shrinks every time the wavefront reaches a reconvergence point (immediate post-dominator instruction).
Definition at line 390 of file wavefront.hh.
Referenced by execMask(), getContext(), pc(), popFromReconvergenceStack(), pushToReconvergenceStack(), and rpc().
int Wavefront::reservedVectorRegs |
Definition at line 228 of file wavefront.hh.
Referenced by HsailISA::Ret::execute(), init(), remap(), ComputeUnit::StartWorkgroup(), and Wavefront().
Addr Wavefront::roBase |
Definition at line 273 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), and ComputeUnit::fillKernelState().
uint32_t Wavefront::roSize |
Definition at line 275 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), and ComputeUnit::fillKernelState().
int Wavefront::simdId |
Definition at line 163 of file wavefront.hh.
Referenced by ScheduleStage::arbitrate(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), LocalMemPipeline::exec(), ScheduleStage::exec(), GlobalMemPipeline::exec(), ConditionRegisterState::exec(), VectorRegisterFile::exec(), exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchStage::fetch(), FetchUnit::fetch(), SRegOperand::get(), DRegOperand::get(), getContext(), FetchUnit::initiateFetch(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), HsailISA::Call::MagicSimBreak(), HsailISA::Call::MagicXactCasLd(), popFromReconvergenceStack(), Gcn3ISA::ScalarOperand< DataType, Const, NumDwords >::read(), ready(), ComputeUnit::DataPort::recvTimingResp(), remap(), SRegOperand::set(), DRegOperand::set(), CRegOperand::set(), ListOperand::set(), setContext(), ComputeUnit::startWavefront(), updateResources(), Wavefront(), and Gcn3ISA::ScalarOperand< DataType, Const, NumDwords >::write().
Addr Wavefront::spillBase |
Definition at line 261 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), getContext(), getStaticContextSize(), setContext(), and ComputeUnit::startWavefront().
uint32_t Wavefront::spillSizePerItem |
Definition at line 263 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), and ComputeUnit::fillKernelState().
uint32_t Wavefront::spillWidth |
Definition at line 265 of file wavefront.hh.
Referenced by HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), and ComputeUnit::startWavefront().
Stats::Distribution Wavefront::srcRegOpDist |
Definition at line 293 of file wavefront.hh.
Referenced by exec(), and regStats().
bool Wavefront::stalledAtBarrier |
Definition at line 254 of file wavefront.hh.
Referenced by HsailISA::Barrier::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), ready(), ComputeUnit::startWavefront(), and Wavefront().
uint32_t Wavefront::startVgprIndex |
Definition at line 231 of file wavefront.hh.
Referenced by HsailISA::Ret::execute(), init(), remap(), ComputeUnit::StartWorkgroup(), and Wavefront().
status_e Wavefront::status |
Definition at line 158 of file wavefront.hh.
Referenced by ComputeUnit::AllAtBarrier(), FetchUnit::exec(), exec(), HsailISA::Ret::execute(), isOldestInstALU(), isOldestInstBarrier(), isOldestInstFlatMem(), isOldestInstGMem(), isOldestInstLMem(), isOldestInstPrivMem(), ready(), ComputeUnit::DataPort::recvTimingResp(), start(), ComputeUnit::StartWorkgroup(), and Wavefront().
uint64_t Wavefront::wfDynId |
Definition at line 280 of file wavefront.hh.
Referenced by OFSchedulingPolicy::__chooseWave(), exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), HsailISA::Call::MagicPrintWF32(), HsailISA::Call::MagicPrintWF32ID(), HsailISA::Call::MagicPrintWF64(), HsailISA::Call::MagicPrintWFFloat(), HsailISA::Call::MagicPrintWFID64(), popFromReconvergenceStack(), ComputeUnit::DataPort::recvTimingResp(), and start().
uint32_t Wavefront::wfId |
Definition at line 204 of file wavefront.hh.
Referenced by getContext(), getStaticContextSize(), setContext(), and ComputeUnit::startWavefront().
int Wavefront::wfSlotId |
Definition at line 160 of file wavefront.hh.
Referenced by ScheduleStage::arbitrate(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), FetchUnit::exec(), ScheduleStage::exec(), exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchUnit::fetch(), FetchUnit::initiateFetch(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), HsailISA::Call::MagicSimBreak(), HsailISA::Call::MagicXactCasLd(), popFromReconvergenceStack(), ready(), ComputeUnit::DataPort::recvTimingResp(), SRegOperand::set(), DRegOperand::set(), CRegOperand::set(), ListOperand::set(), ComputeUnit::startWavefront(), and Wavefront().
uint32_t Wavefront::wgId |
Definition at line 197 of file wavefront.hh.
Referenced by HsailISA::Ret::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), getContext(), getStaticContextSize(), ready(), setContext(), and ComputeUnit::startWavefront().
uint32_t Wavefront::wgSz |
Definition at line 198 of file wavefront.hh.
Referenced by ComputeUnit::fillKernelState().
uint32_t Wavefront::workGroupId[3] |
Definition at line 194 of file wavefront.hh.
Referenced by ComputeUnit::startWavefront().
uint32_t Wavefront::workGroupSz[3] |
Definition at line 195 of file wavefront.hh.
Referenced by computeActualWgSz(), and ComputeUnit::fillKernelState().
std::vector<uint32_t> Wavefront::workItemFlatId |
Definition at line 192 of file wavefront.hh.
Referenced by ComputeUnit::startWavefront(), and Wavefront().
std::vector<uint32_t> Wavefront::workItemId[3] |
Definition at line 191 of file wavefront.hh.
Referenced by getContext(), setContext(), ComputeUnit::startWavefront(), and Wavefront().
uint32_t Wavefront::wrGmReqsInPipe |
Definition at line 223 of file wavefront.hh.
Referenced by HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), ready(), updateResources(), and Wavefront().
uint32_t Wavefront::wrLmReqsInPipe |
Definition at line 222 of file wavefront.hh.
Referenced by HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), ready(), updateResources(), and Wavefront().