gem5
v21.0.1.0
|
#include <wavefront.hh>
Classes | |
struct | WavefrontStats |
Public Types | |
enum | status_e { S_STOPPED, S_RETURNING, S_RUNNING, S_STALLED, S_STALLED_SLEEP, S_WAITCNT, S_BARRIER } |
typedef WavefrontParams | Params |
![]() | |
typedef SimObjectParams | Params |
Public Member Functions | |
void | freeResources () |
GPUDynInstPtr | nextInstr () |
void | setStatus (status_e newStatus) |
status_e | getStatus () |
void | resizeRegFiles (int num_vregs, int num_sregs) |
bool | isGmInstruction (GPUDynInstPtr ii) |
bool | isLmInstruction (GPUDynInstPtr ii) |
bool | isOldestInstWaitcnt () |
bool | isOldestInstSleep () |
bool | isOldestInstGMem () |
bool | isOldestInstLMem () |
bool | isOldestInstPrivMem () |
bool | isOldestInstFlatMem () |
bool | isOldestInstVectorALU () |
bool | isOldestInstScalarALU () |
bool | isOldestInstScalarMem () |
bool | isOldestInstBarrier () |
void | computeActualWgSz (HSAQueueEntry *task) |
void | initRegState (HSAQueueEntry *task, int wgSizeInWorkItems) |
Wavefront (const Params &p) | |
~Wavefront () | |
virtual void | init () |
init() is called after all C++ SimObjects have been created and all ports are connected. More... | |
void | setParent (ComputeUnit *cu) |
void | validateRequestCounters () |
void | start (uint64_t _wfDynId, uint64_t _base_ptr) |
void | exec () |
std::vector< int > | reserveResources () |
bool | stopFetch () |
Addr | pc () const |
void | pc (Addr new_pc) |
VectorMask & | execMask () |
bool | execMask (int lane) const |
void | discardFetch () |
bool | waitCntsSatisfied () |
void | setWaitCnts (int vm_wait_cnt, int exp_wait_cnt, int lgkm_wait_cnt) |
void | clearWaitCnts () |
void | incVMemInstsIssued () |
void | incExpInstsIssued () |
void | incLGKMInstsIssued () |
void | decVMemInstsIssued () |
void | decExpInstsIssued () |
void | decLGKMInstsIssued () |
void | freeRegisterFile () |
Freeing VRF space. More... | |
bool | sleepDone () |
void | setSleepTime (int sleep_time) |
TheGpuISA::GPUISA & | gpuISA () |
void | barrierId (int bar_id) |
int | barrierId () const |
bool | hasBarrier () const |
void | releaseBarrier () |
![]() | |
const Params & | params () const |
SimObject (const Params &p) | |
virtual | ~SimObject () |
virtual const std::string | name () const |
virtual void | loadState (CheckpointIn &cp) |
loadState() is called on each SimObject when restoring from a checkpoint. More... | |
virtual void | initState () |
initState() is called on each SimObject when not restoring from a checkpoint. More... | |
virtual void | regProbePoints () |
Register probe points for this object. More... | |
virtual void | regProbeListeners () |
Register probe listeners for this object. More... | |
ProbeManager * | getProbeManager () |
Get the probe manager for this object. More... | |
virtual Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) |
Get a port with a given name and index. More... | |
virtual void | startup () |
startup() is the final initialization call before simulation. More... | |
DrainState | drain () override |
Provide a default implementation of the drain interface for objects that don't need draining. More... | |
virtual void | memWriteback () |
Write back dirty buffers to memory using functional writes. More... | |
virtual void | memInvalidate () |
Invalidate the contents of memory buffers. More... | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
![]() | |
EventQueue * | eventQueue () const |
void | schedule (Event &event, Tick when) |
void | deschedule (Event &event) |
void | reschedule (Event &event, Tick when, bool always=false) |
void | schedule (Event *event, Tick when) |
void | deschedule (Event *event) |
void | reschedule (Event *event, Tick when, bool always=false) |
void | wakeupEventQueue (Tick when=(Tick) -1) |
This function is not needed by the usual gem5 event loop but may be necessary in derived EventQueues which host gem5 on other schedulers. More... | |
void | setCurTick (Tick newVal) |
EventManager (EventManager &em) | |
Event manger manages events in the event queue. More... | |
EventManager (EventManager *em) | |
EventManager (EventQueue *eq) | |
![]() | |
Serializable () | |
virtual | ~Serializable () |
void | serializeSection (CheckpointOut &cp, const char *name) const |
Serialize an object into a new section. More... | |
void | serializeSection (CheckpointOut &cp, const std::string &name) const |
void | unserializeSection (CheckpointIn &cp, const char *name) |
Unserialize an a child object. More... | |
void | unserializeSection (CheckpointIn &cp, const std::string &name) |
![]() | |
DrainState | drainState () const |
Return the current drain state of an object. More... | |
virtual void | notifyFork () |
Notify a child process of a fork. More... | |
![]() | |
Group (Group *parent, const char *name=nullptr) | |
Construct a new statistics group. More... | |
virtual | ~Group () |
virtual void | regStats () |
Callback to set stat parameters. More... | |
virtual void | resetStats () |
Callback to reset stats. More... | |
virtual void | preDumpStats () |
Callback before stats are dumped. More... | |
void | addStat (Stats::Info *info) |
Register a stat with this group. More... | |
const std::map< std::string, Group * > & | getStatGroups () const |
Get all child groups associated with this object. More... | |
const std::vector< Info * > & | getStats () const |
Get all stats associated with this object. More... | |
void | addStatGroup (const char *name, Group *block) |
Add a stat block as a child of this block. More... | |
const Info * | resolveStat (std::string name) const |
Resolve a stat by its name within this group. More... | |
void | mergeStatGroup (Group *block) |
Merge the contents (stats & children) of a block to this block. More... | |
Group ()=delete | |
Group (const Group &)=delete | |
Group & | operator= (const Group &)=delete |
Private Member Functions | |
void | reserveGmResource (GPUDynInstPtr ii) |
void | reserveLmResource (GPUDynInstPtr ii) |
Private Attributes | |
TheGpuISA::GPUISA | _gpuISA |
int | vmWaitCnt |
the following are used for waitcnt instructions vmWaitCnt: once set, we wait for the oustanding number of vector mem instructions to be at, or below vmWaitCnt. More... | |
int | expWaitCnt |
int | lgkmWaitCnt |
int | vmemInstsIssued |
int | expInstsIssued |
int | lgkmInstsIssued |
int | sleepCnt |
status_e | status |
Addr | _pc |
VectorMask | _execMask |
int | barId |
Additional Inherited Members | |
![]() | |
static void | serializeAll (CheckpointOut &cp) |
Serialize all SimObjects in the system. More... | |
static SimObject * | find (const char *name) |
Find the SimObject with the given name and return a pointer to it. More... | |
![]() | |
static const std::string & | currentSection () |
Gets the fully-qualified name of the active section. More... | |
static void | serializeAll (const std::string &cpt_dir) |
Serializes all the SimObjects. More... | |
static void | unserializeGlobals (CheckpointIn &cp) |
![]() | |
Drainable () | |
virtual | ~Drainable () |
virtual void | drainResume () |
Resume execution after a successful drain. More... | |
void | signalDrainDone () const |
Signal that an object is drained. More... | |
![]() | |
const SimObjectParams & | _params |
Cached copy of the object parameters. More... | |
![]() | |
EventQueue * | eventq |
A pointer to this object's event queue. More... | |
Definition at line 59 of file wavefront.hh.
typedef WavefrontParams Wavefront::Params |
Definition at line 242 of file wavefront.hh.
enum Wavefront::status_e |
Definition at line 62 of file wavefront.hh.
Wavefront::Wavefront | ( | const Params & | p | ) |
Definition at line 47 of file wavefront.cc.
References _execMask, dropFetch, execUnitId, ArmISA::i, lastAddr, lastInstExec, lastNonIdleTick, lastTrace, ldsChunk, maxSgprs, maxVgprs, memTraceBusy, oldDgpr, oldDgprTcnt, oldVgpr, oldVgprTcnt, outstandingReqs, outstandingReqsRdGm, outstandingReqsRdLm, outstandingReqsWrGm, outstandingReqsWrLm, MipsISA::p, pendingFetch, rawDist, rdGmReqsInPipe, rdLmReqsInPipe, reservedScalarRegs, reservedVectorRegs, S_STOPPED, scalarOutstandingReqsRdGm, scalarOutstandingReqsWrGm, scalarRdGmReqsInPipe, scalarWrGmReqsInPipe, startSgprIndex, startVgprIndex, status, vecReads, workItemFlatId, workItemId, wrGmReqsInPipe, and wrLmReqsInPipe.
Wavefront::~Wavefront | ( | ) |
Definition at line 512 of file wavefront.cc.
int Wavefront::barrierId | ( | ) | const |
Definition at line 1424 of file wavefront.cc.
References barId.
void Wavefront::barrierId | ( | int | bar_id | ) |
Definition at line 1416 of file wavefront.cc.
References barId, and WFBarrier::InvalidID.
Referenced by Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), and ComputeUnit::releaseWFsFromBarrier().
void Wavefront::clearWaitCnts | ( | ) |
Definition at line 1315 of file wavefront.cc.
References expWaitCnt, lgkmWaitCnt, S_RUNNING, status, and vmWaitCnt.
Referenced by waitCntsSatisfied().
void Wavefront::computeActualWgSz | ( | HSAQueueEntry * | task | ) |
Definition at line 1405 of file wavefront.cc.
References actualWgSz, actualWgSzTotal, ArmISA::d, gridSz, HSAQueueEntry::MAX_DIM, HSAQueueEntry::wgId(), and workGroupSz.
void Wavefront::decExpInstsIssued | ( | ) |
Definition at line 1353 of file wavefront.cc.
References expInstsIssued.
void Wavefront::decLGKMInstsIssued | ( | ) |
Definition at line 1359 of file wavefront.cc.
References lgkmInstsIssued.
Referenced by Gcn3ISA::Inst_DS__DS_PERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), and GPUDynInst::resolveFlatSegment().
void Wavefront::decVMemInstsIssued | ( | ) |
Definition at line 1347 of file wavefront.cc.
References vmemInstsIssued.
Referenced by Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), and GPUDynInst::resolveFlatSegment().
void Wavefront::discardFetch | ( | ) |
clear the fetch buffer for this wave in order to remove any stale inst data
Definition at line 1188 of file wavefront.cc.
References computeUnit, dropFetch, ComputeUnit::fetchStage, FetchStage::fetchUnit(), FetchUnit::flushBuf(), instructionBuffer, pendingFetch, simdId, and wfSlotId.
Referenced by exec().
void Wavefront::exec | ( | ) |
if this wave is in S_WAITCNT state, then it should enter exec() precisely one time before the waitcnts are satisfied, in order to execute the waitcnt instruction itself thus we assert that the waitcnt is the oldest instruction. if we enter exec() with active waitcnts, and we're not executing the waitcnt instruction, something must be wrong
we return here to avoid spurious errors related to flat insts and their address segment resolution.
Definition at line 861 of file wavefront.cc.
References _gpuISA, ComputeUnit::ComputeUnitStats::activeLanesPerGMemInstrDist, ComputeUnit::ComputeUnitStats::activeLanesPerLMemInstrDist, computeUnit, ComputeUnit::ComputeUnitStats::controlFlowDivergenceDist, ComputeUnit::cu_id, Clocked::cyclesToTicks(), ComputeUnit::deleteFromPipeMap(), discardFetch(), DPRINTF, execMask(), ComputeUnit::ComputeUnitStats::execRateDist, fatal, ComputeUnit::getTokenManager(), Shader::hsail_mode, ArmISA::i, Shader::incVectorInstDstOperand(), Shader::incVectorInstSrcOperand(), ComputeUnit::ComputeUnitStats::instCyclesLdsPerSimd, ComputeUnit::ComputeUnitStats::instCyclesScMemPerSimd, ComputeUnit::ComputeUnitStats::instCyclesVMemPerSimd, ComputeUnit::instExecPerSimd, ComputeUnit::ComputeUnitStats::instInterleave, instructionBuffer, isGmInstruction(), isLmInstruction(), isOldestInstWaitcnt(), ComputeUnit::issuePeriod, ComputeUnit::lastExecCycle, lastInstExec, ArmISA::n, Stats::none, Wavefront::WavefrontStats::numInstrExecuted, ComputeUnit::ComputeUnitStats::numInstrExecuted, ComputeUnit::ComputeUnitStats::numVecOpsExecuted, ComputeUnit::ComputeUnitStats::numVecOpsExecutedF16, ComputeUnit::ComputeUnitStats::numVecOpsExecutedF32, ComputeUnit::ComputeUnitStats::numVecOpsExecutedF64, ComputeUnit::ComputeUnitStats::numVecOpsExecutedFMA16, ComputeUnit::ComputeUnitStats::numVecOpsExecutedFMA32, ComputeUnit::ComputeUnitStats::numVecOpsExecutedFMA64, ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAC16, ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAC32, ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAC64, ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAD16, ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAD32, ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAD64, ComputeUnit::ComputeUnitStats::numVecOpsExecutedTwoOpFP, panic, pc(), rawDist, Wavefront::WavefrontStats::readsPerWrite, TokenManager::recvTokens(), S_RETURNING, S_STALLED, S_STOPPED, S_WAITCNT, Stats::DistBase< Derived, Stor >::sample(), scalarAlu, ComputeUnit::scalarALUs, ComputeUnit::scalarMemUnit, WaitClass::set(), ComputeUnit::shader, simdId, Shader::SIMT, ComputeUnit::srf, ComputeUnit::srf_scm_bus_latency, ComputeUnit::srfToScalarMemPipeBus, stats, ComputeUnit::stats, status, ComputeUnit::ComputeUnitStats::totalCycles, ComputeUnit::updateInstStats(), Stats::ScalarBase< Derived, Stor >::value(), Wavefront::WavefrontStats::vecRawDistance, vecReads, ComputeUnit::vectorALUs, ComputeUnit::vectorGlobalMemUnit, ComputeUnit::vectorSharedMemUnit, ComputeUnit::vrf, ComputeUnit::vrf_gm_bus_latency, ComputeUnit::vrf_lm_bus_latency, ComputeUnit::vrfToGlobalMemPipeBus, ComputeUnit::vrfToLocalMemPipeBus, wfDynId, and wfSlotId.
Referenced by ExecStage::exec().
VectorMask & Wavefront::execMask | ( | ) |
Definition at line 1377 of file wavefront.cc.
References _execMask.
Referenced by Gcn3ISA::Inst_DS::calcAddr(), exec(), Gcn3ISA::Inst_SOP1__S_AND_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_OR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_XOR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_ANDN2_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_ORN2_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_NAND_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_NOR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOP1__S_XNOR_SAVEEXEC_B64::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECNZ::execute(), Gcn3ISA::Inst_VOP2__V_CNDMASK_B32::execute(), Gcn3ISA::Inst_VOP2__V_ADD_F32::execute(), Gcn3ISA::Inst_VOP2__V_SUB_F32::execute(), Gcn3ISA::Inst_VOP2__V_SUBREV_F32::execute(), Gcn3ISA::Inst_VOP2__V_MUL_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP2__V_MUL_F32::execute(), Gcn3ISA::Inst_VOP2__V_MUL_I32_I24::execute(), Gcn3ISA::Inst_VOP2__V_MUL_HI_I32_I24::execute(), Gcn3ISA::Inst_VOP2__V_MUL_U32_U24::execute(), Gcn3ISA::Inst_VOP2__V_MUL_HI_U32_U24::execute(), Gcn3ISA::Inst_VOP2__V_MIN_F32::execute(), Gcn3ISA::Inst_VOP2__V_MAX_F32::execute(), Gcn3ISA::Inst_VOP2__V_MIN_I32::execute(), Gcn3ISA::Inst_VOP2__V_MAX_I32::execute(), Gcn3ISA::Inst_VOP2__V_MIN_U32::execute(), Gcn3ISA::Inst_VOP2__V_MAX_U32::execute(), Gcn3ISA::Inst_VOP2__V_LSHRREV_B32::execute(), Gcn3ISA::Inst_VOP2__V_ASHRREV_I32::execute(), Gcn3ISA::Inst_VOP2__V_LSHLREV_B32::execute(), Gcn3ISA::Inst_VOP2__V_AND_B32::execute(), Gcn3ISA::Inst_VOP2__V_OR_B32::execute(), Gcn3ISA::Inst_VOP2__V_XOR_B32::execute(), Gcn3ISA::Inst_VOP2__V_MAC_F32::execute(), Gcn3ISA::Inst_VOP2__V_MADMK_F32::execute(), Gcn3ISA::Inst_VOP2__V_MADAK_F32::execute(), Gcn3ISA::Inst_VOP2__V_ADD_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUB_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUBREV_U32::execute(), Gcn3ISA::Inst_VOP2__V_ADDC_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUBB_U32::execute(), Gcn3ISA::Inst_VOP2__V_SUBBREV_U32::execute(), Gcn3ISA::Inst_VOP2__V_ADD_U16::execute(), Gcn3ISA::Inst_VOP2__V_SUB_U16::execute(), Gcn3ISA::Inst_VOP2__V_SUBREV_U16::execute(), Gcn3ISA::Inst_VOP2__V_MUL_LO_U16::execute(), Gcn3ISA::Inst_VOP2__V_LSHLREV_B16::execute(), Gcn3ISA::Inst_VOP2__V_LSHRREV_B16::execute(), Gcn3ISA::Inst_VOP2__V_ASHRREV_I16::execute(), Gcn3ISA::Inst_VOP2__V_MAX_U16::execute(), Gcn3ISA::Inst_VOP2__V_MAX_I16::execute(), Gcn3ISA::Inst_VOP2__V_MIN_U16::execute(), Gcn3ISA::Inst_VOP2__V_MIN_I16::execute(), Gcn3ISA::Inst_VOP1__V_MOV_B32::execute(), Gcn3ISA::Inst_VOP1__V_READFIRSTLANE_B32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_I32_F64::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F64_I32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_I32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_U32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_U32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_RPI_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_FLR_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_F64::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F64_F32::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE0::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE1::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE2::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F32_UBYTE3::execute(), Gcn3ISA::Inst_VOP1__V_CVT_U32_F64::execute(), Gcn3ISA::Inst_VOP1__V_CVT_F64_U32::execute(), Gcn3ISA::Inst_VOP1__V_TRUNC_F64::execute(), Gcn3ISA::Inst_VOP1__V_CEIL_F64::execute(), Gcn3ISA::Inst_VOP1__V_RNDNE_F64::execute(), Gcn3ISA::Inst_VOP1__V_FLOOR_F64::execute(), Gcn3ISA::Inst_VOP1__V_FRACT_F32::execute(), Gcn3ISA::Inst_VOP1__V_TRUNC_F32::execute(), Gcn3ISA::Inst_VOP1__V_CEIL_F32::execute(), Gcn3ISA::Inst_VOP1__V_RNDNE_F32::execute(), Gcn3ISA::Inst_VOP1__V_FLOOR_F32::execute(), Gcn3ISA::Inst_VOP1__V_EXP_F32::execute(), Gcn3ISA::Inst_VOP1__V_LOG_F32::execute(), Gcn3ISA::Inst_VOP1__V_RCP_F32::execute(), Gcn3ISA::Inst_VOP1__V_RCP_IFLAG_F32::execute(), Gcn3ISA::Inst_VOP1__V_RSQ_F32::execute(), Gcn3ISA::Inst_VOP1__V_RCP_F64::execute(), Gcn3ISA::Inst_VOP1__V_RSQ_F64::execute(), Gcn3ISA::Inst_VOP1__V_SQRT_F32::execute(), Gcn3ISA::Inst_VOP1__V_SQRT_F64::execute(), Gcn3ISA::Inst_VOP1__V_SIN_F32::execute(), Gcn3ISA::Inst_VOP1__V_COS_F32::execute(), Gcn3ISA::Inst_VOP1__V_NOT_B32::execute(), Gcn3ISA::Inst_VOP1__V_BFREV_B32::execute(), Gcn3ISA::Inst_VOP1__V_FFBH_U32::execute(), Gcn3ISA::Inst_VOP1__V_FFBL_B32::execute(), Gcn3ISA::Inst_VOP1__V_FFBH_I32::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_EXP_I32_F64::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_MANT_F64::execute(), Gcn3ISA::Inst_VOP1__V_FRACT_F64::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_EXP_I32_F32::execute(), Gcn3ISA::Inst_VOP1__V_FREXP_MANT_F32::execute(), Gcn3ISA::Inst_VOP1__V_EXP_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP1__V_LOG_LEGACY_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_CLASS_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_CLASS_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_CLASS_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_CLASS_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_O_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_U_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NEQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_TRU_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_O_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_U_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLG_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLE_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NEQ_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLT_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_TRU_F32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_O_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_U_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NGT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NEQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NLT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_TRU_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_O_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_U_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLG_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NGT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLE_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NEQ_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NLT_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_TRU_F64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_I16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_U16::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_I32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_U32::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_F_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_EQ_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_LE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_NE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_GE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMP_T_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_I64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_F_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_EQ_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_LE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GT_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_NE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_GE_U64::execute(), Gcn3ISA::Inst_VOPC__V_CMPX_T_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_CLASS_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_CLASS_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_CLASS_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_CLASS_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_TRU_F16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_F16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_TRU_F16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_O_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_U_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NEQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_TRU_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_O_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_U_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLG_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLE_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NEQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLT_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_TRU_F32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_O_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_U_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NGT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NEQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NLT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_TRU_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_O_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_U_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLG_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NGT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLE_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NEQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NLT_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_TRU_F64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_I16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_U16::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_I32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_U32::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_F_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_EQ_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_LE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_NE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_GE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMP_T_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_I64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_F_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_EQ_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_LE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GT_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_NE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_GE_U64::execute(), Gcn3ISA::Inst_VOP3__V_CMPX_T_U64::execute(), Gcn3ISA::Inst_VOP3__V_CNDMASK_B32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_F32::execute(), Gcn3ISA::Inst_VOP3__V_SUB_F32::execute(), Gcn3ISA::Inst_VOP3__V_SUBREV_F32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_F32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_I32_I24::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_I32_I24::execute(), Gcn3ISA::Inst_VOP3__V_MUL_U32_U24::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_U32_U24::execute(), Gcn3ISA::Inst_VOP3__V_MIN_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAX_F32::execute(), Gcn3ISA::Inst_VOP3__V_MIN_I32::execute(), Gcn3ISA::Inst_VOP3__V_MAX_I32::execute(), Gcn3ISA::Inst_VOP3__V_MIN_U32::execute(), Gcn3ISA::Inst_VOP3__V_MAX_U32::execute(), Gcn3ISA::Inst_VOP3__V_LSHRREV_B32::execute(), Gcn3ISA::Inst_VOP3__V_ASHRREV_I32::execute(), Gcn3ISA::Inst_VOP3__V_LSHLREV_B32::execute(), Gcn3ISA::Inst_VOP3__V_AND_B32::execute(), Gcn3ISA::Inst_VOP3__V_OR_B32::execute(), Gcn3ISA::Inst_VOP3__V_XOR_B32::execute(), Gcn3ISA::Inst_VOP3__V_MAC_F32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUB_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUBREV_U32::execute(), Gcn3ISA::Inst_VOP3__V_ADDC_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUBB_U32::execute(), Gcn3ISA::Inst_VOP3__V_SUBBREV_U32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_U16::execute(), Gcn3ISA::Inst_VOP3__V_SUB_U16::execute(), Gcn3ISA::Inst_VOP3__V_SUBREV_U16::execute(), Gcn3ISA::Inst_VOP3__V_MUL_LO_U16::execute(), Gcn3ISA::Inst_VOP3__V_LSHLREV_B16::execute(), Gcn3ISA::Inst_VOP3__V_LSHRREV_B16::execute(), Gcn3ISA::Inst_VOP3__V_ASHRREV_I16::execute(), Gcn3ISA::Inst_VOP3__V_MAX_U16::execute(), Gcn3ISA::Inst_VOP3__V_MAX_I16::execute(), Gcn3ISA::Inst_VOP3__V_MIN_U16::execute(), Gcn3ISA::Inst_VOP3__V_MIN_I16::execute(), Gcn3ISA::Inst_VOP3__V_MOV_B32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_I32_F64::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F64_I32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_I32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_U32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_U32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_RPI_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_FLR_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_F64::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F64_F32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE0::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE1::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE2::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F32_UBYTE3::execute(), Gcn3ISA::Inst_VOP3__V_CVT_U32_F64::execute(), Gcn3ISA::Inst_VOP3__V_CVT_F64_U32::execute(), Gcn3ISA::Inst_VOP3__V_TRUNC_F64::execute(), Gcn3ISA::Inst_VOP3__V_CEIL_F64::execute(), Gcn3ISA::Inst_VOP3__V_RNDNE_F64::execute(), Gcn3ISA::Inst_VOP3__V_FLOOR_F64::execute(), Gcn3ISA::Inst_VOP3__V_FRACT_F32::execute(), Gcn3ISA::Inst_VOP3__V_TRUNC_F32::execute(), Gcn3ISA::Inst_VOP3__V_CEIL_F32::execute(), Gcn3ISA::Inst_VOP3__V_RNDNE_F32::execute(), Gcn3ISA::Inst_VOP3__V_FLOOR_F32::execute(), Gcn3ISA::Inst_VOP3__V_EXP_F32::execute(), Gcn3ISA::Inst_VOP3__V_LOG_F32::execute(), Gcn3ISA::Inst_VOP3__V_RCP_F32::execute(), Gcn3ISA::Inst_VOP3__V_RCP_IFLAG_F32::execute(), Gcn3ISA::Inst_VOP3__V_RSQ_F32::execute(), Gcn3ISA::Inst_VOP3__V_RCP_F64::execute(), Gcn3ISA::Inst_VOP3__V_RSQ_F64::execute(), Gcn3ISA::Inst_VOP3__V_SQRT_F32::execute(), Gcn3ISA::Inst_VOP3__V_SQRT_F64::execute(), Gcn3ISA::Inst_VOP3__V_SIN_F32::execute(), Gcn3ISA::Inst_VOP3__V_COS_F32::execute(), Gcn3ISA::Inst_VOP3__V_NOT_B32::execute(), Gcn3ISA::Inst_VOP3__V_BFREV_B32::execute(), Gcn3ISA::Inst_VOP3__V_FFBH_U32::execute(), Gcn3ISA::Inst_VOP3__V_FFBL_B32::execute(), Gcn3ISA::Inst_VOP3__V_FFBH_I32::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_EXP_I32_F64::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_MANT_F64::execute(), Gcn3ISA::Inst_VOP3__V_FRACT_F64::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_EXP_I32_F32::execute(), Gcn3ISA::Inst_VOP3__V_FREXP_MANT_F32::execute(), Gcn3ISA::Inst_VOP3__V_EXP_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_LOG_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_LEGACY_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_I32_I24::execute(), Gcn3ISA::Inst_VOP3__V_MAD_U32_U24::execute(), Gcn3ISA::Inst_VOP3__V_BFE_U32::execute(), Gcn3ISA::Inst_VOP3__V_BFE_I32::execute(), Gcn3ISA::Inst_VOP3__V_BFI_B32::execute(), Gcn3ISA::Inst_VOP3__V_FMA_F32::execute(), Gcn3ISA::Inst_VOP3__V_FMA_F64::execute(), Gcn3ISA::Inst_VOP3__V_LERP_U8::execute(), Gcn3ISA::Inst_VOP3__V_ALIGNBIT_B32::execute(), Gcn3ISA::Inst_VOP3__V_ALIGNBYTE_B32::execute(), Gcn3ISA::Inst_VOP3__V_MIN3_F32::execute(), Gcn3ISA::Inst_VOP3__V_MIN3_I32::execute(), Gcn3ISA::Inst_VOP3__V_MIN3_U32::execute(), Gcn3ISA::Inst_VOP3__V_MAX3_F32::execute(), Gcn3ISA::Inst_VOP3__V_MAX3_I32::execute(), Gcn3ISA::Inst_VOP3__V_MAX3_U32::execute(), Gcn3ISA::Inst_VOP3__V_MED3_F32::execute(), Gcn3ISA::Inst_VOP3__V_MED3_I32::execute(), Gcn3ISA::Inst_VOP3__V_MED3_U32::execute(), Gcn3ISA::Inst_VOP3__V_SAD_U8::execute(), Gcn3ISA::Inst_VOP3__V_SAD_HI_U8::execute(), Gcn3ISA::Inst_VOP3__V_SAD_U16::execute(), Gcn3ISA::Inst_VOP3__V_SAD_U32::execute(), Gcn3ISA::Inst_VOP3__V_CVT_PK_U8_F32::execute(), Gcn3ISA::Inst_VOP3__V_DIV_FIXUP_F32::execute(), Gcn3ISA::Inst_VOP3__V_DIV_FIXUP_F64::execute(), Gcn3ISA::Inst_VOP3__V_DIV_SCALE_F32::execute(), Gcn3ISA::Inst_VOP3__V_DIV_SCALE_F64::execute(), Gcn3ISA::Inst_VOP3__V_DIV_FMAS_F32::execute(), Gcn3ISA::Inst_VOP3__V_DIV_FMAS_F64::execute(), Gcn3ISA::Inst_VOP3__V_MAD_U64_U32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_I64_I32::execute(), Gcn3ISA::Inst_VOP3__V_MAD_U16::execute(), Gcn3ISA::Inst_VOP3__V_MAD_I16::execute(), Gcn3ISA::Inst_VOP3__V_PERM_B32::execute(), Gcn3ISA::Inst_VOP3__V_ADD_F64::execute(), Gcn3ISA::Inst_VOP3__V_MUL_F64::execute(), Gcn3ISA::Inst_VOP3__V_MIN_F64::execute(), Gcn3ISA::Inst_VOP3__V_MAX_F64::execute(), Gcn3ISA::Inst_VOP3__V_LDEXP_F64::execute(), Gcn3ISA::Inst_VOP3__V_MUL_LO_U32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_U32::execute(), Gcn3ISA::Inst_VOP3__V_MUL_HI_I32::execute(), Gcn3ISA::Inst_VOP3__V_LDEXP_F32::execute(), Gcn3ISA::Inst_VOP3__V_BCNT_U32_B32::execute(), Gcn3ISA::Inst_VOP3__V_MBCNT_LO_U32_B32::execute(), Gcn3ISA::Inst_VOP3__V_MBCNT_HI_U32_B32::execute(), Gcn3ISA::Inst_VOP3__V_LSHLREV_B64::execute(), Gcn3ISA::Inst_VOP3__V_LSHRREV_B64::execute(), Gcn3ISA::Inst_VOP3__V_ASHRREV_I64::execute(), Gcn3ISA::Inst_VOP3__V_BFM_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_PERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), VectorRegisterFile::printReg(), Gcn3ISA::VecOperand< DataType, Const, NumDwords >::write(), and Gcn3ISA::ScalarOperand< DataType, Const, sizeof(DataType)/sizeof(VecElemU32) >::write().
bool Wavefront::execMask | ( | int | lane | ) | const |
Definition at line 1383 of file wavefront.cc.
References _execMask.
void Wavefront::freeRegisterFile | ( | ) |
Freeing VRF space.
Definition at line 1389 of file wavefront.cc.
References computeUnit, ArmISA::i, RegisterManager::mapVgpr(), maxVgprs, ComputeUnit::registerManager, reservedVectorRegs, simdId, startVgprIndex, ComputeUnit::vrf, and RegisterManager::vrfPoolMgrs.
void Wavefront::freeResources | ( | ) |
Definition at line 740 of file wavefront.cc.
References execUnitId.
Referenced by ExecStage::exec().
|
inline |
Definition at line 135 of file wavefront.hh.
References status.
Referenced by FetchUnit::exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), and ComputeUnit::releaseWFsFromBarrier().
|
inline |
Definition at line 287 of file wavefront.hh.
References _gpuISA.
bool Wavefront::hasBarrier | ( | ) | const |
Definition at line 1430 of file wavefront.cc.
References barId, and WFBarrier::InvalidID.
Referenced by ScheduleStage::addToSchList(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), and Gcn3ISA::Inst_SOPP__S_BARRIER::execute().
void Wavefront::incExpInstsIssued | ( | ) |
Definition at line 1335 of file wavefront.cc.
References expInstsIssued.
Referenced by ScheduleStage::exec().
void Wavefront::incLGKMInstsIssued | ( | ) |
Definition at line 1341 of file wavefront.cc.
References lgkmInstsIssued.
Referenced by ScheduleStage::exec().
void Wavefront::incVMemInstsIssued | ( | ) |
Definition at line 1329 of file wavefront.cc.
References vmemInstsIssued.
Referenced by ScheduleStage::exec().
|
virtual |
init() is called after all C++ SimObjects have been created and all ports are connected.
Initializations that are independent of unserialization but rely on a fully instantiated and connected SimObject graph should be done here.
Reimplemented from SimObject.
Definition at line 101 of file wavefront.cc.
References computeUnit, globalMem, localMem, ComputeUnit::mapWaveToGlobalMem(), ComputeUnit::mapWaveToLocalMem(), ComputeUnit::mapWaveToScalarAlu(), ComputeUnit::mapWaveToScalarAluGlobalIdx(), ComputeUnit::mapWaveToScalarMem(), reservedScalarRegs, reservedVectorRegs, scalarAlu, scalarAluGlobalIdx, scalarMem, startSgprIndex, and startVgprIndex.
void Wavefront::initRegState | ( | HSAQueueEntry * | task, |
int | wgSizeInWorkItems | ||
) |
Since flat scratch init is needed for this kernel, this kernel is going to have flat memory instructions and we need to initialize the hidden private base for this queue. scratch_resource_descriptor[0] has this queue's scratch base address. scratch_backing_memory_location has the offset to this queue's scratch base address from the SH_HIDDEN_PRIVATE_BASE_VMID. Ideally, we only require this queue's scratch base address for address calculation (stored in scratch_resource_descriptor[0]). But that address calculation shoule be done by first finding the queue's scratch base address using the calculation "SH_HIDDEN_PRIVATE_BASE_VMID + offset". So, we initialize SH_HIDDEN_PRIVATE_BASE_VMID.
For more details see: http://rocm-documentation.readthedocs.io/en/latest/ ROCm_Compiler_SDK/ROCm-Native-ISA.html#flat-scratch
https://github.com/ROCm-Developer-Tools/ ROCm-ComputeABI-Doc/blob/master/AMDGPU-ABI.md #flat-addressing
the compute_tmpring_size_wavesize specifies the number of kB allocated per wavefront, hence the multiplication by 1024.
to get the per wavefront offset into the scratch memory, we also multiply this by the wfId. the wfId stored in the Wavefront class, however, is the wave ID within the WG, whereas here we need the global WFID because the scratch space will be divided amongst all waves in the kernel. to get the global ID we multiply the WGID by the WG size, then add the WFID of the wave within its WG.
Definition at line 116 of file wavefront.cc.
References HSAQueueEntry::amdQueue, bits(), _amd_queue_s::compute_tmpring_size_wavesize, computeUnit, ComputeUnit::cu_id, DispatchPtr, divCeil(), DPRINTF, fatal, FlatScratchInit, HSAQueueEntry::gridSize(), GridWorkgroupCountX, GridWorkgroupCountY, GridWorkgroupCountZ, HSAQueueEntry::hostAMDQueueAddr, HSAQueueEntry::hostDispPktAddr(), Shader::initShHiddenPrivateBase(), HSAQueueEntry::kernargAddr(), KernargSegPtr, RegisterManager::mapSgpr(), RegisterManager::mapVgpr(), NumScalarInitFields, NumVectorInitFields, PrivateSegBuf, PrivSegWaveByteOffset, QueuePtr, rawDist, ComputeUnit::registerManager, _amd_queue_s::scratch_backing_memory_location, _amd_queue_s::scratch_resource_descriptor, _amd_queue_s::scratch_workitem_byte_size, HSAQueueEntry::sgprBitEnabled(), ComputeUnit::shader, simdId, ComputeUnit::srf, HSAQueueEntry::vgprBitEnabled(), ComputeUnit::vrf, wfDynId, wfId, ComputeUnit::wfSize(), wfSlotId, wgId, HSAQueueEntry::wgSize(), wgSz, workGroupId, WorkgroupIdX, WorkgroupIdY, WorkgroupIdZ, WorkgroupInfo, workItemId, WorkitemIdX, WorkitemIdY, and WorkitemIdZ.
bool Wavefront::isGmInstruction | ( | GPUDynInstPtr | ii | ) |
Definition at line 565 of file wavefront.cc.
Referenced by exec().
bool Wavefront::isLmInstruction | ( | GPUDynInstPtr | ii | ) |
Definition at line 576 of file wavefront.cc.
Referenced by exec().
bool Wavefront::isOldestInstBarrier | ( | ) |
Definition at line 648 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
Referenced by ScheduleStage::addToSchList().
bool Wavefront::isOldestInstFlatMem | ( | ) |
Definition at line 713 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstGMem | ( | ) |
Definition at line 661 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstLMem | ( | ) |
Definition at line 687 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstPrivMem | ( | ) |
Definition at line 700 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstScalarALU | ( | ) |
Definition at line 618 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstScalarMem | ( | ) |
Definition at line 674 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstSleep | ( | ) |
Definition at line 587 of file wavefront.cc.
References instructionBuffer.
Referenced by ScheduleStage::addToSchList().
bool Wavefront::isOldestInstVectorALU | ( | ) |
Definition at line 633 of file wavefront.cc.
References instructionBuffer, S_STOPPED, and status.
bool Wavefront::isOldestInstWaitcnt | ( | ) |
Definition at line 601 of file wavefront.cc.
References instructionBuffer.
Referenced by ScheduleStage::addToSchList(), and exec().
GPUDynInstPtr Wavefront::nextInstr | ( | ) |
Definition at line 1169 of file wavefront.cc.
References computeUnit, instructionBuffer, and ComputeUnit::pipeMap.
Referenced by ScoreboardCheckStage::exec().
Addr Wavefront::pc | ( | ) | const |
Definition at line 1365 of file wavefront.cc.
References _pc.
Referenced by Gcn3ISA::GPUISA::advancePC(), exec(), Gcn3ISA::Inst_SOP1__S_GETPC_B64::execute(), Gcn3ISA::Inst_SOP1__S_SETPC_B64::execute(), Gcn3ISA::Inst_SOP1__S_SWAPPC_B64::execute(), Gcn3ISA::Inst_SOPP__S_BRANCH::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_SCC0::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_SCC1::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_VCCZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_VCCNZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECZ::execute(), Gcn3ISA::Inst_SOPP__S_CBRANCH_EXECNZ::execute(), and FetchUnit::initiateFetch().
void Wavefront::pc | ( | Addr | new_pc | ) |
Definition at line 1371 of file wavefront.cc.
References _pc.
void Wavefront::releaseBarrier | ( | ) |
Definition at line 1436 of file wavefront.cc.
References barId, and WFBarrier::InvalidID.
Referenced by Gcn3ISA::Inst_SOPP__S_ENDPGM::execute().
|
private |
Definition at line 759 of file wavefront.cc.
References execUnitId, globalMem, panic, rdGmReqsInPipe, scalarMem, scalarRdGmReqsInPipe, scalarWrGmReqsInPipe, and wrGmReqsInPipe.
Referenced by reserveResources().
|
private |
Definition at line 789 of file wavefront.cc.
References execUnitId, fatal_if, localMem, panic, rdLmReqsInPipe, and wrLmReqsInPipe.
Referenced by reserveResources().
std::vector< int > Wavefront::reserveResources | ( | ) |
Definition at line 807 of file wavefront.cc.
References execUnitId, fatal_if, flatGmUnitId, flatLmUnitId, instructionBuffer, panic, reserveGmResource(), reserveLmResource(), scalarAluGlobalIdx, and simdId.
Referenced by ScheduleStage::reserveResources().
void Wavefront::resizeRegFiles | ( | int | num_vregs, |
int | num_sregs | ||
) |
Definition at line 506 of file wavefront.cc.
|
inline |
Definition at line 248 of file wavefront.hh.
References computeUnit.
void Wavefront::setSleepTime | ( | int | sleep_time | ) |
Definition at line 1263 of file wavefront.cc.
References sleepCnt.
void Wavefront::setStatus | ( | status_e | newStatus | ) |
Definition at line 517 of file wavefront.cc.
References computeUnit, ComputeUnit::cu_id, curTick(), ComputeUnit::idleCUTimeout, ComputeUnit::idleWfs, lastNonIdleTick, Shader::n_wf, ComputeUnit::numVectorALUs, panic_if, S_BARRIER, S_STALLED, S_STOPPED, S_WAITCNT, ComputeUnit::shader, and status.
Referenced by ScheduleStage::addToSchList(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), and ComputeUnit::releaseWFsFromBarrier().
void Wavefront::setWaitCnts | ( | int | vm_wait_cnt, |
int | exp_wait_cnt, | ||
int | lgkm_wait_cnt | ||
) |
prior waitcnts should be satisfied, at which time the WF resets them back to -1, indicating they are no longer active
if the instruction encoding indicates a waitcnt of 0xf, that means the waitcnt is not being used
Definition at line 1270 of file wavefront.cc.
References expWaitCnt, lgkmWaitCnt, S_WAITCNT, status, and vmWaitCnt.
bool Wavefront::sleepDone | ( | ) |
Definition at line 1244 of file wavefront.cc.
References S_RUNNING, S_STALLED_SLEEP, sleepCnt, and status.
void Wavefront::start | ( | uint64_t | _wfDynId, |
uint64_t | _base_ptr | ||
) |
bool Wavefront::stopFetch | ( | ) |
Definition at line 726 of file wavefront.cc.
References instructionBuffer.
Referenced by FetchUnit::exec().
void Wavefront::validateRequestCounters | ( | ) |
Definition at line 745 of file wavefront.cc.
References outstandingReqs, panic_if, rdGmReqsInPipe, rdLmReqsInPipe, simdId, wfDynId, wfSlotId, wrGmReqsInPipe, and wrLmReqsInPipe.
Referenced by Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_SWIZZLE_B32::execute(), Gcn3ISA::Inst_DS__DS_PERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), and Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute().
bool Wavefront::waitCntsSatisfied | ( | ) |
If we reach here, that means an s_waitcnt instruction was executed and the waitcnts are set by the execute method. Check if waitcnts are satisfied.
Definition at line 1201 of file wavefront.cc.
References clearWaitCnts(), expInstsIssued, expWaitCnt, lgkmInstsIssued, lgkmWaitCnt, vmemInstsIssued, and vmWaitCnt.
|
private |
Definition at line 328 of file wavefront.hh.
Referenced by execMask(), and Wavefront().
|
private |
Definition at line 298 of file wavefront.hh.
|
private |
Definition at line 327 of file wavefront.hh.
uint32_t Wavefront::actualWgSz[3] |
Definition at line 161 of file wavefront.hh.
Referenced by computeActualWgSz().
uint32_t Wavefront::actualWgSzTotal |
Definition at line 162 of file wavefront.hh.
Referenced by computeActualWgSz().
|
private |
Definition at line 329 of file wavefront.hh.
Referenced by barrierId(), hasBarrier(), and releaseBarrier().
ComputeUnit* Wavefront::computeUnit |
Definition at line 104 of file wavefront.hh.
Referenced by discardFetch(), exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), freeRegisterFile(), init(), initRegState(), nextInstr(), GPUDispatcher::notifyWgCompl(), GPUDynInst::resolveFlatSegment(), setParent(), and setStatus().
uint8_t* Wavefront::context |
Definition at line 240 of file wavefront.hh.
uint32_t Wavefront::dispatchId |
Definition at line 167 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_SOPP__S_ENDPGM::execute().
bool Wavefront::dropFetch |
Definition at line 110 of file wavefront.hh.
Referenced by discardFetch(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchUnit::fetch(), FetchUnit::processFetchReturn(), ComputeUnit::ITLBPort::recvTimingResp(), and Wavefront().
int Wavefront::execUnitId |
Definition at line 100 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_SMEM__S_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX16::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX16::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX4::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_SWIZZLE_B32::execute(), Gcn3ISA::Inst_DS__DS_PERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), freeResources(), reserveGmResource(), reserveLmResource(), reserveResources(), GPUDynInst::resolveFlatSegment(), and Wavefront().
|
private |
Definition at line 323 of file wavefront.hh.
Referenced by decExpInstsIssued(), incExpInstsIssued(), and waitCntsSatisfied().
|
private |
Definition at line 320 of file wavefront.hh.
Referenced by clearWaitCnts(), setWaitCnts(), and waitCntsSatisfied().
int Wavefront::flatGmUnitId |
Definition at line 102 of file wavefront.hh.
Referenced by reserveResources(), and GPUDynInst::resolveFlatSegment().
int Wavefront::flatLmUnitId |
Definition at line 101 of file wavefront.hh.
Referenced by reserveResources(), and GPUDynInst::resolveFlatSegment().
int Wavefront::globalMem |
Definition at line 124 of file wavefront.hh.
Referenced by init(), reserveGmResource(), and ScheduleStage::reserveResources().
uint32_t Wavefront::gridSz[3] |
Definition at line 157 of file wavefront.hh.
Referenced by computeActualWgSz().
VectorMask Wavefront::initMask |
Definition at line 217 of file wavefront.hh.
std::deque<GPUDynInstPtr> Wavefront::instructionBuffer |
Definition at line 107 of file wavefront.hh.
Referenced by discardFetch(), ExecStage::dumpDispList(), ScheduleStage::exec(), exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), isOldestInstBarrier(), isOldestInstFlatMem(), isOldestInstGMem(), isOldestInstLMem(), isOldestInstPrivMem(), isOldestInstScalarALU(), isOldestInstScalarMem(), isOldestInstSleep(), isOldestInstVectorALU(), isOldestInstWaitcnt(), nextInstr(), FetchUnit::processFetchReturn(), ComputeUnit::ITLBPort::recvTimingResp(), reserveResources(), ScheduleStage::scheduleRfDestOperands(), and stopFetch().
int Wavefront::kernId |
Definition at line 95 of file wavefront.hh.
Referenced by GPUDynInst::GPUDynInst(), GPUDispatcher::isReachingKernelEnd(), and GPUDispatcher::notifyWgCompl().
std::vector<Addr> Wavefront::lastAddr |
Definition at line 151 of file wavefront.hh.
Referenced by Wavefront().
uint64_t Wavefront::lastInstExec |
Definition at line 227 of file wavefront.hh.
Referenced by exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), and Wavefront().
Tick Wavefront::lastNonIdleTick |
Definition at line 112 of file wavefront.hh.
Referenced by setStatus(), and Wavefront().
uint64_t Wavefront::lastTrace |
Definition at line 190 of file wavefront.hh.
Referenced by Wavefront().
LdsChunk* Wavefront::ldsChunk |
Definition at line 221 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_DS::initDualMemRead(), Gcn3ISA::Inst_DS::initDualMemWrite(), Gcn3ISA::Inst_DS::initMemRead(), Gcn3ISA::Inst_DS::initMemWrite(), and Wavefront().
|
private |
Definition at line 324 of file wavefront.hh.
Referenced by decLGKMInstsIssued(), incLGKMInstsIssued(), and waitCntsSatisfied().
|
private |
Definition at line 321 of file wavefront.hh.
Referenced by clearWaitCnts(), setWaitCnts(), and waitCntsSatisfied().
int Wavefront::localMem |
Definition at line 125 of file wavefront.hh.
Referenced by ScheduleStage::arbitrateVrfToLdsBus(), init(), reserveLmResource(), ScheduleStage::reserveResources(), and ScheduleStage::scheduleRfDestOperands().
uint32_t Wavefront::maxDynWaveId |
Definition at line 166 of file wavefront.hh.
int Wavefront::maxIbSize |
Definition at line 105 of file wavefront.hh.
Referenced by FetchUnit::FetchBufDesc::allocateBuf().
uint32_t Wavefront::maxSgprs |
Definition at line 131 of file wavefront.hh.
Referenced by resizeRegFiles(), GPUDynInst::resolveFlatSegment(), and Wavefront().
uint32_t Wavefront::maxVgprs |
Definition at line 129 of file wavefront.hh.
Referenced by freeRegisterFile(), resizeRegFiles(), start(), and Wavefront().
int Wavefront::memTraceBusy |
Definition at line 189 of file wavefront.hh.
Referenced by Wavefront().
std::vector<uint64_t> Wavefront::oldDgpr |
Definition at line 210 of file wavefront.hh.
Referenced by Wavefront().
uint32_t Wavefront::oldDgprId |
Definition at line 212 of file wavefront.hh.
uint64_t Wavefront::oldDgprTcnt |
Definition at line 214 of file wavefront.hh.
Referenced by Wavefront().
std::vector<uint32_t> Wavefront::oldVgpr |
Definition at line 203 of file wavefront.hh.
Referenced by Wavefront().
uint32_t Wavefront::oldVgprId |
Definition at line 205 of file wavefront.hh.
uint64_t Wavefront::oldVgprTcnt |
Definition at line 207 of file wavefront.hh.
Referenced by Wavefront().
int Wavefront::outstandingReqs |
Definition at line 169 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), validateRequestCounters(), and Wavefront().
int Wavefront::outstandingReqsRdGm |
Definition at line 175 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), and Wavefront().
int Wavefront::outstandingReqsRdLm |
Definition at line 177 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), and Wavefront().
int Wavefront::outstandingReqsWrGm |
Definition at line 171 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), and Wavefront().
int Wavefront::outstandingReqsWrLm |
Definition at line 173 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), and Wavefront().
bool Wavefront::pendingFetch |
Definition at line 109 of file wavefront.hh.
Referenced by discardFetch(), FetchUnit::exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchUnit::fetch(), FetchUnit::processFetchReturn(), ComputeUnit::ITLBPort::recvTimingResp(), and Wavefront().
std::unordered_map<int,uint64_t> Wavefront::rawDist |
Definition at line 231 of file wavefront.hh.
Referenced by exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), initRegState(), and Wavefront().
int Wavefront::rdGmReqsInPipe |
Definition at line 183 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), reserveGmResource(), GPUDynInst::resolveFlatSegment(), validateRequestCounters(), and Wavefront().
int Wavefront::rdLmReqsInPipe |
Definition at line 182 of file wavefront.hh.
Referenced by ScheduleStage::dispatchReady(), Gcn3ISA::Inst_DS__DS_READ_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2_B32::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_U8::execute(), Gcn3ISA::Inst_DS__DS_READ_U16::execute(), Gcn3ISA::Inst_DS__DS_SWIZZLE_B32::execute(), Gcn3ISA::Inst_DS__DS_PERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_BPERMUTE_B32::execute(), Gcn3ISA::Inst_DS__DS_READ_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2_B64::execute(), Gcn3ISA::Inst_DS__DS_READ2ST64_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_UBYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_USHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), reserveLmResource(), GPUDynInst::resolveFlatSegment(), validateRequestCounters(), and Wavefront().
int Wavefront::reservedScalarRegs |
Definition at line 194 of file wavefront.hh.
Referenced by init(), Gcn3ISA::ScalarOperand< DataType, Const, sizeof(DataType)/sizeof(VecElemU32) >::regIdx(), and Wavefront().
int Wavefront::reservedVectorRegs |
Definition at line 192 of file wavefront.hh.
Referenced by freeRegisterFile(), init(), and Wavefront().
int Wavefront::scalarAlu |
Definition at line 119 of file wavefront.hh.
Referenced by ScheduleStage::dispatchReady(), exec(), and init().
int Wavefront::scalarAluGlobalIdx |
Definition at line 123 of file wavefront.hh.
Referenced by init(), and reserveResources().
int Wavefront::scalarMem |
Definition at line 126 of file wavefront.hh.
Referenced by init(), and reserveGmResource().
int Wavefront::scalarOutstandingReqsRdGm |
Definition at line 179 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_SMEM__S_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX16::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX16::execute(), and Wavefront().
int Wavefront::scalarOutstandingReqsWrGm |
Definition at line 181 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_SMEM__S_STORE_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX4::execute(), and Wavefront().
int Wavefront::scalarRdGmReqsInPipe |
Definition at line 186 of file wavefront.hh.
Referenced by ScheduleStage::dispatchReady(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_LOAD_DWORDX16::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX8::execute(), Gcn3ISA::Inst_SMEM__S_BUFFER_LOAD_DWORDX16::execute(), reserveGmResource(), and Wavefront().
int Wavefront::scalarWrGmReqsInPipe |
Definition at line 187 of file wavefront.hh.
Referenced by ScheduleStage::dispatchReady(), Gcn3ISA::Inst_SMEM__S_STORE_DWORD::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX2::execute(), Gcn3ISA::Inst_SMEM__S_STORE_DWORDX4::execute(), reserveGmResource(), and Wavefront().
const int Wavefront::simdId |
Definition at line 97 of file wavefront.hh.
Referenced by ScheduleStage::addToSchList(), ScheduleStage::checkRfOperandReadComplete(), discardFetch(), ScheduleStage::dispatchReady(), ExecStage::dumpDispList(), ScoreboardCheckStage::exec(), ExecStage::exec(), exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_UBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_SBYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_USHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_LOAD_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), FetchStage::fetch(), FetchUnit::fetch(), freeRegisterFile(), GPUDynInst::GPUDynInst(), FetchUnit::initiateFetch(), initRegState(), VectorRegisterFile::printReg(), ScalarRegisterFile::printReg(), FetchStage::processFetchReturn(), FetchUnit::processFetchReturn(), Gcn3ISA::VecOperand< DataType, Const, NumDwords >::read(), Gcn3ISA::ScalarOperand< DataType, Const, sizeof(DataType)/sizeof(VecElemU32) >::read(), ScheduleStage::reserveResources(), reserveResources(), ScheduleStage::schedRfWrites(), validateRequestCounters(), Gcn3ISA::VecOperand< DataType, Const, NumDwords >::write(), and Gcn3ISA::ScalarOperand< DataType, Const, sizeof(DataType)/sizeof(VecElemU32) >::write().
|
private |
Definition at line 325 of file wavefront.hh.
Referenced by setSleepTime(), and sleepDone().
uint32_t Wavefront::startSgprIndex |
Definition at line 200 of file wavefront.hh.
Referenced by init(), and Wavefront().
uint32_t Wavefront::startVgprIndex |
Definition at line 197 of file wavefront.hh.
Referenced by freeRegisterFile(), init(), and Wavefront().
Wavefront::WavefrontStats Wavefront::stats |
|
private |
Definition at line 326 of file wavefront.hh.
Referenced by clearWaitCnts(), exec(), getStatus(), isOldestInstBarrier(), isOldestInstFlatMem(), isOldestInstGMem(), isOldestInstLMem(), isOldestInstPrivMem(), isOldestInstScalarALU(), isOldestInstScalarMem(), isOldestInstVectorALU(), setStatus(), setWaitCnts(), sleepDone(), start(), and Wavefront().
std::vector<int> Wavefront::vecReads |
Definition at line 235 of file wavefront.hh.
Referenced by exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), start(), and Wavefront().
|
private |
Definition at line 322 of file wavefront.hh.
Referenced by decVMemInstsIssued(), incVMemInstsIssued(), and waitCntsSatisfied().
|
private |
the following are used for waitcnt instructions vmWaitCnt: once set, we wait for the oustanding number of vector mem instructions to be at, or below vmWaitCnt.
expWaitCnt: once set, we wait for the outstanding number outstanding VM writes or EXP insts to be at, or below expWaitCnt.
lgkmWaitCnt: once set, we wait for the oustanding number of LDS, GDS, scalar memory, and message instructions to be at, or below lgkmCount. we currently do not support GDS/message ops.
Definition at line 319 of file wavefront.hh.
Referenced by clearWaitCnts(), setWaitCnts(), and waitCntsSatisfied().
uint64_t Wavefront::wfDynId |
Definition at line 224 of file wavefront.hh.
Referenced by OFSchedulingPolicy::__chooseWave(), ScheduleStage::addToSchList(), ScheduleStage::checkRfOperandReadComplete(), ExecStage::dumpDispList(), ExecStage::exec(), ScoreboardCheckStage::exec(), exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), GPUDynInst::GPUDynInst(), FetchUnit::initiateFetch(), initRegState(), VectorRegisterFile::printReg(), ScalarRegisterFile::printReg(), ScheduleStage::reserveResources(), start(), and validateRequestCounters().
uint32_t Wavefront::wfId |
Definition at line 165 of file wavefront.hh.
Referenced by initRegState().
const int Wavefront::wfSlotId |
Definition at line 94 of file wavefront.hh.
Referenced by discardFetch(), FetchUnit::exec(), exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), Gcn3ISA::Inst_SOPP__S_BARRIER::execute(), FetchUnit::fetch(), GPUDynInst::GPUDynInst(), FetchUnit::init(), FetchUnit::initiateFetch(), initRegState(), VectorRegisterFile::printReg(), ScalarRegisterFile::printReg(), FetchUnit::processFetchReturn(), and validateRequestCounters().
uint32_t Wavefront::wgId |
Definition at line 158 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), GPUDynInst::GPUDynInst(), initRegState(), and GPUDispatcher::notifyWgCompl().
uint32_t Wavefront::wgSz |
Definition at line 159 of file wavefront.hh.
Referenced by initRegState().
uint32_t Wavefront::workGroupId[3] |
Definition at line 155 of file wavefront.hh.
Referenced by initRegState().
uint32_t Wavefront::workGroupSz[3] |
Definition at line 156 of file wavefront.hh.
Referenced by computeActualWgSz().
std::vector<uint32_t> Wavefront::workItemFlatId |
Definition at line 153 of file wavefront.hh.
Referenced by Wavefront().
std::vector<uint32_t> Wavefront::workItemId[3] |
Definition at line 152 of file wavefront.hh.
Referenced by initRegState(), and Wavefront().
int Wavefront::wrGmReqsInPipe |
Definition at line 185 of file wavefront.hh.
Referenced by Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_WBINVL1_VOL::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), reserveGmResource(), GPUDynInst::resolveFlatSegment(), validateRequestCounters(), and Wavefront().
int Wavefront::wrLmReqsInPipe |
Definition at line 184 of file wavefront.hh.
Referenced by ScheduleStage::dispatchReady(), Gcn3ISA::Inst_DS__DS_WRITE_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE2ST64_B32::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B8::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B16::execute(), Gcn3ISA::Inst_DS__DS_WRITE_B64::execute(), Gcn3ISA::Inst_DS__DS_WRITE2_B64::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_BYTE::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_SHORT::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORD::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX2::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX3::execute(), Gcn3ISA::Inst_MUBUF__BUFFER_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_BYTE::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_SHORT::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORD::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX2::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX3::execute(), Gcn3ISA::Inst_FLAT__FLAT_STORE_DWORDX4::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_ADD_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_SUB_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_INC_X2::execute(), Gcn3ISA::Inst_FLAT__FLAT_ATOMIC_DEC_X2::execute(), reserveLmResource(), GPUDynInst::resolveFlatSegment(), validateRequestCounters(), and Wavefront().