gem5
v20.0.0.3
|
#include <compute_unit.hh>
Classes | |
class | CUExitCallback |
class | DataPort |
Data access Port. More... | |
class | DTLBPort |
Data TLB port. More... | |
class | ITLBPort |
class | LDSPort |
the port intended to communicate between the CU and its LDS More... | |
class | SQCPort |
class | waveIdentifier |
class | waveQueue |
Public Types | |
typedef ComputeUnitParams | Params |
typedef std::unordered_map< Addr, std::pair< int, int > > | pageDataStruct |
![]() | |
typedef ClockedObjectParams | Params |
Parameters of ClockedObject. More... | |
![]() | |
typedef SimObjectParams | Params |
Public Member Functions | |
void | registerEvent (uint32_t simdId, uint32_t regIdx, uint32_t operandSize, uint64_t when, uint8_t newStatus) |
void | updateEvents () |
ComputeUnit (const Params *p) | |
~ComputeUnit () | |
int | spBypassLength () |
int | dpBypassLength () |
int | storeBusLength () |
int | loadBusLength () |
int | wfSize () const |
void | resizeRegFiles (int num_cregs, int num_sregs, int num_dregs) |
void | exec () |
void | initiateFetch (Wavefront *wavefront) |
void | fetch (PacketPtr pkt, Wavefront *wavefront) |
void | fillKernelState (Wavefront *w, NDRange *ndr) |
void | startWavefront (Wavefront *w, int waveId, LdsChunk *ldsChunk, NDRange *ndr) |
void | StartWorkgroup (NDRange *ndr) |
int | ReadyWorkgroup (NDRange *ndr) |
bool | isVecAlu (int unitId) |
bool | isGlbMem (int unitId) |
bool | isShrMem (int unitId) |
int | GlbMemUnitId () |
int | ShrMemUnitId () |
int | nextGlbRdBus () |
int | nextLocRdBus () |
int | AllAtBarrier (uint32_t _barrier_id, uint32_t bcnt, uint32_t bslots) |
bool | cedeSIMD (int simdId, int wfSlotId) |
template<typename c0 , typename c1 > | |
void | doSmReturn (GPUDynInstPtr gpuDynInst) |
virtual void | init () override |
init() is called after all C++ SimObjects have been created and all ports are connected. More... | |
void | sendRequest (GPUDynInstPtr gpuDynInst, int index, PacketPtr pkt) |
void | sendSyncRequest (GPUDynInstPtr gpuDynInst, int index, PacketPtr pkt) |
void | injectGlobalMemFence (GPUDynInstPtr gpuDynInst, bool kernelLaunch=true, RequestPtr req=nullptr) |
void | handleMemPacket (PacketPtr pkt, int memport_index) |
bool | processTimingPacket (PacketPtr pkt) |
void | processFetchReturn (PacketPtr pkt) |
void | updatePageDivergenceDist (Addr addr) |
MasterID | masterId () |
bool | isDone () const |
bool | isSimdDone (uint32_t) const |
void | updateInstStats (GPUDynInstPtr gpuDynInst) |
void | regStats () override |
Callback to set stat parameters. More... | |
LdsState & | getLds () const |
int32_t | getRefCounter (const uint32_t dispatchId, const uint32_t wgId) const |
int | cacheLineSize () const |
bool | sendToLds (GPUDynInstPtr gpuDynInst) __attribute__((warn_unused_result)) |
send a general request to the LDS make sure to look at the return value here as your request might be NACK'd and returning false means that you have to have some backup plan More... | |
LDSPort * | getLdsPort () const |
Port & | getPort (const std::string &if_name, PortID idx) override |
Get a port with a given name and index. More... | |
uint64_t | getAndIncSeqNum () |
![]() | |
ClockedObject (const ClockedObjectParams *p) | |
const Params * | params () const |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
![]() | |
virtual | ~SimObject () |
virtual const std::string | name () const |
virtual void | loadState (CheckpointIn &cp) |
loadState() is called on each SimObject when restoring from a checkpoint. More... | |
virtual void | initState () |
initState() is called on each SimObject when not restoring from a checkpoint. More... | |
virtual void | regProbePoints () |
Register probe points for this object. More... | |
virtual void | regProbeListeners () |
Register probe listeners for this object. More... | |
ProbeManager * | getProbeManager () |
Get the probe manager for this object. More... | |
virtual void | startup () |
startup() is the final initialization call before simulation. More... | |
DrainState | drain () override |
Provide a default implementation of the drain interface for objects that don't need draining. More... | |
virtual void | memWriteback () |
Write back dirty buffers to memory using functional writes. More... | |
virtual void | memInvalidate () |
Invalidate the contents of memory buffers. More... | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
const Params * | params () const |
SimObject (const Params *_params) | |
![]() | |
EventQueue * | eventQueue () const |
void | schedule (Event &event, Tick when) |
void | deschedule (Event &event) |
void | reschedule (Event &event, Tick when, bool always=false) |
void | schedule (Event *event, Tick when) |
void | deschedule (Event *event) |
void | reschedule (Event *event, Tick when, bool always=false) |
void | wakeupEventQueue (Tick when=(Tick) -1) |
void | setCurTick (Tick newVal) |
EventManager (EventManager &em) | |
EventManager (EventManager *em) | |
EventManager (EventQueue *eq) | |
![]() | |
Serializable () | |
virtual | ~Serializable () |
void | serializeSection (CheckpointOut &cp, const char *name) const |
Serialize an object into a new section. More... | |
void | serializeSection (CheckpointOut &cp, const std::string &name) const |
void | unserializeSection (CheckpointIn &cp, const char *name) |
Unserialize an a child object. More... | |
void | unserializeSection (CheckpointIn &cp, const std::string &name) |
![]() | |
DrainState | drainState () const |
Return the current drain state of an object. More... | |
virtual void | notifyFork () |
Notify a child process of a fork. More... | |
![]() | |
Group (Group *parent, const char *name=nullptr) | |
Construct a new statistics group. More... | |
virtual | ~Group () |
virtual void | resetStats () |
Callback to reset stats. More... | |
virtual void | preDumpStats () |
Callback before stats are dumped. More... | |
void | addStat (Stats::Info *info) |
Register a stat with this group. More... | |
const std::map< std::string, Group * > & | getStatGroups () const |
Get all child groups associated with this object. More... | |
const std::vector< Info * > & | getStats () const |
Get all stats associated with this object. More... | |
void | addStatGroup (const char *name, Group *block) |
Add a stat block as a child of this block. More... | |
const Info * | resolveStat (std::string name) const |
Resolve a stat by its name within this group. More... | |
Group ()=delete | |
Group (const Group &)=delete | |
Group & | operator= (const Group &)=delete |
![]() | |
void | updateClockPeriod () |
Update the tick to the current tick. More... | |
Tick | clockEdge (Cycles cycles=Cycles(0)) const |
Determine the tick when a cycle begins, by default the current one, but the argument also enables the caller to determine a future cycle. More... | |
Cycles | curCycle () const |
Determine the current cycle, corresponding to a tick aligned to a clock edge. More... | |
Tick | nextCycle () const |
Based on the clock of the object, determine the start tick of the first cycle that is at least one cycle in the future. More... | |
uint64_t | frequency () const |
Tick | clockPeriod () const |
double | voltage () const |
Cycles | ticksToCycles (Tick t) const |
Tick | cyclesToTicks (Cycles c) const |
Protected Attributes | |
MasterID | _masterId |
LdsState & | lds |
![]() | |
const SimObjectParams * | _params |
Cached copy of the object parameters. More... | |
![]() | |
EventQueue * | eventq |
A pointer to this object's event queue. More... | |
Private Attributes | |
const int | _cacheLineSize |
uint64_t | globalSeqNum |
int | wavefrontSize |
GPUStaticInst * | kernelLaunchInst |
Additional Inherited Members | |
![]() | |
static void | serializeAll (CheckpointOut &cp) |
Serialize all SimObjects in the system. More... | |
static SimObject * | find (const char *name) |
Find the SimObject with the given name and return a pointer to it. More... | |
![]() | |
static const std::string & | currentSection () |
Gets the fully-qualified name of the active section. More... | |
static void | serializeAll (const std::string &cpt_dir) |
static void | unserializeGlobals (CheckpointIn &cp) |
![]() | |
Drainable () | |
virtual | ~Drainable () |
virtual void | drainResume () |
Resume execution after a successful drain. More... | |
void | signalDrainDone () const |
Signal that an object is drained. More... | |
![]() | |
Clocked (ClockDomain &clk_domain) | |
Create a clocked object and set the clock domain based on the parameters. More... | |
Clocked (Clocked &)=delete | |
Clocked & | operator= (Clocked &)=delete |
virtual | ~Clocked () |
Virtual destructor due to inheritance. More... | |
void | resetClock () const |
Reset the object's clock using the current global tick value. More... | |
virtual void | clockPeriodUpdated () |
A hook subclasses can implement so they can do any extra work that's needed when the clock rate is changed. More... | |
Definition at line 91 of file compute_unit.hh.
typedef std::unordered_map<Addr, std::pair<int, int> > ComputeUnit::pageDataStruct |
Definition at line 396 of file compute_unit.hh.
typedef ComputeUnitParams ComputeUnit::Params |
Definition at line 132 of file compute_unit.hh.
ComputeUnit::ComputeUnit | ( | const Params * | p | ) |
This check is necessary because std::bitset only provides conversion to unsigned long or unsigned long long via to_ulong() or to_ullong(). there are * a few places in the code where to_ullong() is used, however if VSZ is larger than a value the host can support then bitset will throw a runtime exception. we should remove all use of to_long() or to_ullong() so we can have VSZ greater than 64b, however until that is done this assert is required.
Definition at line 58 of file compute_unit.cc.
References coalescerToVrfBusWidth, cuExitCallback, exec_policy, fatal, fatal_if, ArmISA::i, isPowerOf2(), ArmISA::j, MipsISA::k, lastExecCycle, lastVaddrCU, lastVaddrSimd, lastVaddrWF, lds, memPort, numCyclesPerLoadTransfer, numCyclesPerStoreTransfer, numSIMDs, numVecRegsPerSimd, OLDEST, perLaneTLB, registerExitCallback(), RR, LdsState::setParent(), tlbPort, vrf, vrfToCoalescerBusWidth, wavefrontSize, wfList, wfSize(), and xactCasLoadMap.
Referenced by ComputeUnit::DataPort::processMemRespEvent().
ComputeUnit::~ComputeUnit | ( | ) |
Definition at line 159 of file compute_unit.cc.
References cuExitCallback, dispatchList, ArmISA::i, ArmISA::j, lastVaddrCU, lastVaddrSimd, ldsPort, Shader::n_wf, numSIMDs, readyList, shader, vectorAluInstAvail, waveStatusList, and wfList.
int ComputeUnit::AllAtBarrier | ( | uint32_t | _barrier_id, |
uint32_t | bcnt, | ||
uint32_t | bslots | ||
) |
Definition at line 445 of file compute_unit.cc.
References Wavefront::barrierCnt, Wavefront::barrierId, cu_id, DPRINTF, Shader::n_wf, numSIMDs, Wavefront::outstandingReqs, Wavefront::S_RUNNING, shader, Wavefront::status, MipsISA::w, and wfList.
Referenced by nextLocRdBus(), and Wavefront::ready().
|
inline |
Definition at line 391 of file compute_unit.hh.
References __attribute__(), _cacheLineSize, and sendToLds().
Referenced by FetchUnit::initiateFetch().
bool ComputeUnit::cedeSIMD | ( | int | simdId, |
int | wfSlotId | ||
) |
Definition at line 483 of file compute_unit.cc.
References ComputeUnit::waveIdentifier::simdId, ComputeUnit::waveIdentifier::wfSlotId, xact_cas_mode, and xactCasLoadMap.
Referenced by ScoreboardCheckStage::exec(), and nextLocRdBus().
void ComputeUnit::doSmReturn | ( | GPUDynInstPtr | gpuDynInst | ) |
Referenced by nextLocRdBus().
|
inline |
Definition at line 246 of file compute_unit.hh.
References dpBypassPipeLength.
Referenced by VectorRegisterFile::exec().
void ComputeUnit::exec | ( | ) |
Definition at line 531 of file compute_unit.cc.
References FetchStage::exec(), ScheduleStage::exec(), LocalMemPipeline::exec(), GlobalMemPipeline::exec(), ScoreboardCheckStage::exec(), ExecStage::exec(), execStage, fetchStage, globalMemoryPipe, localMemoryPipe, scheduleStage, scoreboardCheckStage, totalCycles, and updateEvents().
Referenced by wfSize().
Definition at line 178 of file compute_unit.cc.
References HsaQueueEntry::args, Wavefront::computeActualWgSz(), HsaQueueEntry::cRegCount, HsaQueueEntry::dRegCount, HsaQueueEntry::gdSize, Wavefront::gridSz, Wavefront::kernelArgs, HsaQueueEntry::privMemPerItem, Wavefront::privSizePerItem, NDRange::q, Wavefront::resizeRegFiles(), Wavefront::roBase, HsaQueueEntry::roMemStart, HsaQueueEntry::roMemTotal, Wavefront::roSize, HsaQueueEntry::spillMemPerItem, Wavefront::spillSizePerItem, HsaQueueEntry::sRegCount, HsaQueueEntry::wgSize, Wavefront::wgSz, and Wavefront::workGroupSz.
Referenced by StartWorkgroup(), and wfSize().
|
inline |
Definition at line 739 of file compute_unit.hh.
References globalSeqNum.
Referenced by StartWorkgroup().
|
inline |
Definition at line 383 of file compute_unit.hh.
References getRefCounter(), and lds.
Referenced by HsailISA::Ret::execute(), and Gcn3ISA::Inst_SOPP__S_ENDPGM::execute().
|
inline |
Definition at line 675 of file compute_unit.hh.
References ldsPort.
Get a port with a given name and index.
This is used at binding time and returns a reference to a protocol-agnostic port.
if_name | Port name |
idx | Index in the case of a VectorPort |
Reimplemented from SimObject.
Definition at line 692 of file compute_unit.hh.
References csprintf(), fatal, ldsPort, SimObject::name(), panic, sqcPort, and sqcTLBPort.
int32_t ComputeUnit::getRefCounter | ( | const uint32_t | dispatchId, |
const uint32_t | wgId | ||
) | const |
Definition at line 1757 of file compute_unit.cc.
References LdsState::getRefCounter(), and lds.
Referenced by getLds(), and Wavefront::ready().
|
inline |
Definition at line 266 of file compute_unit.hh.
References GLBMEM_PIPE.
Referenced by ScoreboardCheckStage::exec(), Wavefront::exec(), and Wavefront::updateResources().
void ComputeUnit::handleMemPacket | ( | PacketPtr | pkt, |
int | memport_index | ||
) |
Referenced by nextLocRdBus().
|
overridevirtual |
init() is called after all C++ SimObjects have been created and all ports are connected.
Initializations that are independent of unserialization but rely on a fully instantiated and connected SimObject graph should be done here.
Reimplemented from SimObject.
Definition at line 547 of file compute_unit.cc.
References aluPipe, BLOCKED, dispatchList, EMPTY, execStage, fatal_if, fetchStage, Shader::funcargs_size, glbMemInstAvail, glbMemToVrfBus, globalMemoryPipe, ArmISA::i, WaitClass::init(), FetchStage::init(), ScheduleStage::init(), LocalMemPipeline::init(), GlobalMemPipeline::init(), ScoreboardCheckStage::init(), ExecStage::init(), ArmISA::j, localMemoryPipe, locMemToVrfBus, Shader::n_wf, nextGlbMemBus, nextLocMemBus, numGlbMemUnits, numLocMemUnits, numSIMDs, readyList, scheduleStage, scoreboardCheckStage, shader, shrMemInstAvail, Shader::tick_cnt, Shader::ticks(), vectorAluInstAvail, vectorRegsReserved, vrfToGlobalMemPipeBus, vrfToLocalMemPipeBus, wavefrontSize, waveStatusList, wfList, and wfWait.
Referenced by nextLocRdBus().
void ComputeUnit::injectGlobalMemFence | ( | GPUDynInstPtr | gpuDynInst, |
bool | kernelLaunch = true , |
||
RequestPtr | req = nullptr |
||
) |
Definition at line 938 of file compute_unit.cc.
References Request::KERNEL, masterId(), MemCmd::MemFenceReq, and sendSyncRequest().
Referenced by HsailISA::Ret::execute(), HsailISA::MemFence::initiateAcc(), nextLocRdBus(), and StartWorkgroup().
bool ComputeUnit::isDone | ( | ) | const |
Definition at line 1728 of file compute_unit.cc.
References glbMemToVrfBus, globalMemoryPipe, ArmISA::i, GlobalMemPipeline::isGMLdRespFIFOWrRdy(), GlobalMemPipeline::isGMReqFIFOWrRdy(), GlobalMemPipeline::isGMStRespFIFOWrRdy(), LocalMemPipeline::isLMReqFIFOWrRdy(), LocalMemPipeline::isLMRespFIFOWrRdy(), isSimdDone(), ArmISA::j, localMemoryPipe, locMemToVrfBus, numGlbMemUnits, numLocMemUnits, numSIMDs, WaitClass::rdy(), vrfToGlobalMemPipeBus, and vrfToLocalMemPipeBus.
Referenced by masterId().
|
inline |
Definition at line 264 of file compute_unit.hh.
References GLBMEM_PIPE.
Referenced by ExecStage::collectStatistics().
|
inline |
Definition at line 265 of file compute_unit.hh.
References LDSMEM_PIPE.
Referenced by ExecStage::collectStatistics().
bool ComputeUnit::isSimdDone | ( | uint32_t | simdId | ) | const |
Definition at line 1763 of file compute_unit.cc.
References aluPipe, ArmISA::i, Shader::n_wf, numGlbMemUnits, numLocMemUnits, numSIMDs, Wavefront::S_STOPPED, shader, ArmISA::status, vrfToGlobalMemPipeBus, vrfToLocalMemPipeBus, and wfList.
Referenced by isDone(), and masterId().
|
inline |
Definition at line 263 of file compute_unit.hh.
Referenced by ExecStage::collectStatistics().
|
inline |
Definition at line 248 of file compute_unit.hh.
References numCyclesPerLoadTransfer.
Referenced by LdsState::processPacket().
|
inline |
Definition at line 291 of file compute_unit.hh.
References _masterId, isDone(), and isSimdDone().
Referenced by FetchUnit::initiateFetch(), and injectGlobalMemFence().
|
inline |
Definition at line 268 of file compute_unit.hh.
References numGlbMemUnits.
Referenced by Wavefront::exec(), and Wavefront::updateResources().
|
inline |
Definition at line 269 of file compute_unit.hh.
References addr, AllAtBarrier(), cedeSIMD(), doSmReturn(), handleMemPacket(), MipsISA::index, init(), injectGlobalMemFence(), numLocMemUnits, processFetchReturn(), processTimingPacket(), sendRequest(), sendSyncRequest(), and updatePageDivergenceDist().
Referenced by Wavefront::exec(), and Wavefront::updateResources().
void ComputeUnit::processFetchReturn | ( | PacketPtr | pkt | ) |
Referenced by nextLocRdBus().
bool ComputeUnit::processTimingPacket | ( | PacketPtr | pkt | ) |
Referenced by nextLocRdBus().
int ComputeUnit::ReadyWorkgroup | ( | NDRange * | ndr | ) |
Definition at line 363 of file compute_unit.cc.
References LdsState::canReserve(), ArmISA::d, DPRINTF, HsaQueueEntry::dRegCount, HsaQueueEntry::gdSize, ArmISA::i, ArmISA::j, lds, HsaQueueEntry::ldsSize, Shader::n_wf, numSIMDs, numTimesWgBlockedDueVgprAlloc, numVecRegsPerSimd, NDRange::q, Wavefront::S_STOPPED, shader, HsaQueueEntry::sRegCount, ArmISA::status, vrf, wfList, wfSize(), wgBlockedDueLdsAllocation, NDRange::wgId, and HsaQueueEntry::wgSize.
Referenced by wfSize().
|
inline |
Definition at line 219 of file compute_unit.hh.
References updateEvents().
Referenced by VectorRegisterFile::exec().
|
overridevirtual |
Callback to set stat parameters.
This callback is typically used for complex stats (e.g., distributions) that need parameters in addition to a name and a description. Stat names and descriptions should typically be set from the constructor usingo from the constructor using the ADD_STAT macro.
Reimplemented from Stats::Group.
Definition at line 1395 of file compute_unit.cc.
References activeLanesPerGMemInstrDist, activeLanesPerLMemInstrDist, completedWfs, controlFlowDivergenceDist, csprintf(), Stats::DataWrap< Derived, InfoProxyType >::desc(), dynamicGMemInstrCnt, dynamicLMemInstrCnt, execRateDist, execStage, fetchStage, flatLDSInsts, flatLDSInstsPerWF, flatVMemInsts, flatVMemInstsPerWF, globalMemoryPipe, hitsPerTLBLevel, ArmISA::i, Stats::VectorBase< Derived, Stor >::init(), Stats::Distribution::init(), instCyclesSALU, instCyclesVALU, ipc, ldsBankAccesses, ldsBankConflictDist, ldsNoFlatInsts, ldsNoFlatInstsPerWF, localMemoryPipe, SimObject::name(), Stats::DataWrap< Derived, InfoProxyType >::name(), numALUInstsExecuted, numCASOps, numFailedCASOps, numInstrExecuted, numTimesWgBlockedDueVgprAlloc, numVecOpsExecuted, pageDivergenceDist, FetchStage::regStats(), ScheduleStage::regStats(), ScoreboardCheckStage::regStats(), ExecStage::regStats(), LocalMemPipeline::regStats(), GlobalMemPipeline::regStats(), Stats::Group::regStats(), sALUInsts, sALUInstsPerWF, scalarMemReads, scalarMemReadsPerWF, scalarMemWrites, scalarMemWritesPerWF, scheduleStage, scoreboardCheckStage, Stats::DataWrapVec< Derived, InfoProxyType >::subname(), threadCyclesVALU, tlbCycles, tlbLatency, tlbRequests, totalCycles, vALUInsts, vALUInstsPerWF, vALUUtilization, vectorMemReads, vectorMemReadsPerWF, vectorMemWrites, vectorMemWritesPerWF, vpc, wfSize(), and wgBlockedDueLdsAllocation.
void ComputeUnit::resizeRegFiles | ( | int | num_cregs, |
int | num_sregs, | ||
int | num_dregs | ||
) |
Referenced by wfSize().
void ComputeUnit::sendRequest | ( | GPUDynInstPtr | gpuDynInst, |
int | index, | ||
PacketPtr | pkt | ||
) |
Definition at line 740 of file compute_unit.cc.
References Packet::cmd, cu_id, curTick(), Packet::dataStatic(), debugSegFault, DPRINTF, fatal, Process::fixupFault(), functionalTLB, Packet::getAddr(), ThreadContext::getProcessPtr(), Packet::getPtr(), Packet::getSize(), Shader::gpuTc, hitsPerTLBLevel, MipsISA::index, Packet::isRead(), Packet::isWrite(), MemCmd::MemFenceReq, memPort, MipsISA::p, panic, perLaneTLB, Process::pTable, BaseTLB::Read, Packet::req, req_tick_latency, safe_cast(), X86ISA::GpuTLB::TranslationState::saved, EventManager::schedule(), Packet::senderState, shader, Shader::timingSim, tlbCycles, X86ISA::GpuTLB::TranslationState::tlbEntry, tlbPort, tlbRequests, EmulationPageTable::translate(), updatePageDivergenceDist(), MipsISA::vaddr, and BaseTLB::Write.
Referenced by nextLocRdBus().
void ComputeUnit::sendSyncRequest | ( | GPUDynInstPtr | gpuDynInst, |
int | index, | ||
PacketPtr | pkt | ||
) |
Definition at line 920 of file compute_unit.cc.
References cu_id, curTick(), DPRINTF, MipsISA::index, memPort, Packet::req, req_tick_latency, EventManager::schedule(), and Packet::senderState.
Referenced by injectGlobalMemFence(), and nextLocRdBus().
bool ComputeUnit::sendToLds | ( | GPUDynInstPtr | gpuDynInst | ) |
send a general request to the LDS make sure to look at the return value here as your request might be NACK'd and returning false means that you have to have some backup plan
Definition at line 1794 of file compute_unit.cc.
References ldsPort, MemCmd::ReadReq, Packet::senderState, and ComputeUnit::LDSPort::sendTimingReq().
Referenced by cacheLineSize(), and LocalMemPipeline::exec().
|
inline |
Definition at line 267 of file compute_unit.hh.
References LDSMEM_PIPE.
Referenced by ScoreboardCheckStage::exec(), Wavefront::exec(), and Wavefront::updateResources().
|
inline |
Definition at line 245 of file compute_unit.hh.
References spBypassPipeLength.
Referenced by ConditionRegisterState::exec(), VectorRegisterFile::exec(), Wavefront::exec(), and Wavefront::updateResources().
Definition at line 225 of file compute_unit.cc.
References Wavefront::actualWgSz, Wavefront::actualWgSzTotal, Wavefront::barCnt, barrier_id, Wavefront::barrierCnt, Wavefront::barrierId, Wavefront::barrierSlots, HsaQueueEntry::code_ptr, cu_id, NDRange::dispatchId, Wavefront::dispatchId, divCeil(), DPRINTF, Wavefront::dropFetch, NDRange::globalWgId, LdsState::increaseRefCounter(), Wavefront::initMask, Wavefront::instructionBuffer, MipsISA::k, Wavefront::kernId, lds, Wavefront::ldsChunk, Wavefront::maxBarCnt, NDRange::numWg, Wavefront::oldBarrierCnt, Wavefront::pendingFetch, Wavefront::privBase, HsaQueueEntry::privMemPerItem, HsaQueueEntry::privMemStart, Wavefront::pushToReconvergenceStack(), NDRange::q, Wavefront::simdId, Wavefront::spillBase, HsaQueueEntry::spillMemPerItem, HsaQueueEntry::spillMemStart, Wavefront::spillWidth, Wavefront::stalledAtBarrier, Wavefront::start(), Wavefront::wfId, wfSize(), Wavefront::wfSlotId, Wavefront::wgId, Wavefront::workGroupId, Wavefront::workItemFlatId, and Wavefront::workItemId.
Referenced by StartWorkgroup(), and wfSize().
void ComputeUnit::StartWorkgroup | ( | NDRange * | ndr | ) |
Definition at line 309 of file compute_unit.cc.
References Wavefront::actualWgSzTotal, barrier_id, NDRange::dispatchId, HsaQueueEntry::dRegCount, fillKernelState(), getAndIncSeqNum(), NDRange::globalWgId, Shader::impl_kern_boundary_sync, injectGlobalMemFence(), kernelLaunchInst, lds, HsaQueueEntry::ldsSize, ArmISA::m, Shader::n_wf, numSIMDs, numVecRegsPerSimd, NDRange::q, Wavefront::reservedVectorRegs, LdsState::reserveSpace(), Wavefront::S_STOPPED, shader, HsaQueueEntry::sRegCount, Wavefront::startVgprIndex, startWavefront(), Wavefront::status, vectorRegsReserved, vrf, MipsISA::w, wfList, and wfSize().
Referenced by wfSize().
|
inline |
Definition at line 247 of file compute_unit.hh.
References numCyclesPerStoreTransfer.
Referenced by LdsState::processPacket().
void ComputeUnit::updateEvents | ( | ) |
Definition at line 198 of file compute_unit.cc.
References ArmISA::i, numSIMDs, regIdxVec, Sinic::regInfo(), shader, statusVec, Shader::tick_cnt, timestampVec, and vrf.
Referenced by exec(), and registerEvent().
void ComputeUnit::updateInstStats | ( | GPUDynInstPtr | gpuDynInst | ) |
Definition at line 1666 of file compute_unit.cc.
References flatLDSInsts, flatVMemInsts, instCyclesSALU, instCyclesVALU, ldsNoFlatInsts, sALUInsts, scalarMemReads, scalarMemWrites, threadCyclesVALU, vALUInsts, vectorMemReads, and vectorMemWrites.
Referenced by Wavefront::exec().
void ComputeUnit::updatePageDivergenceDist | ( | Addr | addr | ) |
Definition at line 1699 of file compute_unit.cc.
References ArmISA::PageBytes, pagesTouched, and roundDown().
Referenced by nextLocRdBus(), and sendRequest().
|
inline |
Definition at line 249 of file compute_unit.hh.
References exec(), fetch(), fillKernelState(), initiateFetch(), ReadyWorkgroup(), resizeRegFiles(), startWavefront(), StartWorkgroup(), MipsISA::w, and wavefrontSize.
Referenced by HsailISA::Call::calcAddr(), HsailISA::calcPrivAddr(), RegAddrOperand< RegOperandType >::calcVector(), NoRegAddrOperand::calcVector(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), ComputeUnit(), LdsState::countBankConflicts(), HsailISA::Call::execPseudoInst(), HsailISA::LdaInst< DestDataType, AddrOperandType >::execute(), HsailISA::CbrInstBase< SRegOperand >::execute(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Wavefront::getContext(), Wavefront::getStaticContextSize(), GPUDynInst::GPUDynInst(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicJoinWFBar(), HsailISA::Call::MagicMaskLower(), HsailISA::Call::MagicMaskUpper(), HsailISA::Call::MagicMostSigBroadcast(), HsailISA::Call::MagicMostSigThread(), HsailISA::Call::MagicPanic(), HsailISA::Call::MagicPrefixSum(), HsailISA::Call::MagicPrintLane(), HsailISA::Call::MagicPrintLane64(), HsailISA::Call::MagicPrintWF32(), HsailISA::Call::MagicPrintWF32ID(), HsailISA::Call::MagicPrintWF64(), HsailISA::Call::MagicPrintWFFloat(), HsailISA::Call::MagicPrintWFID64(), HsailISA::Call::MagicReduction(), HsailISA::Call::MagicSimBreak(), HsailISA::Call::MagicWaitWFBar(), HsailISA::Call::MagicXactCasLd(), ReadyWorkgroup(), regStats(), Wavefront::setContext(), startWavefront(), and StartWorkgroup().
|
private |
Definition at line 742 of file compute_unit.hh.
Referenced by cacheLineSize().
|
protected |
Definition at line 297 of file compute_unit.hh.
Referenced by masterId().
Stats::Distribution ComputeUnit::activeLanesPerGMemInstrDist |
Definition at line 358 of file compute_unit.hh.
Referenced by Wavefront::exec(), and regStats().
Stats::Distribution ComputeUnit::activeLanesPerLMemInstrDist |
Definition at line 359 of file compute_unit.hh.
Referenced by Wavefront::exec(), and regStats().
std::vector<WaitClass> ComputeUnit::aluPipe |
Definition at line 186 of file compute_unit.hh.
Referenced by Wavefront::exec(), init(), isSimdDone(), and Wavefront::updateResources().
uint32_t ComputeUnit::barrier_id |
Definition at line 184 of file compute_unit.hh.
Referenced by startWavefront(), and StartWorkgroup().
uint32_t ComputeUnit::coalescerToVrfBusWidth |
Definition at line 202 of file compute_unit.hh.
Referenced by ComputeUnit().
Stats::Scalar ComputeUnit::completedWfs |
Definition at line 366 of file compute_unit.hh.
Referenced by HsailISA::Ret::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), and regStats().
Stats::Distribution ComputeUnit::controlFlowDivergenceDist |
Definition at line 357 of file compute_unit.hh.
Referenced by Wavefront::exec(), and regStats().
bool ComputeUnit::countPages |
Definition at line 181 of file compute_unit.hh.
int ComputeUnit::cu_id |
Definition at line 134 of file compute_unit.hh.
Referenced by AllAtBarrier(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), GlobalMemPipeline::exec(), Wavefront::exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchUnit::fetch(), Wavefront::getContext(), Wavefront::getStaticContextSize(), GPUDynInst::initiateAcc(), FetchUnit::initiateFetch(), HsailISA::Call::MagicSimBreak(), Wavefront::popFromReconvergenceStack(), FetchUnit::processFetchReturn(), ComputeUnit::DataPort::processMemRespEvent(), Wavefront::ready(), sendRequest(), sendSyncRequest(), SRegOperand::set(), DRegOperand::set(), CRegOperand::set(), ListOperand::set(), Wavefront::setContext(), and startWavefront().
CUExitCallback* ComputeUnit::cuExitCallback |
Definition at line 416 of file compute_unit.hh.
Referenced by ComputeUnit(), and ~ComputeUnit().
bool ComputeUnit::debugSegFault |
Definition at line 169 of file compute_unit.hh.
Referenced by sendRequest().
std::vector<std::pair<Wavefront*, DISPATCH_STATUS> > ComputeUnit::dispatchList |
Definition at line 128 of file compute_unit.hh.
Referenced by ScheduleStage::init(), ExecStage::init(), init(), and ~ComputeUnit().
int ComputeUnit::dpBypassPipeLength |
Definition at line 145 of file compute_unit.hh.
Referenced by dpBypassLength().
Stats::Scalar ComputeUnit::dynamicGMemInstrCnt |
Definition at line 341 of file compute_unit.hh.
Referenced by regStats(), and GPUDynInst::updateStats().
Stats::Scalar ComputeUnit::dynamicLMemInstrCnt |
Definition at line 342 of file compute_unit.hh.
Referenced by regStats(), and GPUDynInst::updateStats().
EXEC_POLICY ComputeUnit::exec_policy |
Definition at line 166 of file compute_unit.hh.
Referenced by ComputeUnit().
Stats::Distribution ComputeUnit::execRateDist |
Definition at line 350 of file compute_unit.hh.
Referenced by Wavefront::exec(), and regStats().
ExecStage ComputeUnit::execStage |
Definition at line 97 of file compute_unit.hh.
Referenced by exec(), init(), and regStats().
FetchStage ComputeUnit::fetchStage |
Definition at line 94 of file compute_unit.hh.
Referenced by exec(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), init(), and regStats().
Stats::Scalar ComputeUnit::flatLDSInsts |
Definition at line 314 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::flatLDSInstsPerWF |
Definition at line 315 of file compute_unit.hh.
Referenced by regStats().
Stats::Scalar ComputeUnit::flatVMemInsts |
Definition at line 312 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::flatVMemInstsPerWF |
Definition at line 313 of file compute_unit.hh.
Referenced by regStats().
bool ComputeUnit::functionalTLB |
Definition at line 170 of file compute_unit.hh.
Referenced by sendRequest().
int ComputeUnit::glbMemInstAvail |
Definition at line 377 of file compute_unit.hh.
Referenced by ScoreboardCheckStage::init(), ExecStage::init(), and init().
WaitClass ComputeUnit::glbMemToVrfBus |
Definition at line 197 of file compute_unit.hh.
Referenced by GlobalMemPipeline::exec(), init(), and isDone().
GlobalMemPipeline ComputeUnit::globalMemoryPipe |
Definition at line 98 of file compute_unit.hh.
Referenced by exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::MemFence::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), init(), isDone(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), ComputeUnit::DataPort::processMemRespEvent(), Wavefront::ready(), and regStats().
|
private |
Definition at line 743 of file compute_unit.hh.
Referenced by getAndIncSeqNum().
Stats::Vector ComputeUnit::hitsPerTLBLevel |
Definition at line 333 of file compute_unit.hh.
Referenced by regStats(), and sendRequest().
Stats::Scalar ComputeUnit::instCyclesSALU |
Definition at line 307 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Scalar ComputeUnit::instCyclesVALU |
Definition at line 306 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::ipc |
Definition at line 356 of file compute_unit.hh.
Referenced by regStats().
int ComputeUnit::issuePeriod |
Definition at line 147 of file compute_unit.hh.
Referenced by Wavefront::exec(), and Wavefront::updateResources().
|
private |
Definition at line 745 of file compute_unit.hh.
Referenced by StartWorkgroup().
std::vector<uint64_t> ComputeUnit::lastExecCycle |
Definition at line 153 of file compute_unit.hh.
Referenced by ComputeUnit(), and Wavefront::exec().
std::vector<Addr> ComputeUnit::lastVaddrCU |
Definition at line 162 of file compute_unit.hh.
Referenced by ComputeUnit(), and ~ComputeUnit().
std::vector<std::vector<Addr> > ComputeUnit::lastVaddrSimd |
Definition at line 163 of file compute_unit.hh.
Referenced by ComputeUnit(), and ~ComputeUnit().
std::vector<std::vector<std::vector<Addr> > > ComputeUnit::lastVaddrWF |
Definition at line 164 of file compute_unit.hh.
Referenced by ComputeUnit().
|
protected |
Definition at line 299 of file compute_unit.hh.
Referenced by ComputeUnit(), getLds(), getRefCounter(), ReadyWorkgroup(), startWavefront(), and StartWorkgroup().
Stats::Scalar ComputeUnit::ldsBankAccesses |
Definition at line 335 of file compute_unit.hh.
Referenced by LdsState::processPacket(), and regStats().
Stats::Distribution ComputeUnit::ldsBankConflictDist |
Definition at line 336 of file compute_unit.hh.
Referenced by LdsState::processPacket(), and regStats().
Stats::Scalar ComputeUnit::ldsNoFlatInsts |
Definition at line 310 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::ldsNoFlatInstsPerWF |
Definition at line 311 of file compute_unit.hh.
Referenced by regStats().
LDSPort* ComputeUnit::ldsPort = nullptr |
The port to access the Local Data Store Can be connected to a LDS object.
Definition at line 672 of file compute_unit.hh.
Referenced by getLdsPort(), getPort(), sendToLds(), and ~ComputeUnit().
bool ComputeUnit::localMemBarrier |
Definition at line 171 of file compute_unit.hh.
LocalMemPipeline ComputeUnit::localMemoryPipe |
Definition at line 99 of file compute_unit.hh.
Referenced by exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), init(), isDone(), Wavefront::ready(), and regStats().
WaitClass ComputeUnit::locMemToVrfBus |
Definition at line 199 of file compute_unit.hh.
Referenced by LocalMemPipeline::exec(), init(), and isDone().
std::vector<DataPort*> ComputeUnit::memPort |
The memory port for SIMD data accesses.
Can be connected to PhysMem for Ruby for timing simulations
Definition at line 683 of file compute_unit.hh.
Referenced by ComputeUnit(), sendRequest(), and sendSyncRequest().
int ComputeUnit::nextGlbMemBus |
Definition at line 194 of file compute_unit.hh.
Referenced by init().
int ComputeUnit::nextLocMemBus |
Definition at line 195 of file compute_unit.hh.
Referenced by init().
Stats::Formula ComputeUnit::numALUInstsExecuted |
Definition at line 361 of file compute_unit.hh.
Referenced by regStats().
Stats::Scalar ComputeUnit::numCASOps |
Definition at line 364 of file compute_unit.hh.
Referenced by AtomicOpCAS< T >::execute(), and regStats().
uint32_t ComputeUnit::numCyclesPerLoadTransfer |
Definition at line 204 of file compute_unit.hh.
Referenced by ComputeUnit(), and loadBusLength().
uint32_t ComputeUnit::numCyclesPerStoreTransfer |
Definition at line 203 of file compute_unit.hh.
Referenced by ComputeUnit(), and storeBusLength().
Stats::Scalar ComputeUnit::numFailedCASOps |
Definition at line 365 of file compute_unit.hh.
Referenced by AtomicOpCAS< T >::execute(), and regStats().
int ComputeUnit::numGlbMemUnits |
Definition at line 150 of file compute_unit.hh.
Referenced by init(), isDone(), isSimdDone(), nextGlbRdBus(), and Wavefront::ready().
Stats::Scalar ComputeUnit::numInstrExecuted |
Definition at line 347 of file compute_unit.hh.
Referenced by Wavefront::exec(), and regStats().
int ComputeUnit::numLocMemUnits |
Definition at line 151 of file compute_unit.hh.
Referenced by init(), isDone(), isSimdDone(), nextLocRdBus(), and Wavefront::ready().
int ComputeUnit::numSIMDs |
Definition at line 139 of file compute_unit.hh.
Referenced by AllAtBarrier(), ComputeUnit(), init(), isDone(), isSimdDone(), ReadyWorkgroup(), StartWorkgroup(), updateEvents(), and ~ComputeUnit().
Stats::Scalar ComputeUnit::numTimesWgBlockedDueVgprAlloc |
Definition at line 363 of file compute_unit.hh.
Referenced by ReadyWorkgroup(), and regStats().
Stats::Scalar ComputeUnit::numVecOpsExecuted |
Definition at line 352 of file compute_unit.hh.
Referenced by Wavefront::exec(), and regStats().
uint32_t ComputeUnit::numVecRegsPerSimd |
Definition at line 212 of file compute_unit.hh.
Referenced by ComputeUnit(), ReadyWorkgroup(), and StartWorkgroup().
pageDataStruct ComputeUnit::pageAccesses |
Definition at line 397 of file compute_unit.hh.
Referenced by GPUDynInst::updateStats().
Stats::Distribution ComputeUnit::pageDivergenceDist |
Definition at line 340 of file compute_unit.hh.
Referenced by regStats(), and GPUDynInst::updateStats().
std::map<Addr, int> ComputeUnit::pagesTouched |
Definition at line 241 of file compute_unit.hh.
Referenced by updatePageDivergenceDist(), and GPUDynInst::updateStats().
bool ComputeUnit::perLaneTLB |
Definition at line 156 of file compute_unit.hh.
Referenced by ComputeUnit(), and sendRequest().
int ComputeUnit::prefetchDepth |
Definition at line 158 of file compute_unit.hh.
int ComputeUnit::prefetchStride |
Definition at line 160 of file compute_unit.hh.
Enums::PrefetchType ComputeUnit::prefetchType |
Definition at line 165 of file compute_unit.hh.
std::vector<std::vector<Wavefront*> > ComputeUnit::readyList |
Definition at line 108 of file compute_unit.hh.
Referenced by ScheduleStage::exec(), ScheduleStage::init(), ScoreboardCheckStage::init(), init(), and ~ComputeUnit().
std::vector<std::pair<uint32_t, uint32_t> > ComputeUnit::regIdxVec |
Definition at line 214 of file compute_unit.hh.
Referenced by updateEvents().
Tick ComputeUnit::req_tick_latency |
Definition at line 206 of file compute_unit.hh.
Referenced by sendRequest(), and sendSyncRequest().
Tick ComputeUnit::resp_tick_latency |
Definition at line 207 of file compute_unit.hh.
int ComputeUnit::rrNextALUWp |
Definition at line 131 of file compute_unit.hh.
int ComputeUnit::rrNextMemID |
Definition at line 130 of file compute_unit.hh.
Stats::Scalar ComputeUnit::sALUInsts |
Definition at line 304 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::sALUInstsPerWF |
Definition at line 305 of file compute_unit.hh.
Referenced by regStats().
Stats::Scalar ComputeUnit::scalarMemReads |
Definition at line 322 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::scalarMemReadsPerWF |
Definition at line 323 of file compute_unit.hh.
Referenced by regStats().
Stats::Scalar ComputeUnit::scalarMemWrites |
Definition at line 320 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::scalarMemWritesPerWF |
Definition at line 321 of file compute_unit.hh.
Referenced by regStats().
ScheduleStage ComputeUnit::scheduleStage |
Definition at line 96 of file compute_unit.hh.
Referenced by exec(), init(), and regStats().
ScoreboardCheckStage ComputeUnit::scoreboardCheckStage |
Definition at line 95 of file compute_unit.hh.
Referenced by exec(), init(), and regStats().
Shader* ComputeUnit::shader |
Definition at line 183 of file compute_unit.hh.
Referenced by AllAtBarrier(), FetchUnit::exec(), LocalMemPipeline::exec(), GlobalMemPipeline::exec(), ScoreboardCheckStage::exec(), ConditionRegisterState::exec(), VectorRegisterFile::exec(), Wavefront::exec(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::execute(), HsailISA::Ret::execute(), HsailISA::StInst< MemDataType, SrcDataType, AddrOperandType >::execute(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::execute(), Gcn3ISA::Inst_SOPP__S_ENDPGM::execute(), FetchUnit::init(), GlobalMemPipeline::init(), init(), FetchUnit::initiateFetch(), isSimdDone(), HsailISA::Call::MagicAtomicNRAddGlobalU32Reg(), HsailISA::Call::MagicAtomicNRAddGroupU32Reg(), HsailISA::Call::MagicLoadGlobalU32Reg(), LdsState::processPacket(), ReadyWorkgroup(), sendRequest(), StartWorkgroup(), updateEvents(), Wavefront::updateResources(), and ~ComputeUnit().
int ComputeUnit::shrMemInstAvail |
Definition at line 374 of file compute_unit.hh.
Referenced by ScoreboardCheckStage::init(), ExecStage::init(), and init().
int ComputeUnit::spBypassPipeLength |
Definition at line 142 of file compute_unit.hh.
Referenced by spBypassLength().
SQCPort* ComputeUnit::sqcPort |
Definition at line 687 of file compute_unit.hh.
Referenced by FetchUnit::fetch(), and getPort().
ITLBPort* ComputeUnit::sqcTLBPort |
Definition at line 689 of file compute_unit.hh.
Referenced by getPort(), and FetchUnit::initiateFetch().
std::vector<uint8_t> ComputeUnit::statusVec |
Definition at line 216 of file compute_unit.hh.
Referenced by updateEvents().
Stats::Scalar ComputeUnit::threadCyclesVALU |
Definition at line 308 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
std::vector<uint64_t> ComputeUnit::timestampVec |
Definition at line 215 of file compute_unit.hh.
Referenced by updateEvents().
Stats::Scalar ComputeUnit::tlbCycles |
Definition at line 330 of file compute_unit.hh.
Referenced by regStats(), and sendRequest().
Stats::Formula ComputeUnit::tlbLatency |
Definition at line 331 of file compute_unit.hh.
Referenced by regStats().
std::vector<DTLBPort*> ComputeUnit::tlbPort |
Definition at line 685 of file compute_unit.hh.
Referenced by ComputeUnit(), and sendRequest().
Stats::Scalar ComputeUnit::tlbRequests |
Definition at line 329 of file compute_unit.hh.
Referenced by regStats(), and sendRequest().
Stats::Scalar ComputeUnit::totalCycles |
Definition at line 354 of file compute_unit.hh.
Referenced by exec(), Wavefront::exec(), and regStats().
Stats::Scalar ComputeUnit::vALUInsts |
Definition at line 302 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::vALUInstsPerWF |
Definition at line 303 of file compute_unit.hh.
Referenced by regStats().
Stats::Formula ComputeUnit::vALUUtilization |
Definition at line 309 of file compute_unit.hh.
Referenced by regStats().
std::vector<bool> ComputeUnit::vectorAluInstAvail |
Definition at line 371 of file compute_unit.hh.
Referenced by ScoreboardCheckStage::init(), ExecStage::init(), init(), and ~ComputeUnit().
Stats::Scalar ComputeUnit::vectorMemReads |
Definition at line 318 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::vectorMemReadsPerWF |
Definition at line 319 of file compute_unit.hh.
Referenced by regStats().
Stats::Scalar ComputeUnit::vectorMemWrites |
Definition at line 316 of file compute_unit.hh.
Referenced by regStats(), and updateInstStats().
Stats::Formula ComputeUnit::vectorMemWritesPerWF |
Definition at line 317 of file compute_unit.hh.
Referenced by regStats().
std::vector<int> ComputeUnit::vectorRegsReserved |
Definition at line 210 of file compute_unit.hh.
Referenced by HsailISA::Ret::execute(), init(), and StartWorkgroup().
Stats::Formula ComputeUnit::vpc |
Definition at line 355 of file compute_unit.hh.
Referenced by regStats().
std::vector<VectorRegisterFile*> ComputeUnit::vrf |
Definition at line 137 of file compute_unit.hh.
Referenced by ScheduleStage::arbitrate(), HsailISA::LdInst< MemDataType, DestDataType, AddrOperandType >::completeAcc(), HsailISA::AtomicInst< MemDataType, AddrOperandType, NumSrcOperands, HasDst >::completeAcc(), ComputeUnit(), LocalMemPipeline::exec(), GlobalMemPipeline::exec(), Wavefront::exec(), HsailISA::Ret::execute(), SRegOperand::get(), DRegOperand::get(), Wavefront::getContext(), Gcn3ISA::VecOperand< DataType, Const, NumDwords >::read(), Wavefront::ready(), ReadyWorkgroup(), Wavefront::remap(), SRegOperand::set(), DRegOperand::set(), Wavefront::setContext(), StartWorkgroup(), updateEvents(), Wavefront::updateResources(), and Gcn3ISA::VecOperand< DataType, Const, NumDwords >::write().
uint32_t ComputeUnit::vrfToCoalescerBusWidth |
Definition at line 201 of file compute_unit.hh.
Referenced by ComputeUnit().
std::vector<WaitClass> ComputeUnit::vrfToGlobalMemPipeBus |
Definition at line 191 of file compute_unit.hh.
Referenced by Wavefront::exec(), init(), isDone(), isSimdDone(), Wavefront::ready(), and Wavefront::updateResources().
std::vector<WaitClass> ComputeUnit::vrfToLocalMemPipeBus |
Definition at line 193 of file compute_unit.hh.
Referenced by Wavefront::exec(), init(), isDone(), isSimdDone(), Wavefront::ready(), and Wavefront::updateResources().
|
private |
Definition at line 744 of file compute_unit.hh.
Referenced by ComputeUnit(), init(), and wfSize().
std::vector<std::vector<std::pair<Wavefront*, WAVE_STATUS> > > ComputeUnit::waveStatusList |
Definition at line 116 of file compute_unit.hh.
Referenced by ScheduleStage::init(), ScoreboardCheckStage::init(), init(), and ~ComputeUnit().
std::vector<std::vector<Wavefront*> > ComputeUnit::wfList |
Definition at line 133 of file compute_unit.hh.
Referenced by AllAtBarrier(), ComputeUnit(), FetchStage::init(), init(), isSimdDone(), ReadyWorkgroup(), StartWorkgroup(), and ~ComputeUnit().
std::vector<WaitClass> ComputeUnit::wfWait |
Definition at line 188 of file compute_unit.hh.
Referenced by LocalMemPipeline::exec(), GlobalMemPipeline::exec(), Wavefront::exec(), init(), Wavefront::ready(), and Wavefront::updateResources().
Stats::Scalar ComputeUnit::wgBlockedDueLdsAllocation |
Definition at line 344 of file compute_unit.hh.
Referenced by ReadyWorkgroup(), and regStats().
bool ComputeUnit::xact_cas_mode |
Definition at line 168 of file compute_unit.hh.
Referenced by cedeSIMD(), and AtomicOpCAS< T >::execute().
std::map<unsigned, waveQueue> ComputeUnit::xactCasLoadMap |
Definition at line 737 of file compute_unit.hh.
Referenced by cedeSIMD(), ComputeUnit(), AtomicOpCAS< T >::execute(), and HsailISA::Call::MagicXactCasLd().