34 #ifndef __LDS_STATE_HH__ 35 #define __LDS_STATE_HH__ 40 #include <unordered_map> 44 #include "enums/MemType.hh" 47 #include "params/LdsState.hh" 73 fatal_if(!
chunk.size(),
"cannot read from an LDS chunk of size 0");
74 fatal_if(index >=
chunk.size(),
"out-of-bounds access to an LDS chunk");
75 T *p0 = (T *) (&(
chunk.at(index)));
86 fatal_if(!
chunk.size(),
"cannot write to an LDS chunk of size 0");
87 fatal_if(index >=
chunk.size(),
"out-of-bounds access to an LDS chunk");
88 T *p0 = (T *) (&(
chunk.at(index)));
153 SlavePort(_name, _ownerLds), ownerLds(_ownerLds)
214 std::unordered_map<uint32_t,
218 std::unordered_map<uint32_t,
230 bool retryResp =
false;
242 countBankConflicts(
PacketPtr packet,
unsigned *bankAccesses);
246 unsigned *numBankAccesses);
264 return dynamic_cast<const Params *
>(_params);
281 operator=(
const LdsState &) =
delete;
289 int refCount = getRefCounter(dispatchId, wgId);
291 "reference count should not be below zero");
292 return ++refCounter[dispatchId][wgId];
302 int refCount = getRefCounter(dispatchId, wgId);
305 "reference count should not be below zero or at zero to" 308 refCounter[dispatchId][wgId]--;
310 if (refCounter[dispatchId][wgId] == 0) {
311 releaseSpace(dispatchId, wgId);
314 return refCounter[dispatchId][wgId];
324 auto dispatchIter = chunkMap.find(dispatchId);
325 fatal_if(dispatchIter == chunkMap.end(),
326 "could not locate this dispatch id [%d]", dispatchId);
328 auto workgroup = dispatchIter->second.find(wgId);
329 fatal_if(workgroup == dispatchIter->second.end(),
330 "could not find this workgroup id within this dispatch id" 331 " did[%d] wgid[%d]", dispatchId, wgId);
333 auto refCountIter = refCounter.find(dispatchId);
334 if (refCountIter == refCounter.end()) {
335 fatal(
"could not locate this dispatch id [%d]", dispatchId);
337 auto workgroup = refCountIter->second.find(wgId);
338 if (workgroup == refCountIter->second.end()) {
339 fatal(
"could not find this workgroup id within this dispatch id" 340 " did[%d] wgid[%d]", dispatchId, wgId);
342 return refCounter.at(dispatchId).at(wgId);
346 fatal(
"should not reach this point");
358 if (chunkMap.find(dispatchId) != chunkMap.end()) {
360 chunkMap[dispatchId].find(wgId) != chunkMap[dispatchId].end(),
361 "duplicate workgroup ID asking for space in the LDS " 362 "did[%d] wgid[%d]", dispatchId, wgId);
365 fatal_if(bytesAllocated + size > maximumSize,
366 "request would ask for more space than is available");
368 bytesAllocated +=
size;
370 chunkMap[dispatchId].emplace(wgId,
LdsChunk(size));
372 refCounter[dispatchId][wgId] = 0;
374 return &chunkMap[dispatchId][wgId];
384 return returnQueue.empty() ?
curTick() : returnQueue.back().first;
418 return bankConflictPenalty;
427 return chunkMap[x_wgId].size();
439 if (if_name ==
"cuPort") {
443 fatal(
"cannot resolve the port name " + if_name);
453 return bytesAllocated + x_size <= maximumSize;
463 auto dispatchIter = chunkMap.find(x_dispatchId);
465 if (dispatchIter == chunkMap.end()) {
466 fatal(
"dispatch id not found [%d]", x_dispatchId);
468 auto workgroupIter = dispatchIter->second.find(x_wgId);
469 if (workgroupIter == dispatchIter->second.end()) {
470 fatal(
"workgroup id [%d] not found in dispatch id [%d]",
471 x_wgId, x_dispatchId);
475 fatal_if(bytesAllocated < chunkMap[x_dispatchId][x_wgId].
size(),
476 "releasing more space than was allocated");
478 bytesAllocated -= chunkMap[x_dispatchId][x_wgId].size();
479 chunkMap[x_dispatchId].erase(chunkMap[x_dispatchId].find(x_wgId));
491 int bytesAllocated = 0;
500 int bankConflictPenalty = 0;
506 #endif // __LDS_STATE_HH__ Ports are used to interface objects to each other.
an event to allow event-driven execution
#define fatal(...)
This implements a cprintf based fatal() function.
std::vector< uint8_t >::size_type size() const
get the size of this chunk
Tick earliestReturnTime() const
std::queue< std::pair< Tick, PacketPtr > > returnQueue
const Params * params() const
virtual AddrRangeList getAddrRanges() const
Get a list of the non-overlapping address ranges the owner is responsible for.
std::vector< uint8_t > chunk
TickEvent(LdsState *_ldsState)
vector< EventQueue * > mainEventQueue
Array for main event queues.
A SlavePort is a specialisation of a port.
this represents a slice of the overall LDS, intended to be associated with an individual workgroup ...
ComputeUnit * getParent() const
CuSidePort(const std::string &_name, LdsState *_ownerLds)
The AddrRange class encapsulates an address range, and supports a number of tests to check if two ran...
std::shared_ptr< GPUDynInst > GPUDynInstPtr
virtual void recvRangeChange()
void setRetryResp(const bool value)
Tick curTick()
The current simulated tick.
std::size_t ldsSize(const uint32_t x_wgId)
get the allocated size for this workgroup
uint64_t Tick
Tick count type.
The ClockedObject class extends the SimObject with a clock and accessor functions to relate ticks to ...
bool canReserve(uint32_t x_size) const
can this much space be reserved for a workgroup?
ClockedObject declaration and implementation.
Port & getPort(const std::string &if_name, PortID idx)
Get a port with a given name and index.
#define fatal_if(cond,...)
Conditional fatal macro that checks the supplied condition and only causes a fatal error if the condi...
std::unordered_map< uint32_t, std::unordered_map< uint32_t, int32_t > > refCounter
int increaseRefCounter(const uint32_t dispatchId, const uint32_t wgId)
use the dynamic wave id to create or just increase the reference count
int decreaseRefCounter(const uint32_t dispatchId, const uint32_t wgId)
decrease the reference count after making sure it is in the list give back this chunk if the ref coun...
T read(const uint32_t index)
a read operation
virtual Tick recvAtomic(PacketPtr pkt)
Receive an atomic request packet from the peer.
LdsChunk(const uint32_t x_size)
A Packet is used to encapsulate a transfer between two objects in the memory system (e...
std::unordered_map< uint32_t, std::unordered_map< uint32_t, LdsChunk > > chunkMap
LdsChunk * reserveSpace(const uint32_t dispatchId, const uint32_t wgId, const uint32_t size)
assign a parent and request this amount of space be set aside for this wgid
int getRefCounter(const uint32_t dispatchId, const uint32_t wgId) const
return the current reference count for this workgroup id
void write(const uint32_t index, const T value)
a write operation
int16_t PortID
Port index/ID type, and a symbolic name for an invalid port id.
int getBankConflictPenalty() const
bool releaseSpace(const uint32_t x_dispatchId, const uint32_t x_wgId)
give back the space
CuSidePort is the LDS Port closer to the CU side.
AddrRange getAddrRange() const
ComputeUnit * getComputeUnit() const