release/v20-0-0-2/GPUCoalescer_8hh_source.html

 /*
  * Copyright (c) 2013-2015 Advanced Micro Devices, Inc.
  * All rights reserved.
  *
  * For use for simulation and test purposes only
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are met:
  *
  * 1. Redistributions of source code must retain the above copyright notice,
  * this list of conditions and the following disclaimer.
  *
  * 2. Redistributions in binary form must reproduce the above copyright notice,
  * this list of conditions and the following disclaimer in the documentation
  * and/or other materials provided with the distribution.
  *
  * 3. Neither the name of the copyright holder nor the names of its
  * contributors may be used to endorse or promote products derived from this
  * software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  * POSSIBILITY OF SUCH DAMAGE.
  */

 #ifndef __MEM_RUBY_SYSTEM_GPU_COALESCER_HH__
 #define __MEM_RUBY_SYSTEM_GPU_COALESCER_HH__

 #include <iostream>
 #include <unordered_map>

 #include "base/statistics.hh"
 #include "mem/request.hh"
 #include "mem/ruby/common/Address.hh"
 #include "mem/ruby/common/Consumer.hh"
 #include "mem/ruby/protocol/HSAScope.hh"
 #include "mem/ruby/protocol/HSASegment.hh"
 #include "mem/ruby/protocol/PrefetchBit.hh"
 #include "mem/ruby/protocol/RubyAccessMode.hh"
 #include "mem/ruby/protocol/RubyRequestType.hh"
 #include "mem/ruby/protocol/SequencerRequestType.hh"
 #include "mem/ruby/system/Sequencer.hh"
 #include "mem/token_port.hh"

 class DataBlock;
 class CacheMsg;
 class MachineID;
 class CacheMemory;

 class RubyGPUCoalescerParams;

 HSAScope reqScopeToHSAScope(const RequestPtr &req);
 HSASegment reqSegmentToHSASegment(const RequestPtr &req);

 // List of packets that belongs to a specific instruction.
 typedef std::list<PacketPtr> PerInstPackets;

 class UncoalescedTable
 {
   public:
     UncoalescedTable(GPUCoalescer *gc);
     ~UncoalescedTable() {}

     void insertPacket(PacketPtr pkt);
     bool packetAvailable();
     void printRequestTable(std::stringstream& ss);

     // Returns a pointer to the list of packets corresponding to an
     // instruction in the instruction map or nullptr if there are no
     // instructions at the offset.
     PerInstPackets* getInstPackets(int offset);
     void updateResources();

     // Check if a packet hasn't been removed from instMap in too long.
     // Panics if a deadlock is detected and returns nothing otherwise.
     void checkDeadlock(Tick threshold);

   private:
     GPUCoalescer *coalescer;

     // Maps an instructions unique sequence number to a queue of packets
     // which need responses. This data structure assumes the sequence number
     // is monotonically increasing (which is true for CU class) in order to
     // issue packets in age order.
     std::map<uint64_t, PerInstPackets> instMap;
 };

 class CoalescedRequest
 {
   public:
     CoalescedRequest(uint64_t _seqNum)
         : seqNum(_seqNum), issueTime(Cycles(0)),
           rubyType(RubyRequestType_NULL)
     {}
     ~CoalescedRequest() {}

     void insertPacket(PacketPtr pkt) { pkts.push_back(pkt); }
     void setSeqNum(uint64_t _seqNum) { seqNum = _seqNum; }
     void setIssueTime(Cycles _issueTime) { issueTime = _issueTime; }
     void setRubyType(RubyRequestType type) { rubyType = type; }

     uint64_t getSeqNum() const { return seqNum; }
     PacketPtr getFirstPkt() const { return pkts[0]; }
     Cycles getIssueTime() const { return issueTime; }
     RubyRequestType getRubyType() const { return rubyType; }
     std::vector<PacketPtr>& getPackets() { return pkts; }

   private:
     uint64_t seqNum;
     Cycles issueTime;
     RubyRequestType rubyType;
     std::vector<PacketPtr> pkts;
 };

 class GPUCoalescer : public RubyPort
 {
   public:
     class GMTokenPort : public TokenSlavePort
     {
       public:
         GMTokenPort(const std::string& name, ClockedObject *owner,
                     PortID id = InvalidPortID)
             : TokenSlavePort(name, owner, id)
         { }
         ~GMTokenPort() { }

       protected:
         Tick recvAtomic(PacketPtr) { return Tick(0); }
         void recvFunctional(PacketPtr) { }
         bool recvTimingReq(PacketPtr) { return false; }
         AddrRangeList getAddrRanges() const
         {
             AddrRangeList ranges;
             return ranges;
         }
     };

     typedef RubyGPUCoalescerParams Params;
     GPUCoalescer(const Params *);
     ~GPUCoalescer();

     Port &getPort(const std::string &if_name,
                   PortID idx = InvalidPortID) override;

     // Public Methods
     void wakeup(); // Used only for deadlock detection
     void printRequestTable(std::stringstream& ss);

     void printProgress(std::ostream& out) const;
     void resetStats() override;
     void collateStats();
     void regStats() override;

     void writeCallback(Addr address, DataBlock& data);

     void writeCallback(Addr address,
                        MachineType mach,
                        DataBlock& data);

     void writeCallback(Addr address,
                        MachineType mach,
                        DataBlock& data,
                        Cycles initialRequestTime,
                        Cycles forwardRequestTime,
                        Cycles firstResponseTime,
                        bool isRegion);

     void writeCallback(Addr address,
                        MachineType mach,
                        DataBlock& data,
                        Cycles initialRequestTime,
                        Cycles forwardRequestTime,
                        Cycles firstResponseTime);

     void readCallback(Addr address, DataBlock& data);

     void readCallback(Addr address,
                       MachineType mach,
                       DataBlock& data);

     void readCallback(Addr address,
                       MachineType mach,
                       DataBlock& data,
                       Cycles initialRequestTime,
                       Cycles forwardRequestTime,
                       Cycles firstResponseTime);

     void readCallback(Addr address,
                       MachineType mach,
                       DataBlock& data,
                       Cycles initialRequestTime,
                       Cycles forwardRequestTime,
                       Cycles firstResponseTime,
                       bool isRegion);
     /* atomics need their own callback because the data
        might be const coming from SLICC */
     void atomicCallback(Addr address,
                         MachineType mach,
                         const DataBlock& data);

     void recordCPReadCallBack(MachineID myMachID, MachineID senderMachID);
     void recordCPWriteCallBack(MachineID myMachID, MachineID senderMachID);

     // Alternate implementations in VIPER Coalescer
     virtual RequestStatus makeRequest(PacketPtr pkt) override;

     int outstandingCount() const override { return m_outstanding_count; }

     bool
     isDeadlockEventScheduled() const override
     {
         return deadlockCheckEvent.scheduled();
     }

     void
     descheduleDeadlockEvent() override
     {
         deschedule(deadlockCheckEvent);
     }

     bool empty() const;

     void print(std::ostream& out) const;

     void evictionCallback(Addr address);
     void completeIssue();

     void insertKernel(int wavefront_id, PacketPtr pkt);

     GMTokenPort& getGMTokenPort() { return gmTokenPort; }

     void recordRequestType(SequencerRequestType requestType);
     Stats::Histogram& getOutstandReqHist() { return m_outstandReqHist; }

     Stats::Histogram& getLatencyHist() { return m_latencyHist; }
     Stats::Histogram& getTypeLatencyHist(uint32_t t)
     { return *m_typeLatencyHist[t]; }

     Stats::Histogram& getMissLatencyHist()
     { return m_missLatencyHist; }
     Stats::Histogram& getMissTypeLatencyHist(uint32_t t)
     { return *m_missTypeLatencyHist[t]; }

     Stats::Histogram& getMissMachLatencyHist(uint32_t t) const
     { return *m_missMachLatencyHist[t]; }

     Stats::Histogram&
     getMissTypeMachLatencyHist(uint32_t r, uint32_t t) const
     { return *m_missTypeMachLatencyHist[r][t]; }

     Stats::Histogram& getIssueToInitialDelayHist(uint32_t t) const
     { return *m_IssueToInitialDelayHist[t]; }

     Stats::Histogram&
     getInitialToForwardDelayHist(const MachineType t) const
     { return *m_InitialToForwardDelayHist[t]; }

     Stats::Histogram&
     getForwardRequestToFirstResponseHist(const MachineType t) const
     { return *m_ForwardToFirstResponseDelayHist[t]; }

     Stats::Histogram&
     getFirstResponseToCompletionDelayHist(const MachineType t) const
     { return *m_FirstResponseToCompletionDelayHist[t]; }

   // Changed to protected to enable inheritance by VIPER Coalescer
   protected:
     bool tryCacheAccess(Addr addr, RubyRequestType type,
                         Addr pc, RubyAccessMode access_mode,
                         int size, DataBlock*& data_ptr);
     // Alternate implementations in VIPER Coalescer
     virtual void issueRequest(CoalescedRequest* crequest);

     void kernelCallback(int wavfront_id);

     void hitCallback(CoalescedRequest* crequest,
                      MachineType mach,
                      DataBlock& data,
                      bool success,
                      Cycles initialRequestTime,
                      Cycles forwardRequestTime,
                      Cycles firstResponseTime,
                      bool isRegion);
     void recordMissLatency(CoalescedRequest* crequest,
                            MachineType mach,
                            Cycles initialRequestTime,
                            Cycles forwardRequestTime,
                            Cycles firstResponseTime,
                            bool success, bool isRegion);
     void completeHitCallback(std::vector<PacketPtr> & mylist);


     virtual RubyRequestType getRequestType(PacketPtr pkt);

     // Attempt to remove a packet from the uncoalescedTable and coalesce
     // with a previous request from the same instruction. If there is no
     // previous instruction and the max number of outstanding requests has
     // not be reached, a new coalesced request is created and added to the
     // "target" list of the coalescedTable.
     bool coalescePacket(PacketPtr pkt);

     EventFunctionWrapper issueEvent;


   // Changed to protected to enable inheritance by VIPER Coalescer
   protected:
     int m_max_outstanding_requests;
     Cycles m_deadlock_threshold;

     CacheMemory* m_dataCache_ptr;
     CacheMemory* m_instCache_ptr;

     // coalescingWindow is the maximum number of instructions that are
     // allowed to be coalesced in a single cycle.
     int coalescingWindow;

     // The uncoalescedTable contains several "columns" which hold memory
     // request packets for an instruction. The maximum size is the number of
     // columns * the wavefront size.
     UncoalescedTable uncoalescedTable;

     // An MSHR-like struct for holding coalesced requests. The requests in
     // this table may or may not be outstanding in the memory hierarchy. The
     // maximum size is equal to the maximum outstanding requests for a CU
     // (typically the number of blocks in TCP). If there are duplicates of
     // an address, the are serviced in age order.
     std::map<Addr, std::deque<CoalescedRequest*>> coalescedTable;

     // Global outstanding request count, across all request tables
     int m_outstanding_count;
     bool m_deadlock_check_scheduled;
     std::unordered_map<int, PacketPtr> kernelEndList;
     std::vector<int> newKernelEnds;

     int m_store_waiting_on_load_cycles;
     int m_store_waiting_on_store_cycles;
     int m_load_waiting_on_store_cycles;
     int m_load_waiting_on_load_cycles;

     bool m_runningGarnetStandalone;

     EventFunctionWrapper deadlockCheckEvent;
     bool assumingRfOCoherence;

     // m5 style stats for TCP hit/miss counts
     Stats::Scalar GPU_TCPLdHits;
     Stats::Scalar GPU_TCPLdTransfers;
     Stats::Scalar GPU_TCCLdHits;
     Stats::Scalar GPU_LdMiss;

     Stats::Scalar GPU_TCPStHits;
     Stats::Scalar GPU_TCPStTransfers;
     Stats::Scalar GPU_TCCStHits;
     Stats::Scalar GPU_StMiss;

     Stats::Scalar CP_TCPLdHits;
     Stats::Scalar CP_TCPLdTransfers;
     Stats::Scalar CP_TCCLdHits;
     Stats::Scalar CP_LdMiss;

     Stats::Scalar CP_TCPStHits;
     Stats::Scalar CP_TCPStTransfers;
     Stats::Scalar CP_TCCStHits;
     Stats::Scalar CP_StMiss;

     Stats::Histogram m_outstandReqHist;

     Stats::Histogram m_latencyHist;
     std::vector<Stats::Histogram *> m_typeLatencyHist;

     Stats::Histogram m_missLatencyHist;
     std::vector<Stats::Histogram *> m_missTypeLatencyHist;

     std::vector<Stats::Histogram *> m_missMachLatencyHist;
     std::vector< std::vector<Stats::Histogram *> > m_missTypeMachLatencyHist;

     std::vector<Stats::Histogram *> m_IssueToInitialDelayHist;
     std::vector<Stats::Histogram *> m_InitialToForwardDelayHist;
     std::vector<Stats::Histogram *> m_ForwardToFirstResponseDelayHist;
     std::vector<Stats::Histogram *> m_FirstResponseToCompletionDelayHist;

   private:
     // Token port is used to send/receive tokens to/from GPU's global memory
     // pipeline across the port boundary. There is one per <wave size> data
     // ports in the CU.
     GMTokenPort gmTokenPort;

     // Private copy constructor and assignment operator
     GPUCoalescer(const GPUCoalescer& obj);
     GPUCoalescer& operator=(const GPUCoalescer& obj);
 };

 inline std::ostream&
 operator<<(std::ostream& out, const GPUCoalescer& obj)
 {
     obj.print(out);
     out << std::flush;
     return out;
 }

 #endif // __MEM_RUBY_SYSTEM_GPU_COALESCER_HH__
GPUCoalescer::getGMTokenPort
GMTokenPort & getGMTokenPort()
Definition: GPUCoalescer.hh:238

GPUCoalescer::getLatencyHist
Stats::Histogram & getLatencyHist()
Definition: GPUCoalescer.hh:243

CoalescedRequest::CoalescedRequest
CoalescedRequest(uint64_t _seqNum)
Definition: GPUCoalescer.hh:99

Port
Ports are used to interface objects to each other.
Definition: port.hh:56

GPUCoalescer::CP_TCCStHits
Stats::Scalar CP_TCCStHits
Definition: GPUCoalescer.hh:371

GPUCoalescer::issueEvent
EventFunctionWrapper issueEvent
Definition: GPUCoalescer.hh:310

GPUCoalescer::GPU_TCPStHits
Stats::Scalar GPU_TCPStHits
Definition: GPUCoalescer.hh:359

CoalescedRequest::setSeqNum
void setSeqNum(uint64_t _seqNum)
Definition: GPUCoalescer.hh:106

Consumer.hh

Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition: types.hh:81

GPUCoalescer::GMTokenPort::recvTimingReq
bool recvTimingReq(PacketPtr)
Receive a timing request from the peer.
Definition: GPUCoalescer.hh:138

GPUCoalescer::GMTokenPort::~GMTokenPort
~GMTokenPort()
Definition: GPUCoalescer.hh:133

UncoalescedTable::UncoalescedTable
UncoalescedTable(GPUCoalescer *gc)
Definition: GPUCoalescer.cc:116

name
const std::string & name()
Definition: trace.cc:50

GPUCoalescer::m_missLatencyHist
Stats::Histogram m_missLatencyHist
Histogram for holding latency profile of all requests that miss in the controller connected to this s...
Definition: GPUCoalescer.hh:383

CoalescedRequest
Definition: GPUCoalescer.hh:96

TokenSlavePort
Definition: token_port.hh:90

GPUCoalescer::m_ForwardToFirstResponseDelayHist
std::vector< Stats::Histogram * > m_ForwardToFirstResponseDelayHist
Definition: GPUCoalescer.hh:394

InvalidPortID
const PortID InvalidPortID
Definition: types.hh:236

GPUCoalescer::getIssueToInitialDelayHist
Stats::Histogram & getIssueToInitialDelayHist(uint32_t t) const
Definition: GPUCoalescer.hh:259

GPUCoalescer::getFirstResponseToCompletionDelayHist
Stats::Histogram & getFirstResponseToCompletionDelayHist(const MachineType t) const
Definition: GPUCoalescer.hh:271

GPUCoalescer::GMTokenPort::GMTokenPort
GMTokenPort(const std::string &name, ClockedObject *owner, PortID id=InvalidPortID)
Definition: GPUCoalescer.hh:129

request.hh
Declaration of a request, the overall memory request consisting of the parts of the request that are ...

reqSegmentToHSASegment
HSASegment reqSegmentToHSASegment(const RequestPtr &req)
Definition: GPUCoalescer.cc:91

RequestPtr
std::shared_ptr< Request > RequestPtr
Definition: request.hh:81

GPUCoalescer::GPU_TCPLdHits
Stats::Scalar GPU_TCPLdHits
Definition: GPUCoalescer.hh:354

GPUCoalescer::CP_StMiss
Stats::Scalar CP_StMiss
Definition: GPUCoalescer.hh:372

addr
ip6_addr_t addr
Definition: inet.hh:330

GPUCoalescer::GPU_TCCStHits
Stats::Scalar GPU_TCCStHits
Definition: GPUCoalescer.hh:361

GPUCoalescer::deadlockCheckEvent
EventFunctionWrapper deadlockCheckEvent
Definition: GPUCoalescer.hh:350

GPUCoalescer::getMissTypeLatencyHist
Stats::Histogram & getMissTypeLatencyHist(uint32_t t)
Definition: GPUCoalescer.hh:249

CoalescedRequest::getSeqNum
uint64_t getSeqNum() const
Definition: GPUCoalescer.hh:110

GPUCoalescer::CP_LdMiss
Stats::Scalar CP_LdMiss
Definition: GPUCoalescer.hh:367

GPUCoalescer::GPU_TCPLdTransfers
Stats::Scalar GPU_TCPLdTransfers
Definition: GPUCoalescer.hh:355

GPUCoalescer::getForwardRequestToFirstResponseHist
Stats::Histogram & getForwardRequestToFirstResponseHist(const MachineType t) const
Definition: GPUCoalescer.hh:267

ArmISA::offset
Bitfield< 23, 0 > offset
Definition: types.hh:152

GPUCoalescer::CP_TCPLdTransfers
Stats::Scalar CP_TCPLdTransfers
Definition: GPUCoalescer.hh:365

GPUCoalescer::m_missMachLatencyHist
std::vector< Stats::Histogram * > m_missMachLatencyHist
Histograms for profiling the latencies for requests that required external messages.
Definition: GPUCoalescer.hh:388

GPUCoalescer::GMTokenPort
Definition: GPUCoalescer.hh:126

GPUCoalescer::m_max_outstanding_requests
int m_max_outstanding_requests
Definition: GPUCoalescer.hh:315

GPUCoalescer::getMissTypeMachLatencyHist
Stats::Histogram & getMissTypeMachLatencyHist(uint32_t r, uint32_t t) const
Definition: GPUCoalescer.hh:256

GPUCoalescer::m_latencyHist
Stats::Histogram m_latencyHist
Histogram for holding latency profile of all requests.
Definition: GPUCoalescer.hh:378

UncoalescedTable::checkDeadlock
void checkDeadlock(Tick threshold)
Definition: GPUCoalescer.cc:176

DataBlock
Definition: DataBlock.hh:40

CoalescedRequest::getPackets
std::vector< PacketPtr > & getPackets()
Definition: GPUCoalescer.hh:114

statistics.hh
Declaration of Statistics objects.

CoalescedRequest::issueTime
Cycles issueTime
Definition: GPUCoalescer.hh:118

Stats::Scalar
This is a simple scalar statistic, like a counter.
Definition: statistics.hh:2505

std::vector
STL vector class.
Definition: stl.hh:37

ArmISA::id
Bitfield< 33 > id
Definition: miscregs_types.hh:247

GPUCoalescer::CP_TCPStTransfers
Stats::Scalar CP_TCPStTransfers
Definition: GPUCoalescer.hh:370

GPUCoalescer::Params
RubyGPUCoalescerParams Params
Definition: GPUCoalescer.hh:146

GPUCoalescer::getMissMachLatencyHist
Stats::Histogram & getMissMachLatencyHist(uint32_t t) const
Definition: GPUCoalescer.hh:252

type
uint8_t type
Definition: inet.hh:328

MipsISA::pc
Bitfield< 4 > pc
Definition: pra_constants.hh:240

CoalescedRequest::setRubyType
void setRubyType(RubyRequestType type)
Definition: GPUCoalescer.hh:108

CoalescedRequest::getIssueTime
Cycles getIssueTime() const
Definition: GPUCoalescer.hh:112

GPUCoalescer
Definition: GPUCoalescer.hh:123

UncoalescedTable::instMap
std::map< uint64_t, PerInstPackets > instMap
Definition: GPUCoalescer.hh:93

CoalescedRequest::setIssueTime
void setIssueTime(Cycles _issueTime)
Definition: GPUCoalescer.hh:107

GPUCoalescer::GPU_LdMiss
Stats::Scalar GPU_LdMiss
Definition: GPUCoalescer.hh:357

CoalescedRequest::seqNum
uint64_t seqNum
Definition: GPUCoalescer.hh:117

GPUCoalescer::m_dataCache_ptr
CacheMemory * m_dataCache_ptr
Definition: GPUCoalescer.hh:318

Tick
uint64_t Tick
Tick count type.
Definition: types.hh:61

ClockedObject
The ClockedObject class extends the SimObject with a clock and accessor functions to relate ticks to ...
Definition: clocked_object.hh:231

GPUCoalescer::assumingRfOCoherence
bool assumingRfOCoherence
Definition: GPUCoalescer.hh:351

UncoalescedTable::getInstPackets
PerInstPackets * getInstPackets(int offset)
Definition: GPUCoalescer.cc:138

GPUCoalescer::GPU_TCCLdHits
Stats::Scalar GPU_TCCLdHits
Definition: GPUCoalescer.hh:356

GPUCoalescer::GMTokenPort::recvAtomic
Tick recvAtomic(PacketPtr)
Receive an atomic request packet from the peer.
Definition: GPUCoalescer.hh:136

GPUCoalescer::descheduleDeadlockEvent
void descheduleDeadlockEvent() override
Definition: GPUCoalescer.hh:224

GPUCoalescer::m_store_waiting_on_load_cycles
int m_store_waiting_on_load_cycles
Definition: GPUCoalescer.hh:343

Stats::Histogram
A simple histogram stat.
Definition: statistics.hh:2626

UncoalescedTable::updateResources
void updateResources()
Definition: GPUCoalescer.cc:151

GPUCoalescer::m_outstandReqHist
Stats::Histogram m_outstandReqHist
Histogram for number of outstanding requests per cycle.
Definition: GPUCoalescer.hh:375

GPUCoalescer::m_missTypeMachLatencyHist
std::vector< std::vector< Stats::Histogram * > > m_missTypeMachLatencyHist
Definition: GPUCoalescer.hh:389

MipsISA::r
r
Definition: pra_constants.hh:95

ArmISA::ss
Bitfield< 21 > ss
Definition: miscregs_types.hh:56

GPUCoalescer::isDeadlockEventScheduled
bool isDeadlockEventScheduled() const override
Definition: GPUCoalescer.hh:218

std::list
STL list class.
Definition: stl.hh:51

Address.hh

GPUCoalescer::m_InitialToForwardDelayHist
std::vector< Stats::Histogram * > m_InitialToForwardDelayHist
Definition: GPUCoalescer.hh:393

CoalescedRequest::~CoalescedRequest
~CoalescedRequest()
Definition: GPUCoalescer.hh:103

token_port.hh

Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:140

UncoalescedTable
Definition: GPUCoalescer.hh:66

GPUCoalescer::m_load_waiting_on_load_cycles
int m_load_waiting_on_load_cycles
Definition: GPUCoalescer.hh:346

Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e...
Definition: packet.hh:249

UncoalescedTable::coalescer
GPUCoalescer * coalescer
Definition: GPUCoalescer.hh:87

GPUCoalescer::kernelEndList
std::unordered_map< int, PacketPtr > kernelEndList
Definition: GPUCoalescer.hh:340

Sequencer.hh

GPUCoalescer::GPU_StMiss
Stats::Scalar GPU_StMiss
Definition: GPUCoalescer.hh:362

GPUCoalescer::m_IssueToInitialDelayHist
std::vector< Stats::Histogram * > m_IssueToInitialDelayHist
Histograms for recording the breakdown of miss latency.
Definition: GPUCoalescer.hh:392

GPUCoalescer::getOutstandReqHist
Stats::Histogram & getOutstandReqHist()
Definition: GPUCoalescer.hh:241

GPUCoalescer::CP_TCPLdHits
Stats::Scalar CP_TCPLdHits
Definition: GPUCoalescer.hh:364

UncoalescedTable::~UncoalescedTable
~UncoalescedTable()
Definition: GPUCoalescer.hh:70

CoalescedRequest::getRubyType
RubyRequestType getRubyType() const
Definition: GPUCoalescer.hh:113

CacheMemory
Definition: CacheMemory.hh:51

CoalescedRequest::pkts
std::vector< PacketPtr > pkts
Definition: GPUCoalescer.hh:120

CoalescedRequest::insertPacket
void insertPacket(PacketPtr pkt)
Definition: GPUCoalescer.hh:105

GPUCoalescer::m_typeLatencyHist
std::vector< Stats::Histogram * > m_typeLatencyHist
Definition: GPUCoalescer.hh:379

UncoalescedTable::insertPacket
void insertPacket(PacketPtr pkt)
Definition: GPUCoalescer.cc:122

PerInstPackets
std::list< PacketPtr > PerInstPackets
Definition: GPUCoalescer.hh:64

operator<<
std::ostream & operator<<(std::ostream &out, const GPUCoalescer &obj)
Definition: GPUCoalescer.hh:409

GPUCoalescer::getMissLatencyHist
Stats::Histogram & getMissLatencyHist()
Definition: GPUCoalescer.hh:247

GPUCoalescer::getTypeLatencyHist
Stats::Histogram & getTypeLatencyHist(uint32_t t)
Definition: GPUCoalescer.hh:244

GPUCoalescer::coalescingWindow
int coalescingWindow
Definition: GPUCoalescer.hh:323

GPUCoalescer::newKernelEnds
std::vector< int > newKernelEnds
Definition: GPUCoalescer.hh:341

CoalescedRequest::getFirstPkt
PacketPtr getFirstPkt() const
Definition: GPUCoalescer.hh:111

GPUCoalescer::gmTokenPort
GMTokenPort gmTokenPort
Definition: GPUCoalescer.hh:401

reqScopeToHSAScope
HSAScope reqScopeToHSAScope(const RequestPtr &req)
Definition: GPUCoalescer.cc:71

GPUCoalescer::GMTokenPort::getAddrRanges
AddrRangeList getAddrRanges() const
Get a list of the non-overlapping address ranges the owner is responsible for.
Definition: GPUCoalescer.hh:139

GPUCoalescer::outstandingCount
int outstandingCount() const override
Definition: GPUCoalescer.hh:215

EventFunctionWrapper
Definition: eventq.hh:1091

GPUCoalescer::CP_TCPStHits
Stats::Scalar CP_TCPStHits
Definition: GPUCoalescer.hh:369

GPUCoalescer::m_load_waiting_on_store_cycles
int m_load_waiting_on_store_cycles
Definition: GPUCoalescer.hh:345

UncoalescedTable::printRequestTable
void printRequestTable(std::stringstream &ss)
Definition: GPUCoalescer.cc:164

GPUCoalescer::getInitialToForwardDelayHist
Stats::Histogram & getInitialToForwardDelayHist(const MachineType t) const
Definition: GPUCoalescer.hh:263

GPUCoalescer::GMTokenPort::recvFunctional
void recvFunctional(PacketPtr)
Receive a functional request packet from the peer.
Definition: GPUCoalescer.hh:137

CoalescedRequest::rubyType
RubyRequestType rubyType
Definition: GPUCoalescer.hh:119

GPUCoalescer::m_instCache_ptr
CacheMemory * m_instCache_ptr
Definition: GPUCoalescer.hh:319

GPUCoalescer::m_outstanding_count
int m_outstanding_count
Definition: GPUCoalescer.hh:338

GPUCoalescer::uncoalescedTable
UncoalescedTable uncoalescedTable
Definition: GPUCoalescer.hh:328

PortID
int16_t PortID
Port index/ID type, and a symbolic name for an invalid port id.
Definition: types.hh:235

GPUCoalescer::m_deadlock_threshold
Cycles m_deadlock_threshold
Definition: GPUCoalescer.hh:316

MachineID
Definition: MachineID.hh:38

ArmISA::t
Bitfield< 5 > t
Definition: miscregs_types.hh:67

GPUCoalescer::print
void print(std::ostream &out) const
Definition: GPUCoalescer.cc:755

GPUCoalescer::m_runningGarnetStandalone
bool m_runningGarnetStandalone
Definition: GPUCoalescer.hh:348

GPUCoalescer::coalescedTable
std::map< Addr, std::deque< CoalescedRequest * > > coalescedTable
Definition: GPUCoalescer.hh:335

GPUCoalescer::m_FirstResponseToCompletionDelayHist
std::vector< Stats::Histogram * > m_FirstResponseToCompletionDelayHist
Definition: GPUCoalescer.hh:395

GPUCoalescer::m_missTypeLatencyHist
std::vector< Stats::Histogram * > m_missTypeLatencyHist
Definition: GPUCoalescer.hh:384

GPUCoalescer::m_store_waiting_on_store_cycles
int m_store_waiting_on_store_cycles
Definition: GPUCoalescer.hh:344

data
const char data[]
Definition: circlebuf.test.cc:42

RubyPort
Definition: RubyPort.hh:58

GPUCoalescer::GPU_TCPStTransfers
Stats::Scalar GPU_TCPStTransfers
Definition: GPUCoalescer.hh:360

GPUCoalescer::m_deadlock_check_scheduled
bool m_deadlock_check_scheduled
Definition: GPUCoalescer.hh:339

GPUCoalescer::CP_TCCLdHits
Stats::Scalar CP_TCCLdHits
Definition: GPUCoalescer.hh:366

UncoalescedTable::packetAvailable
bool packetAvailable()
Definition: GPUCoalescer.cc:132