release/v19-0-0-0/gpu__tlb_8hh_source.html

 /*
  * Copyright (c) 2011-2015 Advanced Micro Devices, Inc.
  * All rights reserved.
  *
  * For use for simulation and test purposes only
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are met:
  *
  * 1. Redistributions of source code must retain the above copyright notice,
  * this list of conditions and the following disclaimer.
  *
  * 2. Redistributions in binary form must reproduce the above copyright notice,
  * this list of conditions and the following disclaimer in the documentation
  * and/or other materials provided with the distribution.
  *
  * 3. Neither the name of the copyright holder nor the names of its
  * contributors may be used to endorse or promote products derived from this
  * software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
  * POSSIBILITY OF SUCH DAMAGE.
  *
  * Authors: Lisa Hsu
  */

 #ifndef __GPU_TLB_HH__
 #define __GPU_TLB_HH__

 #include <fstream>
 #include <list>
 #include <queue>
 #include <string>
 #include <vector>

 #include "arch/generic/tlb.hh"
 #include "arch/x86/pagetable.hh"
 #include "arch/x86/pagetable_walker.hh"
 #include "arch/x86/regs/segment.hh"
 #include "base/callback.hh"
 #include "base/logging.hh"
 #include "base/statistics.hh"
 #include "gpu-compute/compute_unit.hh"
 #include "mem/port.hh"
 #include "mem/request.hh"
 #include "params/X86GPUTLB.hh"
 #include "sim/clocked_object.hh"
 #include "sim/sim_object.hh"

 class BaseTLB;
 class Packet;
 class ThreadContext;

 namespace X86ISA
 {
     class GpuTLB : public ClockedObject
     {
       protected:
         friend class Walker;

         typedef std::list<TlbEntry*> EntryList;

         uint32_t configAddress;

         // TLB clock: will inherit clock from shader's clock period in terms
         // of nuber of ticks of curTime (aka global simulation clock)
         // The assignment of TLB clock from shader clock is done in the python
         // config files.
         int clock;

       public:
         // clock related functions ; maps to-and-from Simulation ticks and
         // object clocks.
         Tick frequency() const { return SimClock::Frequency / clock; }

         Tick
         ticks(int numCycles) const
         {
             return (Tick)clock * numCycles;
         }

         Tick curCycle() const { return curTick() / clock; }
         Tick tickToCycles(Tick val) const { return val / clock;}

         typedef X86GPUTLBParams Params;
         GpuTLB(const Params *p);
         ~GpuTLB();

         typedef enum BaseTLB::Mode Mode;

         class Translation
         {
           public:
             virtual ~Translation() { }

             virtual void markDelayed() = 0;

             virtual void finish(Fault fault, const RequestPtr &req,
                                 ThreadContext *tc, Mode mode) = 0;
         };

         void dumpAll();
         TlbEntry *lookup(Addr va, bool update_lru=true);
         void setConfigAddress(uint32_t addr);

       protected:
         EntryList::iterator lookupIt(Addr va, bool update_lru=true);
         Walker *walker;

       public:
         Walker *getWalker();
         void invalidateAll();
         void invalidateNonGlobal();
         void demapPage(Addr va, uint64_t asn);

       protected:
         int size;
         int assoc;
         int numSets;

         bool FA;
         Addr setMask;

         bool allocationPolicy;

         bool hasMemSidePort;

         bool accessDistance;

         std::vector<TlbEntry> tlb;

         /*
          * It's a per-set list. As long as we have not reached
          * the full capacity of the given set, grab an entry from
          * the freeList.
          */
         std::vector<EntryList> freeList;

         std::vector<EntryList> entryList;

         Fault translateInt(const RequestPtr &req, ThreadContext *tc);

         Fault translate(const RequestPtr &req, ThreadContext *tc,
                 Translation *translation, Mode mode, bool &delayedResponse,
                 bool timing, int &latency);

       public:
         // latencies for a TLB hit, miss and page fault
         int hitLatency;
         int missLatency1;
         int missLatency2;

         // local_stats are as seen from the TLB
         // without taking into account coalescing
         Stats::Scalar localNumTLBAccesses;
         Stats::Scalar localNumTLBHits;
         Stats::Scalar localNumTLBMisses;
         Stats::Formula localTLBMissRate;

         // global_stats are as seen from the
         // CU's perspective taking into account
         // all coalesced requests.
         Stats::Scalar globalNumTLBAccesses;
         Stats::Scalar globalNumTLBHits;
         Stats::Scalar globalNumTLBMisses;
         Stats::Formula globalTLBMissRate;

         // from the CU perspective (global)
         Stats::Scalar accessCycles;
         // from the CU perspective (global)
         Stats::Scalar pageTableCycles;
         Stats::Scalar numUniquePages;
         // from the perspective of this TLB
         Stats::Scalar localCycles;
         // from the perspective of this TLB
         Stats::Formula localLatency;
         // I take the avg. per page and then
         // the avg. over all pages.
         Stats::Scalar avgReuseDistance;

         void regStats() override;
         void updatePageFootprint(Addr virt_page_addr);
         void printAccessPattern();


         Fault translateAtomic(const RequestPtr &req, ThreadContext *tc,
                               Mode mode, int &latency);

         void translateTiming(const RequestPtr &req, ThreadContext *tc,
                              Translation *translation, Mode mode,
                              int &latency);

         Tick doMmuRegRead(ThreadContext *tc, Packet *pkt);
         Tick doMmuRegWrite(ThreadContext *tc, Packet *pkt);

         TlbEntry *insert(Addr vpn, TlbEntry &entry);

         // Checkpointing
         virtual void serialize(CheckpointOut& cp) const override;
         virtual void unserialize(CheckpointIn& cp) override;
         void issueTranslation();
         enum tlbOutcome {TLB_HIT, TLB_MISS, PAGE_WALK, MISS_RETURN};
         bool tlbLookup(const RequestPtr &req,
                        ThreadContext *tc, bool update_stats);

         void handleTranslationReturn(Addr addr, tlbOutcome outcome,
                                      PacketPtr pkt);

         void handleFuncTranslationReturn(PacketPtr pkt, tlbOutcome outcome);

         void pagingProtectionChecks(ThreadContext *tc, PacketPtr pkt,
                                     TlbEntry *tlb_entry, Mode mode);

         void updatePhysAddresses(Addr virt_page_addr, TlbEntry *tlb_entry,
                                  Addr phys_page_addr);

         void issueTLBLookup(PacketPtr pkt);

         // CpuSidePort is the TLB Port closer to the CPU/CU side
         class CpuSidePort : public SlavePort
         {
           public:
             CpuSidePort(const std::string &_name, GpuTLB * gpu_TLB,
                         PortID _index)
                 : SlavePort(_name, gpu_TLB), tlb(gpu_TLB), index(_index) { }

           protected:
             GpuTLB *tlb;
             int index;

             virtual bool recvTimingReq(PacketPtr pkt);
             virtual Tick recvAtomic(PacketPtr pkt) { return 0; }
             virtual void recvFunctional(PacketPtr pkt);
             virtual void recvRangeChange() { }
             virtual void recvReqRetry();
             virtual void recvRespRetry() { panic("recvRespRetry called"); }
             virtual AddrRangeList getAddrRanges() const;
         };

         class MemSidePort : public MasterPort
         {
           public:
             MemSidePort(const std::string &_name, GpuTLB * gpu_TLB,
                         PortID _index)
                 : MasterPort(_name, gpu_TLB), tlb(gpu_TLB), index(_index) { }

             std::deque<PacketPtr> retries;

           protected:
             GpuTLB *tlb;
             int index;

             virtual bool recvTimingResp(PacketPtr pkt);
             virtual Tick recvAtomic(PacketPtr pkt) { return 0; }
             virtual void recvFunctional(PacketPtr pkt) { }
             virtual void recvRangeChange() { }
             virtual void recvReqRetry();
         };

         // TLB ports on the cpu Side
         std::vector<CpuSidePort*> cpuSidePort;
         // TLB ports on the memory side
         std::vector<MemSidePort*> memSidePort;

         Port &getPort(const std::string &if_name,
                       PortID idx=InvalidPortID) override;

         struct TranslationState : public Packet::SenderState
         {
             // TLB mode, read or write
             Mode tlbMode;
             // Thread context associated with this req
             ThreadContext *tc;

             /*
             * TLB entry to be populated and passed back and filled in
             * previous TLBs.  Equivalent to the data cache concept of
             * "data return."
             */
             TlbEntry *tlbEntry;
             // Is this a TLB prefetch request?
             bool prefetch;
             // When was the req for this translation issued
             uint64_t issueTime;
             // Remember where this came from
             std::vector<SlavePort*>ports;

             // keep track of #uncoalesced reqs per packet per TLB level;
             // reqCnt per level >= reqCnt higher level
             std::vector<int> reqCnt;
             // TLB level this packet hit in; 0 if it hit in the page table
             int hitLevel;
             Packet::SenderState *saved;

             TranslationState(Mode tlb_mode, ThreadContext *_tc,
                              bool _prefetch=false,
                              Packet::SenderState *_saved=nullptr)
                 : tlbMode(tlb_mode), tc(_tc), tlbEntry(nullptr),
                   prefetch(_prefetch), issueTime(0),
                   hitLevel(0),saved(_saved) { }
         };

         // maximum number of permitted coalesced requests per cycle
         int maxCoalescedReqs;

         // Current number of outstandings coalesced requests.
         // Should be <= maxCoalescedReqs
         int outstandingReqs;

         void translationReturn(Addr virtPageAddr, tlbOutcome outcome,
                                PacketPtr pkt);

         class TLBEvent : public Event
         {
             private:
                 GpuTLB *tlb;
                 Addr virtPageAddr;
                 tlbOutcome outcome;
                 PacketPtr pkt;

             public:
                 TLBEvent(GpuTLB *_tlb, Addr _addr, tlbOutcome outcome,
                         PacketPtr _pkt);

                 void process();
                 const char *description() const;

                 // updateOutcome updates the tlbOutcome of a TLBEvent
                 void updateOutcome(tlbOutcome _outcome);
                 Addr getTLBEventVaddr();
         };

         std::unordered_map<Addr, TLBEvent*> translationReturnEvent;

         // this FIFO queue keeps track of the virt. page addresses
         // that are pending cleanup
         std::queue<Addr> cleanupQueue;

         // the cleanupEvent is scheduled after a TLBEvent triggers in order to
         // free memory and do the required clean-up
         void cleanup();

         EventFunctionWrapper cleanupEvent;

         struct AccessInfo
         {
             unsigned int lastTimeAccessed; // last access to this page
             unsigned int accessesPerPage;
             // need to divide it by accessesPerPage at the end
             unsigned int totalReuseDistance;

             std::vector<unsigned int> localTLBAccesses;
             unsigned int sumDistance;
             unsigned int meanDistance;
         };

         typedef std::unordered_map<Addr, AccessInfo> AccessPatternTable;
         AccessPatternTable TLBFootprint;

         // Called at the end of simulation to dump page access stats.
         void exitCallback();

         EventFunctionWrapper exitEvent;
     };
 }

 #endif // __GPU_TLB_HH__
MasterPort
A MasterPort is a specialisation of a BaseMasterPort, which implements the default protocol for the t...
Definition: port.hh:75

X86ISA::GpuTLB::assoc
int assoc
Definition: gpu_tlb.hh:136

panic
#define panic(...)
This implements a cprintf based panic() function.
Definition: logging.hh:167

X86ISA::GpuTLB::TLBFootprint
AccessPatternTable TLBFootprint
Definition: gpu_tlb.hh:443

X86ISA::GpuTLB::AccessInfo::accessesPerPage
unsigned int accessesPerPage
Definition: gpu_tlb.hh:425

X86ISA::GpuTLB::Translation
Definition: gpu_tlb.hh:100

logging.hh

X86ISA::GpuTLB::globalTLBMissRate
Stats::Formula globalTLBMissRate
Definition: gpu_tlb.hh:205

Port
Ports are used to interface objects to each other.
Definition: port.hh:60

X86ISA::GpuTLB::allocationPolicy
bool allocationPolicy
Allocation Policy: true if we always allocate on a hit, false otherwise.
Definition: gpu_tlb.hh:149

X86ISA::GpuTLB::localCycles
Stats::Scalar localCycles
Definition: gpu_tlb.hh:213

X86ISA::index
Bitfield< 5, 3 > index
Definition: types.hh:95

X86ISA::GpuTLB::TLBEvent::virtPageAddr
Addr virtPageAddr
Definition: gpu_tlb.hh:386

InvalidPortID
const PortID InvalidPortID
Definition: types.hh:238

X86ISA::GpuTLB::serialize
virtual void serialize(CheckpointOut &cp) const override
Serialize an object.
Definition: gpu_tlb.cc:935

X86ISA::GpuTLB::TranslationState
TLB TranslationState: this currently is a somewhat bastardization of the usage of SenderState...
Definition: gpu_tlb.hh:330

X86ISA::GpuTLB::avgReuseDistance
Stats::Scalar avgReuseDistance
Definition: gpu_tlb.hh:218

X86ISA::GpuTLB::translationReturn
void translationReturn(Addr virtPageAddr, tlbOutcome outcome, PacketPtr pkt)
A TLBEvent is scheduled after the TLB lookup and helps us take the appropriate actions: (e...
Definition: gpu_tlb.cc:1244

X86ISA::GpuTLB::CpuSidePort::recvRespRetry
virtual void recvRespRetry()
Called by the peer if sendTimingResp was called on this protocol (causing recvTimingResp to be called...
Definition: gpu_tlb.hh:275

X86ISA::GpuTLB::CpuSidePort::CpuSidePort
CpuSidePort(const std::string &_name, GpuTLB *gpu_TLB, PortID _index)
Definition: gpu_tlb.hh:262

X86ISA::GpuTLB::handleFuncTranslationReturn
void handleFuncTranslationReturn(PacketPtr pkt, tlbOutcome outcome)
handleFuncTranslationReturn is called on a TLB hit, when a TLB miss returns or when a page fault retu...
Definition: gpu_tlb.cc:1410

X86ISA::GpuTLB::accessCycles
Stats::Scalar accessCycles
Definition: gpu_tlb.hh:208

X86ISA::GpuTLB::localTLBMissRate
Stats::Formula localTLBMissRate
Definition: gpu_tlb.hh:197

X86ISA::GpuTLB::pagingProtectionChecks
void pagingProtectionChecks(ThreadContext *tc, PacketPtr pkt, TlbEntry *tlb_entry, Mode mode)
Do Paging protection checks.
Definition: gpu_tlb.cc:1125

request.hh
Declaration of a request, the overall memory request consisting of the parts of the request that are ...

X86ISA::GpuTLB::invalidateAll
void invalidateAll()
Definition: gpu_tlb.cc:226

RequestPtr
std::shared_ptr< Request > RequestPtr
Definition: request.hh:83

X86ISA::GpuTLB::AccessInfo::meanDistance
unsigned int meanDistance
Definition: gpu_tlb.hh:439

X86ISA::GpuTLB::exitCallback
void exitCallback()
Definition: gpu_tlb.cc:1701

X86ISA::GpuTLB::issueTranslation
void issueTranslation()

X86ISA::GpuTLB::getWalker
Walker * getWalker()
Definition: gpu_tlb.cc:928

X86ISA::GpuTLB::lookupIt
EntryList::iterator lookupIt(Addr va, bool update_lru=true)
Definition: gpu_tlb.cc:183

X86ISA::GpuTLB::numSets
int numSets
Definition: gpu_tlb.hh:137

X86ISA::GpuTLB::tlb
std::vector< TlbEntry > tlb
Definition: gpu_tlb.hh:162

X86ISA::GpuTLB::TranslationState::hitLevel
int hitLevel
Definition: gpu_tlb.hh:354

X86ISA::GpuTLB::translateAtomic
Fault translateAtomic(const RequestPtr &req, ThreadContext *tc, Mode mode, int &latency)
Definition: gpu_tlb.cc:904

X86ISA::GpuTLB::setMask
Addr setMask
Definition: gpu_tlb.hh:143

X86ISA::GpuTLB::MemSidePort
MemSidePort is the TLB Port closer to the memory side If this is a last level TLB then this port will...
Definition: gpu_tlb.hh:286

X86ISA::GpuTLB::hasMemSidePort
bool hasMemSidePort
if true, then this is not the last level TLB
Definition: gpu_tlb.hh:154

X86ISA::GpuTLB::AccessInfo::totalReuseDistance
unsigned int totalReuseDistance
Definition: gpu_tlb.hh:427

X86ISA::GpuTLB::translate
Fault translate(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode, bool &delayedResponse, bool timing, int &latency)
Definition: gpu_tlb.cc:701

X86ISA::GpuTLB::CpuSidePort::index
int index
Definition: gpu_tlb.hh:268

X86ISA::GpuTLB::getPort
Port & getPort(const std::string &if_name, PortID idx=InvalidPortID) override
Get a port with a given name and index.
Definition: gpu_tlb.cc:135

X86ISA::GpuTLB::doMmuRegRead
Tick doMmuRegRead(ThreadContext *tc, Packet *pkt)

X86ISA::GpuTLB::AccessInfo::lastTimeAccessed
unsigned int lastTimeAccessed
Definition: gpu_tlb.hh:424

SlavePort
A SlavePort is a specialisation of a port.
Definition: port.hh:258

cp
Definition: cprintf.cc:42

X86ISA::GpuTLB::AccessInfo::sumDistance
unsigned int sumDistance
Definition: gpu_tlb.hh:438

ArmISA::mode
Bitfield< 4, 0 > mode
Definition: miscregs_types.hh:73

X86ISA::GpuTLB::translateInt
Fault translateInt(const RequestPtr &req, ThreadContext *tc)
Definition: gpu_tlb.cc:277

X86ISA::GpuTLB::localNumTLBMisses
Stats::Scalar localNumTLBMisses
Definition: gpu_tlb.hh:196

compute_unit.hh

SimClock::Frequency
Tick Frequency
The simulated frequency of curTick(). (In ticks per second)
Definition: core.cc:49

X86ISA::GpuTLB::maxCoalescedReqs
int maxCoalescedReqs
Definition: gpu_tlb.hh:366

ThreadContext
ThreadContext is the external interface to all thread state for anything outside of the CPU...
Definition: thread_context.hh:93

X86ISA::GpuTLB::TranslationState::prefetch
bool prefetch
Definition: gpu_tlb.hh:344

X86ISA::GpuTLB::CpuSidePort
Definition: gpu_tlb.hh:259

statistics.hh
Declaration of Statistics objects.

Stats::Scalar
This is a simple scalar statistic, like a counter.
Definition: statistics.hh:2508

X86ISA::GpuTLB::Mode
enum BaseTLB::Mode Mode
Definition: gpu_tlb.hh:98

std::vector
STL vector class.
Definition: stl.hh:40

X86ISA::GpuTLB::insert
TlbEntry * insert(Addr vpn, TlbEntry &entry)
Definition: gpu_tlb.cc:157

X86ISA::val
Bitfield< 63 > val
Definition: misc.hh:771

X86ISA::GpuTLB::TLBEvent::tlb
GpuTLB * tlb
Definition: gpu_tlb.hh:385

X86ISA::GpuTLB::walker
Walker * walker
Definition: gpu_tlb.hh:126

pagetable.hh

X86ISA::GpuTLB::MISS_RETURN
Definition: gpu_tlb.hh:241

segment.hh

X86ISA::GpuTLB::numUniquePages
Stats::Scalar numUniquePages
Definition: gpu_tlb.hh:211

BaseTLB
Definition: tlb.hh:52

X86ISA::GpuTLB::size
int size
Definition: gpu_tlb.hh:135

X86ISA::GpuTLB::globalNumTLBMisses
Stats::Scalar globalNumTLBMisses
Definition: gpu_tlb.hh:204

X86ISA::GpuTLB::tickToCycles
Tick tickToCycles(Tick val) const
Definition: gpu_tlb.hh:92

X86ISA::GpuTLB::cleanupQueue
std::queue< Addr > cleanupQueue
Definition: gpu_tlb.hh:409

X86ISA::GpuTLB::memSidePort
std::vector< MemSidePort * > memSidePort
Definition: gpu_tlb.hh:309

X86ISA::GpuTLB::accessDistance
bool accessDistance
Print out accessDistance stats.
Definition: gpu_tlb.hh:160

curTick
Tick curTick()
The current simulated tick.
Definition: core.hh:47

X86ISA::GpuTLB::Translation::markDelayed
virtual void markDelayed()=0
Signal that the translation has been delayed due to a hw page table walk.

X86ISA::GpuTLB::translateTiming
void translateTiming(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode, int &latency)
Definition: gpu_tlb.cc:914

X86ISA::GpuTLB::MemSidePort::retries
std::deque< PacketPtr > retries
Definition: gpu_tlb.hh:293

X86ISA::GpuTLB::MemSidePort::index
int index
Definition: gpu_tlb.hh:297

X86ISA::GpuTLB::Translation::finish
virtual void finish(Fault fault, const RequestPtr &req, ThreadContext *tc, Mode mode)=0
The memory for this object may be dynamically allocated, and it may be responsible for cleaning itsle...

X86ISA::GpuTLB::exitEvent
EventFunctionWrapper exitEvent
Definition: gpu_tlb.hh:448

X86ISA::GpuTLB::localLatency
Stats::Formula localLatency
Definition: gpu_tlb.hh:215

X86ISA::GpuTLB::TranslationState::tlbMode
Mode tlbMode
Definition: gpu_tlb.hh:333

X86ISA::GpuTLB::EntryList
std::list< TlbEntry * > EntryList
Definition: gpu_tlb.hh:70

X86ISA::GpuTLB::MemSidePort::recvAtomic
virtual Tick recvAtomic(PacketPtr pkt)
Definition: gpu_tlb.hh:300

X86ISA::GpuTLB::outstandingReqs
int outstandingReqs
Definition: gpu_tlb.hh:370

X86ISA::GpuTLB::entryList
std::vector< EntryList > entryList
An entryList per set is the equivalent of an LRU stack; it&#39;s used to guide replacement decisions...
Definition: gpu_tlb.hh:178

X86ISA::GpuTLB::invalidateNonGlobal
void invalidateNonGlobal()
Definition: gpu_tlb.cc:246

X86ISA::GpuTLB::TranslationState::tlbEntry
TlbEntry * tlbEntry
Definition: gpu_tlb.hh:342

X86ISA::GpuTLB::TranslationState::tc
ThreadContext * tc
Definition: gpu_tlb.hh:335

callback.hh

X86ISA::GpuTLB::TranslationState::issueTime
uint64_t issueTime
Definition: gpu_tlb.hh:346

Tick
uint64_t Tick
Tick count type.
Definition: types.hh:63

X86ISA::TlbEntry
Definition: pagetable.hh:66

X86ISA::GpuTLB::setConfigAddress
void setConfigAddress(uint32_t addr)
Definition: gpu_tlb.cc:240

ClockedObject
The ClockedObject class extends the SimObject with a clock and accessor functions to relate ticks to ...
Definition: clocked_object.hh:237

X86ISA::GpuTLB::MemSidePort::MemSidePort
MemSidePort(const std::string &_name, GpuTLB *gpu_TLB, PortID _index)
Definition: gpu_tlb.hh:289

X86ISA::GpuTLB::cleanupEvent
EventFunctionWrapper cleanupEvent
Definition: gpu_tlb.hh:415

X86ISA::GpuTLB::MemSidePort::tlb
GpuTLB * tlb
Definition: gpu_tlb.hh:296

X86ISA::GpuTLB::AccessInfo
This hash map will use the virtual page address as a key and will keep track of total number of acces...
Definition: gpu_tlb.hh:422

clocked_object.hh
ClockedObject declaration and implementation.

X86ISA::GpuTLB::clock
int clock
Definition: gpu_tlb.hh:78

X86ISA::GpuTLB::Params
X86GPUTLBParams Params
Definition: gpu_tlb.hh:94

X86ISA::GpuTLB::demapPage
void demapPage(Addr va, uint64_t asn)
Definition: gpu_tlb.cc:264

X86ISA::GpuTLB::MemSidePort::recvRangeChange
virtual void recvRangeChange()
Called to receive an address range change from the peer slave port.
Definition: gpu_tlb.hh:302

X86ISA::GpuTLB::translationReturnEvent
std::unordered_map< Addr, TLBEvent * > translationReturnEvent
Definition: gpu_tlb.hh:405

port.hh
Port Object Declaration.

X86ISA::GpuTLB::hitLatency
int hitLatency
Definition: gpu_tlb.hh:188

X86ISA::GpuTLB::PAGE_WALK
Definition: gpu_tlb.hh:241

X86ISA::GpuTLB::handleTranslationReturn
void handleTranslationReturn(Addr addr, tlbOutcome outcome, PacketPtr pkt)
handleTranslationReturn is called on a TLB hit, when a TLB miss returns or when a page fault returns...
Definition: gpu_tlb.cc:1159

std::list< TlbEntry * >

X86ISA::GpuTLB::TLBEvent
Definition: gpu_tlb.hh:382

X86ISA::GpuTLB::MemSidePort::recvFunctional
virtual void recvFunctional(PacketPtr pkt)
Definition: gpu_tlb.hh:301

X86ISA::GpuTLB::cpuSidePort
std::vector< CpuSidePort * > cpuSidePort
Definition: gpu_tlb.hh:307

X86ISA::GpuTLB::lookup
TlbEntry * lookup(Addr va, bool update_lru=true)
Definition: gpu_tlb.cc:213

X86ISA::GpuTLB::globalNumTLBAccesses
Stats::Scalar globalNumTLBAccesses
Definition: gpu_tlb.hh:202

X86ISA::GpuTLB::TLB_MISS
Definition: gpu_tlb.hh:241

Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:142

pagetable_walker.hh

X86ISA::GpuTLB::TranslationState::saved
Packet::SenderState * saved
Definition: gpu_tlb.hh:355

X86ISA::GpuTLB::freeList
std::vector< EntryList > freeList
Definition: gpu_tlb.hh:169

CheckpointIn
Definition: serialize.hh:72

Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e...
Definition: packet.hh:255

ArmISA::va
Bitfield< 8 > va
Definition: miscregs_types.hh:274

Packet::SenderState
A virtual base opaque structure used to hold state associated with the packet (e.g., an MSHR), specific to a SimObject that sees the packet.
Definition: packet.hh:403

std::deque
STL deque class.
Definition: stl.hh:47

X86ISA::GpuTLB::AccessPatternTable
std::unordered_map< Addr, AccessInfo > AccessPatternTable
Definition: gpu_tlb.hh:442

X86ISA::GpuTLB::regStats
void regStats() override
Callback to set stat parameters.
Definition: gpu_tlb.cc:945

Stats::Formula
A formula for statistics that is calculated when printed.
Definition: statistics.hh:3012

BaseTLB::Mode
Mode
Definition: tlb.hh:59

X86ISA::GpuTLB::unserialize
virtual void unserialize(CheckpointIn &cp) override
Unserialize an object.
Definition: gpu_tlb.cc:940

X86ISA::GpuTLB::CpuSidePort::recvAtomic
virtual Tick recvAtomic(PacketPtr pkt)
Receive an atomic request packet from the peer.
Definition: gpu_tlb.hh:271

X86ISA::GpuTLB::configAddress
uint32_t configAddress
Definition: gpu_tlb.hh:72

X86ISA::GpuTLB::CpuSidePort::tlb
GpuTLB * tlb
Definition: gpu_tlb.hh:267

X86ISA::GpuTLB::AccessInfo::localTLBAccesses
std::vector< unsigned int > localTLBAccesses
The field below will help us compute the access distance, that is the number of (coalesced) TLB acces...
Definition: gpu_tlb.hh:437

CheckpointOut
std::ostream CheckpointOut
Definition: serialize.hh:68

X86ISA
This is exposed globally, independent of the ISA.
Definition: acpi.hh:57

X86ISA::GpuTLB::missLatency2
int missLatency2
Definition: gpu_tlb.hh:190

X86ISA::GpuTLB::tlbOutcome
tlbOutcome
Definition: gpu_tlb.hh:241

X86ISA::GpuTLB::TranslationState::ports
std::vector< SlavePort * > ports
Definition: gpu_tlb.hh:348

Event
Definition: eventq.hh:189

EventFunctionWrapper
Definition: eventq.hh:819

X86ISA::GpuTLB::curCycle
Tick curCycle() const
Definition: gpu_tlb.hh:91

X86ISA::GpuTLB::cleanup
void cleanup()
Definition: gpu_tlb.cc:1642

X86ISA::GpuTLB::frequency
Tick frequency() const
Definition: gpu_tlb.hh:83

sim_object.hh

X86ISA::GpuTLB::TLB_HIT
Definition: gpu_tlb.hh:241

X86ISA::GpuTLB::missLatency1
int missLatency1
Definition: gpu_tlb.hh:189

X86ISA::GpuTLB::pageTableCycles
Stats::Scalar pageTableCycles
Definition: gpu_tlb.hh:210

X86ISA::GpuTLB::ticks
Tick ticks(int numCycles) const
Definition: gpu_tlb.hh:86

X86ISA::GpuTLB::localNumTLBHits
Stats::Scalar localNumTLBHits
Definition: gpu_tlb.hh:195

X86ISA::GpuTLB::~GpuTLB
~GpuTLB()
Definition: gpu_tlb.cc:128

X86ISA::GpuTLB::TranslationState::TranslationState
TranslationState(Mode tlb_mode, ThreadContext *_tc, bool _prefetch=false, Packet::SenderState *_saved=nullptr)
Definition: gpu_tlb.hh:357

X86ISA::GpuTLB::updatePhysAddresses
void updatePhysAddresses(Addr virt_page_addr, TlbEntry *tlb_entry, Addr phys_page_addr)

PortID
int16_t PortID
Port index/ID type, and a symbolic name for an invalid port id.
Definition: types.hh:237

X86ISA::p
Bitfield< 0 > p
Definition: pagetable.hh:152

X86ISA::GpuTLB::GpuTLB
GpuTLB(const Params *p)
Definition: gpu_tlb.cc:63

X86ISA::GpuTLB::doMmuRegWrite
Tick doMmuRegWrite(ThreadContext *tc, Packet *pkt)

tlb.hh

X86ISA::Walker
Definition: pagetable_walker.hh:58

X86ISA::GpuTLB::CpuSidePort::recvRangeChange
virtual void recvRangeChange()
Definition: gpu_tlb.hh:273

X86ISA::GpuTLB::FA
bool FA
true if this is a fully-associative TLB
Definition: gpu_tlb.hh:142

X86ISA::GpuTLB::localNumTLBAccesses
Stats::Scalar localNumTLBAccesses
Definition: gpu_tlb.hh:194

X86ISA::GpuTLB::Translation::~Translation
virtual ~Translation()
Definition: gpu_tlb.hh:103

X86ISA::GpuTLB::globalNumTLBHits
Stats::Scalar globalNumTLBHits
Definition: gpu_tlb.hh:203

Fault
std::shared_ptr< FaultBase > Fault
Definition: types.hh:240

X86ISA::addr
Bitfield< 3 > addr
Definition: types.hh:81

X86ISA::GpuTLB::TLBEvent::outcome
tlbOutcome outcome
outcome can be TLB_HIT, TLB_MISS, or PAGE_WALK
Definition: gpu_tlb.hh:390

X86ISA::GpuTLB::TranslationState::reqCnt
std::vector< int > reqCnt
Definition: gpu_tlb.hh:352

X86ISA::GpuTLB::TLBEvent::pkt
PacketPtr pkt
Definition: gpu_tlb.hh:391

X86ISA::GpuTLB::issueTLBLookup
void issueTLBLookup(PacketPtr pkt)
Do the TLB lookup for this coalesced request and schedule another event <TLB access="" latency>=""> c...
Definition: gpu_tlb.cc:1033

X86ISA::GpuTLB::tlbLookup
bool tlbLookup(const RequestPtr &req, ThreadContext *tc, bool update_stats)
TLB_lookup will only perform a TLB lookup returning true on a TLB hit and false on a TLB miss...
Definition: gpu_tlb.cc:652

X86ISA::GpuTLB
Definition: gpu_tlb.hh:65

X86ISA::GpuTLB::dumpAll
void dumpAll()

X86ISA::GpuTLB::updatePageFootprint
void updatePageFootprint(Addr virt_page_addr)
Definition: gpu_tlb.cc:1666

X86ISA::GpuTLB::printAccessPattern
void printAccessPattern()