Go to the documentation of this file.
55 #include "debug/GPUPrefetch.hh"
56 #include "debug/GPUTLB.hh"
72 exitEvent([
this]{ exitCallback(); },
name()), stats(
this)
86 for (
int set = 0; set <
numSets; ++set) {
87 for (
int way = 0; way <
assoc; ++way) {
110 cprintf(
"Forcing maxCoalescedReqs to %d (TLB assoc.) \n",
assoc);
119 for (
size_t i = 0;
i <
p.port_cpu_side_ports_connection_count; ++
i) {
125 for (
size_t i = 0;
i <
p.port_mem_side_ports_connection_count; ++
i) {
141 if (if_name ==
"cpu_side_ports") {
143 panic(
"TLBCoalescer::getPort: unknown index %d\n", idx);
147 }
else if (if_name ==
"mem_side_ports") {
149 panic(
"TLBCoalescer::getPort: unknown index %d\n", idx);
156 panic(
"TLBCoalescer::getPort: unknown port %s\n", if_name);
180 newEntry->
vaddr = vpn;
186 GpuTLB::EntryList::iterator
196 for (; entry !=
entryList[set].end(); ++entry) {
197 int page_size = (*entry)->size();
199 if ((*entry)->vaddr <=
va && (*entry)->vaddr + page_size >
va) {
200 DPRINTF(GPUTLB,
"Matched vaddr %#x to entry starting at %#x "
201 "with size %#x.\n",
va, (*entry)->vaddr, page_size);
232 DPRINTF(GPUTLB,
"Invalidating all entries.\n");
252 DPRINTF(GPUTLB,
"Invalidating all non global entries.\n");
257 if (!(*entryIt)->global) {
305 DPRINTF(GPUTLB,
"Addresses references internal memory.\n");
310 panic(
"CPUID memory space not yet implemented!\n");
316 return std::make_shared<GeneralProtection>(0);
318 req->setLocalAccessor(
321 return localMiscRegAccess(read, regNum, tc, pkt);
333 assert(!(IOPort & ~0xFFFF));
334 if (IOPort == 0xCF8 && req->getSize() == 4) {
335 req->setLocalAccessor(
338 return localMiscRegAccess(
342 }
else if ((IOPort & ~
mask(2)) == 0xCFC) {
359 panic(
"Access to unrecognized internal address space %#x.\n",
375 bool tlb_hit =
false;
377 uint32_t flags = req->getFlags();
387 DPRINTF(GPUTLB,
"In protected mode.\n");
389 assert(m5Reg.mode == LongMode);
393 DPRINTF(GPUTLB,
"Paging enabled.\n");
423 bool &delayedResponse,
bool timing,
int &latency)
425 uint32_t flags = req->getFlags();
435 delayedResponse =
false;
443 DPRINTF(GPUTLB,
"In protected mode.\n");
445 if (m5Reg.mode != LongMode) {
446 DPRINTF(GPUTLB,
"Not in long mode. Checking segment "
453 return std::make_shared<GeneralProtection>(0);
462 return std::make_shared<GeneralProtection>(0);
465 return std::make_shared<GeneralProtection>(0);
479 if ((csAttr.defaultSize && sizeOverride) ||
480 (!csAttr.defaultSize && !sizeOverride)) {
488 DPRINTF(GPUTLB,
"Checking an expand down segment.\n");
489 warn_once(
"Expand down segments are untested.\n");
492 return std::make_shared<GeneralProtection>(0);
495 return std::make_shared<GeneralProtection>(0);
501 DPRINTF(GPUTLB,
"Paging enabled.\n");
513 fatal(
"GpuTLB doesn't support full-system mode\n");
515 DPRINTF(GPUTLB,
"Handling a TLB miss for address %#x "
528 pte =
p->pTable->lookup(
vaddr);
532 return std::make_shared<PageFault>(
vaddr,
true,
536 Addr alignedVaddr =
p->pTable->pageAlign(
vaddr);
538 DPRINTF(GPUTLB,
"Mapping %#x to %#x\n",
539 alignedVaddr, pte->
paddr);
541 TlbEntry gpuEntry(
p->pid(), alignedVaddr,
542 pte->
paddr,
false,
false);
543 entry =
insert(alignedVaddr, gpuEntry);
546 DPRINTF(GPUTLB,
"Miss was serviced.\n");
557 bool inUser = (m5Reg.cpl == 3 &&
561 bool badWrite = (!entry->
writable && (inUser || cr0.wp));
568 return std::make_shared<PageFault>(
vaddr,
true,
mode,
572 if (storeCheck && badWrite) {
575 return std::make_shared<PageFault>(
vaddr,
true,
581 DPRINTF(GPUTLB,
"Entry found with paddr %#x, doing protection "
582 "checks.\n", entry->
paddr);
584 int page_size = entry->
size();
586 DPRINTF(GPUTLB,
"Translated %#x -> %#x.\n",
vaddr, paddr);
587 req->setPaddr(paddr);
593 DPRINTF(GPUTLB,
"Paging disabled.\n");
595 req->setPaddr(
vaddr);
599 DPRINTF(GPUTLB,
"In real mode.\n");
601 req->setPaddr(
vaddr);
606 LocalApicBase localApicBase =
610 Addr paddr = req->getPaddr();
612 if (baseAddr <= paddr && baseAddr + PageBytes > paddr) {
627 bool delayedResponse;
637 bool delayedResponse;
641 delayedResponse,
true, latency);
643 if (!delayedResponse)
681 bool update_stats = !sender_state->
isPrefetch;
684 DPRINTF(GPUTLB,
"Translation req. for virt. page addr %#x\n",
687 int req_cnt = sender_state->
reqCnt.back();
700 bool success =
tlbLookup(tmp_req, tmp_tc, update_stats);
734 new TLBEvent(
this, virt_page_addr, lookup_outcome, pkt);
737 panic(
"Virtual Page Address %#x already has a return event\n",
744 DPRINTF(GPUTLB,
"schedule translationReturnEvent @ curTick %d\n",
752 :
Event(CPU_Tick_Pri),
tlb(_tlb), virtPageAddr(_addr),
753 outcome(tlb_outcome), pkt(_pkt)
766 uint32_t flags = pkt->
req->getFlags();
774 bool badWrite = (!tlb_entry->
writable && (inUser || cr0.wp));
776 if ((inUser && !tlb_entry->
user) ||
781 panic(
"Page fault detected");
784 if (storeCheck && badWrite) {
787 panic(
"Page fault detected");
812 DPRINTF(GPUTLB,
"Translation Done - TLB Hit for addr %#x\n",
814 local_entry = sender_state->
tlbEntry;
816 DPRINTF(GPUTLB,
"Translation Done - TLB Miss for addr %#x\n",
826 local_entry = new_entry;
829 DPRINTF(GPUTLB,
"allocating entry w/ addr %#x\n",
832 local_entry =
insert(virt_page_addr, *new_entry);
843 DPRINTF(GPUTLB,
"Entry found with vaddr %#x, doing protection checks "
844 "while paddr was %#x.\n", local_entry->
vaddr,
848 int page_size = local_entry->
size();
850 DPRINTF(GPUTLB,
"Translated %#x -> %#x.\n",
vaddr, paddr);
858 pkt->
req->setPaddr(paddr);
887 DPRINTF(GPUTLB,
"Triggered TLBEvent for addr %#x\n", virtPageAddr);
895 int req_cnt = tmp_sender_state->
reqCnt.back();
896 bool update_stats = !tmp_sender_state->
isPrefetch;
909 DPRINTF(GPUTLB,
"This is a TLB miss\n");
930 DPRINTF(GPUTLB,
"Failed sending translation request to "
931 "lower level TLB for addr %#x\n", virtPageAddr);
935 DPRINTF(GPUTLB,
"Sent translation request to lower level "
936 "TLB for addr %#x\n", virtPageAddr);
940 DPRINTF(GPUTLB,
"Last level TLB - start a page walk for "
941 "addr %#x\n", virtPageAddr);
957 DPRINTF(GPUTLB,
"Doing a page walk for address %#x\n",
966 Addr alignedVaddr =
p->pTable->pageAlign(
vaddr);
967 assert(alignedVaddr == virtPageAddr);
972 pte =
p->pTable->lookup(
vaddr);
976 DPRINTF(GPUTLB,
"Mapping %#x to %#x\n", alignedVaddr,
993 panic(
"Unexpected TLB outcome %d", outcome);
1000 tlb->translationReturn(virtPageAddr, outcome, pkt);
1006 return "trigger translationDoneEvent";
1018 return virtPageAddr;
1030 if (
tlb->outstandingReqs <
tlb->maxCoalescedReqs) {
1031 tlb->issueTLBLookup(pkt);
1033 tlb->outstandingReqs++;
1036 DPRINTF(GPUTLB,
"Reached maxCoalescedReqs number %d\n",
1037 tlb->outstandingReqs);
1063 DPRINTF(GPUTLB,
"Functional Translation Done - TLB hit for addr "
1066 local_entry = sender_state->
tlbEntry;
1068 DPRINTF(GPUTLB,
"Functional Translation Done - TLB miss for addr "
1076 new_entry = sender_state->
tlbEntry;
1078 local_entry = new_entry;
1083 DPRINTF(GPUTLB,
"allocating entry w/ addr %#x\n",
1086 local_entry =
insert(virt_page_addr, *new_entry);
1089 assert(local_entry);
1092 DPRINTF(GPUTLB,
"Entry found with vaddr %#x, doing protection checks "
1093 "while paddr was %#x.\n", local_entry->
vaddr,
1094 local_entry->
paddr);
1110 int page_size = local_entry->
size();
1112 DPRINTF(GPUTLB,
"Translated %#x -> %#x.\n",
vaddr, paddr);
1114 pkt->
req->setPaddr(paddr);
1129 bool update_stats = !sender_state->
isPrefetch;
1135 tlb->updatePageFootprint(virt_page_addr);
1138 bool success =
tlb->tlbLookup(pkt->
req, tc, update_stats);
1144 tlb->stats.globalNumTLBAccesses++;
1148 tlb->stats.globalNumTLBHits++;
1154 tlb->stats.globalNumTLBMisses++;
1155 if (
tlb->hasMemSidePort) {
1157 tlb->memSidePort[0]->sendFunctional(pkt);
1163 DPRINTF(GPUTLB,
"Doing a page walk for address %#x\n",
1170 Addr alignedVaddr =
p->pTable->pageAlign(
vaddr);
1171 assert(alignedVaddr == virt_page_addr);
1174 p->pTable->lookup(
vaddr);
1177 pte =
p->pTable->lookup(
vaddr);
1185 DPRINTF(GPUTLB,
"Mapping %#x to %#x\n", alignedVaddr,
1190 pte->
paddr,
false,
false);
1197 DPRINTF(GPUTLB,
"Mapping %#x to %#x\n", alignedVaddr,
1202 pte->
paddr,
false,
false);
1204 DPRINTF(GPUPrefetch,
"Prefetch failed %#x\n",
1214 DPRINTF(GPUPrefetch,
"Functional Hit for vaddr %#x\n",
1215 tlb->lookup(pkt->
req->getVaddr()));
1231 tlb->handleFuncTranslationReturn(pkt, tlb_outcome);
1239 panic(
"recvReqRetry called");
1262 DPRINTF(GPUTLB,
"MemSidePort recvTiming for virt_page_addr %#x\n",
1265 TLBEvent *tlb_event =
tlb->translationReturnEvent[virt_page_addr];
1280 panic(
"recvReqRetry called");
1292 delete old_tlb_event;
1321 AccessPatternTable::value_type(virt_page_addr, tmp_access_info));
1323 bool first_page_access = ret.second;
1325 if (first_page_access) {
1328 int accessed_before;
1329 accessed_before =
curTick() - ret.first->second.lastTimeAccessed;
1330 ret.first->second.totalReuseDistance += accessed_before;
1333 ret.first->second.accessesPerPage++;
1334 ret.first->second.lastTimeAccessed =
curTick();
1337 ret.first->second.localTLBAccesses
1345 std::ostream *page_stat_file =
nullptr;
1356 <<
"page,max_access_distance,mean_access_distance, "
1357 <<
"stddev_distance" << std::endl;
1361 unsigned int sum_avg_reuse_distance_per_page = 0;
1365 sum_avg_reuse_distance_per_page += iter.second.totalReuseDistance /
1366 iter.second.accessesPerPage;
1369 unsigned int tmp = iter.second.localTLBAccesses[0];
1370 unsigned int prev = tmp;
1372 for (
int i = 0;
i < iter.second.localTLBAccesses.size(); ++
i) {
1377 prev = iter.second.localTLBAccesses[
i];
1380 iter.second.localTLBAccesses[
i] -= tmp;
1383 iter.second.sumDistance +=
1384 iter.second.localTLBAccesses[
i];
1387 iter.second.meanDistance =
1388 iter.second.sumDistance / iter.second.accessesPerPage;
1392 unsigned int max_distance = 0;
1393 unsigned int stddev_distance = 0;
1395 for (
int i = 0;
i < iter.second.localTLBAccesses.size(); ++
i) {
1396 unsigned int tmp_access_distance =
1397 iter.second.localTLBAccesses[
i];
1399 if (tmp_access_distance > max_distance) {
1400 max_distance = tmp_access_distance;
1404 tmp_access_distance - iter.second.meanDistance;
1405 stddev_distance += pow(diff, 2);
1410 sqrt(stddev_distance/iter.second.accessesPerPage);
1412 if (page_stat_file) {
1413 *page_stat_file << std::hex << iter.first <<
",";
1414 *page_stat_file << std::dec << max_distance <<
",";
1415 *page_stat_file << std::dec << iter.second.meanDistance
1417 *page_stat_file << std::dec << stddev_distance;
1418 *page_stat_file << std::endl;
1422 iter.second.localTLBAccesses.clear();
1436 : statistics::
Group(parent),
1437 ADD_STAT(localNumTLBAccesses,
"Number of TLB accesses"),
1438 ADD_STAT(localNumTLBHits,
"Number of TLB hits"),
1439 ADD_STAT(localNumTLBMisses,
"Number of TLB misses"),
1440 ADD_STAT(localTLBMissRate,
"TLB miss rate"),
1441 ADD_STAT(globalNumTLBAccesses,
"Number of TLB accesses"),
1442 ADD_STAT(globalNumTLBHits,
"Number of TLB hits"),
1443 ADD_STAT(globalNumTLBMisses,
"Number of TLB misses"),
1444 ADD_STAT(globalTLBMissRate,
"TLB miss rate"),
1445 ADD_STAT(accessCycles,
"Cycles spent accessing this TLB level"),
1446 ADD_STAT(pageTableCycles,
"Cycles spent accessing the page table"),
1447 ADD_STAT(numUniquePages,
"Number of unique pages touched"),
1448 ADD_STAT(localCycles,
"Number of cycles spent in queue for all "
1450 ADD_STAT(localLatency,
"Avg. latency over incoming coalesced reqs"),
1451 ADD_STAT(avgReuseDistance,
"avg. reuse distance over all pages (in "
Tick curTick()
The universal simulation clock.
#define fatal(...)
This implements a cprintf based fatal() function.
int16_t PortID
Port index/ID type, and a symbolic name for an invalid port id.
statistics::Scalar numUniquePages
virtual RegVal readMiscReg(RegIndex misc_reg)=0
static MiscRegIndex MISCREG_SEG_SEL(int index)
constexpr decltype(nullptr) NoFault
GpuTLBStats(statistics::Group *parent)
statistics::Scalar accessCycles
@ STRICT_ORDER
The request is required to be strictly ordered by CPU models and is non-speculative.
void cprintf(const char *format, const Args &...args)
virtual void recvFunctional(PacketPtr pkt)
Receive a functional request packet from the peer.
void translationReturn(Addr virtPageAddr, tlbOutcome outcome, PacketPtr pkt)
A TLBEvent is scheduled after the TLB lookup and helps us take the appropriate actions: (e....
gem5::X86ISA::GpuTLB::GpuTLBStats stats
std::vector< MemSidePort * > memSidePort
statistics::Scalar avgReuseDistance
static Addr x86LocalAPICAddress(const uint8_t id, const uint16_t addr)
const Addr IntAddrPrefixMSR
void setData(const uint8_t *p)
Copy data into the packet from the provided pointer.
statistics::Scalar localNumTLBAccesses
static MiscRegIndex MISCREG_SEG_LIMIT(int index)
@ UNCACHEABLE
The request is to an uncacheable address.
RequestPtr req
A pointer to the original request.
static MiscRegIndex MISCREG_SEG_ATTR(int index)
unsigned int totalReuseDistance
statistics::Formula localTLBMissRate
virtual ContextID contextId() const =0
void schedule(Event &event, Tick when)
OutputStream * create(const std::string &name, bool binary=false, bool no_gz=false)
Creates a file in this directory (optionally compressed).
TlbEntry * lookup(Addr va, bool update_lru=true)
virtual Addr instAddr() const =0
std::string csprintf(const char *format, const Args &...args)
BitfieldType< SegDescriptorLimit > limit
statistics::Formula globalTLBMissRate
constexpr T mbits(T val, unsigned first, unsigned last)
Mask off the given bits in place like bits() but without shifting.
bool FA
true if this is a fully-associative TLB
TlbEntry * insert(Addr vpn, TlbEntry &entry)
statistics::Scalar globalNumTLBAccesses
EntryList::iterator lookupIt(Addr va, bool update_lru=true)
unsigned int lastTimeAccessed
bool allocationPolicy
Allocation Policy: true if we always allocate on a hit, false otherwise.
void setConfigAddress(uint32_t addr)
virtual void finish(Fault fault, const RequestPtr &req, ThreadContext *tc, Mode mode)=0
The memory for this object may be dynamically allocated, and it may be responsible for cleaning itsle...
bool hasMemSidePort
if true, then this is not the last level TLB
statistics::Formula localLatency
std::queue< Addr > cleanupQueue
Cycles is a wrapper class for representing cycle counts, i.e.
virtual AddrRangeList getAddrRanges() const
Get a list of the non-overlapping address ranges the owner is responsible for.
Fault translateAtomic(const RequestPtr &req, ThreadContext *tc, Mode mode, int &latency)
virtual void serialize(CheckpointOut &cp) const override
Serialize an object.
TLB TranslationState: this currently is a somewhat bastardization of the usage of SenderState,...
std::ostream * stream() const
Get the output underlying output stream.
Fault translate(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode, bool &delayedResponse, bool timing, int &latency)
bool accessDistance
Print out accessDistance stats.
virtual void unserialize(CheckpointIn &cp) override
Unserialize an object.
void handleFuncTranslationReturn(PacketPtr pkt, tlbOutcome outcome)
handleFuncTranslationReturn is called on a TLB hit, when a TLB miss returns or when a page fault retu...
ThreadContext is the external interface to all thread state for anything outside of the CPU.
virtual std::string name() const
void issueTLBLookup(PacketPtr pkt)
Do the TLB lookup for this coalesced request and schedule another event <TLB access latency> cycles l...
std::shared_ptr< FaultBase > Fault
Tick cyclesToTicks(Cycles c) const
#define ADD_STAT(n,...)
Convenience macro to add a stat to a statistics group.
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
void updatePageFootprint(Addr virt_page_addr)
static const Priority Maximum_Pri
Maximum priority.
Fault translateInt(bool read, const RequestPtr &req, ThreadContext *tc)
std::shared_ptr< Request > RequestPtr
const Addr IntAddrPrefixMask
bool tlbLookup(const RequestPtr &req, ThreadContext *tc, bool update_stats)
TLB_lookup will only perform a TLB lookup returning true on a TLB hit and false on a TLB miss.
@ MISCREG_PCI_CONFIG_ADDRESS
unsigned int accessesPerPage
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
const Addr IntAddrPrefixCPUID
static MiscRegIndex MISCREG_SEG_BASE(int index)
static constexpr T roundDown(const T &val, const U &align)
This function is used to align addresses in memory.
Port & getPort(const std::string &if_name, PortID idx=InvalidPortID) override
Get a port with a given name and index.
statistics::Scalar globalNumTLBMisses
std::unordered_map< Addr, TLBEvent * > translationReturnEvent
virtual RegVal readMiscRegNoEffect(RegIndex misc_reg) const =0
statistics::Scalar pageTableCycles
virtual void recvReqRetry()
std::vector< EntryList > freeList
const Addr PhysAddrPrefixPciConfig
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
SenderState * senderState
This packet's sender state.
statistics::Scalar localNumTLBHits
bool msrAddrToIndex(MiscRegIndex ®Num, Addr addr)
Find and return the misc reg corresponding to an MSR address.
std::vector< CpuSidePort * > cpuSidePort
void invalidateNonGlobal()
const std::string & name()
Bitfield< 14 > expandDown
statistics::Scalar localCycles
The ClockedObject class extends the SimObject with a clock and accessor functions to relate ticks to ...
AccessPatternTable TLBFootprint
std::vector< EntryList > entryList
An entryList per set is the equivalent of an LRU stack; it's used to guide replacement decisions.
virtual bool recvTimingResp(PacketPtr pkt)
MemSidePort receives the packet back.
virtual Process * getProcessPtr()=0
bool FullSystem
The FullSystem variable can be used to determine the current mode of simulation.
const char * description() const
Return a C string describing the event.
void makeTimingResponse()
TLBEvent(GpuTLB *_tlb, Addr _addr, tlbOutcome outcome, PacketPtr _pkt)
void updateOutcome(tlbOutcome _outcome)
Ports are used to interface objects to each other.
virtual void setMiscReg(RegIndex misc_reg, RegVal val)=0
void pagingProtectionChecks(ThreadContext *tc, PacketPtr pkt, TlbEntry *tlb_entry, Mode mode)
Do Paging protection checks.
unsigned int meanDistance
std::ostream CheckpointOut
const Addr IntAddrPrefixIO
This hash map will use the virtual page address as a key and will keep track of total number of acces...
std::vector< TlbEntry > tlb
statistics::Scalar globalNumTLBHits
virtual bool recvTimingReq(PacketPtr pkt)
recvTiming receives a coalesced timing request from a TLBCoalescer and it calls issueTLBLookup() It o...
void translateTiming(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode, int &latency)
void handleTranslationReturn(Addr addr, tlbOutcome outcome, PacketPtr pkt)
handleTranslationReturn is called on a TLB hit, when a TLB miss returns or when a page fault returns.
Reference material can be found at the JEDEC website: UFS standard http://www.jedec....
virtual void recvReqRetry()
Called by the peer if sendTimingReq was called on this peer (causing recvTimingReq to be called on th...
const GEM5_VAR_USED Request::FlagsType SegmentFlagMask
std::vector< int > reqCnt
void demapPage(Addr va, uint64_t asn)
statistics::Scalar localNumTLBMisses
const Addr PhysAddrPrefixIO
bool scheduled() const
Determine if the current event is scheduled.
#define panic(...)
This implements a cprintf based panic() function.
EventFunctionWrapper cleanupEvent
Counter value() const
Return the current value of this stat as its base type.
Generated on Wed Jul 28 2021 12:10:27 for gem5 by doxygen 1.8.17