release/current/amdgpu_2common_2tlb_8cc_source.html

/*

 * Copyright (c) 2011-2021 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 *

 */


#include "arch/amdgpu/common/tlb.hh"


#include <cmath>

#include <cstring>


#include "arch/amdgpu/common/gpu_translation_state.hh"

#include "arch/x86/faults.hh"

#include "arch/x86/insts/microldstop.hh"

#include "arch/x86/page_size.hh"

#include "arch/x86/pagetable.hh"

#include "arch/x86/pagetable_walker.hh"

#include "arch/x86/regs/misc.hh"

#include "arch/x86/regs/msr.hh"

#include "arch/x86/regs/segment.hh"

#include "arch/x86/x86_traits.hh"

#include "base/bitfield.hh"

#include "base/logging.hh"

#include "base/output.hh"

#include "base/trace.hh"

#include "cpu/base.hh"

#include "cpu/thread_context.hh"

#include "debug/GPUPrefetch.hh"

#include "debug/GPUTLB.hh"

#include "mem/packet_access.hh"

#include "mem/page_table.hh"

#include "mem/request.hh"

#include "sim/process.hh"

#include "sim/pseudo_inst.hh"


namespace gem5

{


namespace X86ISA

{


    GpuTLB::GpuTLB(const Params &p)

        : ClockedObject(p), configAddress(0), size(p.size),

          cleanupEvent([this]{ cleanup(); }, name(), false,

                       Event::Maximum_Pri),

          exitEvent([this]{ exitCallback(); }, name()), stats(this)

    {

        assoc = p.assoc;

        assert(assoc <= size);

        numSets = size/assoc;

        allocationPolicy = p.allocationPolicy;

        hasMemSidePort = false;

        accessDistance = p.accessDistance;


        tlb.assign(size, TlbEntry());


        freeList.resize(numSets);

        entryList.resize(numSets);


        for (int set = 0; set < numSets; ++set) {

            for (int way = 0; way < assoc; ++way) {

                int x = set * assoc + way;

                freeList[set].push_back(&tlb.at(x));

            }

        }


        FA = (size == assoc);


        setMask = numSets - 1;


        maxCoalescedReqs = p.maxOutstandingReqs;


        // Do not allow maxCoalescedReqs to be more than the TLB associativity

        if (maxCoalescedReqs > assoc) {

            maxCoalescedReqs = assoc;

            cprintf("Forcing maxCoalescedReqs to %d (TLB assoc.) \n", assoc);

        }


        outstandingReqs = 0;

        hitLatency = p.hitLatency;

        missLatency1 = p.missLatency1;

        missLatency2 = p.missLatency2;


        // create the response ports based on the number of connected ports

        for (size_t i = 0; i < p.port_cpu_side_ports_connection_count; ++i) {

            cpuSidePort.push_back(new CpuSidePort(csprintf("%s-port%d",

                                  name(), i), this, i));

        }


        // create the request ports based on the number of connected ports

        for (size_t i = 0; i < p.port_mem_side_ports_connection_count; ++i) {

            memSidePort.push_back(new MemSidePort(csprintf("%s-port%d",

                                  name(), i), this, i));

        }

    }

    GpuTLB::GpuTLB(const Params &p) {…}


    // fixme: this is never called?


    GpuTLB::~GpuTLB()

    {

        // make sure all the hash-maps are empty

        assert(translationReturnEvent.empty());

    }

    GpuTLB::~GpuTLB() {…}


    Port &


    GpuTLB::getPort(const std::string &if_name, PortID idx)

    {

        if (if_name == "cpu_side_ports") {

            if (idx >= static_cast<PortID>(cpuSidePort.size())) {

                panic("TLBCoalescer::getPort: unknown index %d\n", idx);

            }


            return *cpuSidePort[idx];

        } else if (if_name == "mem_side_ports") {

            if (idx >= static_cast<PortID>(memSidePort.size())) {

                panic("TLBCoalescer::getPort: unknown index %d\n", idx);

            }


            hasMemSidePort = true;


            return *memSidePort[idx];

        } else {

            panic("TLBCoalescer::getPort: unknown port %s\n", if_name);

        }

    }

    GpuTLB::getPort(const std::string &if_name, PortID idx) {…}


    TlbEntry*


    GpuTLB::insert(Addr vpn, TlbEntry &entry)

    {

        TlbEntry *newEntry = nullptr;


        int set = (vpn >> PageShift) & setMask;


        if (!freeList[set].empty()) {

            newEntry = freeList[set].front();

            freeList[set].pop_front();

        } else {

            newEntry = entryList[set].back();

            entryList[set].pop_back();

        }


        *newEntry = entry;

        newEntry->vaddr = vpn;

        entryList[set].push_front(newEntry);


        return newEntry;

    }

    GpuTLB::insert(Addr vpn, TlbEntry &entry) {…}


    GpuTLB::EntryList::iterator


    GpuTLB::lookupIt(Addr va, bool update_lru)

    {

        int set = (va >> PageShift) & setMask;


        if (FA) {

            assert(!set);

        }


        auto entry = entryList[set].begin();

        for (; entry != entryList[set].end(); ++entry) {

            int page_size = (*entry)->size();


            if ((*entry)->vaddr <= va && (*entry)->vaddr + page_size > va) {

                DPRINTF(GPUTLB, "Matched vaddr %#x to entry starting at %#x "

                        "with size %#x.\n", va, (*entry)->vaddr, page_size);


                if (update_lru) {

                    entryList[set].push_front(*entry);

                    entryList[set].erase(entry);

                    entry = entryList[set].begin();

                }


                break;

            }

        }


        return entry;

    }

    GpuTLB::lookupIt(Addr va, bool update_lru) {…}


    TlbEntry*


    GpuTLB::lookup(Addr va, bool update_lru)

    {

        int set = (va >> PageShift) & setMask;


        auto entry = lookupIt(va, update_lru);


        if (entry == entryList[set].end())

            return nullptr;

        else

            return *entry;

    }

    GpuTLB::lookup(Addr va, bool update_lru) {…}


    void


    GpuTLB::invalidateAll()

    {

        DPRINTF(GPUTLB, "Invalidating all entries.\n");


        for (int i = 0; i < numSets; ++i) {

            while (!entryList[i].empty()) {

                TlbEntry *entry = entryList[i].front();

                entryList[i].pop_front();

                freeList[i].push_back(entry);

            }

        }

    }

    GpuTLB::invalidateAll() {…}


    void


    GpuTLB::setConfigAddress(uint32_t addr)

    {

        configAddress = addr;

    }

    GpuTLB::setConfigAddress(uint32_t addr) {…}


    void


    GpuTLB::invalidateNonGlobal()

    {

        DPRINTF(GPUTLB, "Invalidating all non global entries.\n");


        for (int i = 0; i < numSets; ++i) {

            for (auto entryIt = entryList[i].begin();

                 entryIt != entryList[i].end();) {

                if (!(*entryIt)->global) {

                    freeList[i].push_back(*entryIt);

                    entryList[i].erase(entryIt++);

                } else {

                    ++entryIt;

                }

            }

        }

    }

    GpuTLB::invalidateNonGlobal() {…}


    void


    GpuTLB::demapPage(Addr va, uint64_t asn)

    {


        int set = (va >> PageShift) & setMask;

        auto entry = lookupIt(va, false);


        if (entry != entryList[set].end()) {

            freeList[set].push_back(*entry);

            entryList[set].erase(entry);

        }

    }

    GpuTLB::demapPage(Addr va, uint64_t asn) {…}


    namespace

    {


    Cycles

    localMiscRegAccess(bool read, RegIndex regNum,

                       ThreadContext *tc, PacketPtr pkt)

    {

        if (read) {

            RegVal data = htole(tc->readMiscReg(regNum));

            // Make sure we don't trot off the end of data.

            pkt->setData((uint8_t *)&data);

        } else {

            RegVal data = htole(tc->readMiscRegNoEffect(regNum));

            tc->setMiscReg(regNum, letoh(data));

        }

        return Cycles(1);

    }


    } // anonymous namespace


    Fault


    GpuTLB::translateInt(bool read, const RequestPtr &req, ThreadContext *tc)

    {

        DPRINTF(GPUTLB, "Addresses references internal memory.\n");

        Addr vaddr = req->getVaddr();

        Addr prefix = (vaddr >> 3) & IntAddrPrefixMask;


        if (prefix == IntAddrPrefixCPUID) {

            panic("CPUID memory space not yet implemented!\n");

        } else if (prefix == IntAddrPrefixMSR) {

            vaddr = (vaddr >> 3) & ~IntAddrPrefixMask;


            RegIndex regNum;

            if (!msrAddrToIndex(regNum, vaddr))

                return std::make_shared<GeneralProtection>(0);


            req->setLocalAccessor(

                [read, regNum](ThreadContext *tc, PacketPtr pkt)

                {

                    return localMiscRegAccess(read, regNum, tc, pkt);

                }

            );


            return NoFault;

        } else if (prefix == IntAddrPrefixIO) {

            // TODO If CPL > IOPL or in virtual mode, check the I/O permission

            // bitmap in the TSS.


            Addr IOPort = vaddr & ~IntAddrPrefixMask;

            // Make sure the address fits in the expected 16 bit IO address

            // space.

            assert(!(IOPort & ~0xFFFF));

            if (IOPort == 0xCF8 && req->getSize() == 4) {

                req->setLocalAccessor(

                    [read](ThreadContext *tc, PacketPtr pkt)

                    {

                        return localMiscRegAccess(

                                read, misc_reg::PciConfigAddress, tc, pkt);

                    }

                );

            } else if ((IOPort & ~mask(2)) == 0xCFC) {

                req->setFlags(Request::UNCACHEABLE | Request::STRICT_ORDER);

                Addr configAddress =

                    tc->readMiscRegNoEffect(misc_reg::PciConfigAddress);

                if (bits(configAddress, 31, 31)) {

                    req->setPaddr(PhysAddrPrefixPciConfig |

                            mbits(configAddress, 30, 2) |

                            (IOPort & mask(2)));

                } else {

                    req->setPaddr(PhysAddrPrefixIO | IOPort);

                }

            } else {

                req->setFlags(Request::UNCACHEABLE | Request::STRICT_ORDER);

                req->setPaddr(PhysAddrPrefixIO | IOPort);

            }

            return NoFault;

        } else {

            panic("Access to unrecognized internal address space %#x.\n",

                  prefix);

        }

    }

    GpuTLB::translateInt(bool read, const RequestPtr &req, ThreadContext *tc) {…}


    bool


    GpuTLB::tlbLookup(const RequestPtr &req,

                      ThreadContext *tc, bool update_stats)

    {

        bool tlb_hit = false;

    #ifndef NDEBUG

        uint32_t flags = req->getFlags();

        int seg = flags & SegmentFlagMask;

    #endif


        assert(seg != segment_idx::Ms);

        Addr vaddr = req->getVaddr();

        if (req->hasNoAddr()) {

            return true;

        } else {

            DPRINTF(GPUTLB, "TLB Lookup for vaddr %#x.\n", vaddr);

        }

        HandyM5Reg m5Reg = tc->readMiscRegNoEffect(misc_reg::M5Reg);


        if (m5Reg.prot) {

            DPRINTF(GPUTLB, "In protected mode.\n");

            // make sure we are in 64-bit mode

            assert(m5Reg.mode == LongMode);


            // If paging is enabled, do the translation.

            if (m5Reg.paging) {

                DPRINTF(GPUTLB, "Paging enabled.\n");

                //update LRU stack on a hit

                TlbEntry *entry = lookup(vaddr, true);


                if (entry)

                    tlb_hit = true;


                if (!update_stats) {

                    // functional tlb access for memory initialization

                    // i.e., memory seeding or instr. seeding -> don't update

                    // TLB and stats

                    return tlb_hit;

                }


                stats.localNumTLBAccesses++;


                if (!entry) {

                    stats.localNumTLBMisses++;

                } else {

                    stats.localNumTLBHits++;

                }

            }

        }


        return tlb_hit;

    }

    GpuTLB::tlbLookup(const RequestPtr &req, {…}


    Fault


    GpuTLB::translate(const RequestPtr &req, ThreadContext *tc,

                      Translation *translation, Mode mode,

                      bool &delayedResponse, bool timing, int &latency)

    {

        uint32_t flags = req->getFlags();

        int seg = flags & SegmentFlagMask;

        bool storeCheck = flags & Request::READ_MODIFY_WRITE;


        // If this is true, we're dealing with a request

        // to a non-memory address space.

        if (seg == segment_idx::Ms) {

            return translateInt(mode == Mode::Read, req, tc);

        }


        delayedResponse = false;

        Addr vaddr = req->getVaddr();

        DPRINTF(GPUTLB, "Translating vaddr %#x.\n", vaddr);


        HandyM5Reg m5Reg = tc->readMiscRegNoEffect(misc_reg::M5Reg);


        // If protected mode has been enabled...

        if (m5Reg.prot) {

            DPRINTF(GPUTLB, "In protected mode.\n");

            // If we're not in 64-bit mode, do protection/limit checks

            if (m5Reg.mode != LongMode) {

                DPRINTF(GPUTLB, "Not in long mode. Checking segment "

                        "protection.\n");


                // Check for a null segment selector.

                if (!(seg == segment_idx::Tsg || seg == segment_idx::Idtr ||

                    seg == segment_idx::Hs || seg == segment_idx::Ls)

                    && !tc->readMiscRegNoEffect(misc_reg::segSel(seg))) {

                    return std::make_shared<GeneralProtection>(0);

                }


                bool expandDown = false;

                SegAttr attr = tc->readMiscRegNoEffect(misc_reg::segAttr(seg));


                if (seg >= segment_idx::Es && seg <= segment_idx::Hs) {

                    if (!attr.writable && (mode == BaseMMU::Write ||

                        storeCheck))

                        return std::make_shared<GeneralProtection>(0);


                    if (!attr.readable && mode == BaseMMU::Read)

                        return std::make_shared<GeneralProtection>(0);


                    expandDown = attr.expandDown;


                }


                Addr base = tc->readMiscRegNoEffect(misc_reg::segBase(seg));

                Addr limit = tc->readMiscRegNoEffect(misc_reg::segLimit(seg));

                Addr logSize = (flags >> AddrSizeFlagShift) & AddrSizeFlagMask;

                int size = 8 << logSize;


                Addr offset = (vaddr - base) & mask(size);

                Addr endOffset = offset + req->getSize() - 1;


                if (expandDown) {

                    DPRINTF(GPUTLB, "Checking an expand down segment.\n");

                    warn_once("Expand down segments are untested.\n");


                    if (offset <= limit || endOffset <= limit)

                        return std::make_shared<GeneralProtection>(0);

                } else {

                    if (offset > limit || endOffset > limit)

                        return std::make_shared<GeneralProtection>(0);

                }

            }


            // If paging is enabled, do the translation.

            if (m5Reg.paging) {

                DPRINTF(GPUTLB, "Paging enabled.\n");

                // The vaddr already has the segment base applied.

                TlbEntry *entry = lookup(vaddr);

                stats.localNumTLBAccesses++;


                if (!entry) {

                    stats.localNumTLBMisses++;

                    if (timing) {

                        latency = missLatency1;

                    }


                    if (FullSystem) {

                        fatal("GpuTLB doesn't support full-system mode\n");

                    } else {

                        DPRINTF(GPUTLB, "Handling a TLB miss for address %#x "

                                "at pc %#x.\n", vaddr,

                                tc->pcState().instAddr());


                        Process *p = tc->getProcessPtr();

                        const EmulationPageTable::Entry *pte =

                            p->pTable->lookup(vaddr);


                        if (!pte && mode != BaseMMU::Execute) {

                            // penalize a "page fault" more

                            if (timing)

                                latency += missLatency2;


                            if (p->fixupFault(vaddr))

                                pte = p->pTable->lookup(vaddr);

                        }


                        if (!pte) {

                            return std::make_shared<PageFault>(vaddr, true,

                                                               mode, true,

                                                               false);

                        } else {

                            Addr alignedVaddr = p->pTable->pageAlign(vaddr);


                            DPRINTF(GPUTLB, "Mapping %#x to %#x\n",

                                    alignedVaddr, pte->paddr);


                            TlbEntry gpuEntry(p->pid(), alignedVaddr,

                                              pte->paddr, false, false);

                            entry = insert(alignedVaddr, gpuEntry);

                        }


                        DPRINTF(GPUTLB, "Miss was serviced.\n");

                    }

                } else {

                    stats.localNumTLBHits++;


                    if (timing) {

                        latency = hitLatency;

                    }

                }


                // Do paging protection checks.

                bool inUser = m5Reg.cpl == 3 && !(flags & CPL0FlagBit);


                CR0 cr0 = tc->readMiscRegNoEffect(misc_reg::Cr0);

                bool badWrite = (!entry->writable && (inUser || cr0.wp));


                if ((inUser && !entry->user) || (mode == BaseMMU::Write &&

                     badWrite)) {

                    // The page must have been present to get into the TLB in

                    // the first place. We'll assume the reserved bits are

                    // fine even though we're not checking them.

                    return std::make_shared<PageFault>(vaddr, true, mode,

                                                       inUser, false);

                }


                if (storeCheck && badWrite) {

                    // This would fault if this were a write, so return a page

                    // fault that reflects that happening.

                    return std::make_shared<PageFault>(vaddr, true,

                                                       BaseMMU::Write,

                                                       inUser, false);

                }


                DPRINTF(GPUTLB, "Entry found with paddr %#x, doing protection "

                        "checks.\n", entry->paddr);


                int page_size = entry->size();

                Addr paddr = entry->paddr | (vaddr & (page_size - 1));

                DPRINTF(GPUTLB, "Translated %#x -> %#x.\n", vaddr, paddr);

                req->setPaddr(paddr);


                if (entry->uncacheable)

                    req->setFlags(Request::UNCACHEABLE);

            } else {

                //Use the address which already has segmentation applied.

                DPRINTF(GPUTLB, "Paging disabled.\n");

                DPRINTF(GPUTLB, "Translated %#x -> %#x.\n", vaddr, vaddr);

                req->setPaddr(vaddr);

            }

        } else {

            // Real mode

            DPRINTF(GPUTLB, "In real mode.\n");

            DPRINTF(GPUTLB, "Translated %#x -> %#x.\n", vaddr, vaddr);

            req->setPaddr(vaddr);

        }


        // Check for an access to the local APIC

        if (FullSystem) {

            LocalApicBase localApicBase =

                tc->readMiscRegNoEffect(misc_reg::ApicBase);


            Addr baseAddr = localApicBase.base * PageBytes;

            Addr paddr = req->getPaddr();


            if (baseAddr <= paddr && baseAddr + PageBytes > paddr) {

                // Force the access to be uncacheable.

                req->setFlags(Request::UNCACHEABLE);

                req->setPaddr(x86LocalAPICAddress(tc->contextId(),

                                                  paddr - baseAddr));

            }

        }


        return NoFault;

    };

    GpuTLB::translate(const RequestPtr &req, ThreadContext *tc, {…}


    Fault


    GpuTLB::translateAtomic(const RequestPtr &req, ThreadContext *tc,

                            Mode mode, int &latency)

    {

        bool delayedResponse;


        return GpuTLB::translate(req, tc, nullptr, mode, delayedResponse,

            false, latency);

    }

    GpuTLB::translateAtomic(const RequestPtr &req, ThreadContext *tc, {…}


    void


    GpuTLB::translateTiming(const RequestPtr &req, ThreadContext *tc,

            Translation *translation, Mode mode, int &latency)

    {

        bool delayedResponse;

        assert(translation);


        Fault fault = GpuTLB::translate(req, tc, translation, mode,

                                        delayedResponse, true, latency);


        if (!delayedResponse)

            translation->finish(fault, req, tc, mode);

    }

    GpuTLB::translateTiming(const RequestPtr &req, ThreadContext *tc, {…}


    Walker*


    GpuTLB::getWalker()

    {

        return walker;

    }

    GpuTLB::getWalker() {…}


    void


    GpuTLB::serialize(CheckpointOut &cp) const

    {

    }

    GpuTLB::serialize(CheckpointOut &cp) const {…}


    void


    GpuTLB::unserialize(CheckpointIn &cp)

    {

    }

    GpuTLB::unserialize(CheckpointIn &cp) {…}


    void


    GpuTLB::issueTLBLookup(PacketPtr pkt)

    {

        assert(pkt);

        assert(pkt->senderState);


        Addr virt_page_addr = roundDown(pkt->req->getVaddr(),

                                        X86ISA::PageBytes);


        GpuTranslationState *sender_state =

                safe_cast<GpuTranslationState*>(pkt->senderState);


        bool update_stats = !sender_state->isPrefetch;

        ThreadContext * tmp_tc = sender_state->tc;


        DPRINTF(GPUTLB, "Translation req. for virt. page addr %#x\n",

                virt_page_addr);


        int req_cnt = sender_state->reqCnt.back();


        if (update_stats) {

            stats.accessCycles -= (curTick() * req_cnt);

            stats.localCycles -= curTick();

            updatePageFootprint(virt_page_addr);

            stats.globalNumTLBAccesses += req_cnt;

        }


        tlbOutcome lookup_outcome = TLB_MISS;

        const RequestPtr &tmp_req = pkt->req;


        // Access the TLB and figure out if it's a hit or a miss.

        bool success = tlbLookup(tmp_req, tmp_tc, update_stats);


        if (success) {

            lookup_outcome = TLB_HIT;

            // Put the entry in SenderState

            auto p = sender_state->tc->getProcessPtr();

            if (pkt->req->hasNoAddr()) {

                sender_state->tlbEntry =

                    new TlbEntry(p->pid(), 0, 0,

                                 false, false);

            } else {

                TlbEntry *entry = lookup(tmp_req->getVaddr(), false);

                assert(entry);


                sender_state->tlbEntry =

                    new TlbEntry(p->pid(), entry->vaddr, entry->paddr,

                                 false, false);

            }


            if (update_stats) {

                // the reqCnt has an entry per level, so its size tells us

                // which level we are in

                sender_state->hitLevel = sender_state->reqCnt.size();

                stats.globalNumTLBHits += req_cnt;

            }

        } else {

            if (update_stats)

                stats.globalNumTLBMisses += req_cnt;

        }


        /*

         * We now know the TLB lookup outcome (if it's a hit or a miss), as

         * well as the TLB access latency.

         *

         * We create and schedule a new TLBEvent which will help us take the

         * appropriate actions (e.g., update TLB on a hit, send request to

         * lower level TLB on a miss, or start a page walk if this was the

         * last-level TLB)

         */

        TLBEvent *tlb_event =

            new TLBEvent(this, virt_page_addr, lookup_outcome, pkt);


        if (translationReturnEvent.count(virt_page_addr)) {

            panic("Virtual Page Address %#x already has a return event\n",

                  virt_page_addr);

        }


        translationReturnEvent[virt_page_addr] = tlb_event;

        assert(tlb_event);


        DPRINTF(GPUTLB, "schedule translationReturnEvent @ curTick %d\n",

                curTick() + cyclesToTicks(Cycles(hitLatency)));


        schedule(tlb_event, curTick() + cyclesToTicks(Cycles(hitLatency)));

    }

    GpuTLB::issueTLBLookup(PacketPtr pkt) {…}


    GpuTLB::TLBEvent::TLBEvent(GpuTLB* _tlb, Addr _addr,

        tlbOutcome tlb_outcome, PacketPtr _pkt)

            : Event(CPU_Tick_Pri), tlb(_tlb), virtPageAddr(_addr),

              outcome(tlb_outcome), pkt(_pkt)

    {

    }

    GpuTLB::TLBEvent::TLBEvent(GpuTLB* _tlb, Addr _addr, {…}


    void


    GpuTLB::pagingProtectionChecks(ThreadContext *tc, PacketPtr pkt,

            TlbEntry * tlb_entry, Mode mode)

    {

        HandyM5Reg m5Reg = tc->readMiscRegNoEffect(misc_reg::M5Reg);

        uint32_t flags = pkt->req->getFlags();

        bool storeCheck = flags & Request::READ_MODIFY_WRITE;


        // Do paging protection checks.

        bool inUser = m5Reg.cpl == 3 && !(flags & CPL0FlagBit);

        CR0 cr0 = tc->readMiscRegNoEffect(misc_reg::Cr0);


        bool badWrite = (!tlb_entry->writable && (inUser || cr0.wp));


        if ((inUser && !tlb_entry->user) ||

            (mode == BaseMMU::Write && badWrite)) {

            // The page must have been present to get into the TLB in

            // the first place. We'll assume the reserved bits are

            // fine even though we're not checking them.

            panic("Page fault detected");

        }


        if (storeCheck && badWrite) {

            // This would fault if this were a write, so return a page

            // fault that reflects that happening.

            panic("Page fault detected");

        }

    }

    GpuTLB::pagingProtectionChecks(ThreadContext *tc, PacketPtr pkt, {…}


    void


    GpuTLB::handleTranslationReturn(Addr virt_page_addr,

        tlbOutcome tlb_outcome, PacketPtr pkt)

    {

        assert(pkt);

        Addr vaddr = pkt->req->getVaddr();


        GpuTranslationState *sender_state =

            safe_cast<GpuTranslationState*>(pkt->senderState);


        ThreadContext *tc = sender_state->tc;

        Mode mode = sender_state->tlbMode;


        TlbEntry *local_entry, *new_entry;


        if (tlb_outcome == TLB_HIT) {

            DPRINTF(GPUTLB, "Translation Done - TLB Hit for addr %#x\n",

                vaddr);

            local_entry = safe_cast<TlbEntry *>(sender_state->tlbEntry);

        } else {

            DPRINTF(GPUTLB, "Translation Done - TLB Miss for addr %#x\n",

                    vaddr);


            new_entry = safe_cast<TlbEntry *>(sender_state->tlbEntry);

            assert(new_entry);

            local_entry = new_entry;


            if (allocationPolicy) {

                DPRINTF(GPUTLB, "allocating entry w/ addr %#x\n",

                        virt_page_addr);


                local_entry = insert(virt_page_addr, *new_entry);

            }


            assert(local_entry);

        }


        DPRINTF(GPUTLB, "Entry found with vaddr %#x,  doing protection checks "

                "while paddr was %#x.\n", local_entry->vaddr,

                local_entry->paddr);


        pagingProtectionChecks(tc, pkt, local_entry, mode);

        int page_size = local_entry->size();

        Addr paddr = local_entry->paddr | (vaddr & (page_size - 1));

        DPRINTF(GPUTLB, "Translated %#x -> %#x.\n", vaddr, paddr);


        // Since this packet will be sent through the cpu side port,

        // it must be converted to a response pkt if it is not one already

        if (pkt->isRequest()) {

            pkt->makeTimingResponse();

        }


        pkt->req->setPaddr(paddr);


        if (local_entry->uncacheable) {

             pkt->req->setFlags(Request::UNCACHEABLE);

        }


        //send packet back to coalescer

        cpuSidePort[0]->sendTimingResp(pkt);

        //schedule cleanup event

        cleanupQueue.push(virt_page_addr);


        // schedule this only once per cycle.

        // The check is required because we might have multiple translations

        // returning the same cycle

        // this is a maximum priority event and must be on the same cycle

        // as the cleanup event in TLBCoalescer to avoid a race with

        // IssueProbeEvent caused by TLBCoalescer::MemSidePort::recvReqRetry

        if (!cleanupEvent.scheduled())

            schedule(cleanupEvent, curTick());

    }

    GpuTLB::handleTranslationReturn(Addr virt_page_addr, {…}


    void


    GpuTLB::translationReturn(Addr virtPageAddr, tlbOutcome outcome,

                              PacketPtr pkt)

    {

        DPRINTF(GPUTLB, "Triggered TLBEvent for addr %#x\n", virtPageAddr);


        assert(translationReturnEvent[virtPageAddr]);

        assert(pkt);


        GpuTranslationState *tmp_sender_state =

            safe_cast<GpuTranslationState*>(pkt->senderState);


        int req_cnt = tmp_sender_state->reqCnt.back();

        bool update_stats = !tmp_sender_state->isPrefetch;


        if (outcome == TLB_HIT) {

            handleTranslationReturn(virtPageAddr, TLB_HIT, pkt);


            if (update_stats) {

                stats.accessCycles += (req_cnt * curTick());

                stats.localCycles += curTick();

            }


        } else if (outcome == TLB_MISS) {


            DPRINTF(GPUTLB, "This is a TLB miss\n");

            if (update_stats) {

                stats.accessCycles += (req_cnt*curTick());

                stats.localCycles += curTick();

            }


            if (hasMemSidePort) {

                // the one cyle added here represent the delay from when we get

                // the reply back till when we propagate it to the coalescer

                // above.

                if (update_stats) {

                    stats.accessCycles += (req_cnt * 1);

                    stats.localCycles += 1;

                }


                if (!memSidePort[0]->sendTimingReq(pkt)) {

                    DPRINTF(GPUTLB, "Failed sending translation request to "

                            "lower level TLB for addr %#x\n", virtPageAddr);


                    memSidePort[0]->retries.push_back(pkt);

                } else {

                    DPRINTF(GPUTLB, "Sent translation request to lower level "

                            "TLB for addr %#x\n", virtPageAddr);

                }

            } else {

                //this is the last level TLB. Start a page walk

                DPRINTF(GPUTLB, "Last level TLB - start a page walk for "

                        "addr %#x\n", virtPageAddr);


                if (update_stats)

                    stats.pageTableCycles -= (req_cnt*curTick());


                TLBEvent *tlb_event = translationReturnEvent[virtPageAddr];

                assert(tlb_event);

                tlb_event->updateOutcome(PAGE_WALK);

                schedule(tlb_event,

                         curTick() + cyclesToTicks(Cycles(missLatency2)));

            }

        } else if (outcome == PAGE_WALK) {

            if (update_stats)

                stats.pageTableCycles += (req_cnt*curTick());


            // Need to access the page table and update the TLB

            DPRINTF(GPUTLB, "Doing a page walk for address %#x\n",

                    virtPageAddr);


            GpuTranslationState *sender_state =

                safe_cast<GpuTranslationState*>(pkt->senderState);


            Process *p = sender_state->tc->getProcessPtr();

            Addr vaddr = pkt->req->getVaddr();


            Addr alignedVaddr = p->pTable->pageAlign(vaddr);

            assert(alignedVaddr == virtPageAddr);


            const EmulationPageTable::Entry *pte = p->pTable->lookup(vaddr);

            if (!pte && sender_state->tlbMode != BaseMMU::Execute &&

                    p->fixupFault(vaddr)) {

                pte = p->pTable->lookup(vaddr);

            }


            if (pte) {

                DPRINTF(GPUTLB, "Mapping %#x to %#x\n", alignedVaddr,

                        pte->paddr);


                sender_state->tlbEntry =

                    new TlbEntry(p->pid(), virtPageAddr, pte->paddr, false,

                                 false);

            } else {

                sender_state->tlbEntry = nullptr;

            }


            handleTranslationReturn(virtPageAddr, TLB_MISS, pkt);

        } else if (outcome == MISS_RETURN) {

            handleTranslationReturn(virtPageAddr, TLB_MISS, pkt);

        } else {

            panic("Unexpected TLB outcome %d", outcome);

        }

    }

    GpuTLB::translationReturn(Addr virtPageAddr, tlbOutcome outcome, {…}


    void


    GpuTLB::TLBEvent::process()

    {

        tlb->translationReturn(virtPageAddr, outcome, pkt);

    }

    GpuTLB::TLBEvent::process() {…}


    const char*


    GpuTLB::TLBEvent::description() const

    {

        return "trigger translationDoneEvent";

    }

    GpuTLB::TLBEvent::description() const {…}


    void


    GpuTLB::TLBEvent::updateOutcome(tlbOutcome _outcome)

    {

        outcome = _outcome;

    }

    GpuTLB::TLBEvent::updateOutcome(tlbOutcome _outcome) {…}


    Addr


    GpuTLB::TLBEvent::getTLBEventVaddr()

    {

        return virtPageAddr;

    }

    GpuTLB::TLBEvent::getTLBEventVaddr() {…}


    bool


    GpuTLB::CpuSidePort::recvTimingReq(PacketPtr pkt)

    {

        if (tlb->outstandingReqs < tlb->maxCoalescedReqs) {

            tlb->issueTLBLookup(pkt);

            // update number of outstanding translation requests

            tlb->outstandingReqs++;

            return true;

         } else {

            DPRINTF(GPUTLB, "Reached maxCoalescedReqs number %d\n",

                    tlb->outstandingReqs);

            return false;

         }

    }

    GpuTLB::CpuSidePort::recvTimingReq(PacketPtr pkt) {…}


    void


    GpuTLB::handleFuncTranslationReturn(PacketPtr pkt, tlbOutcome tlb_outcome)

    {

        GpuTranslationState *sender_state =

            safe_cast<GpuTranslationState*>(pkt->senderState);


        ThreadContext *tc = sender_state->tc;

        Mode mode = sender_state->tlbMode;

        Addr vaddr = pkt->req->getVaddr();


        TlbEntry *local_entry, *new_entry;


        if (tlb_outcome == TLB_HIT) {

            DPRINTF(GPUTLB, "Functional Translation Done - TLB hit for addr "

                    "%#x\n", vaddr);


            local_entry = safe_cast<TlbEntry *>(sender_state->tlbEntry);

        } else {

            DPRINTF(GPUTLB, "Functional Translation Done - TLB miss for addr "

                    "%#x\n", vaddr);


            new_entry = safe_cast<TlbEntry *>(sender_state->tlbEntry);

            assert(new_entry);

            local_entry = new_entry;


            if (allocationPolicy) {

                Addr virt_page_addr = roundDown(vaddr, X86ISA::PageBytes);


                DPRINTF(GPUTLB, "allocating entry w/ addr %#x\n",

                        virt_page_addr);


                local_entry = insert(virt_page_addr, *new_entry);

            }


            assert(local_entry);

        }


        DPRINTF(GPUTLB, "Entry found with vaddr %#x, doing protection checks "

                "while paddr was %#x.\n", local_entry->vaddr,

                local_entry->paddr);


        if (!sender_state->isPrefetch && sender_state->tlbEntry)

            pagingProtectionChecks(tc, pkt, local_entry, mode);


        int page_size = local_entry->size();

        Addr paddr = local_entry->paddr | (vaddr & (page_size - 1));

        DPRINTF(GPUTLB, "Translated %#x -> %#x.\n", vaddr, paddr);


        pkt->req->setPaddr(paddr);


        if (local_entry->uncacheable)

             pkt->req->setFlags(Request::UNCACHEABLE);

    }

    GpuTLB::handleFuncTranslationReturn(PacketPtr pkt, tlbOutcome tlb_outcome) {…}


    // This is used for atomic translations. Need to

    // make it all happen during the same cycle.

    void


    GpuTLB::CpuSidePort::recvFunctional(PacketPtr pkt)

    {

        GpuTranslationState *sender_state =

            safe_cast<GpuTranslationState*>(pkt->senderState);


        ThreadContext *tc = sender_state->tc;

        bool update_stats = !sender_state->isPrefetch;


        Addr virt_page_addr = roundDown(pkt->req->getVaddr(),

                                        X86ISA::PageBytes);


        if (update_stats)

            tlb->updatePageFootprint(virt_page_addr);


        // do the TLB lookup without updating the stats

        bool success = tlb->tlbLookup(pkt->req, tc, update_stats);

        tlbOutcome tlb_outcome = success ? TLB_HIT : TLB_MISS;


        // functional mode means no coalescing

        // global metrics are the same as the local metrics

        if (update_stats) {

            tlb->stats.globalNumTLBAccesses++;


            if (success) {

                sender_state->hitLevel = sender_state->reqCnt.size();

                tlb->stats.globalNumTLBHits++;

            }

        }


        if (!success) {

            if (update_stats)

                tlb->stats.globalNumTLBMisses++;

            if (tlb->hasMemSidePort) {

                // there is a TLB below -> propagate down the TLB hierarchy

                tlb->memSidePort[0]->sendFunctional(pkt);

                // If no valid translation from a prefetch, then just return

                if (sender_state->isPrefetch && !pkt->req->hasPaddr())

                    return;

            } else {

                // Need to access the page table and update the TLB

                DPRINTF(GPUTLB, "Doing a page walk for address %#x\n",

                        virt_page_addr);


                Process *p = tc->getProcessPtr();


                Addr vaddr = pkt->req->getVaddr();


                Addr alignedVaddr = p->pTable->pageAlign(vaddr);

                assert(alignedVaddr == virt_page_addr);


                const EmulationPageTable::Entry *pte =

                        p->pTable->lookup(vaddr);

                if (!pte && sender_state->tlbMode != BaseMMU::Execute &&

                        p->fixupFault(vaddr)) {

                    pte = p->pTable->lookup(vaddr);

                }


                if (!sender_state->isPrefetch) {

                    // no PageFaults are permitted after

                    // the second page table lookup

                    assert(pte);


                    DPRINTF(GPUTLB, "Mapping %#x to %#x\n", alignedVaddr,

                            pte->paddr);


                    sender_state->tlbEntry =

                        new TlbEntry(p->pid(), virt_page_addr,

                                     pte->paddr, false, false);

                } else {

                    // If this was a prefetch, then do the normal thing if it

                    // was a successful translation.  Otherwise, send an empty

                    // TLB entry back so that it can be figured out as empty

                    // and handled accordingly.

                    if (pte) {

                        DPRINTF(GPUTLB, "Mapping %#x to %#x\n", alignedVaddr,

                                pte->paddr);


                        sender_state->tlbEntry =

                            new TlbEntry(p->pid(), virt_page_addr,

                                         pte->paddr, false, false);

                    } else {

                        DPRINTF(GPUPrefetch, "Prefetch failed %#x\n",

                                alignedVaddr);


                        sender_state->tlbEntry = nullptr;


                        return;

                    }

                }

            }

        } else {

            DPRINTF(GPUPrefetch, "Functional Hit for vaddr %#x\n",

                    tlb->lookup(pkt->req->getVaddr()));


            TlbEntry *entry = tlb->lookup(pkt->req->getVaddr(),

                                             update_stats);


            assert(entry);


            auto p = sender_state->tc->getProcessPtr();

            sender_state->tlbEntry =

                new TlbEntry(p->pid(), entry->vaddr, entry->paddr,

                             false, false);

        }

        // This is the function that would populate pkt->req with the paddr of

        // the translation. But if no translation happens (i.e Prefetch fails)

        // then the early returns in the above code wiill keep this function

        // from executing.

        tlb->handleFuncTranslationReturn(pkt, tlb_outcome);

    }

    GpuTLB::CpuSidePort::recvFunctional(PacketPtr pkt) {…}


    void


    GpuTLB::CpuSidePort::recvReqRetry()

    {

        // The CPUSidePort never sends anything but replies. No retries

        // expected.

        panic("recvReqRetry called");

    }

    GpuTLB::CpuSidePort::recvReqRetry() {…}


    AddrRangeList


    GpuTLB::CpuSidePort::getAddrRanges() const

    {

        // currently not checked by the requestor

        AddrRangeList ranges;


        return ranges;

    }

    GpuTLB::CpuSidePort::getAddrRanges() const {…}


    bool


    GpuTLB::MemSidePort::recvTimingResp(PacketPtr pkt)

    {

        Addr virt_page_addr = roundDown(pkt->req->getVaddr(),

                                        X86ISA::PageBytes);


        DPRINTF(GPUTLB, "MemSidePort recvTiming for virt_page_addr %#x\n",

                virt_page_addr);


        TLBEvent *tlb_event = tlb->translationReturnEvent[virt_page_addr];

        assert(tlb_event);

        assert(virt_page_addr == tlb_event->getTLBEventVaddr());


        tlb_event->updateOutcome(MISS_RETURN);

        tlb->schedule(tlb_event, curTick()+tlb->clockPeriod());


        return true;

    }

    GpuTLB::MemSidePort::recvTimingResp(PacketPtr pkt) {…}


    void


    GpuTLB::MemSidePort::recvReqRetry()

    {

        // No retries should reach the TLB. The retries

        // should only reach the TLBCoalescer.

        panic("recvReqRetry called");

    }

    GpuTLB::MemSidePort::recvReqRetry() {…}


    void


    GpuTLB::cleanup()

    {

        while (!cleanupQueue.empty()) {

            Addr cleanup_addr = cleanupQueue.front();

            cleanupQueue.pop();


            // delete TLBEvent

            TLBEvent * old_tlb_event = translationReturnEvent[cleanup_addr];

            delete old_tlb_event;

            translationReturnEvent.erase(cleanup_addr);


            // update number of outstanding requests

            outstandingReqs--;

        }


        for (int i = 0; i < cpuSidePort.size(); ++i) {

            cpuSidePort[i]->sendRetryReq();

        }

    }

    GpuTLB::cleanup() {…}


    void


    GpuTLB::updatePageFootprint(Addr virt_page_addr)

    {


        std::pair<AccessPatternTable::iterator, bool> ret;


        AccessInfo tmp_access_info;

        tmp_access_info.lastTimeAccessed = 0;

        tmp_access_info.accessesPerPage = 0;

        tmp_access_info.totalReuseDistance = 0;

        tmp_access_info.sumDistance = 0;

        tmp_access_info.meanDistance = 0;


        ret = TLBFootprint.insert(

            AccessPatternTable::value_type(virt_page_addr, tmp_access_info));


        bool first_page_access = ret.second;


        if (first_page_access) {

            stats.numUniquePages++;

        } else  {

            int accessed_before;

            accessed_before  = curTick() - ret.first->second.lastTimeAccessed;

            ret.first->second.totalReuseDistance += accessed_before;

        }


        ret.first->second.accessesPerPage++;

        ret.first->second.lastTimeAccessed = curTick();


        if (accessDistance) {

            ret.first->second.localTLBAccesses

                .push_back(stats.localNumTLBAccesses.value());

        }

    }

    GpuTLB::updatePageFootprint(Addr virt_page_addr) {…}


    void


    GpuTLB::exitCallback()

    {

        std::ostream *page_stat_file = nullptr;


        if (accessDistance) {


            // print per page statistics to a separate file (.csv format)

            // simout is the gem5 output directory (default is m5out or the one

            // specified with -d

            page_stat_file = simout.create(name().c_str())->stream();


            // print header

            *page_stat_file

                << "page,max_access_distance,mean_access_distance, "

                << "stddev_distance" << std::endl;

        }


        // update avg. reuse distance footprint

        unsigned int sum_avg_reuse_distance_per_page = 0;


        // iterate through all pages seen by this TLB

        for (auto &iter : TLBFootprint) {

            sum_avg_reuse_distance_per_page += iter.second.totalReuseDistance /

                                               iter.second.accessesPerPage;


            if (accessDistance) {

                unsigned int tmp = iter.second.localTLBAccesses[0];

                unsigned int prev = tmp;


                for (int i = 0; i < iter.second.localTLBAccesses.size(); ++i) {

                    if (i) {

                        tmp = prev + 1;

                    }


                    prev = iter.second.localTLBAccesses[i];

                    // update the localTLBAccesses value

                    // with the actual differece

                    iter.second.localTLBAccesses[i] -= tmp;

                    // compute the sum of AccessDistance per page

                    // used later for mean

                    iter.second.sumDistance +=

                        iter.second.localTLBAccesses[i];

                }


                iter.second.meanDistance =

                    iter.second.sumDistance / iter.second.accessesPerPage;


                // compute std_dev and max  (we need a second round because we

                // need to know the mean value

                unsigned int max_distance = 0;

                unsigned int stddev_distance = 0;


                for (int i = 0; i < iter.second.localTLBAccesses.size(); ++i) {

                    unsigned int tmp_access_distance =

                        iter.second.localTLBAccesses[i];


                    if (tmp_access_distance > max_distance) {

                        max_distance = tmp_access_distance;

                    }


                    unsigned int diff =

                        tmp_access_distance - iter.second.meanDistance;

                    stddev_distance += pow(diff, 2);


                }


                stddev_distance =

                    sqrt(stddev_distance/iter.second.accessesPerPage);


                if (page_stat_file) {

                    *page_stat_file << std::hex << iter.first << ",";

                    *page_stat_file << std::dec << max_distance << ",";

                    *page_stat_file << std::dec << iter.second.meanDistance

                                    << ",";

                    *page_stat_file << std::dec << stddev_distance;

                    *page_stat_file << std::endl;

                }


                // erase the localTLBAccesses array

                iter.second.localTLBAccesses.clear();

            }

        }


        if (!TLBFootprint.empty()) {

            stats.avgReuseDistance =

                sum_avg_reuse_distance_per_page / TLBFootprint.size();

        }


        //clear the TLBFootprint map

        TLBFootprint.clear();

    }

    GpuTLB::exitCallback() {…}


    GpuTLB::GpuTLBStats::GpuTLBStats(statistics::Group *parent)

        : statistics::Group(parent),

          ADD_STAT(localNumTLBAccesses, "Number of TLB accesses"),

          ADD_STAT(localNumTLBHits, "Number of TLB hits"),

          ADD_STAT(localNumTLBMisses, "Number of TLB misses"),

          ADD_STAT(localTLBMissRate, "TLB miss rate"),

          ADD_STAT(globalNumTLBAccesses, "Number of TLB accesses"),

          ADD_STAT(globalNumTLBHits, "Number of TLB hits"),

          ADD_STAT(globalNumTLBMisses, "Number of TLB misses"),

          ADD_STAT(globalTLBMissRate, "TLB miss rate"),

          ADD_STAT(accessCycles, "Cycles spent accessing this TLB level"),

          ADD_STAT(pageTableCycles, "Cycles spent accessing the page table"),

          ADD_STAT(numUniquePages, "Number of unique pages touched"),

          ADD_STAT(localCycles, "Number of cycles spent in queue for all "

                   "incoming reqs"),

          ADD_STAT(localLatency, "Avg. latency over incoming coalesced reqs"),

          ADD_STAT(avgReuseDistance, "avg. reuse distance over all pages (in "

                   "ticks)")

    {

        localLatency = localCycles / localNumTLBAccesses;


        localTLBMissRate = 100 * localNumTLBMisses / localNumTLBAccesses;

        globalTLBMissRate = 100 * globalNumTLBMisses / globalNumTLBAccesses;

    }

    GpuTLB::GpuTLBStats::GpuTLBStats(statistics::Group *parent) {…}

} // namespace X86ISA

namespace X86ISA {…}

} // namespace gem5

tlb.hh

faults.hh

misc.hh

trace.hh

DPRINTF
#define DPRINTF(x,...)
Definition trace.hh:209

bitfield.hh

data
const char data[]
Definition circlebuf.test.cc:48

gem5::BaseMMU::Execute
@ Execute
Definition mmu.hh:56

gem5::BaseMMU::Write
@ Write
Definition mmu.hh:56

gem5::BaseMMU::Read
@ Read
Definition mmu.hh:56

gem5::CheckpointIn
Definition serialize.hh:69

gem5::ClockedObject
The ClockedObject class extends the SimObject with a clock and accessor functions to relate ticks to ...
Definition clocked_object.hh:235

gem5::Clocked::cyclesToTicks
Tick cyclesToTicks(Cycles c) const
Definition clocked_object.hh:227

gem5::Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition types.hh:79

gem5::Event
Definition eventq.hh:255

gem5::Named::name
virtual std::string name() const
Definition named.hh:47

gem5::OutputDirectory::create
OutputStream * create(const std::string &name, bool binary=false, bool no_gz=false)
Creates a file in this directory (optionally compressed).
Definition output.cc:210

gem5::OutputStream::stream
std::ostream * stream() const
Get the output underlying output stream.
Definition output.hh:62

gem5::PCStateBase::instAddr
Addr instAddr() const
Returns the memory address of the instruction this PC points to.
Definition pcstate.hh:108

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::Packet::makeTimingResponse
void makeTimingResponse()
Definition packet.hh:1080

gem5::Packet::senderState
SenderState * senderState
This packet's sender state.
Definition packet.hh:545

gem5::Packet::setData
void setData(const uint8_t *p)
Copy data into the packet from the provided pointer.
Definition packet.hh:1293

gem5::Packet::req
RequestPtr req
A pointer to the original request.
Definition packet.hh:377

gem5::Packet::isRequest
bool isRequest() const
Definition packet.hh:597

gem5::Port
Ports are used to interface objects to each other.
Definition port.hh:62

gem5::Process
Definition process.hh:68

gem5::Request::STRICT_ORDER
@ STRICT_ORDER
The request is required to be strictly ordered by CPU models and is non-speculative.
Definition request.hh:135

gem5::Request::UNCACHEABLE
@ UNCACHEABLE
The request is to an uncacheable address.
Definition request.hh:125

gem5::Request::READ_MODIFY_WRITE
@ READ_MODIFY_WRITE
This request is a read which will be followed by a write.
Definition request.hh:161

gem5::ThreadContext
ThreadContext is the external interface to all thread state for anything outside of the CPU.
Definition thread_context.hh:89

gem5::ThreadContext::readMiscReg
virtual RegVal readMiscReg(RegIndex misc_reg)=0

gem5::ThreadContext::setMiscReg
virtual void setMiscReg(RegIndex misc_reg, RegVal val)=0

gem5::ThreadContext::pcState
virtual const PCStateBase & pcState() const =0

gem5::ThreadContext::readMiscRegNoEffect
virtual RegVal readMiscRegNoEffect(RegIndex misc_reg) const =0

gem5::ThreadContext::getProcessPtr
virtual Process * getProcessPtr()=0

gem5::ThreadContext::contextId
virtual ContextID contextId() const =0

gem5::X86ISA::GpuTLB::CpuSidePort::recvReqRetry
virtual void recvReqRetry()
Definition tlb.cc:1235

gem5::X86ISA::GpuTLB::CpuSidePort::recvFunctional
virtual void recvFunctional(PacketPtr pkt)
Receive a functional request packet from the peer.
Definition tlb.cc:1123

gem5::X86ISA::GpuTLB::CpuSidePort::recvTimingReq
virtual bool recvTimingReq(PacketPtr pkt)
recvTiming receives a coalesced timing request from a TLBCoalescer and it calls issueTLBLookup() It o...
Definition tlb.cc:1028

gem5::X86ISA::GpuTLB::CpuSidePort::getAddrRanges
virtual AddrRangeList getAddrRanges() const
Get a list of the non-overlapping address ranges the owner is responsible for.
Definition tlb.cc:1243

gem5::X86ISA::GpuTLB::MemSidePort::recvReqRetry
virtual void recvReqRetry()
Called by the peer if sendTimingReq was called on this peer (causing recvTimingReq to be called on th...
Definition tlb.cc:1276

gem5::X86ISA::GpuTLB::MemSidePort::recvTimingResp
virtual bool recvTimingResp(PacketPtr pkt)
MemSidePort receives the packet back.
Definition tlb.cc:1257

gem5::X86ISA::GpuTLB::TLBEvent
Definition tlb.hh:286

gem5::X86ISA::GpuTLB::TLBEvent::getTLBEventVaddr
Addr getTLBEventVaddr()
Definition tlb.cc:1016

gem5::X86ISA::GpuTLB::TLBEvent::updateOutcome
void updateOutcome(tlbOutcome _outcome)
Definition tlb.cc:1010

gem5::X86ISA::GpuTLB::TLBEvent::TLBEvent
TLBEvent(GpuTLB *_tlb, Addr _addr, tlbOutcome outcome, PacketPtr _pkt)
Definition tlb.cc:751

gem5::X86ISA::GpuTLB::TLBEvent::description
const char * description() const
Return a C string describing the event.
Definition tlb.cc:1004

gem5::X86ISA::GpuTLB::TLBEvent::process
void process()
Definition tlb.cc:998

gem5::X86ISA::GpuTLB::Translation
Definition tlb.hh:82

gem5::X86ISA::GpuTLB::Translation::finish
virtual void finish(Fault fault, const RequestPtr &req, ThreadContext *tc, Mode mode)=0
The memory for this object may be dynamically allocated, and it may be responsible for cleaning itsle...

gem5::X86ISA::GpuTLB
Definition tlb.hh:66

gem5::X86ISA::GpuTLB::exitCallback
void exitCallback()
Definition tlb.cc:1343

gem5::X86ISA::GpuTLB::Params
X86GPUTLBParams Params
Definition tlb.hh:75

gem5::X86ISA::GpuTLB::maxCoalescedReqs
int maxCoalescedReqs
Definition tlb.hh:269

gem5::X86ISA::GpuTLB::issueTLBLookup
void issueTLBLookup(PacketPtr pkt)
Do the TLB lookup for this coalesced request and schedule another event <TLB access latency> cycles l...
Definition tlb.cc:665

gem5::X86ISA::GpuTLB::translationReturnEvent
std::unordered_map< Addr, TLBEvent * > translationReturnEvent
Definition tlb.hh:308

gem5::X86ISA::GpuTLB::translationReturn
void translationReturn(Addr virtPageAddr, tlbOutcome outcome, PacketPtr pkt)
A TLBEvent is scheduled after the TLB lookup and helps us take the appropriate actions: (e....
Definition tlb.cc:884

gem5::X86ISA::GpuTLB::invalidateNonGlobal
void invalidateNonGlobal()
Definition tlb.cc:249

gem5::X86ISA::GpuTLB::Mode
enum BaseMMU::Mode Mode
Definition tlb.hh:79

gem5::X86ISA::GpuTLB::cleanupEvent
EventFunctionWrapper cleanupEvent
Definition tlb.hh:318

gem5::X86ISA::GpuTLB::outstandingReqs
int outstandingReqs
Definition tlb.hh:273

gem5::X86ISA::GpuTLB::cleanup
void cleanup()
Definition tlb.cc:1284

gem5::X86ISA::GpuTLB::size
int size
Definition tlb.hh:116

gem5::X86ISA::GpuTLB::lookupIt
EntryList::iterator lookupIt(Addr va, bool update_lru=true)
Definition tlb.cc:186

gem5::X86ISA::GpuTLB::translateInt
Fault translateInt(bool read, const RequestPtr &req, ThreadContext *tc)
Definition tlb.cc:302

gem5::X86ISA::GpuTLB::GpuTLB
GpuTLB(const Params &p)
Definition tlb.cc:67

gem5::X86ISA::GpuTLB::~GpuTLB
~GpuTLB()
Definition tlb.cc:131

gem5::X86ISA::GpuTLB::translate
Fault translate(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode, bool &delayedResponse, bool timing, int &latency)
Definition tlb.cc:424

gem5::X86ISA::GpuTLB::TLBFootprint
AccessPatternTable TLBFootprint
Definition tlb.hh:346

gem5::X86ISA::GpuTLB::demapPage
void demapPage(Addr va, uint64_t asn)
Definition tlb.cc:267

gem5::X86ISA::GpuTLB::configAddress
uint32_t configAddress
Definition tlb.hh:72

gem5::X86ISA::GpuTLB::unserialize
virtual void unserialize(CheckpointIn &cp) override
Unserialize an object.
Definition tlb.cc:655

gem5::X86ISA::GpuTLB::missLatency1
int missLatency1
Definition tlb.hh:171

gem5::X86ISA::GpuTLB::setMask
Addr setMask
Definition tlb.hh:124

gem5::X86ISA::GpuTLB::lookup
TlbEntry * lookup(Addr va, bool update_lru=true)
Definition tlb.cc:216

gem5::X86ISA::GpuTLB::tlbOutcome
tlbOutcome
Definition tlb.hh:194

gem5::X86ISA::GpuTLB::TLB_MISS
@ TLB_MISS
Definition tlb.hh:194

gem5::X86ISA::GpuTLB::TLB_HIT
@ TLB_HIT
Definition tlb.hh:194

gem5::X86ISA::GpuTLB::MISS_RETURN
@ MISS_RETURN
Definition tlb.hh:194

gem5::X86ISA::GpuTLB::PAGE_WALK
@ PAGE_WALK
Definition tlb.hh:194

gem5::X86ISA::GpuTLB::tlb
std::vector< TlbEntry > tlb
Definition tlb.hh:143

gem5::X86ISA::GpuTLB::memSidePort
std::vector< MemSidePort * > memSidePort
Definition tlb.hh:262

gem5::X86ISA::GpuTLB::accessDistance
bool accessDistance
Print out accessDistance stats.
Definition tlb.hh:141

gem5::X86ISA::GpuTLB::invalidateAll
void invalidateAll()
Definition tlb.cc:229

gem5::X86ISA::GpuTLB::getPort
Port & getPort(const std::string &if_name, PortID idx=InvalidPortID) override
Get a port with a given name and index.
Definition tlb.cc:138

gem5::X86ISA::GpuTLB::walker
Walker * walker
Definition tlb.hh:107

gem5::X86ISA::GpuTLB::cleanupQueue
std::queue< Addr > cleanupQueue
Definition tlb.hh:312

gem5::X86ISA::GpuTLB::FA
bool FA
true if this is a fully-associative TLB
Definition tlb.hh:123

gem5::X86ISA::GpuTLB::insert
TlbEntry * insert(Addr vpn, TlbEntry &entry)
Definition tlb.cc:160

gem5::X86ISA::GpuTLB::numSets
int numSets
Definition tlb.hh:118

gem5::X86ISA::GpuTLB::hitLatency
int hitLatency
Definition tlb.hh:170

gem5::X86ISA::GpuTLB::stats
gem5::X86ISA::GpuTLB::GpuTLBStats stats

gem5::X86ISA::GpuTLB::translateTiming
void translateTiming(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode, int &latency)
Definition tlb.cc:629

gem5::X86ISA::GpuTLB::handleFuncTranslationReturn
void handleFuncTranslationReturn(PacketPtr pkt, tlbOutcome outcome)
handleFuncTranslationReturn is called on a TLB hit, when a TLB miss returns or when a page fault retu...
Definition tlb.cc:1051

gem5::X86ISA::GpuTLB::freeList
std::vector< EntryList > freeList
Definition tlb.hh:150

gem5::X86ISA::GpuTLB::assoc
int assoc
Definition tlb.hh:117

gem5::X86ISA::GpuTLB::entryList
std::vector< EntryList > entryList
An entryList per set is the equivalent of an LRU stack; it's used to guide replacement decisions.
Definition tlb.hh:159

gem5::X86ISA::GpuTLB::serialize
virtual void serialize(CheckpointOut &cp) const override
Serialize an object.
Definition tlb.cc:650

gem5::X86ISA::GpuTLB::setConfigAddress
void setConfigAddress(uint32_t addr)
Definition tlb.cc:243

gem5::X86ISA::GpuTLB::hasMemSidePort
bool hasMemSidePort
if true, then this is not the last level TLB
Definition tlb.hh:135

gem5::X86ISA::GpuTLB::allocationPolicy
bool allocationPolicy
Allocation Policy: true if we always allocate on a hit, false otherwise.
Definition tlb.hh:130

gem5::X86ISA::GpuTLB::handleTranslationReturn
void handleTranslationReturn(Addr addr, tlbOutcome outcome, PacketPtr pkt)
handleTranslationReturn is called on a TLB hit, when a TLB miss returns or when a page fault returns.
Definition tlb.cc:797

gem5::X86ISA::GpuTLB::updatePageFootprint
void updatePageFootprint(Addr virt_page_addr)
Definition tlb.cc:1308

gem5::X86ISA::GpuTLB::tlbLookup
bool tlbLookup(const RequestPtr &req, ThreadContext *tc, bool update_stats)
TLB_lookup will only perform a TLB lookup returning true on a TLB hit and false on a TLB miss.
Definition tlb.cc:371

gem5::X86ISA::GpuTLB::getWalker
Walker * getWalker()
Definition tlb.cc:643

gem5::X86ISA::GpuTLB::missLatency2
int missLatency2
Definition tlb.hh:172

gem5::X86ISA::GpuTLB::cpuSidePort
std::vector< CpuSidePort * > cpuSidePort
Definition tlb.hh:260

gem5::X86ISA::GpuTLB::translateAtomic
Fault translateAtomic(const RequestPtr &req, ThreadContext *tc, Mode mode, int &latency)
Definition tlb.cc:619

gem5::X86ISA::GpuTLB::pagingProtectionChecks
void pagingProtectionChecks(ThreadContext *tc, PacketPtr pkt, TlbEntry *tlb_entry, Mode mode)
Do Paging protection checks.
Definition tlb.cc:763

gem5::X86ISA::Walker
Definition pagetable_walker.hh:61

gem5::statistics::Group
Statistics container.
Definition group.hh:93

gem5::statistics::ScalarBase::size
size_type size() const
Return the number of elements, always 1 for a scalar.
Definition statistics.hh:615

gem5::statistics::ScalarBase::value
Counter value() const
Return the current value of this stat as its base type.
Definition statistics.hh:621

std::list< AddrRange >

std::pair
STL pair class.
Definition stl.hh:58

base.hh

thread_context.hh

gpu_translation_state.hh

ADD_STAT
#define ADD_STAT(n,...)
Convenience macro to add a stat to a statistics group.
Definition group.hh:75

gem5::roundDown
static constexpr T roundDown(const T &val, const U &align)
This function is used to align addresses in memory.
Definition intmath.hh:279

gem5::bits
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
Definition bitfield.hh:79

gem5::mbits
constexpr T mbits(T val, unsigned first, unsigned last)
Mask off the given bits in place like bits() but without shifting.
Definition bitfield.hh:106

gem5::EventBase::Maximum_Pri
static const Priority Maximum_Pri
Maximum priority.
Definition eventq.hh:244

gem5::Event::scheduled
bool scheduled() const
Determine if the current event is scheduled.
Definition eventq.hh:458

gem5::EventManager::schedule
void schedule(Event &event, Tick when)
Definition eventq.hh:1012

panic
#define panic(...)
This implements a cprintf based panic() function.
Definition logging.hh:188

fatal
#define fatal(...)
This implements a cprintf based fatal() function.
Definition logging.hh:200

flags
uint8_t flags
Definition helpers.cc:87

logging.hh

warn_once
#define warn_once(...)
Definition logging.hh:260

microldstop.hh

msr.hh

gem5::ArmISA::i
Bitfield< 7 > i
Definition misc_types.hh:67

gem5::ArmISA::set
Bitfield< 12, 11 > set
Definition misc_types.hh:792

gem5::ArmISA::attr
attr
Definition misc_types.hh:745

gem5::ArmISA::va
Bitfield< 8 > va
Definition misc_types.hh:357

gem5::ArmISA::tlb
Bitfield< 59, 56 > tlb
Definition misc_types.hh:119

gem5::MipsISA::vaddr
vaddr
Definition pra_constants.hh:278

gem5::X86ISA::misc_reg::segSel
static RegIndex segSel(int index)
Definition misc.hh:515

gem5::X86ISA::misc_reg::segAttr
static RegIndex segAttr(int index)
Definition misc.hh:543

gem5::X86ISA::misc_reg::segBase
static RegIndex segBase(int index)
Definition misc.hh:522

gem5::X86ISA::misc_reg::Cr0
@ Cr0
Definition misc.hh:116

gem5::X86ISA::misc_reg::ApicBase
@ ApicBase
Definition misc.hh:403

gem5::X86ISA::misc_reg::M5Reg
@ M5Reg
Definition misc.hh:148

gem5::X86ISA::misc_reg::PciConfigAddress
@ PciConfigAddress
Definition misc.hh:406

gem5::X86ISA::misc_reg::segLimit
static RegIndex segLimit(int index)
Definition misc.hh:536

gem5::X86ISA::segment_idx::Tsg
@ Tsg
Definition segment.hh:58

gem5::X86ISA::segment_idx::Ms
@ Ms
Definition segment.hh:60

gem5::X86ISA::segment_idx::Hs
@ Hs
Definition segment.hh:56

gem5::X86ISA::segment_idx::Es
@ Es
Definition segment.hh:50

gem5::X86ISA::segment_idx::Ls
@ Ls
Definition segment.hh:59

gem5::X86ISA::segment_idx::Idtr
@ Idtr
Definition segment.hh:65

gem5::X86ISA::AddrSizeFlagMask
constexpr auto AddrSizeFlagMask
Definition ldstflags.hh:58

gem5::X86ISA::PhysAddrPrefixPciConfig
const Addr PhysAddrPrefixPciConfig
Definition x86_traits.hh:69

gem5::X86ISA::base
Bitfield< 51, 12 > base
Definition pagetable.hh:141

gem5::X86ISA::expandDown
Bitfield< 14 > expandDown
Definition misc.hh:1031

gem5::X86ISA::IntAddrPrefixIO
const Addr IntAddrPrefixIO
Definition x86_traits.hh:66

gem5::X86ISA::AddrSizeFlagShift
constexpr auto AddrSizeFlagShift
Definition ldstflags.hh:57

gem5::X86ISA::SegmentFlagMask
constexpr Request::FlagsType SegmentFlagMask
Definition ldstflags.hh:54

gem5::X86ISA::limit
BitfieldType< SegDescriptorLimit > limit
Definition misc.hh:959

gem5::X86ISA::PageShift
const Addr PageShift
Definition page_size.hh:48

gem5::X86ISA::addr
Bitfield< 3 > addr
Definition types.hh:84

gem5::X86ISA::seg
Bitfield< 2, 0 > seg
Definition types.hh:87

gem5::X86ISA::PhysAddrPrefixIO
const Addr PhysAddrPrefixIO
Definition x86_traits.hh:68

gem5::X86ISA::CPL0FlagBit
constexpr auto CPL0FlagBit
Definition ldstflags.hh:56

gem5::X86ISA::mode
Bitfield< 3 > mode
Definition types.hh:192

gem5::X86ISA::p
Bitfield< 0 > p
Definition pagetable.hh:151

gem5::X86ISA::IntAddrPrefixCPUID
const Addr IntAddrPrefixCPUID
Definition x86_traits.hh:64

gem5::X86ISA::IntAddrPrefixMSR
const Addr IntAddrPrefixMSR
Definition x86_traits.hh:65

gem5::X86ISA::IntAddrPrefixMask
const Addr IntAddrPrefixMask
Definition x86_traits.hh:63

gem5::X86ISA::x
Bitfield< 1 > x
Definition types.hh:108

gem5::X86ISA::msrAddrToIndex
bool msrAddrToIndex(RegIndex &reg_num, Addr addr)
Find and return the misc reg corresponding to an MSR address.
Definition msr.cc:150

gem5::X86ISA::mask
mask
Definition misc.hh:831

gem5::X86ISA::x86LocalAPICAddress
static Addr x86LocalAPICAddress(const uint8_t id, const uint16_t addr)
Definition x86_traits.hh:92

gem5::X86ISA::offset
offset
Definition misc.hh:1059

gem5::X86ISA::PageBytes
const Addr PageBytes
Definition page_size.hh:49

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::Fault
std::shared_ptr< FaultBase > Fault
Definition types.hh:249

gem5::letoh
T letoh(T value)
Definition byteswap.hh:173

gem5::RequestPtr
std::shared_ptr< Request > RequestPtr
Definition request.hh:94

gem5::RegIndex
uint16_t RegIndex
Definition types.hh:176

gem5::cprintf
void cprintf(const char *format, const Args &...args)
Definition cprintf.hh:155

gem5::curTick
Tick curTick()
The universal simulation clock.
Definition cur_tick.hh:46

gem5::CheckpointOut
std::ostream CheckpointOut
Definition serialize.hh:66

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::PortID
int16_t PortID
Port index/ID type, and a symbolic name for an invalid port id.
Definition types.hh:245

gem5::FullSystem
bool FullSystem
The FullSystem variable can be used to determine the current mode of simulation.
Definition root.cc:220

gem5::simout
OutputDirectory simout
Definition output.cc:62

gem5::htole
T htole(T value)
Definition byteswap.hh:172

gem5::RegVal
uint64_t RegVal
Definition types.hh:173

gem5::csprintf
std::string csprintf(const char *format, const Args &...args)
Definition cprintf.hh:161

gem5::NoFault
constexpr decltype(nullptr) NoFault
Definition types.hh:253

output.hh

packet_access.hh

page_table.hh
Declarations of a non-full system Page Table.

pseudo_inst.hh

request.hh
Declaration of a request, the overall memory request consisting of the parts of the request that are ...

segment.hh

process.hh

gem5::ArmISA::TlbEntry
Definition pagetable.hh:233

gem5::EmulationPageTable::Entry
Definition page_table.hh:57

gem5::EmulationPageTable::Entry::paddr
Addr paddr
Definition page_table.hh:58

gem5::GpuTranslationState
GPU TranslationState: this currently is a somewhat bastardization of the usage of SenderState,...
Definition gpu_translation_state.hh:59

gem5::GpuTranslationState::tlbMode
BaseMMU::Mode tlbMode
Definition gpu_translation_state.hh:61

gem5::GpuTranslationState::reqCnt
std::vector< int > reqCnt
Definition gpu_translation_state.hh:83

gem5::GpuTranslationState::isPrefetch
bool isPrefetch
Definition gpu_translation_state.hh:75

gem5::GpuTranslationState::hitLevel
int hitLevel
Definition gpu_translation_state.hh:85

gem5::GpuTranslationState::tc
ThreadContext * tc
Definition gpu_translation_state.hh:63

gem5::GpuTranslationState::tlbEntry
Serializable * tlbEntry
Definition gpu_translation_state.hh:73

gem5::X86ISA::GpuTLB::AccessInfo
This hash map will use the virtual page address as a key and will keep track of total number of acces...
Definition tlb.hh:326

gem5::X86ISA::GpuTLB::AccessInfo::accessesPerPage
unsigned int accessesPerPage
Definition tlb.hh:328

gem5::X86ISA::GpuTLB::AccessInfo::sumDistance
unsigned int sumDistance
Definition tlb.hh:341

gem5::X86ISA::GpuTLB::AccessInfo::totalReuseDistance
unsigned int totalReuseDistance
Definition tlb.hh:330

gem5::X86ISA::GpuTLB::AccessInfo::lastTimeAccessed
unsigned int lastTimeAccessed
Definition tlb.hh:327

gem5::X86ISA::GpuTLB::AccessInfo::meanDistance
unsigned int meanDistance
Definition tlb.hh:342

gem5::X86ISA::GpuTLB::GpuTLBStats::GpuTLBStats
GpuTLBStats(statistics::Group *parent)
Definition tlb.cc:1435

gem5::X86ISA::GpuTLB::GpuTLBStats::localTLBMissRate
statistics::Formula localTLBMissRate
Definition tlb.hh:363

gem5::X86ISA::GpuTLB::GpuTLBStats::globalNumTLBMisses
statistics::Scalar globalNumTLBMisses
Definition tlb.hh:370

gem5::X86ISA::GpuTLB::GpuTLBStats::localCycles
statistics::Scalar localCycles
Definition tlb.hh:379

gem5::X86ISA::GpuTLB::GpuTLBStats::globalTLBMissRate
statistics::Formula globalTLBMissRate
Definition tlb.hh:371

gem5::X86ISA::GpuTLB::GpuTLBStats::localNumTLBHits
statistics::Scalar localNumTLBHits
Definition tlb.hh:361

gem5::X86ISA::GpuTLB::GpuTLBStats::numUniquePages
statistics::Scalar numUniquePages
Definition tlb.hh:377

gem5::X86ISA::GpuTLB::GpuTLBStats::avgReuseDistance
statistics::Scalar avgReuseDistance
Definition tlb.hh:384

gem5::X86ISA::GpuTLB::GpuTLBStats::globalNumTLBHits
statistics::Scalar globalNumTLBHits
Definition tlb.hh:369

gem5::X86ISA::GpuTLB::GpuTLBStats::localLatency
statistics::Formula localLatency
Definition tlb.hh:381

gem5::X86ISA::GpuTLB::GpuTLBStats::localNumTLBMisses
statistics::Scalar localNumTLBMisses
Definition tlb.hh:362

gem5::X86ISA::GpuTLB::GpuTLBStats::globalNumTLBAccesses
statistics::Scalar globalNumTLBAccesses
Definition tlb.hh:368

gem5::X86ISA::GpuTLB::GpuTLBStats::accessCycles
statistics::Scalar accessCycles
Definition tlb.hh:374

gem5::X86ISA::GpuTLB::GpuTLBStats::localNumTLBAccesses
statistics::Scalar localNumTLBAccesses
Definition tlb.hh:360

gem5::X86ISA::GpuTLB::GpuTLBStats::pageTableCycles
statistics::Scalar pageTableCycles
Definition tlb.hh:376

gem5::X86ISA::TlbEntry
Definition pagetable.hh:66

gem5::X86ISA::TlbEntry::uncacheable
bool uncacheable
Definition pagetable.hh:84

gem5::X86ISA::TlbEntry::paddr
Addr paddr
Definition pagetable.hh:68

gem5::X86ISA::TlbEntry::user
bool user
Definition pagetable.hh:79

gem5::X86ISA::TlbEntry::vaddr
Addr vaddr
Definition pagetable.hh:71

gem5::X86ISA::TlbEntry::size
int size()
Definition pagetable.hh:112

gem5::X86ISA::TlbEntry::writable
bool writable
Definition pagetable.hh:77

name
const std::string & name()
Definition trace.cc:48

page_size.hh

pagetable.hh

pagetable_walker.hh

x86_traits.hh