release/current/fetch_8cc_source.html

/*

 * Copyright (c) 2010-2014 ARM Limited

 * Copyright (c) 2012-2013 AMD

 * All rights reserved.

 *

 * The license below extends only to copyright in the software and shall

 * not be construed as granting a license to any other intellectual

 * property including but not limited to intellectual property relating

 * to a hardware implementation of the functionality of the software

 * licensed hereunder.  You may use the software subject to the license

 * terms below provided that you ensure that this notice is replicated

 * unmodified and in its entirety in all distributions of the software,

 * modified or unmodified, in source code or in binary form.

 *

 * Copyright (c) 2004-2006 The Regents of The University of Michigan

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are

 * met: redistributions of source code must retain the above copyright

 * notice, this list of conditions and the following disclaimer;

 * redistributions in binary form must reproduce the above copyright

 * notice, this list of conditions and the following disclaimer in the

 * documentation and/or other materials provided with the distribution;

 * neither the name of the copyright holders nor the names of its

 * contributors may be used to endorse or promote products derived from

 * this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 */


#include "cpu/o3/fetch.hh"


#include <algorithm>

#include <cstring>

#include <list>

#include <map>

#include <queue>


#include "arch/generic/tlb.hh"

#include "base/types.hh"

#include "cpu/base.hh"

#include "cpu/exetrace.hh"

#include "cpu/nop_static_inst.hh"

#include "cpu/o3/cpu.hh"

#include "cpu/o3/dyn_inst.hh"

#include "cpu/o3/limits.hh"

#include "debug/Activity.hh"

#include "debug/Drain.hh"

#include "debug/Fetch.hh"

#include "debug/O3CPU.hh"

#include "debug/O3PipeView.hh"

#include "mem/packet.hh"

#include "params/BaseO3CPU.hh"

#include "sim/byteswap.hh"

#include "sim/core.hh"

#include "sim/eventq.hh"

#include "sim/full_system.hh"

#include "sim/system.hh"


namespace gem5

{


namespace o3

{


Fetch::IcachePort::IcachePort(Fetch *_fetch, CPU *_cpu) :

        RequestPort(_cpu->name() + ".icache_port"), fetch(_fetch)

{}

Fetch::IcachePort::IcachePort(Fetch *_fetch, CPU *_cpu) : {…}


Fetch::Fetch(CPU *_cpu, const BaseO3CPUParams &params)

    : fetchPolicy(params.smtFetchPolicy),

      cpu(_cpu),

      branchPred(nullptr),

      decodeToFetchDelay(params.decodeToFetchDelay),

      renameToFetchDelay(params.renameToFetchDelay),

      iewToFetchDelay(params.iewToFetchDelay),

      commitToFetchDelay(params.commitToFetchDelay),

      fetchWidth(params.fetchWidth),

      decodeWidth(params.decodeWidth),

      retryPkt(NULL),

      retryTid(InvalidThreadID),

      cacheBlkSize(cpu->cacheLineSize()),

      fetchBufferSize(params.fetchBufferSize),

      fetchBufferMask(fetchBufferSize - 1),

      fetchQueueSize(params.fetchQueueSize),

      numThreads(params.numThreads),

      numFetchingThreads(params.smtNumFetchingThreads),

      icachePort(this, _cpu),

      finishTranslationEvent(this), fetchStats(_cpu, this)

{

    if (numThreads > MaxThreads)

        fatal("numThreads (%d) is larger than compiled limit (%d),\n"

              "\tincrease MaxThreads in src/cpu/o3/limits.hh\n",

              numThreads, static_cast<int>(MaxThreads));

    if (fetchWidth > MaxWidth)

        fatal("fetchWidth (%d) is larger than compiled limit (%d),\n"

             "\tincrease MaxWidth in src/cpu/o3/limits.hh\n",

             fetchWidth, static_cast<int>(MaxWidth));

    if (fetchBufferSize > cacheBlkSize)

        fatal("fetch buffer size (%u bytes) is greater than the cache "

              "block size (%u bytes)\n", fetchBufferSize, cacheBlkSize);

    if (cacheBlkSize % fetchBufferSize)

        fatal("cache block (%u bytes) is not a multiple of the "

              "fetch buffer (%u bytes)\n", cacheBlkSize, fetchBufferSize);


    for (int i = 0; i < MaxThreads; i++) {

        fetchStatus[i] = Idle;

        decoder[i] = nullptr;

        pc[i].reset(params.isa[0]->newPCState());

        fetchOffset[i] = 0;

        macroop[i] = nullptr;

        delayedCommit[i] = false;

        memReq[i] = nullptr;

        stalls[i] = {false, false};

        fetchBuffer[i] = NULL;

        fetchBufferPC[i] = 0;

        fetchBufferValid[i] = false;

        lastIcacheStall[i] = 0;

        issuePipelinedIfetch[i] = false;

    }


    branchPred = params.branchPred;


    for (ThreadID tid = 0; tid < numThreads; tid++) {

        decoder[tid] = params.decoder[tid];

        // Create space to buffer the cache line data,

        // which may not hold the entire cache line.

        fetchBuffer[tid] = new uint8_t[fetchBufferSize];

    }


    // Get the size of an instruction.

    instSize = decoder[0]->moreBytesSize();

}

Fetch::Fetch(CPU *_cpu, const BaseO3CPUParams &params) {…}


std::string Fetch::name() const { return cpu->name() + ".fetch"; }


void


Fetch::regProbePoints()

{

    ppFetch = new ProbePointArg<DynInstPtr>(cpu->getProbeManager(), "Fetch");

    ppFetchRequestSent = new ProbePointArg<RequestPtr>(cpu->getProbeManager(),

                                                       "FetchRequest");


}

Fetch::regProbePoints() {…}


Fetch::FetchStatGroup::FetchStatGroup(CPU *cpu, Fetch *fetch)

    : statistics::Group(cpu, "fetch"),

    ADD_STAT(predictedBranches, statistics::units::Count::get(),

             "Number of branches that fetch has predicted taken"),

    ADD_STAT(cycles, statistics::units::Cycle::get(),

             "Number of cycles fetch has run and was not squashing or "

             "blocked"),

    ADD_STAT(squashCycles, statistics::units::Cycle::get(),

             "Number of cycles fetch has spent squashing"),

    ADD_STAT(tlbCycles, statistics::units::Cycle::get(),

             "Number of cycles fetch has spent waiting for tlb"),

    ADD_STAT(idleCycles, statistics::units::Cycle::get(),

             "Number of cycles fetch was idle"),

    ADD_STAT(blockedCycles, statistics::units::Cycle::get(),

             "Number of cycles fetch has spent blocked"),

    ADD_STAT(miscStallCycles, statistics::units::Cycle::get(),

             "Number of cycles fetch has spent waiting on interrupts, or bad "

             "addresses, or out of MSHRs"),

    ADD_STAT(pendingDrainCycles, statistics::units::Cycle::get(),

             "Number of cycles fetch has spent waiting on pipes to drain"),

    ADD_STAT(noActiveThreadStallCycles, statistics::units::Cycle::get(),

             "Number of stall cycles due to no active thread to fetch from"),

    ADD_STAT(pendingTrapStallCycles, statistics::units::Cycle::get(),

             "Number of stall cycles due to pending traps"),

    ADD_STAT(pendingQuiesceStallCycles, statistics::units::Cycle::get(),

             "Number of stall cycles due to pending quiesce instructions"),

    ADD_STAT(icacheWaitRetryStallCycles, statistics::units::Cycle::get(),

             "Number of stall cycles due to full MSHR"),

    ADD_STAT(cacheLines, statistics::units::Count::get(),

             "Number of cache lines fetched"),

    ADD_STAT(icacheSquashes, statistics::units::Count::get(),

             "Number of outstanding Icache misses that were squashed"),

    ADD_STAT(tlbSquashes, statistics::units::Count::get(),

             "Number of outstanding ITLB misses that were squashed"),

    ADD_STAT(nisnDist, statistics::units::Count::get(),

             "Number of instructions fetched each cycle (Total)"),

    ADD_STAT(idleRate, statistics::units::Ratio::get(),

             "Ratio of cycles fetch was idle",

             idleCycles / cpu->baseStats.numCycles)

{

        predictedBranches

            .prereq(predictedBranches);

        cycles

            .prereq(cycles);

        squashCycles

            .prereq(squashCycles);

        tlbCycles

            .prereq(tlbCycles);

        idleCycles

            .prereq(idleCycles);

        blockedCycles

            .prereq(blockedCycles);

        cacheLines

            .prereq(cacheLines);

        miscStallCycles

            .prereq(miscStallCycles);

        pendingDrainCycles

            .prereq(pendingDrainCycles);

        noActiveThreadStallCycles

            .prereq(noActiveThreadStallCycles);

        pendingTrapStallCycles

            .prereq(pendingTrapStallCycles);

        pendingQuiesceStallCycles

            .prereq(pendingQuiesceStallCycles);

        icacheWaitRetryStallCycles

            .prereq(icacheWaitRetryStallCycles);

        icacheSquashes

            .prereq(icacheSquashes);

        tlbSquashes

            .prereq(tlbSquashes);

        nisnDist

            .init(/* base value */ 0,

              /* last value */ fetch->fetchWidth,

              /* bucket size */ 1)

            .flags(statistics::pdf);

        idleRate

            .prereq(idleRate);

}

Fetch::FetchStatGroup::FetchStatGroup(CPU *cpu, Fetch *fetch) {…}

void


Fetch::setTimeBuffer(TimeBuffer<TimeStruct> *time_buffer)

{

    timeBuffer = time_buffer;


    // Create wires to get information from proper places in time buffer.

    fromDecode = timeBuffer->getWire(-decodeToFetchDelay);

    fromRename = timeBuffer->getWire(-renameToFetchDelay);

    fromIEW = timeBuffer->getWire(-iewToFetchDelay);

    fromCommit = timeBuffer->getWire(-commitToFetchDelay);

}

Fetch::setTimeBuffer(TimeBuffer<TimeStruct> *time_buffer) {…}


void


Fetch::setActiveThreads(std::list<ThreadID> *at_ptr)

{

    activeThreads = at_ptr;

}

Fetch::setActiveThreads(std::list<ThreadID> *at_ptr) {…}


void


Fetch::setFetchQueue(TimeBuffer<FetchStruct> *ftb_ptr)

{

    // Create wire to write information to proper place in fetch time buf.

    toDecode = ftb_ptr->getWire(0);

}

Fetch::setFetchQueue(TimeBuffer<FetchStruct> *ftb_ptr) {…}


void


Fetch::startupStage()

{

    assert(priorityList.empty());

    resetStage();


    // Fetch needs to start fetching instructions at the very beginning,

    // so it must start up in active state.

    switchToActive();

}

Fetch::startupStage() {…}


void


Fetch::clearStates(ThreadID tid)

{

    fetchStatus[tid] = Running;

    set(pc[tid], cpu->pcState(tid));

    fetchOffset[tid] = 0;

    macroop[tid] = NULL;

    delayedCommit[tid] = false;

    memReq[tid] = NULL;

    stalls[tid].decode = false;

    stalls[tid].drain = false;

    fetchBufferPC[tid] = 0;

    fetchBufferValid[tid] = false;

    fetchQueue[tid].clear();


    // TODO not sure what to do with priorityList for now

    // priorityList.push_back(tid);

}

Fetch::clearStates(ThreadID tid) {…}


void


Fetch::resetStage()

{

    numInst = 0;

    interruptPending = false;

    cacheBlocked = false;


    priorityList.clear();


    // Setup PC and nextPC with initial state.

    for (ThreadID tid = 0; tid < numThreads; ++tid) {

        fetchStatus[tid] = Running;

        set(pc[tid], cpu->pcState(tid));

        fetchOffset[tid] = 0;

        macroop[tid] = NULL;


        delayedCommit[tid] = false;

        memReq[tid] = NULL;


        stalls[tid].decode = false;

        stalls[tid].drain = false;


        fetchBufferPC[tid] = 0;

        fetchBufferValid[tid] = false;


        fetchQueue[tid].clear();


        priorityList.push_back(tid);

    }


    wroteToTimeBuffer = false;

    _status = Inactive;

}

Fetch::resetStage() {…}


void


Fetch::processCacheCompletion(PacketPtr pkt)

{

    ThreadID tid = cpu->contextToThread(pkt->req->contextId());


    DPRINTF(Fetch, "[tid:%i] Waking up from cache miss.\n", tid);

    assert(!cpu->switchedOut());


    // Only change the status if it's still waiting on the icache access

    // to return.

    if (fetchStatus[tid] != IcacheWaitResponse ||

        pkt->req != memReq[tid]) {

        ++fetchStats.icacheSquashes;

        delete pkt;

        return;

    }


    memcpy(fetchBuffer[tid], pkt->getConstPtr<uint8_t>(), fetchBufferSize);

    fetchBufferValid[tid] = true;


    // Wake up the CPU (if it went to sleep and was waiting on

    // this completion event).

    cpu->wakeCPU();


    DPRINTF(Activity, "[tid:%i] Activating fetch due to cache completion\n",

            tid);


    switchToActive();


    // Only switch to IcacheAccessComplete if we're not stalled as well.

    if (checkStall(tid)) {

        fetchStatus[tid] = Blocked;

    } else {

        fetchStatus[tid] = IcacheAccessComplete;

    }


    pkt->req->setAccessLatency();

    cpu->ppInstAccessComplete->notify(pkt);

    // Reset the mem req to NULL.

    delete pkt;

    memReq[tid] = NULL;

}

Fetch::processCacheCompletion(PacketPtr pkt) {…}


void


Fetch::drainResume()

{

    for (ThreadID i = 0; i < numThreads; ++i) {

        stalls[i].decode = false;

        stalls[i].drain = false;

    }

}

Fetch::drainResume() {…}


void


Fetch::drainSanityCheck() const

{

    assert(isDrained());

    assert(retryPkt == NULL);

    assert(retryTid == InvalidThreadID);

    assert(!cacheBlocked);

    assert(!interruptPending);


    for (ThreadID i = 0; i < numThreads; ++i) {

        assert(!memReq[i]);

        assert(fetchStatus[i] == Idle || stalls[i].drain);

    }


    branchPred->drainSanityCheck();

}

Fetch::drainSanityCheck() const {…}


bool


Fetch::isDrained() const

{

    /* Make sure that threads are either idle of that the commit stage

     * has signaled that draining has completed by setting the drain

     * stall flag. This effectively forces the pipeline to be disabled

     * until the whole system is drained (simulation may continue to

     * drain other components).

     */

    for (ThreadID i = 0; i < numThreads; ++i) {

        // Verify fetch queues are drained

        if (!fetchQueue[i].empty())

            return false;


        // Return false if not idle or drain stalled

        if (fetchStatus[i] != Idle) {

            if (fetchStatus[i] == Blocked && stalls[i].drain)

                continue;

            else

                return false;

        }

    }


    /* The pipeline might start up again in the middle of the drain

     * cycle if the finish translation event is scheduled, so make

     * sure that's not the case.

     */

    return !finishTranslationEvent.scheduled();

}

Fetch::isDrained() const {…}


void


Fetch::takeOverFrom()

{

    assert(cpu->getInstPort().isConnected());

    resetStage();


}

Fetch::takeOverFrom() {…}


void


Fetch::drainStall(ThreadID tid)

{

    assert(cpu->isDraining());

    assert(!stalls[tid].drain);

    DPRINTF(Drain, "%i: Thread drained.\n", tid);

    stalls[tid].drain = true;

}

Fetch::drainStall(ThreadID tid) {…}


void


Fetch::wakeFromQuiesce()

{

    DPRINTF(Fetch, "Waking up from quiesce\n");

    // Hopefully this is safe

    // @todo: Allow other threads to wake from quiesce.

    fetchStatus[0] = Running;

}

Fetch::wakeFromQuiesce() {…}


void


Fetch::switchToActive()

{

    if (_status == Inactive) {

        DPRINTF(Activity, "Activating stage.\n");


        cpu->activateStage(CPU::FetchIdx);


        _status = Active;

    }

}

Fetch::switchToActive() {…}


void


Fetch::switchToInactive()

{

    if (_status == Active) {

        DPRINTF(Activity, "Deactivating stage.\n");


        cpu->deactivateStage(CPU::FetchIdx);


        _status = Inactive;

    }

}

Fetch::switchToInactive() {…}


void


Fetch::deactivateThread(ThreadID tid)

{

    // Update priority list

    auto thread_it = std::find(priorityList.begin(), priorityList.end(), tid);

    if (thread_it != priorityList.end()) {

        priorityList.erase(thread_it);

    }

}

Fetch::deactivateThread(ThreadID tid) {…}


bool


Fetch::lookupAndUpdateNextPC(const DynInstPtr &inst, PCStateBase &next_pc)

{

    // Do branch prediction check here.

    // A bit of a misnomer...next_PC is actually the current PC until

    // this function updates it.

    bool predict_taken;


    if (!inst->isControl()) {

        inst->staticInst->advancePC(next_pc);

        inst->setPredTarg(next_pc);

        inst->setPredTaken(false);

        return false;

    }


    ThreadID tid = inst->threadNumber;

    predict_taken = branchPred->predict(inst->staticInst, inst->seqNum,

                                        next_pc, tid);


    if (predict_taken) {

        DPRINTF(Fetch, "[tid:%i] [sn:%llu] Branch at PC %#x "

                "predicted to be taken to %s\n",

                tid, inst->seqNum, inst->pcState().instAddr(), next_pc);

    } else {

        DPRINTF(Fetch, "[tid:%i] [sn:%llu] Branch at PC %#x "

                "predicted to be not taken\n",

                tid, inst->seqNum, inst->pcState().instAddr());

    }


    DPRINTF(Fetch, "[tid:%i] [sn:%llu] Branch at PC %#x "

            "predicted to go to %s\n",

            tid, inst->seqNum, inst->pcState().instAddr(), next_pc);

    inst->setPredTarg(next_pc);

    inst->setPredTaken(predict_taken);


    cpu->fetchStats[tid]->numBranches++;


    if (predict_taken) {

        ++fetchStats.predictedBranches;

    }


    return predict_taken;

}

Fetch::lookupAndUpdateNextPC(const DynInstPtr &inst, PCStateBase &next_pc) {…}


bool


Fetch::fetchCacheLine(Addr vaddr, ThreadID tid, Addr pc)

{

    Fault fault = NoFault;


    assert(!cpu->switchedOut());


    // @todo: not sure if these should block translation.

    //AlphaDep

    if (cacheBlocked) {

        DPRINTF(Fetch, "[tid:%i] Can't fetch cache line, cache blocked\n",

                tid);

        return false;

    } else if (checkInterrupt(pc) && !delayedCommit[tid]) {

        // Hold off fetch from getting new instructions when:

        // Cache is blocked, or

        // while an interrupt is pending and we're not in PAL mode, or

        // fetch is switched out.

        DPRINTF(Fetch, "[tid:%i] Can't fetch cache line, interrupt pending\n",

                tid);

        return false;

    }


    // Align the fetch address to the start of a fetch buffer segment.

    Addr fetchBufferBlockPC = fetchBufferAlignPC(vaddr);


    DPRINTF(Fetch, "[tid:%i] Fetching cache line %#x for addr %#x\n",

            tid, fetchBufferBlockPC, vaddr);


    // Setup the memReq to do a read of the first instruction's address.

    // Set the appropriate read size and flags as well.

    // Build request here.

    RequestPtr mem_req = std::make_shared<Request>(

        fetchBufferBlockPC, fetchBufferSize,

        Request::INST_FETCH, cpu->instRequestorId(), pc,

        cpu->thread[tid]->contextId());


    mem_req->taskId(cpu->taskId());


    memReq[tid] = mem_req;


    // Initiate translation of the icache block

    fetchStatus[tid] = ItlbWait;

    FetchTranslation *trans = new FetchTranslation(this);

    cpu->mmu->translateTiming(mem_req, cpu->thread[tid]->getTC(),

                              trans, BaseMMU::Execute);

    return true;

}

Fetch::fetchCacheLine(Addr vaddr, ThreadID tid, Addr pc) {…}


void


Fetch::finishTranslation(const Fault &fault, const RequestPtr &mem_req)

{

    ThreadID tid = cpu->contextToThread(mem_req->contextId());

    Addr fetchBufferBlockPC = mem_req->getVaddr();


    assert(!cpu->switchedOut());


    // Wake up CPU if it was idle

    cpu->wakeCPU();


    if (fetchStatus[tid] != ItlbWait || mem_req != memReq[tid] ||

        mem_req->getVaddr() != memReq[tid]->getVaddr()) {

        DPRINTF(Fetch, "[tid:%i] Ignoring itlb completed after squash\n",

                tid);

        ++fetchStats.tlbSquashes;

        return;

    }


    // If translation was successful, attempt to read the icache block.

    if (fault == NoFault) {

        // Check that we're not going off into random memory

        // If we have, just wait around for commit to squash something and put

        // us on the right track

        if (!cpu->system->isMemAddr(mem_req->getPaddr())) {

            warn("Address %#x is outside of physical memory, stopping fetch\n",

                    mem_req->getPaddr());

            fetchStatus[tid] = NoGoodAddr;

            memReq[tid] = NULL;

            return;

        }


        // Build packet here.

        PacketPtr data_pkt = new Packet(mem_req, MemCmd::ReadReq);

        data_pkt->dataDynamic(new uint8_t[fetchBufferSize]);


        fetchBufferPC[tid] = fetchBufferBlockPC;

        fetchBufferValid[tid] = false;

        DPRINTF(Fetch, "Fetch: Doing instruction read.\n");


        fetchStats.cacheLines++;


        // Access the cache.

        if (!icachePort.sendTimingReq(data_pkt)) {

            assert(retryPkt == NULL);

            assert(retryTid == InvalidThreadID);

            DPRINTF(Fetch, "[tid:%i] Out of MSHRs!\n", tid);


            fetchStatus[tid] = IcacheWaitRetry;

            retryPkt = data_pkt;

            retryTid = tid;

            cacheBlocked = true;

        } else {

            DPRINTF(Fetch, "[tid:%i] Doing Icache access.\n", tid);

            DPRINTF(Activity, "[tid:%i] Activity: Waiting on I-cache "

                    "response.\n", tid);

            lastIcacheStall[tid] = curTick();

            fetchStatus[tid] = IcacheWaitResponse;

            // Notify Fetch Request probe when a packet containing a fetch

            // request is successfully sent

            ppFetchRequestSent->notify(mem_req);

        }

    } else {

        // Don't send an instruction to decode if we can't handle it.

        if (!(numInst < fetchWidth) ||

                !(fetchQueue[tid].size() < fetchQueueSize)) {

            assert(!finishTranslationEvent.scheduled());

            finishTranslationEvent.setFault(fault);

            finishTranslationEvent.setReq(mem_req);

            cpu->schedule(finishTranslationEvent,

                          cpu->clockEdge(Cycles(1)));

            return;

        }

        DPRINTF(Fetch,

                "[tid:%i] Got back req with addr %#x but expected %#x\n",

                tid, mem_req->getVaddr(), memReq[tid]->getVaddr());

        // Translation faulted, icache request won't be sent.

        memReq[tid] = NULL;


        // Send the fault to commit.  This thread will not do anything

        // until commit handles the fault.  The only other way it can

        // wake up is if a squash comes along and changes the PC.

        const PCStateBase &fetch_pc = *pc[tid];


        DPRINTF(Fetch, "[tid:%i] Translation faulted, building noop.\n", tid);

        // We will use a nop in ordier to carry the fault.

        DynInstPtr instruction = buildInst(tid, nopStaticInstPtr, nullptr,

                fetch_pc, fetch_pc, false);

        instruction->setNotAnInst();


        instruction->setPredTarg(fetch_pc);

        instruction->fault = fault;

        wroteToTimeBuffer = true;


        DPRINTF(Activity, "Activity this cycle.\n");

        cpu->activityThisCycle();


        fetchStatus[tid] = TrapPending;


        DPRINTF(Fetch, "[tid:%i] Blocked, need to handle the trap.\n", tid);

        DPRINTF(Fetch, "[tid:%i] fault (%s) detected @ PC %s.\n",

                tid, fault->name(), *pc[tid]);

    }

    _status = updateFetchStatus();

}

Fetch::finishTranslation(const Fault &fault, const RequestPtr &mem_req) {…}


void


Fetch::doSquash(const PCStateBase &new_pc, const DynInstPtr squashInst,

        ThreadID tid)

{

    DPRINTF(Fetch, "[tid:%i] Squashing, setting PC to: %s.\n",

            tid, new_pc);


    set(pc[tid], new_pc);

    fetchOffset[tid] = 0;

    if (squashInst && squashInst->pcState().instAddr() == new_pc.instAddr() &&

        !squashInst->isLastMicroop())

        macroop[tid] = squashInst->macroop;

    else

        macroop[tid] = NULL;

    decoder[tid]->reset();


    // Clear the icache miss if it's outstanding.

    if (fetchStatus[tid] == IcacheWaitResponse) {

        DPRINTF(Fetch, "[tid:%i] Squashing outstanding Icache miss.\n",

                tid);

        memReq[tid] = NULL;

    } else if (fetchStatus[tid] == ItlbWait) {

        DPRINTF(Fetch, "[tid:%i] Squashing outstanding ITLB miss.\n",

                tid);

        memReq[tid] = NULL;

    }


    // Get rid of the retrying packet if it was from this thread.

    if (retryTid == tid) {

        assert(cacheBlocked);

        if (retryPkt) {

            delete retryPkt;

        }

        retryPkt = NULL;

        retryTid = InvalidThreadID;

    }


    fetchStatus[tid] = Squashing;


    // Empty fetch queue

    fetchQueue[tid].clear();


    // microops are being squashed, it is not known wheather the

    // youngest non-squashed microop was  marked delayed commit

    // or not. Setting the flag to true ensures that the

    // interrupts are not handled when they cannot be, though

    // some opportunities to handle interrupts may be missed.

    delayedCommit[tid] = true;


    ++fetchStats.squashCycles;

}

Fetch::doSquash(const PCStateBase &new_pc, const DynInstPtr squashInst, {…}


void


Fetch::squashFromDecode(const PCStateBase &new_pc, const DynInstPtr squashInst,

        const InstSeqNum seq_num, ThreadID tid)

{

    DPRINTF(Fetch, "[tid:%i] Squashing from decode.\n", tid);


    doSquash(new_pc, squashInst, tid);


    // Tell the CPU to remove any instructions that are in flight between

    // fetch and decode.

    cpu->removeInstsUntil(seq_num, tid);

}

Fetch::squashFromDecode(const PCStateBase &new_pc, const DynInstPtr squashInst, {…}


bool


Fetch::checkStall(ThreadID tid) const

{

    bool ret_val = false;


    if (stalls[tid].drain) {

        assert(cpu->isDraining());

        DPRINTF(Fetch,"[tid:%i] Drain stall detected.\n",tid);

        ret_val = true;

    }


    return ret_val;

}

Fetch::checkStall(ThreadID tid) const {…}


Fetch::FetchStatus


Fetch::updateFetchStatus()

{

    //Check Running

    std::list<ThreadID>::iterator threads = activeThreads->begin();

    std::list<ThreadID>::iterator end = activeThreads->end();


    while (threads != end) {

        ThreadID tid = *threads++;


        if (fetchStatus[tid] == Running ||

            fetchStatus[tid] == Squashing ||

            fetchStatus[tid] == IcacheAccessComplete) {


            if (_status == Inactive) {

                DPRINTF(Activity, "[tid:%i] Activating stage.\n",tid);


                if (fetchStatus[tid] == IcacheAccessComplete) {

                    DPRINTF(Activity, "[tid:%i] Activating fetch due to cache"

                            "completion\n",tid);

                }


                cpu->activateStage(CPU::FetchIdx);

            }


            return Active;

        }

    }


    // Stage is switching from active to inactive, notify CPU of it.

    if (_status == Active) {

        DPRINTF(Activity, "Deactivating stage.\n");


        cpu->deactivateStage(CPU::FetchIdx);

    }


    return Inactive;

}

Fetch::updateFetchStatus() {…}


void


Fetch::squash(const PCStateBase &new_pc, const InstSeqNum seq_num,

        DynInstPtr squashInst, ThreadID tid)

{

    DPRINTF(Fetch, "[tid:%i] Squash from commit.\n", tid);


    doSquash(new_pc, squashInst, tid);


    // Tell the CPU to remove any instructions that are not in the ROB.

    cpu->removeInstsNotInROB(tid);

}

Fetch::squash(const PCStateBase &new_pc, const InstSeqNum seq_num, {…}


void


Fetch::tick()

{

    std::list<ThreadID>::iterator threads = activeThreads->begin();

    std::list<ThreadID>::iterator end = activeThreads->end();

    bool status_change = false;


    wroteToTimeBuffer = false;


    for (ThreadID i = 0; i < numThreads; ++i) {

        issuePipelinedIfetch[i] = false;

    }


    while (threads != end) {

        ThreadID tid = *threads++;


        // Check the signals for each thread to determine the proper status

        // for each thread.

        bool updated_status = checkSignalsAndUpdate(tid);

        status_change =  status_change || updated_status;

    }


    DPRINTF(Fetch, "Running stage.\n");


    if (FullSystem) {

        if (fromCommit->commitInfo[0].interruptPending) {

            interruptPending = true;

        }


        if (fromCommit->commitInfo[0].clearInterrupt) {

            interruptPending = false;

        }

    }


    for (threadFetched = 0; threadFetched < numFetchingThreads;

         threadFetched++) {

        // Fetch each of the actively fetching threads.

        fetch(status_change);

    }


    // Record number of instructions fetched this cycle for distribution.

    fetchStats.nisnDist.sample(numInst);


    if (status_change) {

        // Change the fetch stage status if there was a status change.

        _status = updateFetchStatus();

    }


    // Issue the next I-cache request if possible.

    for (ThreadID i = 0; i < numThreads; ++i) {

        if (issuePipelinedIfetch[i]) {

            pipelineIcacheAccesses(i);

        }

    }


    // Send instructions enqueued into the fetch queue to decode.

    // Limit rate by fetchWidth.  Stall if decode is stalled.

    unsigned insts_to_decode = 0;

    unsigned available_insts = 0;


    for (auto tid : *activeThreads) {

        if (!stalls[tid].decode) {

            available_insts += fetchQueue[tid].size();

        }

    }


    // Pick a random thread to start trying to grab instructions from

    auto tid_itr = activeThreads->begin();

    std::advance(tid_itr,

            rng->random<uint8_t>(0, activeThreads->size() - 1));


    while (available_insts != 0 && insts_to_decode < decodeWidth) {

        ThreadID tid = *tid_itr;

        if (!stalls[tid].decode && !fetchQueue[tid].empty()) {

            const auto& inst = fetchQueue[tid].front();

            toDecode->insts[toDecode->size++] = inst;

            DPRINTF(Fetch, "[tid:%i] [sn:%llu] Sending instruction to decode "

                    "from fetch queue. Fetch queue size: %i.\n",

                    tid, inst->seqNum, fetchQueue[tid].size());


            wroteToTimeBuffer = true;

            fetchQueue[tid].pop_front();

            insts_to_decode++;

            available_insts--;

        }


        tid_itr++;

        // Wrap around if at end of active threads list

        if (tid_itr == activeThreads->end())

            tid_itr = activeThreads->begin();

    }


    // If there was activity this cycle, inform the CPU of it.

    if (wroteToTimeBuffer) {

        DPRINTF(Activity, "Activity this cycle.\n");

        cpu->activityThisCycle();

    }


    // Reset the number of the instruction we've fetched.

    numInst = 0;

}

Fetch::tick() {…}


bool


Fetch::checkSignalsAndUpdate(ThreadID tid)

{

    // Update the per thread stall statuses.

    if (fromDecode->decodeBlock[tid]) {

        stalls[tid].decode = true;

    }


    if (fromDecode->decodeUnblock[tid]) {

        assert(stalls[tid].decode);

        assert(!fromDecode->decodeBlock[tid]);

        stalls[tid].decode = false;

    }


    // Check squash signals from commit.

    if (fromCommit->commitInfo[tid].squash) {


        DPRINTF(Fetch, "[tid:%i] Squashing instructions due to squash "

                "from commit.\n",tid);

        // In any case, squash.

        squash(*fromCommit->commitInfo[tid].pc,

               fromCommit->commitInfo[tid].doneSeqNum,

               fromCommit->commitInfo[tid].squashInst, tid);


        // If it was a branch mispredict on a control instruction, update the

        // branch predictor with that instruction, otherwise just kill the

        // invalid state we generated in after sequence number

        if (fromCommit->commitInfo[tid].mispredictInst &&

            fromCommit->commitInfo[tid].mispredictInst->isControl()) {

            branchPred->squash(fromCommit->commitInfo[tid].doneSeqNum,

                    *fromCommit->commitInfo[tid].pc,

                    fromCommit->commitInfo[tid].branchTaken, tid);

        } else {

            branchPred->squash(fromCommit->commitInfo[tid].doneSeqNum,

                              tid);

        }


        return true;

    } else if (fromCommit->commitInfo[tid].doneSeqNum) {

        // Update the branch predictor if it wasn't a squashed instruction

        // that was broadcasted.

        branchPred->update(fromCommit->commitInfo[tid].doneSeqNum, tid);

    }


    // Check squash signals from decode.

    if (fromDecode->decodeInfo[tid].squash) {

        DPRINTF(Fetch, "[tid:%i] Squashing instructions due to squash "

                "from decode.\n",tid);


        // Update the branch predictor.

        if (fromDecode->decodeInfo[tid].branchMispredict) {

            branchPred->squash(fromDecode->decodeInfo[tid].doneSeqNum,

                    *fromDecode->decodeInfo[tid].nextPC,

                    fromDecode->decodeInfo[tid].branchTaken, tid);

        } else {

            branchPred->squash(fromDecode->decodeInfo[tid].doneSeqNum,

                              tid);

        }


        if (fetchStatus[tid] != Squashing) {


            DPRINTF(Fetch, "Squashing from decode with PC = %s\n",

                *fromDecode->decodeInfo[tid].nextPC);

            // Squash unless we're already squashing

            squashFromDecode(*fromDecode->decodeInfo[tid].nextPC,

                             fromDecode->decodeInfo[tid].squashInst,

                             fromDecode->decodeInfo[tid].doneSeqNum,

                             tid);


            return true;

        }

    }


    if (checkStall(tid) &&

        fetchStatus[tid] != IcacheWaitResponse &&

        fetchStatus[tid] != IcacheWaitRetry &&

        fetchStatus[tid] != ItlbWait &&

        fetchStatus[tid] != QuiescePending) {

        DPRINTF(Fetch, "[tid:%i] Setting to blocked\n",tid);


        fetchStatus[tid] = Blocked;


        return true;

    }


    if (fetchStatus[tid] == Blocked ||

        fetchStatus[tid] == Squashing) {

        // Switch status to running if fetch isn't being told to block or

        // squash this cycle.

        DPRINTF(Fetch, "[tid:%i] Done squashing, switching to running.\n",

                tid);


        fetchStatus[tid] = Running;


        return true;

    }


    // If we've reached this point, we have not gotten any signals that

    // cause fetch to change its status.  Fetch remains the same as before.

    return false;

}

Fetch::checkSignalsAndUpdate(ThreadID tid) {…}


DynInstPtr


Fetch::buildInst(ThreadID tid, StaticInstPtr staticInst,

        StaticInstPtr curMacroop, const PCStateBase &this_pc,

        const PCStateBase &next_pc, bool trace)

{

    // Get a sequence number.

    InstSeqNum seq = cpu->getAndIncrementInstSeq();


    DynInst::Arrays arrays;

    arrays.numSrcs = staticInst->numSrcRegs();

    arrays.numDests = staticInst->numDestRegs();


    // Create a new DynInst from the instruction fetched.

    DynInstPtr instruction = new (arrays) DynInst(

            arrays, staticInst, curMacroop, this_pc, next_pc, seq, cpu);

    instruction->setTid(tid);


    instruction->setThreadState(cpu->thread[tid]);


    DPRINTF(Fetch, "[tid:%i] Instruction PC %s created [sn:%lli].\n",

            tid, this_pc, seq);


    DPRINTF(Fetch, "[tid:%i] Instruction is: %s\n", tid,

            instruction->staticInst->disassemble(this_pc.instAddr()));


#if TRACING_ON

    if (trace) {

        instruction->traceData =

            cpu->getTracer()->getInstRecord(curTick(), cpu->tcBase(tid),

                    instruction->staticInst, this_pc, curMacroop);

    }

#else

    instruction->traceData = NULL;

#endif


    // Add instruction to the CPU's list of instructions.

    instruction->setInstListIt(cpu->addInst(instruction));


    // Write the instruction to the first slot in the queue

    // that heads to decode.

    assert(numInst < fetchWidth);

    fetchQueue[tid].push_back(instruction);

    assert(fetchQueue[tid].size() <= fetchQueueSize);

    DPRINTF(Fetch, "[tid:%i] Fetch queue entry created (%i/%i).\n",

            tid, fetchQueue[tid].size(), fetchQueueSize);

    //toDecode->insts[toDecode->size++] = instruction;


    // Keep track of if we can take an interrupt at this boundary

    delayedCommit[tid] = instruction->isDelayedCommit();


    return instruction;

}

Fetch::buildInst(ThreadID tid, StaticInstPtr staticInst, {…}


void


Fetch::fetch(bool &status_change)

{

    // Start actual fetch

    ThreadID tid = getFetchingThread();


    assert(!cpu->switchedOut());


    if (tid == InvalidThreadID) {

        // Breaks looping condition in tick()

        threadFetched = numFetchingThreads;


        if (numThreads == 1) {  // @todo Per-thread stats

            profileStall(0);

        }


        return;

    }


    DPRINTF(Fetch, "Attempting to fetch from [tid:%i]\n", tid);


    // The current PC.

    PCStateBase &this_pc = *pc[tid];


    Addr pcOffset = fetchOffset[tid];

    Addr fetchAddr = (this_pc.instAddr() + pcOffset) & decoder[tid]->pcMask();


    bool inRom = isRomMicroPC(this_pc.microPC());


    // If returning from the delay of a cache miss, then update the status

    // to running, otherwise do the cache access.  Possibly move this up

    // to tick() function.

    if (fetchStatus[tid] == IcacheAccessComplete) {

        DPRINTF(Fetch, "[tid:%i] Icache miss is complete.\n", tid);


        fetchStatus[tid] = Running;

        status_change = true;

    } else if (fetchStatus[tid] == Running) {

        // Align the fetch PC so its at the start of a fetch buffer segment.

        Addr fetchBufferBlockPC = fetchBufferAlignPC(fetchAddr);


        // If buffer is no longer valid or fetchAddr has moved to point

        // to the next cache block, AND we have no remaining ucode

        // from a macro-op, then start fetch from icache.

        if (!(fetchBufferValid[tid] &&

                    fetchBufferBlockPC == fetchBufferPC[tid]) && !inRom &&

                !macroop[tid]) {

            DPRINTF(Fetch, "[tid:%i] Attempting to translate and read "

                    "instruction, starting at PC %s.\n", tid, this_pc);


            fetchCacheLine(fetchAddr, tid, this_pc.instAddr());


            if (fetchStatus[tid] == IcacheWaitResponse) {

                cpu->fetchStats[tid]->icacheStallCycles++;

            }

            else if (fetchStatus[tid] == ItlbWait)

                ++fetchStats.tlbCycles;

            else

                ++fetchStats.miscStallCycles;

            return;

        } else if (checkInterrupt(this_pc.instAddr()) &&

                !delayedCommit[tid]) {

            // Stall CPU if an interrupt is posted and we're not issuing

            // an delayed commit micro-op currently (delayed commit

            // instructions are not interruptable by interrupts, only faults)

            ++fetchStats.miscStallCycles;

            DPRINTF(Fetch, "[tid:%i] Fetch is stalled!\n", tid);

            return;

        }

    } else {

        if (fetchStatus[tid] == Idle) {

            ++fetchStats.idleCycles;

            DPRINTF(Fetch, "[tid:%i] Fetch is idle!\n", tid);

        }


        // Status is Idle, so fetch should do nothing.

        return;

    }


    ++fetchStats.cycles;


    std::unique_ptr<PCStateBase> next_pc(this_pc.clone());


    StaticInstPtr staticInst = NULL;

    StaticInstPtr curMacroop = macroop[tid];


    // If the read of the first instruction was successful, then grab the

    // instructions from the rest of the cache line and put them into the

    // queue heading to decode.


    DPRINTF(Fetch, "[tid:%i] Adding instructions to queue to "

            "decode.\n", tid);


    // Need to keep track of whether or not a predicted branch

    // ended this fetch block.

    bool predictedBranch = false;


    // Need to halt fetch if quiesce instruction detected

    bool quiesce = false;


    const unsigned numInsts = fetchBufferSize / instSize;

    unsigned blkOffset = (fetchAddr - fetchBufferPC[tid]) / instSize;


    auto *dec_ptr = decoder[tid];

    const Addr pc_mask = dec_ptr->pcMask();


    // Loop through instruction memory from the cache.

    // Keep issuing while fetchWidth is available and branch is not

    // predicted taken

    while (numInst < fetchWidth && fetchQueue[tid].size() < fetchQueueSize

           && !predictedBranch && !quiesce) {

        // We need to process more memory if we aren't going to get a

        // StaticInst from the rom, the current macroop, or what's already

        // in the decoder.

        bool needMem = !inRom && !curMacroop && !dec_ptr->instReady();

        fetchAddr = (this_pc.instAddr() + pcOffset) & pc_mask;

        Addr fetchBufferBlockPC = fetchBufferAlignPC(fetchAddr);


        if (needMem) {

            // If buffer is no longer valid or fetchAddr has moved to point

            // to the next cache block then start fetch from icache.

            if (!fetchBufferValid[tid] ||

                fetchBufferBlockPC != fetchBufferPC[tid])

                break;


            if (blkOffset >= numInsts) {

                // We need to process more memory, but we've run out of the

                // current block.

                break;

            }


            memcpy(dec_ptr->moreBytesPtr(),

                    fetchBuffer[tid] + blkOffset * instSize, instSize);

            decoder[tid]->moreBytes(this_pc, fetchAddr);


            if (dec_ptr->needMoreBytes()) {

                blkOffset++;

                fetchAddr += instSize;

                pcOffset += instSize;

            }

        }


        // Extract as many instructions and/or microops as we can from

        // the memory we've processed so far.

        do {

            if (!(curMacroop || inRom)) {

                if (dec_ptr->instReady()) {

                    staticInst = dec_ptr->decode(this_pc);


                    // Increment stat of fetched instructions.

                    cpu->fetchStats[tid]->numInsts++;


                    if (staticInst->isMacroop()) {

                        curMacroop = staticInst;

                    } else {

                        pcOffset = 0;

                    }

                } else {

                    // We need more bytes for this instruction so blkOffset and

                    // pcOffset will be updated

                    break;

                }

            }

            // Whether we're moving to a new macroop because we're at the

            // end of the current one, or the branch predictor incorrectly

            // thinks we are...

            bool newMacro = false;

            if (curMacroop || inRom) {

                if (inRom) {

                    staticInst = dec_ptr->fetchRomMicroop(

                            this_pc.microPC(), curMacroop);

                } else {

                    staticInst = curMacroop->fetchMicroop(this_pc.microPC());

                }

                newMacro |= staticInst->isLastMicroop();

            }


            DynInstPtr instruction = buildInst(

                    tid, staticInst, curMacroop, this_pc, *next_pc, true);


            ppFetch->notify(instruction);

            numInst++;


#if TRACING_ON

            if (debug::O3PipeView) {

                instruction->fetchTick = curTick();

            }

#endif


            set(next_pc, this_pc);


            // If we're branching after this instruction, quit fetching

            // from the same block.

            predictedBranch |= this_pc.branching();

            predictedBranch |= lookupAndUpdateNextPC(instruction, *next_pc);

            if (predictedBranch) {

                DPRINTF(Fetch, "Branch detected with PC = %s\n", this_pc);

            }


            newMacro |= this_pc.instAddr() != next_pc->instAddr();


            // Move to the next instruction, unless we have a branch.

            set(this_pc, *next_pc);

            inRom = isRomMicroPC(this_pc.microPC());


            if (newMacro) {

                fetchAddr = this_pc.instAddr() & pc_mask;

                blkOffset = (fetchAddr - fetchBufferPC[tid]) / instSize;

                pcOffset = 0;

                curMacroop = NULL;

            }


            if (instruction->isQuiesce()) {

                DPRINTF(Fetch,

                        "Quiesce instruction encountered, halting fetch!\n");

                fetchStatus[tid] = QuiescePending;

                status_change = true;

                quiesce = true;

                break;

            }

        } while ((curMacroop || dec_ptr->instReady()) &&

                 numInst < fetchWidth &&

                 fetchQueue[tid].size() < fetchQueueSize);


        // Re-evaluate whether the next instruction to fetch is in micro-op ROM

        // or not.

        inRom = isRomMicroPC(this_pc.microPC());

    }


    if (predictedBranch) {

        DPRINTF(Fetch, "[tid:%i] Done fetching, predicted branch "

                "instruction encountered.\n", tid);

    } else if (numInst >= fetchWidth) {

        DPRINTF(Fetch, "[tid:%i] Done fetching, reached fetch bandwidth "

                "for this cycle.\n", tid);

    } else if (blkOffset >= fetchBufferSize) {

        DPRINTF(Fetch, "[tid:%i] Done fetching, reached the end of the"

                "fetch buffer.\n", tid);

    }


    macroop[tid] = curMacroop;

    fetchOffset[tid] = pcOffset;


    if (numInst > 0) {

        wroteToTimeBuffer = true;

    }


    // pipeline a fetch if we're crossing a fetch buffer boundary and not in

    // a state that would preclude fetching

    fetchAddr = (this_pc.instAddr() + pcOffset) & pc_mask;

    Addr fetchBufferBlockPC = fetchBufferAlignPC(fetchAddr);

    issuePipelinedIfetch[tid] = fetchBufferBlockPC != fetchBufferPC[tid] &&

        fetchStatus[tid] != IcacheWaitResponse &&

        fetchStatus[tid] != ItlbWait &&

        fetchStatus[tid] != IcacheWaitRetry &&

        fetchStatus[tid] != QuiescePending &&

        !curMacroop;

}

Fetch::fetch(bool &status_change) {…}


void


Fetch::recvReqRetry()

{

    if (retryPkt != NULL) {

        assert(cacheBlocked);

        assert(retryTid != InvalidThreadID);

        assert(fetchStatus[retryTid] == IcacheWaitRetry);


        if (icachePort.sendTimingReq(retryPkt)) {

            fetchStatus[retryTid] = IcacheWaitResponse;

            // Notify Fetch Request probe when a retryPkt is successfully sent.

            // Note that notify must be called before retryPkt is set to NULL.

            ppFetchRequestSent->notify(retryPkt->req);

            retryPkt = NULL;

            retryTid = InvalidThreadID;

            cacheBlocked = false;

        }

    } else {

        assert(retryTid == InvalidThreadID);

        // Access has been squashed since it was sent out.  Just clear

        // the cache being blocked.

        cacheBlocked = false;

    }

}

Fetch::recvReqRetry() {…}


//                                   //

//  SMT FETCH POLICY MAINTAINED HERE //

//                                   //

ThreadID


Fetch::getFetchingThread()

{

    if (numThreads > 1) {

        switch (fetchPolicy) {

          case SMTFetchPolicy::RoundRobin:

            return roundRobin();

          case SMTFetchPolicy::IQCount:

            return iqCount();

          case SMTFetchPolicy::LSQCount:

            return lsqCount();

          case SMTFetchPolicy::Branch:

            return branchCount();

          default:

            return InvalidThreadID;

        }

    } else {

        std::list<ThreadID>::iterator thread = activeThreads->begin();

        if (thread == activeThreads->end()) {

            return InvalidThreadID;

        }


        ThreadID tid = *thread;


        if (fetchStatus[tid] == Running ||

            fetchStatus[tid] == IcacheAccessComplete ||

            fetchStatus[tid] == Idle) {

            return tid;

        } else {

            return InvalidThreadID;

        }

    }

}

Fetch::getFetchingThread() {…}


ThreadID


Fetch::roundRobin()

{

    std::list<ThreadID>::iterator pri_iter = priorityList.begin();

    std::list<ThreadID>::iterator end      = priorityList.end();


    ThreadID high_pri;


    while (pri_iter != end) {

        high_pri = *pri_iter;


        assert(high_pri <= numThreads);


        if (fetchStatus[high_pri] == Running ||

            fetchStatus[high_pri] == IcacheAccessComplete ||

            fetchStatus[high_pri] == Idle) {


            priorityList.erase(pri_iter);

            priorityList.push_back(high_pri);


            return high_pri;

        }


        pri_iter++;

    }


    return InvalidThreadID;

}

Fetch::roundRobin() {…}


ThreadID


Fetch::iqCount()

{

    //sorted from lowest->highest

    std::priority_queue<unsigned, std::vector<unsigned>,

                        std::greater<unsigned> > PQ;

    std::map<unsigned, ThreadID> threadMap;


    std::list<ThreadID>::iterator threads = activeThreads->begin();

    std::list<ThreadID>::iterator end = activeThreads->end();


    while (threads != end) {

        ThreadID tid = *threads++;

        unsigned iqCount = fromIEW->iewInfo[tid].iqCount;


        //we can potentially get tid collisions if two threads

        //have the same iqCount, but this should be rare.

        PQ.push(iqCount);

        threadMap[iqCount] = tid;

    }


    while (!PQ.empty()) {

        ThreadID high_pri = threadMap[PQ.top()];


        if (fetchStatus[high_pri] == Running ||

            fetchStatus[high_pri] == IcacheAccessComplete ||

            fetchStatus[high_pri] == Idle)

            return high_pri;

        else

            PQ.pop();


    }


    return InvalidThreadID;

}

Fetch::iqCount() {…}


ThreadID


Fetch::lsqCount()

{

    //sorted from lowest->highest

    std::priority_queue<unsigned, std::vector<unsigned>,

                        std::greater<unsigned> > PQ;

    std::map<unsigned, ThreadID> threadMap;


    std::list<ThreadID>::iterator threads = activeThreads->begin();

    std::list<ThreadID>::iterator end = activeThreads->end();


    while (threads != end) {

        ThreadID tid = *threads++;

        unsigned ldstqCount = fromIEW->iewInfo[tid].ldstqCount;


        //we can potentially get tid collisions if two threads

        //have the same iqCount, but this should be rare.

        PQ.push(ldstqCount);

        threadMap[ldstqCount] = tid;

    }


    while (!PQ.empty()) {

        ThreadID high_pri = threadMap[PQ.top()];


        if (fetchStatus[high_pri] == Running ||

            fetchStatus[high_pri] == IcacheAccessComplete ||

            fetchStatus[high_pri] == Idle)

            return high_pri;

        else

            PQ.pop();

    }


    return InvalidThreadID;

}

Fetch::lsqCount() {…}


ThreadID


Fetch::branchCount()

{

    panic("Branch Count Fetch policy unimplemented\n");

    return InvalidThreadID;

}

Fetch::branchCount() {…}


void


Fetch::pipelineIcacheAccesses(ThreadID tid)

{

    if (!issuePipelinedIfetch[tid]) {

        return;

    }


    // The next PC to access.

    const PCStateBase &this_pc = *pc[tid];


    if (isRomMicroPC(this_pc.microPC())) {

        return;

    }


    Addr pcOffset = fetchOffset[tid];

    Addr fetchAddr = (this_pc.instAddr() + pcOffset) & decoder[tid]->pcMask();


    // Align the fetch PC so its at the start of a fetch buffer segment.

    Addr fetchBufferBlockPC = fetchBufferAlignPC(fetchAddr);


    // Unless buffer already got the block, fetch it from icache.

    if (!(fetchBufferValid[tid] && fetchBufferBlockPC == fetchBufferPC[tid])) {

        DPRINTF(Fetch, "[tid:%i] Issuing a pipelined I-cache access, "

                "starting at PC %s.\n", tid, this_pc);


        fetchCacheLine(fetchAddr, tid, this_pc.instAddr());

    }

}

Fetch::pipelineIcacheAccesses(ThreadID tid) {…}


void


Fetch::profileStall(ThreadID tid)

{

    DPRINTF(Fetch,"There are no more threads available to fetch from.\n");


    // @todo Per-thread stats


    if (stalls[tid].drain) {

        ++fetchStats.pendingDrainCycles;

        DPRINTF(Fetch, "Fetch is waiting for a drain!\n");

    } else if (activeThreads->empty()) {

        ++fetchStats.noActiveThreadStallCycles;

        DPRINTF(Fetch, "Fetch has no active thread!\n");

    } else if (fetchStatus[tid] == Blocked) {

        ++fetchStats.blockedCycles;

        DPRINTF(Fetch, "[tid:%i] Fetch is blocked!\n", tid);

    } else if (fetchStatus[tid] == Squashing) {

        ++fetchStats.squashCycles;

        DPRINTF(Fetch, "[tid:%i] Fetch is squashing!\n", tid);

    } else if (fetchStatus[tid] == IcacheWaitResponse) {

        cpu->fetchStats[tid]->icacheStallCycles++;

        DPRINTF(Fetch, "[tid:%i] Fetch is waiting cache response!\n",

                tid);

    } else if (fetchStatus[tid] == ItlbWait) {

        ++fetchStats.tlbCycles;

        DPRINTF(Fetch, "[tid:%i] Fetch is waiting ITLB walk to "

                "finish!\n", tid);

    } else if (fetchStatus[tid] == TrapPending) {

        ++fetchStats.pendingTrapStallCycles;

        DPRINTF(Fetch, "[tid:%i] Fetch is waiting for a pending trap!\n",

                tid);

    } else if (fetchStatus[tid] == QuiescePending) {

        ++fetchStats.pendingQuiesceStallCycles;

        DPRINTF(Fetch, "[tid:%i] Fetch is waiting for a pending quiesce "

                "instruction!\n", tid);

    } else if (fetchStatus[tid] == IcacheWaitRetry) {

        ++fetchStats.icacheWaitRetryStallCycles;

        DPRINTF(Fetch, "[tid:%i] Fetch is waiting for an I-cache retry!\n",

                tid);

    } else if (fetchStatus[tid] == NoGoodAddr) {

            DPRINTF(Fetch, "[tid:%i] Fetch predicted non-executable address\n",

                    tid);

    } else {

        DPRINTF(Fetch, "[tid:%i] Unexpected fetch stall reason "

            "(Status: %i)\n",

            tid, fetchStatus[tid]);

    }

}

Fetch::profileStall(ThreadID tid) {…}


bool


Fetch::IcachePort::recvTimingResp(PacketPtr pkt)

{

    DPRINTF(O3CPU, "Fetch unit received timing\n");

    // We shouldn't ever get a cacheable block in Modified state

    assert(pkt->req->isUncacheable() ||

           !(pkt->cacheResponding() && !pkt->hasSharers()));

    fetch->processCacheCompletion(pkt);


    return true;

}

Fetch::IcachePort::recvTimingResp(PacketPtr pkt) {…}


void


Fetch::IcachePort::recvReqRetry()

{

    fetch->recvReqRetry();

}

Fetch::IcachePort::recvReqRetry() {…}


} // namespace o3

} // namespace gem5

DPRINTF
#define DPRINTF(x,...)
Definition trace.hh:209

types.hh
Defines global host-dependent types: Counter, Tick, and (indirectly) {int,uint}{8,...

byteswap.hh

gem5::BaseCPU::instRequestorId
RequestorID instRequestorId() const
Reads this CPU's unique instruction requestor ID.
Definition base.hh:220

gem5::BaseCPU::taskId
uint32_t taskId() const
Get cpu task id.
Definition base.hh:236

gem5::BaseCPU::getTracer
trace::InstTracer * getTracer()
Provide access to the tracer pointer.
Definition base.hh:299

gem5::BaseCPU::fetchStats
std::vector< std::unique_ptr< FetchCPUStats > > fetchStats
Definition base.hh:846

gem5::BaseCPU::contextToThread
ThreadID contextToThread(ContextID cid)
Convert ContextID to threadID.
Definition base.hh:326

gem5::BaseCPU::switchedOut
bool switchedOut() const
Determine if the CPU is switched out.
Definition base.hh:400

gem5::BaseMMU::translateTiming
virtual void translateTiming(const RequestPtr &req, ThreadContext *tc, Translation *translation, Mode mode)
Definition mmu.cc:118

gem5::BaseMMU::Execute
@ Execute
Definition mmu.hh:56

gem5::Clocked::clockEdge
Tick clockEdge(Cycles cycles=Cycles(0)) const
Determine the tick when a cycle begins, by default the current one, but the argument also enables the...
Definition clocked_object.hh:177

gem5::Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition types.hh:79

gem5::InstDecoder::moreBytesSize
size_t moreBytesSize() const
Definition decoder.hh:96

gem5::InstDecoder::reset
virtual void reset()
Definition decoder.hh:63

gem5::InstDecoder::moreBytes
virtual void moreBytes(const PCStateBase &pc, Addr fetchPC)=0
Feed data to the decoder.

gem5::InstDecoder::pcMask
Addr pcMask() const
Definition decoder.hh:97

gem5::MemCmd::ReadReq
@ ReadReq
Definition packet.hh:87

gem5::Named::name
virtual std::string name() const
Definition named.hh:47

gem5::PCStateBase
Definition pcstate.hh:59

gem5::PCStateBase::branching
virtual bool branching() const =0

gem5::PCStateBase::microPC
MicroPC microPC() const
Returns the current micropc.
Definition pcstate.hh:119

gem5::PCStateBase::instAddr
Addr instAddr() const
Returns the memory address of the instruction this PC points to.
Definition pcstate.hh:108

gem5::PCStateBase::clone
virtual PCStateBase * clone() const =0

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::Packet::req
RequestPtr req
A pointer to the original request.
Definition packet.hh:377

gem5::Packet::getConstPtr
const T * getConstPtr() const
Definition packet.hh:1234

gem5::Packet::dataDynamic
void dataDynamic(T *p)
Set the data pointer to a value that should have delete [] called on it.
Definition packet.hh:1213

gem5::Packet::cacheResponding
bool cacheResponding() const
Definition packet.hh:659

gem5::Packet::hasSharers
bool hasSharers() const
Definition packet.hh:686

gem5::Port::isConnected
bool isConnected() const
Is this port currently connected to a peer?
Definition port.hh:133

gem5::ProbePointArg
ProbePointArg generates a point for the class of Arg.
Definition probe.hh:264

gem5::ProbePointArg::notify
void notify(const Arg &arg)
called at the ProbePoint call site, passes arg to each listener.
Definition probe.hh:313

gem5::RefCountingPtr< DynInst >

gem5::RequestPort
A RequestPort is a specialisation of a Port, which implements the default protocol for the three diff...
Definition port.hh:136

gem5::RequestPort::sendTimingReq
bool sendTimingReq(PacketPtr pkt)
Attempt to send a timing request to the responder port by calling its corresponding receive function.
Definition port.hh:603

gem5::Request::INST_FETCH
@ INST_FETCH
The request was an instruction fetch.
Definition request.hh:115

gem5::StaticInst::numSrcRegs
uint8_t numSrcRegs() const
Number of source registers.
Definition static_inst.hh:123

gem5::StaticInst::fetchMicroop
virtual StaticInstPtr fetchMicroop(MicroPC upc) const
Return the microop that goes with a particular micropc.
Definition static_inst.cc:39

gem5::StaticInst::numDestRegs
uint8_t numDestRegs() const
Number of destination registers.
Definition static_inst.hh:125

gem5::StaticInst::isMacroop
bool isMacroop() const
Definition static_inst.hh:187

gem5::StaticInst::isLastMicroop
bool isLastMicroop() const
Definition static_inst.hh:190

gem5::System::isMemAddr
bool isMemAddr(Addr addr) const
Check if a physical address is within a range of a memory that is part of the global address map.
Definition system.cc:288

gem5::TimeBuffer
Definition timebuf.hh:41

gem5::TimeBuffer::getWire
wire getWire(int idx)
Definition timebuf.hh:232

gem5::branch_prediction::BPredUnit::update
void update(const InstSeqNum &done_sn, ThreadID tid)
Tells the branch predictor to commit any updates until the given sequence number.
Definition bpred_unit.cc:335

gem5::branch_prediction::BPredUnit::predict
bool predict(const StaticInstPtr &inst, const InstSeqNum &seqNum, PCStateBase &pc, ThreadID tid)
Predicts whether or not the instruction is a taken branch, and the target of the branch if it is take...
Definition bpred_unit.cc:99

gem5::branch_prediction::BPredUnit::drainSanityCheck
void drainSanityCheck() const
Perform sanity checks after a drain.
Definition bpred_unit.cc:89

gem5::branch_prediction::BPredUnit::squash
void squash(const InstSeqNum &squashed_sn, ThreadID tid)
Squashes all outstanding updates until a given sequence number.
Definition bpred_unit.cc:393

gem5::o3::CPU
O3CPU class, has each of the stages (fetch through commit) within it, as well as all of the time buff...
Definition cpu.hh:94

gem5::o3::CPU::addInst
ListIt addInst(const DynInstPtr &inst)
Function to add instruction onto the head of the list of the instructions.
Definition cpu.cc:1133

gem5::o3::CPU::ppInstAccessComplete
ProbePointArg< PacketPtr > * ppInstAccessComplete
Definition cpu.hh:176

gem5::o3::CPU::thread
std::vector< ThreadState * > thread
Pointers to all of the threads in the CPU.
Definition cpu.hh:533

gem5::o3::CPU::activityThisCycle
void activityThisCycle()
Records that there was time buffer activity this cycle.
Definition cpu.hh:488

gem5::o3::CPU::getInstPort
Port & getInstPort() override
Used by the fetch unit to get a hold of the instruction port.
Definition cpu.hh:564

gem5::o3::CPU::removeInstsUntil
void removeInstsUntil(const InstSeqNum &seq_num, ThreadID tid)
Remove all instructions younger than the given sequence number.
Definition cpu.cc:1217

gem5::o3::CPU::isDraining
bool isDraining() const
Is the CPU draining?
Definition cpu.hh:238

gem5::o3::CPU::removeInstsNotInROB
void removeInstsNotInROB(ThreadID tid)
Remove all instructions that are not currently in the ROB.
Definition cpu.cc:1173

gem5::o3::CPU::FetchIdx
@ FetchIdx
Definition cpu.hh:456

gem5::o3::CPU::deactivateStage
void deactivateStage(const StageIdx idx)
Changes a stage's status to inactive within the activity recorder.
Definition cpu.hh:499

gem5::o3::CPU::mmu
BaseMMU * mmu
Definition cpu.hh:110

gem5::o3::CPU::system
System * system
Pointer to the system.
Definition cpu.hh:530

gem5::o3::CPU::getAndIncrementInstSeq
InstSeqNum getAndIncrementInstSeq()
Get the current instruction sequence number, and increment it.
Definition cpu.hh:284

gem5::o3::CPU::pcState
void pcState(const PCStateBase &new_pc_state, ThreadID tid)
Sets the commit PC state of a specific thread.
Definition cpu.cc:1120

gem5::o3::CPU::tcBase
gem5::ThreadContext * tcBase(ThreadID tid)
Returns a pointer to a thread context.
Definition cpu.hh:515

gem5::o3::CPU::activateStage
void activateStage(const StageIdx idx)
Changes a stage's status to active within the activity recorder.
Definition cpu.hh:492

gem5::o3::CPU::wakeCPU
void wakeCPU()
Wakes the CPU, rescheduling the CPU if it's not already active.
Definition cpu.cc:1316

gem5::o3::DynInst
Definition dyn_inst.hh:76

gem5::o3::Fetch::FetchTranslation
Definition fetch.hh:106

gem5::o3::Fetch::FinishTranslationEvent::setReq
void setReq(const RequestPtr &_req)
Definition fetch.hh:142

gem5::o3::Fetch::FinishTranslationEvent::setFault
void setFault(Fault _fault)
Definition fetch.hh:141

gem5::o3::Fetch::IcachePort::recvTimingResp
virtual bool recvTimingResp(PacketPtr pkt)
Timing version of receive.
Definition fetch.cc:1583

gem5::o3::Fetch::IcachePort::IcachePort
IcachePort(Fetch *_fetch, CPU *_cpu)
Default constructor.
Definition fetch.cc:77

gem5::o3::Fetch::IcachePort::recvReqRetry
virtual void recvReqRetry()
Handles doing a retry of a failed fetch.
Definition fetch.cc:1595

gem5::o3::Fetch
Fetch class handles both single threaded and SMT fetch.
Definition fetch.hh:80

gem5::o3::Fetch::fetchStats
gem5::o3::Fetch::FetchStatGroup fetchStats

gem5::o3::Fetch::wroteToTimeBuffer
bool wroteToTimeBuffer
Variable that tracks if fetch has written to the time buffer this cycle.
Definition fetch.hh:433

gem5::o3::Fetch::deactivateThread
void deactivateThread(ThreadID tid)
For priority-based fetch policies, need to keep update priorityList.
Definition fetch.cc:475

gem5::o3::Fetch::FetchStatus
FetchStatus
Overall fetch status.
Definition fetch.hh:164

gem5::o3::Fetch::Active
@ Active
Definition fetch.hh:165

gem5::o3::Fetch::Inactive
@ Inactive
Definition fetch.hh:166

gem5::o3::Fetch::activeThreads
std::list< ThreadID > * activeThreads
List of Active Threads.
Definition fetch.hh:508

gem5::o3::Fetch::fromCommit
TimeBuffer< TimeStruct >::wire fromCommit
Wire to get commit's information from backwards time buffer.
Definition fetch.hh:409

gem5::o3::Fetch::renameToFetchDelay
Cycles renameToFetchDelay
Rename to fetch delay.
Definition fetch.hh:452

gem5::o3::Fetch::macroop
StaticInstPtr macroop[MaxThreads]
Definition fetch.hh:422

gem5::o3::Fetch::fetch
void fetch(bool &status_change)
Does the actual fetching of instructions and passing them on to the next stage.
Definition fetch.cc:1072

gem5::o3::Fetch::takeOverFrom
void takeOverFrom()
Takes over from another CPU's thread.
Definition fetch.cc:425

gem5::o3::Fetch::fetchBuffer
uint8_t * fetchBuffer[MaxThreads]
The fetch data that is being fetched and buffered.
Definition fetch.hh:487

gem5::o3::Fetch::doSquash
void doSquash(const PCStateBase &new_pc, const DynInstPtr squashInst, ThreadID tid)
Squashes a specific thread and resets the PC.
Definition fetch.cc:685

gem5::o3::Fetch::rng
Random::RandomPtr rng
Definition fetch.hh:204

gem5::o3::Fetch::toDecode
TimeBuffer< FetchStruct >::wire toDecode
Wire used to write any information heading to decode.
Definition fetch.hh:413

gem5::o3::Fetch::setActiveThreads
void setActiveThreads(std::list< ThreadID > *at_ptr)
Sets pointer to list of active threads.
Definition fetch.cc:249

gem5::o3::Fetch::lookupAndUpdateNextPC
bool lookupAndUpdateNextPC(const DynInstPtr &inst, PCStateBase &pc)
Looks up in the branch predictor to see if the next PC should be either next PC+=MachInst or a branch...
Definition fetch.cc:485

gem5::o3::Fetch::fetchStatus
ThreadStatus fetchStatus[MaxThreads]
Per-thread status.
Definition fetch.hh:191

gem5::o3::Fetch::numThreads
ThreadID numThreads
Number of threads.
Definition fetch.hh:511

gem5::o3::Fetch::fromDecode
TimeBuffer< TimeStruct >::wire fromDecode
Wire to get decode's information from backwards time buffer.
Definition fetch.hh:400

gem5::o3::Fetch::ppFetch
ProbePointArg< DynInstPtr > * ppFetch
Probe points.
Definition fetch.hh:200

gem5::o3::Fetch::fromRename
TimeBuffer< TimeStruct >::wire fromRename
Wire to get rename's information from backwards time buffer.
Definition fetch.hh:403

gem5::o3::Fetch::squash
void squash(const PCStateBase &new_pc, const InstSeqNum seq_num, DynInstPtr squashInst, ThreadID tid)
Squashes a specific thread and resets the PC.
Definition fetch.cc:803

gem5::o3::Fetch::squashFromDecode
void squashFromDecode(const PCStateBase &new_pc, const DynInstPtr squashInst, const InstSeqNum seq_num, ThreadID tid)
Squashes a specific thread and resets the PC.
Definition fetch.cc:737

gem5::o3::Fetch::updateFetchStatus
FetchStatus updateFetchStatus()
Updates overall fetch stage status; to be called at the end of each cycle.
Definition fetch.cc:764

gem5::o3::Fetch::getFetchingThread
ThreadID getFetchingThread()
Returns the appropriate thread to fetch, given the fetch policy.
Definition fetch.cc:1363

gem5::o3::Fetch::fetchBufferValid
bool fetchBufferValid[MaxThreads]
Whether or not the fetch buffer data is valid.
Definition fetch.hh:499

gem5::o3::Fetch::startupStage
void startupStage()
Initialize stage.
Definition fetch.cc:262

gem5::o3::Fetch::pipelineIcacheAccesses
void pipelineIcacheAccesses(ThreadID tid)
Pipeline the next I-cache access to the current one.
Definition fetch.cc:1505

gem5::o3::Fetch::name
std::string name() const
Returns the name of fetch.
Definition fetch.cc:147

gem5::o3::Fetch::wakeFromQuiesce
void wakeFromQuiesce()
Tells fetch to wake up from a quiesce instruction.
Definition fetch.cc:442

gem5::o3::Fetch::switchToActive
void switchToActive()
Changes the status of this stage to active, and indicates this to the CPU.
Definition fetch.cc:451

gem5::o3::Fetch::switchToInactive
void switchToInactive()
Changes the status of this stage to inactive, and indicates this to the CPU.
Definition fetch.cc:463

gem5::o3::Fetch::numInst
int numInst
Tracks how many instructions has been fetched this cycle.
Definition fetch.hh:436

gem5::o3::Fetch::fetchCacheLine
bool fetchCacheLine(Addr vaddr, ThreadID tid, Addr pc)
Fetches the cache line that contains the fetch PC.
Definition fetch.cc:529

gem5::o3::Fetch::decodeToFetchDelay
Cycles decodeToFetchDelay
Decode to fetch delay.
Definition fetch.hh:449

gem5::o3::Fetch::issuePipelinedIfetch
bool issuePipelinedIfetch[MaxThreads]
Set to true if a pipelined I-cache request should be issued.
Definition fetch.hh:528

gem5::o3::Fetch::fetchBufferAlignPC
Addr fetchBufferAlignPC(Addr addr)
Align a PC to the start of a fetch buffer block.
Definition fetch.hh:355

gem5::o3::Fetch::_status
FetchStatus _status
Fetch status.
Definition fetch.hh:188

gem5::o3::Fetch::delayedCommit
bool delayedCommit[MaxThreads]
Can the fetch stage redirect from an interrupt on this instruction?
Definition fetch.hh:425

gem5::o3::Fetch::threadFetched
ThreadID threadFetched
Thread ID being fetched.
Definition fetch.hh:517

gem5::o3::Fetch::fetchPolicy
SMTFetchPolicy fetchPolicy
Fetch policy.
Definition fetch.hh:194

gem5::o3::Fetch::cacheBlkSize
Addr cacheBlkSize
Cache block size.
Definition fetch.hh:476

gem5::o3::Fetch::branchPred
branch_prediction::BPredUnit * branchPred
BPredUnit.
Definition fetch.hh:416

gem5::o3::Fetch::drainSanityCheck
void drainSanityCheck() const
Perform sanity checks after a drain.
Definition fetch.cc:378

gem5::o3::Fetch::fetchWidth
unsigned fetchWidth
The width of fetch in instructions.
Definition fetch.hh:461

gem5::o3::Fetch::fetchQueueSize
unsigned fetchQueueSize
The size of the fetch queue in micro-ops.
Definition fetch.hh:493

gem5::o3::Fetch::decoder
InstDecoder * decoder[MaxThreads]
The decoder.
Definition fetch.hh:361

gem5::o3::Fetch::fromIEW
TimeBuffer< TimeStruct >::wire fromIEW
Wire to get iew's information from backwards time buffer.
Definition fetch.hh:406

gem5::o3::Fetch::regProbePoints
void regProbePoints()
Registers probes.
Definition fetch.cc:150

gem5::o3::Fetch::checkSignalsAndUpdate
bool checkSignalsAndUpdate(ThreadID tid)
Checks all input signals and updates the status as necessary.
Definition fetch.cc:917

gem5::o3::Fetch::checkStall
bool checkStall(ThreadID tid) const
Checks if a thread is stalled.
Definition fetch.cc:750

gem5::o3::Fetch::icachePort
IcachePort icachePort
Instruction port.
Definition fetch.hh:525

gem5::o3::Fetch::Running
@ Running
Definition fetch.hh:172

gem5::o3::Fetch::Idle
@ Idle
Definition fetch.hh:173

gem5::o3::Fetch::TrapPending
@ TrapPending
Definition fetch.hh:177

gem5::o3::Fetch::IcacheWaitRetry
@ IcacheWaitRetry
Definition fetch.hh:181

gem5::o3::Fetch::NoGoodAddr
@ NoGoodAddr
Definition fetch.hh:183

gem5::o3::Fetch::QuiescePending
@ QuiescePending
Definition fetch.hh:178

gem5::o3::Fetch::Squashing
@ Squashing
Definition fetch.hh:174

gem5::o3::Fetch::IcacheAccessComplete
@ IcacheAccessComplete
Definition fetch.hh:182

gem5::o3::Fetch::IcacheWaitResponse
@ IcacheWaitResponse
Definition fetch.hh:180

gem5::o3::Fetch::ItlbWait
@ ItlbWait
Definition fetch.hh:179

gem5::o3::Fetch::Blocked
@ Blocked
Definition fetch.hh:175

gem5::o3::Fetch::setTimeBuffer
void setTimeBuffer(TimeBuffer< TimeStruct > *time_buffer)
Sets the main backwards communication time buffer pointer.
Definition fetch.cc:237

gem5::o3::Fetch::processCacheCompletion
void processCacheCompletion(PacketPtr pkt)
Processes cache completion event.
Definition fetch.cc:326

gem5::o3::Fetch::iqCount
ThreadID iqCount()
Returns the appropriate thread to fetch using the IQ count policy.
Definition fetch.cc:1427

gem5::o3::Fetch::fetchBufferMask
Addr fetchBufferMask
Mask to align a fetch address to a fetch buffer boundary.
Definition fetch.hh:484

gem5::o3::Fetch::recvReqRetry
void recvReqRetry()
Handles retrying the fetch access.
Definition fetch.cc:1333

gem5::o3::Fetch::checkInterrupt
bool checkInterrupt(Addr pc)
Check if an interrupt is pending and that we need to handle.
Definition fetch.hh:308

gem5::o3::Fetch::iewToFetchDelay
Cycles iewToFetchDelay
IEW to fetch delay.
Definition fetch.hh:455

gem5::o3::Fetch::resetStage
void resetStage()
Reset this pipeline stage.
Definition fetch.cc:292

gem5::o3::Fetch::Fetch
Fetch(CPU *_cpu, const BaseO3CPUParams &params)
Fetch constructor.
Definition fetch.cc:82

gem5::o3::Fetch::drainStall
void drainStall(ThreadID tid)
Stall the fetch stage after reaching a safe drain point.
Definition fetch.cc:433

gem5::o3::Fetch::lastIcacheStall
Counter lastIcacheStall[MaxThreads]
Icache stall statistics.
Definition fetch.hh:505

gem5::o3::Fetch::instSize
int instSize
Size of instructions.
Definition fetch.hh:502

gem5::o3::Fetch::ppFetchRequestSent
ProbePointArg< RequestPtr > * ppFetchRequestSent
To probe when a fetch request is successfully sent.
Definition fetch.hh:202

gem5::o3::Fetch::commitToFetchDelay
Cycles commitToFetchDelay
Commit to fetch delay.
Definition fetch.hh:458

gem5::o3::Fetch::memReq
RequestPtr memReq[MaxThreads]
Memory request used to access cache.
Definition fetch.hh:428

gem5::o3::Fetch::timeBuffer
TimeBuffer< TimeStruct > * timeBuffer
Time buffer interface.
Definition fetch.hh:397

gem5::o3::Fetch::profileStall
void profileStall(ThreadID tid)
Profile the reasons of fetch stall.
Definition fetch.cc:1534

gem5::o3::Fetch::roundRobin
ThreadID roundRobin()
Returns the appropriate thread to fetch using a round robin policy.
Definition fetch.cc:1398

gem5::o3::Fetch::fetchBufferPC
Addr fetchBufferPC[MaxThreads]
The PC of the first instruction loaded into the fetch buffer.
Definition fetch.hh:490

gem5::o3::Fetch::drainResume
void drainResume()
Resume after a drain.
Definition fetch.cc:369

gem5::o3::Fetch::clearStates
void clearStates(ThreadID tid)
Clear all thread-specific states.
Definition fetch.cc:273

gem5::o3::Fetch::finishTranslation
void finishTranslation(const Fault &fault, const RequestPtr &mem_req)
Definition fetch.cc:578

gem5::o3::Fetch::interruptPending
bool interruptPending
Checks if there is an interrupt pending.
Definition fetch.hh:522

gem5::o3::Fetch::pc
std::unique_ptr< PCStateBase > pc[MaxThreads]
Definition fetch.hh:418

gem5::o3::Fetch::lsqCount
ThreadID lsqCount()
Returns the appropriate thread to fetch using the LSQ count policy.
Definition fetch.cc:1463

gem5::o3::Fetch::stalls
Stalls stalls[MaxThreads]
Tracks which stages are telling fetch to stall.
Definition fetch.hh:446

gem5::o3::Fetch::buildInst
DynInstPtr buildInst(ThreadID tid, StaticInstPtr staticInst, StaticInstPtr curMacroop, const PCStateBase &this_pc, const PCStateBase &next_pc, bool trace)
Definition fetch.cc:1019

gem5::o3::Fetch::isDrained
bool isDrained() const
Has the stage drained?
Definition fetch.cc:395

gem5::o3::Fetch::fetchOffset
Addr fetchOffset[MaxThreads]
Definition fetch.hh:420

gem5::o3::Fetch::fetchQueue
std::deque< DynInstPtr > fetchQueue[MaxThreads]
Queue of fetched instructions.
Definition fetch.hh:496

gem5::o3::Fetch::retryPkt
PacketPtr retryPkt
The packet that is waiting to be retried.
Definition fetch.hh:470

gem5::o3::Fetch::priorityList
std::list< ThreadID > priorityList
List that has the threads organized by priority.
Definition fetch.hh:197

gem5::o3::Fetch::finishTranslationEvent
FinishTranslationEvent finishTranslationEvent
Event used to delay fault generation of translation faults.
Definition fetch.hh:531

gem5::o3::Fetch::retryTid
ThreadID retryTid
The thread that is waiting on the cache to tell fetch to retry.
Definition fetch.hh:473

gem5::o3::Fetch::tick
void tick()
Ticks the fetch stage, processing all inputs signals and fetching as many instructions as possible.
Definition fetch.cc:815

gem5::o3::Fetch::numFetchingThreads
ThreadID numFetchingThreads
Number of threads that are actively fetching.
Definition fetch.hh:514

gem5::o3::Fetch::fetchBufferSize
unsigned fetchBufferSize
The size of the fetch buffer in bytes.
Definition fetch.hh:481

gem5::o3::Fetch::setFetchQueue
void setFetchQueue(TimeBuffer< FetchStruct > *fq_ptr)
Sets pointer to time buffer used to communicate to the next stage.
Definition fetch.cc:255

gem5::o3::Fetch::cpu
CPU * cpu
Pointer to the O3CPU.
Definition fetch.hh:394

gem5::o3::Fetch::decodeWidth
unsigned decodeWidth
The width of decode in instructions.
Definition fetch.hh:464

gem5::o3::Fetch::cacheBlocked
bool cacheBlocked
Is the cache blocked? If so no threads can access it.
Definition fetch.hh:467

gem5::o3::Fetch::branchCount
ThreadID branchCount()
Returns the appropriate thread to fetch using the branch count policy.
Definition fetch.cc:1498

gem5::statistics::DataWrap::flags
Derived & flags(Flags _flags)
Set the flags and marks this stat to print at the end of simulation.
Definition statistics.hh:357

gem5::statistics::DataWrap::prereq
Derived & prereq(const Stat &prereq)
Set the prerequisite stat and marks this stat to print at the end of simulation.
Definition statistics.hh:371

gem5::statistics::DistBase::sample
void sample(const U &v, int n=1)
Add a value to the distribtion n times.
Definition statistics.hh:1327

gem5::statistics::Distribution::init
Distribution & init(Counter min, Counter max, Counter bkt)
Set the parameters of this distribution.
Definition statistics.hh:2112

gem5::statistics::Group
Statistics container.
Definition group.hh:93

gem5::trace::InstTracer::getInstRecord
virtual InstRecord * getInstRecord(Tick when, ThreadContext *tc, const StaticInstPtr staticInst, const PCStateBase &pc, const StaticInstPtr macroStaticInst=nullptr)=0

std::list
STL list class.
Definition stl.hh:51

core.hh

base.hh

cpu.hh

eventq.hh

exetrace.hh

fetch.hh

full_system.hh

tlb.hh

ADD_STAT
#define ADD_STAT(n,...)
Convenience macro to add a stat to a statistics group.
Definition group.hh:75

gem5::Event::scheduled
bool scheduled() const
Determine if the current event is scheduled.
Definition eventq.hh:458

gem5::EventManager::schedule
void schedule(Event &event, Tick when)
Definition eventq.hh:1012

panic
#define panic(...)
This implements a cprintf based panic() function.
Definition logging.hh:188

fatal
#define fatal(...)
This implements a cprintf based fatal() function.
Definition logging.hh:200

gem5::SimObject::getProbeManager
ProbeManager * getProbeManager()
Get the probe manager for this object.
Definition sim_object.cc:117

limits.hh

warn
#define warn(...)
Definition logging.hh:256

gem5::ArmISA::i
Bitfield< 7 > i
Definition misc_types.hh:67

gem5::ArmISA::set
Bitfield< 12, 11 > set
Definition misc_types.hh:792

gem5::MipsISA::vaddr
vaddr
Definition pra_constants.hh:278

gem5::o3::MaxThreads
static constexpr int MaxThreads
Definition limits.hh:38

gem5::o3::MaxWidth
static constexpr int MaxWidth
Definition limits.hh:37

gem5::statistics::pdf
const FlagsType pdf
Print the percent of the total that this entry represents.
Definition info.hh:61

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::Fault
std::shared_ptr< FaultBase > Fault
Definition types.hh:249

gem5::ThreadID
int16_t ThreadID
Thread index/ID type.
Definition types.hh:235

gem5::RequestPtr
std::shared_ptr< Request > RequestPtr
Definition request.hh:94

gem5::InvalidThreadID
const ThreadID InvalidThreadID
Definition types.hh:236

gem5::curTick
Tick curTick()
The universal simulation clock.
Definition cur_tick.hh:46

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::FullSystem
bool FullSystem
The FullSystem variable can be used to determine the current mode of simulation.
Definition root.cc:220

gem5::isRomMicroPC
static bool isRomMicroPC(MicroPC upc)
Definition types.hh:166

gem5::nopStaticInstPtr
StaticInstPtr nopStaticInstPtr
Pointer to a statically allocated generic "nop" instruction object.
Definition nop_static_inst.cc:67

gem5::NoFault
constexpr decltype(nullptr) NoFault
Definition types.hh:253

gem5::InstSeqNum
uint64_t InstSeqNum
Definition inst_seq.hh:40

nop_static_inst.hh

dyn_inst.hh

packet.hh
Declaration of the Packet class.

system.hh

gem5::o3::DynInst::Arrays
Definition dyn_inst.hh:86

gem5::o3::DynInst::Arrays::numDests
size_t numDests
Definition dyn_inst.hh:88

gem5::o3::DynInst::Arrays::numSrcs
size_t numSrcs
Definition dyn_inst.hh:87

gem5::o3::Fetch::FetchStatGroup::icacheSquashes
statistics::Scalar icacheSquashes
Total number of outstanding icache accesses that were dropped due to a squash.
Definition fetch.hh:572

gem5::o3::Fetch::FetchStatGroup::pendingDrainCycles
statistics::Scalar pendingDrainCycles
Total number of cycles spent in waiting for drains.
Definition fetch.hh:557

gem5::o3::Fetch::FetchStatGroup::cacheLines
statistics::Scalar cacheLines
Stat for total number of fetched cache lines.
Definition fetch.hh:568

gem5::o3::Fetch::FetchStatGroup::blockedCycles
statistics::Scalar blockedCycles
Total number of cycles spent blocked.
Definition fetch.hh:553

gem5::o3::Fetch::FetchStatGroup::idleCycles
statistics::Scalar idleCycles
Stat for total number of cycles spent blocked due to other stages in the pipeline.
Definition fetch.hh:551

gem5::o3::Fetch::FetchStatGroup::predictedBranches
statistics::Scalar predictedBranches
Stat for total number of predicted branches.
Definition fetch.hh:540

gem5::o3::Fetch::FetchStatGroup::noActiveThreadStallCycles
statistics::Scalar noActiveThreadStallCycles
Total number of stall cycles caused by no active threads to run.
Definition fetch.hh:559

gem5::o3::Fetch::FetchStatGroup::pendingQuiesceStallCycles
statistics::Scalar pendingQuiesceStallCycles
Total number of stall cycles caused by pending quiesce instructions.
Definition fetch.hh:564

gem5::o3::Fetch::FetchStatGroup::icacheWaitRetryStallCycles
statistics::Scalar icacheWaitRetryStallCycles
Total number of stall cycles caused by I-cache wait retrys.
Definition fetch.hh:566

gem5::o3::Fetch::FetchStatGroup::pendingTrapStallCycles
statistics::Scalar pendingTrapStallCycles
Total number of stall cycles caused by pending traps.
Definition fetch.hh:561

gem5::o3::Fetch::FetchStatGroup::cycles
statistics::Scalar cycles
Stat for total number of cycles spent fetching.
Definition fetch.hh:542

gem5::o3::Fetch::FetchStatGroup::miscStallCycles
statistics::Scalar miscStallCycles
Total number of cycles spent in any other state.
Definition fetch.hh:555

gem5::o3::Fetch::FetchStatGroup::tlbCycles
statistics::Scalar tlbCycles
Stat for total number of cycles spent waiting for translation.
Definition fetch.hh:546

gem5::o3::Fetch::FetchStatGroup::squashCycles
statistics::Scalar squashCycles
Stat for total number of cycles spent squashing.
Definition fetch.hh:544

gem5::o3::Fetch::FetchStatGroup::FetchStatGroup
FetchStatGroup(CPU *cpu, Fetch *fetch)
Definition fetch.cc:158

gem5::o3::Fetch::FetchStatGroup::idleRate
statistics::Formula idleRate
Rate of how often fetch was idle.
Definition fetch.hh:580

gem5::o3::Fetch::FetchStatGroup::tlbSquashes
statistics::Scalar tlbSquashes
Total number of outstanding tlb accesses that were dropped due to a squash.
Definition fetch.hh:576

gem5::o3::Fetch::FetchStatGroup::nisnDist
statistics::Distribution nisnDist
Distribution of number of instructions fetched each cycle.
Definition fetch.hh:578

gem5::o3::Fetch::Stalls::decode
bool decode
Definition fetch.hh:441

gem5::o3::Fetch::Stalls::drain
bool drain
Definition fetch.hh:442

name
const std::string & name()
Definition trace.cc:48