develop/mem_2cache_2base_8cc_source.html

/*

 * Copyright (c) 2012-2013, 2018-2019, 2023-2025 Arm Limited

 * All rights reserved.

 *

 * The license below extends only to copyright in the software and shall

 * not be construed as granting a license to any other intellectual

 * property including but not limited to intellectual property relating

 * to a hardware implementation of the functionality of the software

 * licensed hereunder.  You may use the software subject to the license

 * terms below provided that you ensure that this notice is replicated

 * unmodified and in its entirety in all distributions of the software,

 * modified or unmodified, in source code or in binary form.

 *

 * Copyright (c) 2003-2005 The Regents of The University of Michigan

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are

 * met: redistributions of source code must retain the above copyright

 * notice, this list of conditions and the following disclaimer;

 * redistributions in binary form must reproduce the above copyright

 * notice, this list of conditions and the following disclaimer in the

 * documentation and/or other materials provided with the distribution;

 * neither the name of the copyright holders nor the names of its

 * contributors may be used to endorse or promote products derived from

 * this software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS

 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT

 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR

 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT

 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,

 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT

 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,

 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY

 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 */


#include "mem/cache/base.hh"


#include "base/compiler.hh"

#include "base/logging.hh"

#include "debug/Cache.hh"

#include "debug/CacheComp.hh"

#include "debug/CachePort.hh"

#include "debug/CacheRepl.hh"

#include "debug/CacheVerbose.hh"

#include "debug/HWPrefetch.hh"

#include "mem/cache/compressors/base.hh"

#include "mem/cache/mshr.hh"

#include "mem/cache/mshr_queue.hh"

#include "mem/cache/prefetch/base.hh"

#include "mem/cache/queue_entry.hh"

#include "mem/cache/tags/compressed_tags.hh"

#include "mem/cache/tags/partitioning_policies/partition_manager.hh"

#include "mem/cache/tags/super_blk.hh"

#include "params/BaseCache.hh"

#include "params/WriteAllocator.hh"

#include "sim/cur_tick.hh"


namespace gem5

{


BaseCache::CacheResponsePort::CacheResponsePort(const std::string &_name,

                                          BaseCache& _cache,

                                          const std::string &_label)

    : QueuedResponsePort(_name, queue),

      cache{_cache},

      queue(_cache, *this, true, _label),

      blocked(false), mustSendRetry(false),

      sendRetryEvent([this]{ processSendRetry(); }, _name)

{

}


BaseCache::BaseCache(const BaseCacheParams &p, unsigned blk_size)

    : ClockedObject(p),

      cpuSidePort (p.name + ".cpu_side_port", *this, "CpuSidePort"),

      memSidePort(p.name + ".mem_side_port", this, "MemSidePort"),

      accessor(*this),

      mshrQueue("MSHRs", p.mshrs, 0, p.demand_mshr_reserve, p.name),

      writeBuffer("write buffer", p.write_buffers, p.mshrs, p.name),

      tags(p.tags),

      compressor(p.compressor),

      partitionManager(p.partitioning_manager),

      prefetcher(p.prefetcher),

      writeAllocator(p.write_allocator),

      writebackClean(p.writeback_clean),

      tempBlockWriteback(nullptr),

      writebackTempBlockAtomicEvent([this]{ writebackTempBlockAtomic(); },

                                    name(), false,

                                    EventBase::Delayed_Writeback_Pri),

      blkSize(blk_size),

      lookupLatency(p.tag_latency),

      dataLatency(p.data_latency),

      forwardLatency(p.tag_latency),

      fillLatency(p.data_latency),

      responseLatency(p.response_latency),

      sequentialAccess(p.sequential_access),

      numTarget(p.tgts_per_mshr),

      forwardSnoops(true),

      clusivity(p.clusivity),

      isReadOnly(p.is_read_only),

      replaceExpansions(p.replace_expansions),

      moveContractions(p.move_contractions),

      blocked(0),

      order(0),

      noTargetMSHR(nullptr),

      missCount(p.max_miss_count),

      addrRanges(p.addr_ranges.begin(), p.addr_ranges.end()),

      system(p.system),

      stats(*this)

{

    // the MSHR queue has no reserve entries as we check the MSHR

    // queue on every single allocation, whereas the write queue has

    // as many reserve entries as we have MSHRs, since every MSHR may

    // eventually require a writeback, and we do not check the write

    // buffer before committing to an MSHR


    // forward snoops is overridden in init() once we can query

    // whether the connected requestor is actually snooping or not


    tempBlock = new TempCacheBlk(blkSize,

        genTagExtractor(tags->params().indexing_policy));


    tags->tagsInit();

    if (prefetcher) {

        prefetcher->setParentInfo(system, getProbeManager(), getBlockSize());

    }


    fatal_if(compressor && !dynamic_cast<CompressedTags*>(tags),

        "The tags of compressed cache %s must derive from CompressedTags",

        name());

    warn_if(!compressor && dynamic_cast<CompressedTags*>(tags),

        "Compressed cache %s does not have a compression algorithm", name());

    if (compressor)

        compressor->setCache(this);

}


BaseCache::~BaseCache()

{

    delete tempBlock;

}


void


BaseCache::CacheResponsePort::setBlocked()

{

    assert(!blocked);

    DPRINTF(CachePort, "Port is blocking new requests\n");

    blocked = true;

    // if we already scheduled a retry in this cycle, but it has not yet

    // happened, cancel it

    if (sendRetryEvent.scheduled()) {

        cache.deschedule(sendRetryEvent);

        DPRINTF(CachePort, "Port descheduled retry\n");

        mustSendRetry = true;

    }

}


void


BaseCache::CacheResponsePort::clearBlocked()

{

    assert(blocked);

    DPRINTF(CachePort, "Port is accepting new requests\n");

    blocked = false;

    if (mustSendRetry) {

        // @TODO: need to find a better time (next cycle?)

        cache.schedule(sendRetryEvent, curTick() + 1);

    }

}


void


BaseCache::CacheResponsePort::processSendRetry()

{

    DPRINTF(CachePort, "Port is sending retry\n");


    // reset the flag and call retry

    mustSendRetry = false;

    sendRetryReq();

}


Addr


BaseCache::regenerateBlkAddr(CacheBlk* blk)

{

    if (blk != tempBlock) {

        return tags->regenerateBlkAddr(blk);

    } else {

        return tempBlock->getAddr();

    }

}


void


BaseCache::init()

{

    if (!cpuSidePort.isConnected() || !memSidePort.isConnected())

        fatal("Cache ports on %s are not connected\n", name());

    cpuSidePort.sendRangeChange();

    forwardSnoops = cpuSidePort.isSnooping();

}


Port &


BaseCache::getPort(const std::string &if_name, PortID idx)

{

    if (if_name == "mem_side") {

        return memSidePort;

    } else if (if_name == "cpu_side") {

        return cpuSidePort;

    }  else {

        return ClockedObject::getPort(if_name, idx);

    }

}


bool


BaseCache::inRange(Addr addr) const

{

    for (const auto& r : addrRanges) {

        if (r.contains(addr)) {

            return true;

       }

    }

    return false;

}


void


BaseCache::allocateWriteBuffer(PacketPtr pkt, Tick time)

{

    // should only see writes or clean evicts here

    assert(pkt->isWrite() || pkt->cmd == MemCmd::CleanEvict);


    Addr blk_addr = pkt->getBlockAddr(blkSize);


    // If using compression, on evictions the block is decompressed and

    // the operation's latency is added to the payload delay. Consume

    // that payload delay here, meaning that the data is always stored

    // uncompressed in the writebuffer

    if (compressor) {

        time += pkt->payloadDelay;

        pkt->payloadDelay = 0;

    }


    WriteQueueEntry *wq_entry =

        writeBuffer.findMatch(blk_addr, pkt->isSecure());

    if (wq_entry && !wq_entry->inService) {

        DPRINTF(Cache, "Potential to merge writeback %s", pkt->print());

    }


    writeBuffer.allocate(blk_addr, blkSize, pkt, time, order++);


    if (writeBuffer.isFull()) {

        setBlocked((BlockedCause)MSHRQueue_WriteBuffer);

    }


    // schedule the send

    schedMemSideSendEvent(time);

}


void


BaseCache::markInService(WriteQueueEntry *entry)

{

    bool wasFull = writeBuffer.isFull();

    writeBuffer.markInService(entry);


    if (wasFull && !writeBuffer.isFull()) {

        clearBlocked(Blocked_NoWBBuffers);

    }

}


void


BaseCache::handleTimingReqHit(PacketPtr pkt, CacheBlk *blk, Tick request_time)

{


    // handle special cases for LockedRMW transactions

    if (pkt->isLockedRMW()) {

        Addr blk_addr = pkt->getBlockAddr(blkSize);


        if (pkt->isRead()) {

            // Read hit for LockedRMW.  Since it requires exclusive

            // permissions, there should be no outstanding access.

            assert(!mshrQueue.findMatch(blk_addr, pkt->isSecure()));

            // The keys to LockedRMW are that (1) we always have an MSHR

            // allocated during the RMW interval to catch snoops and

            // defer them until after the RMW completes, and (2) we

            // clear permissions on the block to turn any upstream

            // access other than the matching write into a miss, causing

            // it to append to the MSHR as well.


            // Because we hit in the cache, we have to fake an MSHR to

            // achieve part (1).  If the read had missed, this MSHR

            // would get allocated as part of normal miss processing.

            // Basically we need to get the MSHR in the same state as if

            // we had missed and just received the response.

            // Request *req2 = new Request(*(pkt->req));

            RequestPtr req2 = std::make_shared<Request>(*(pkt->req));

            PacketPtr pkt2 = new Packet(req2, pkt->cmd);

            MSHR *mshr = allocateMissBuffer(pkt2, curTick(), true);

            // Mark the MSHR "in service" (even though it's not) to prevent

            // the cache from sending out a request.

            mshrQueue.markInService(mshr, false);

            // Part (2): mark block inaccessible

            assert(blk);

            blk->clearCoherenceBits(CacheBlk::ReadableBit);

            blk->clearCoherenceBits(CacheBlk::WritableBit);

        } else {

            assert(pkt->isWrite());

            // All LockedRMW writes come here, as they cannot miss.

            // Need to undo the two things described above.  Block

            // permissions were already restored earlier in this

            // function, prior to the access() call.  Now we just need

            // to clear out the MSHR.


            // Read should have already allocated MSHR.

            MSHR *mshr = mshrQueue.findMatch(blk_addr, pkt->isSecure());

            assert(mshr);

            // Fake up a packet and "respond" to the still-pending

            // LockedRMWRead, to process any pending targets and clear

            // out the MSHR

            PacketPtr resp_pkt =

                new Packet(pkt->req, MemCmd::LockedRMWWriteResp);

            resp_pkt->senderState = mshr;

            recvTimingResp(resp_pkt);

        }

    }


    if (pkt->needsResponse()) {

        // These delays should have been consumed by now

        assert(pkt->headerDelay == 0);

        assert(pkt->payloadDelay == 0);


        pkt->makeTimingResponse();


        // In this case we are considering request_time that takes

        // into account the delay of the xbar, if any, and just

        // lat, neglecting responseLatency, modelling hit latency

        // just as the value of lat overriden by access(), which calls

        // the calculateAccessLatency() function.

        cpuSidePort.schedTimingResp(pkt, request_time);

    } else {

        DPRINTF(Cache, "%s satisfied %s, no response needed\n", __func__,

                pkt->print());


        // queue the packet for deletion, as the sending cache is

        // still relying on it; if the block is found in access(),

        // CleanEvict and Writeback messages will be deleted

        // here as well

        pendingDelete.reset(pkt);

    }

}


void


BaseCache::handleTimingReqMiss(PacketPtr pkt, MSHR *mshr, CacheBlk *blk,

                               Tick forward_time, Tick request_time)

{

    if (writeAllocator &&

        pkt && pkt->isWrite() && !pkt->req->isUncacheable()) {

        writeAllocator->updateMode(pkt->getAddr(), pkt->getSize(),

                                   pkt->getBlockAddr(blkSize));

    }


    if (mshr) {


        //@todo remove hw_pf here


        // Coalesce unless it was a software prefetch (see above).

        if (pkt) {

            assert(!pkt->isWriteback());

            // CleanEvicts corresponding to blocks which have

            // outstanding requests in MSHRs are simply sunk here

            if (pkt->cmd == MemCmd::CleanEvict) {

                pendingDelete.reset(pkt);

            } else if (pkt->cmd == MemCmd::WriteClean) {

                // A WriteClean should never coalesce with any

                // outstanding cache maintenance requests.


                // We use forward_time here because there is an

                // uncached memory write, forwarded to WriteBuffer.

                allocateWriteBuffer(pkt, forward_time);

            } else {

                DPRINTF(Cache, "%s coalescing MSHR for %s\n", __func__,

                        pkt->print());


                assert(pkt->req->requestorId() < system->maxRequestors());

                stats.cmdStats(pkt).mshrHits[pkt->req->requestorId()]++;


                // We use forward_time here because it is the same

                // considering new targets. We have multiple

                // requests for the same address here. It

                // specifies the latency to allocate an internal

                // buffer and to schedule an event to the queued

                // port and also takes into account the additional

                // delay of the xbar.

                mshr->allocateTarget(pkt, forward_time, order++,

                                     allocOnFill(pkt->cmd));

                if (mshr->getNumTargets() >= numTarget) {

                    noTargetMSHR = mshr;

                    setBlocked(Blocked_NoTargets);

                    // need to be careful with this... if this mshr isn't

                    // ready yet (i.e. time > curTick()), we don't want to

                    // move it ahead of mshrs that are ready

                    // mshrQueue.moveToFront(mshr);

                }

            }

        }

    } else {

        // no MSHR

        assert(pkt->req->requestorId() < system->maxRequestors());

        stats.cmdStats(pkt).mshrMisses[pkt->req->requestorId()]++;

        if (prefetcher && pkt->isDemand())

            prefetcher->incrDemandMhsrMisses();


        if (pkt->isEviction() || pkt->cmd == MemCmd::WriteClean) {

            // We use forward_time here because there is an

            // writeback or writeclean, forwarded to WriteBuffer.

            allocateWriteBuffer(pkt, forward_time);

        } else {

            if (blk && blk->isValid()) {

                // If we have a write miss to a valid block, we

                // need to mark the block non-readable.  Otherwise

                // if we allow reads while there's an outstanding

                // write miss, the read could return stale data

                // out of the cache block... a more aggressive

                // system could detect the overlap (if any) and

                // forward data out of the MSHRs, but we don't do

                // that yet.  Note that we do need to leave the

                // block valid so that it stays in the cache, in

                // case we get an upgrade response (and hence no

                // new data) when the write miss completes.

                // As long as CPUs do proper store/load forwarding

                // internally, and have a sufficiently weak memory

                // model, this is probably unnecessary, but at some

                // point it must have seemed like we needed it...

                assert((pkt->needsWritable() &&

                    !blk->isSet(CacheBlk::WritableBit)) ||

                    pkt->req->isCacheMaintenance());

                blk->clearCoherenceBits(CacheBlk::ReadableBit);

            }

            // Here we are using forward_time, modelling the latency of

            // a miss (outbound) just as forwardLatency, neglecting the

            // lookupLatency component.

            allocateMissBuffer(pkt, forward_time);

        }

    }

}


void


BaseCache::recvTimingReq(PacketPtr pkt)

{

    // anything that is merely forwarded pays for the forward latency and

    // the delay provided by the crossbar

    Tick forward_time = clockEdge(forwardLatency) + pkt->headerDelay;


    if (pkt->cmd == MemCmd::LockedRMWWriteReq) {

        // For LockedRMW accesses, we mark the block inaccessible after the

        // read (see below), to make sure no one gets in before the write.

        // Now that the write is here, mark it accessible again, so the

        // write will succeed.  LockedRMWReadReq brings the block in in

        // exclusive mode, so we know it was previously writable.

        CacheBlk *blk = tags->findBlock({pkt->getAddr(), pkt->isSecure()});

        assert(blk && blk->isValid());

        assert(!blk->isSet(CacheBlk::WritableBit) &&

               !blk->isSet(CacheBlk::ReadableBit));

        blk->setCoherenceBits(CacheBlk::ReadableBit);

        blk->setCoherenceBits(CacheBlk::WritableBit);

    }


    Cycles lat;

    CacheBlk *blk = nullptr;

    bool satisfied = false;

    {

        PacketList writebacks;

        // Note that lat is passed by reference here. The function

        // access() will set the lat value.

        satisfied = access(pkt, blk, lat, writebacks);


        // After the evicted blocks are selected, they must be forwarded

        // to the write buffer to ensure they logically precede anything

        // happening below

        doWritebacks(writebacks, clockEdge(lat + forwardLatency));

    }


    // Here we charge the headerDelay that takes into account the latencies

    // of the bus, if the packet comes from it.

    // The latency charged is just the value set by the access() function.

    // In case of a hit we are neglecting response latency.

    // In case of a miss we are neglecting forward latency.

    Tick request_time = clockEdge(lat);

    // Here we reset the timing of the packet.

    pkt->headerDelay = pkt->payloadDelay = 0;


    if (satisfied) {

        // notify before anything else as later handleTimingReqHit might turn

        // the packet in a response

        ppHit->notify(CacheAccessProbeArg(pkt,accessor));


        if (prefetcher && blk && blk->wasPrefetched()) {

            DPRINTF(Cache, "Hit on prefetch for addr %#x (%s)\n",

                    pkt->getAddr(), pkt->isSecure() ? "s" : "ns");

            blk->clearPrefetched();

        }


        handleTimingReqHit(pkt, blk, request_time);

    } else {

        handleTimingReqMiss(pkt, blk, forward_time, request_time);


        ppMiss->notify(CacheAccessProbeArg(pkt,accessor));

    }


    if (prefetcher) {

        // track time of availability of next prefetch, if any

        Tick next_pf_time = std::max(

                            prefetcher->nextPrefetchReadyTime(), clockEdge());

        if (next_pf_time != MaxTick) {

            schedMemSideSendEvent(next_pf_time);

        }

    }

}


void


BaseCache::handleUncacheableWriteResp(PacketPtr pkt)

{

    Tick completion_time = clockEdge(responseLatency) +

        pkt->headerDelay + pkt->payloadDelay;


    // Reset the bus additional time as it is now accounted for

    pkt->headerDelay = pkt->payloadDelay = 0;


    cpuSidePort.schedTimingResp(pkt, completion_time);

}


void


BaseCache::recvTimingResp(PacketPtr pkt)

{

    assert(pkt->isResponse());


    // all header delay should be paid for by the crossbar, unless

    // this is a prefetch response from above

    panic_if(pkt->headerDelay != 0 && pkt->cmd != MemCmd::HardPFResp,

             "%s saw a non-zero packet delay\n", name());


    const bool is_error = pkt->isError();


    if (is_error) {

        DPRINTF(Cache, "%s: Cache received %s with error\n", __func__,

                pkt->print());

    }


    DPRINTF(Cache, "%s: Handling response %s\n", __func__,

            pkt->print());


    // if this is a write, we should be looking at an uncacheable

    // write

    if (pkt->isWrite() && pkt->cmd != MemCmd::LockedRMWWriteResp) {

        assert(pkt->req->isUncacheable());

        handleUncacheableWriteResp(pkt);

        return;

    }


    // we have dealt with any (uncacheable) writes above, from here on

    // we know we are dealing with an MSHR due to a miss or a prefetch

    MSHR *mshr = dynamic_cast<MSHR*>(pkt->popSenderState());

    assert(mshr);


    if (mshr == noTargetMSHR) {

        // we always clear at least one target

        clearBlocked(Blocked_NoTargets);

        noTargetMSHR = nullptr;

    }


    // Initial target is used just for stats

    const QueueEntry::Target *initial_tgt = mshr->getTarget();

    const Tick miss_latency = curTick() - initial_tgt->recvTime;

    if (pkt->req->isUncacheable()) {

        assert(pkt->req->requestorId() < system->maxRequestors());

        stats.cmdStats(initial_tgt->pkt)

            .mshrUncacheableLatency[pkt->req->requestorId()] += miss_latency;

    } else {

        assert(pkt->req->requestorId() < system->maxRequestors());

        stats.cmdStats(initial_tgt->pkt)

            .mshrMissLatency[pkt->req->requestorId()] += miss_latency;

    }


    PacketList writebacks;


    bool is_fill = !mshr->isForward &&

        (pkt->isRead() || pkt->cmd == MemCmd::UpgradeResp ||

         mshr->wasWholeLineWrite);


    // make sure that if the mshr was due to a whole line write then

    // the response is an invalidation

    assert(!mshr->wasWholeLineWrite || pkt->isInvalidate());


    CacheBlk *blk = tags->findBlock({pkt->getAddr(), pkt->isSecure()});


    if (is_fill && !is_error) {

        DPRINTF(Cache, "Block for addr %#llx being updated in Cache\n",

                pkt->getAddr());


        const bool allocate = (writeAllocator && mshr->wasWholeLineWrite) ?

            writeAllocator->allocate() : mshr->allocOnFill();

        blk = handleFill(pkt, blk, writebacks, allocate);

        assert(blk != nullptr);

        ppFill->notify(CacheAccessProbeArg(pkt, accessor));

    }


    // Don't want to promote the Locked RMW Read until

    // the locked write comes in

    if (!mshr->hasLockedRMWReadTarget()) {

        if (blk && blk->isValid() && pkt->isClean() && !pkt->isInvalidate()) {

            // The block was marked not readable while there was a pending

            // cache maintenance operation, restore its flag.

            blk->setCoherenceBits(CacheBlk::ReadableBit);


            // This was a cache clean operation (without invalidate)

            // and we have a copy of the block already. Since there

            // is no invalidation, we can promote targets that don't

            // require a writable copy

            mshr->promoteReadable();

        }


        if (blk && blk->isSet(CacheBlk::WritableBit) &&

            !pkt->req->isCacheInvalidate()) {

            // If at this point the referenced block is writable and the

            // response is not a cache invalidate, we promote targets that

            // were deferred as we couldn't guarrantee a writable copy

            mshr->promoteWritable();

        }

    }


    serviceMSHRTargets(mshr, pkt, blk);

    // We are stopping servicing targets early for the Locked RMW Read until

    // the write comes.

    if (!mshr->hasLockedRMWReadTarget()) {

        if (mshr->promoteDeferredTargets()) {

            // avoid later read getting stale data while write miss is

            // outstanding.. see comment in timingAccess()

            if (blk) {

                blk->clearCoherenceBits(CacheBlk::ReadableBit);

            }

            mshrQueue.markPending(mshr);

            schedMemSideSendEvent(clockEdge() + pkt->payloadDelay);

        } else {

            // while we deallocate an mshr from the queue we still have to

            // check the isFull condition before and after as we might

            // have been using the reserved entries already

            const bool was_full = mshrQueue.isFull();

            mshrQueue.deallocate(mshr);

            if (was_full && !mshrQueue.isFull()) {

                clearBlocked(Blocked_NoMSHRs);

            }


            // Request the bus for a prefetch if this deallocation freed enough

            // MSHRs for a prefetch to take place

            if (prefetcher && mshrQueue.canPrefetch() && !isBlocked()) {

                Tick next_pf_time = std::max(

                    prefetcher->nextPrefetchReadyTime(), clockEdge());

                if (next_pf_time != MaxTick)

                    schedMemSideSendEvent(next_pf_time);

            }

        }


        // if we used temp block, check to see if its valid and then clear it

        if (blk == tempBlock && tempBlock->isValid()) {

            evictBlock(blk, writebacks);

        }

    }


    const Tick forward_time = clockEdge(forwardLatency) + pkt->headerDelay;

    // copy writebacks to write buffer

    doWritebacks(writebacks, forward_time);


    DPRINTF(CacheVerbose, "%s: Leaving with %s\n", __func__, pkt->print());

    delete pkt;

}


Tick


BaseCache::recvAtomic(PacketPtr pkt)

{

    // should assert here that there are no outstanding MSHRs or

    // writebacks... that would mean that someone used an atomic

    // access in timing mode


    // We use lookupLatency here because it is used to specify the latency

    // to access.

    Cycles lat = lookupLatency;


    CacheBlk *blk = nullptr;

    PacketList writebacks;

    bool satisfied = access(pkt, blk, lat, writebacks);


    if (pkt->isClean() && blk && blk->isSet(CacheBlk::DirtyBit)) {

        // A cache clean opearation is looking for a dirty

        // block. If a dirty block is encountered a WriteClean

        // will update any copies to the path to the memory

        // until the point of reference.

        DPRINTF(CacheVerbose, "%s: packet %s found block: %s\n",

                __func__, pkt->print(), blk->print());

        PacketPtr wb_pkt = writecleanBlk(blk, pkt->req->getDest(), pkt->id);

        writebacks.push_back(wb_pkt);

        pkt->setSatisfied();

    }


    // handle writebacks resulting from the access here to ensure they

    // logically precede anything happening below

    doWritebacksAtomic(writebacks);

    assert(writebacks.empty());


    if (!satisfied) {

        lat += handleAtomicReqMiss(pkt, blk, writebacks);

    }


    // Note that we don't invoke the prefetcher at all in atomic mode.

    // It's not clear how to do it properly, particularly for

    // prefetchers that aggressively generate prefetch candidates and

    // rely on bandwidth contention to throttle them; these will tend

    // to pollute the cache in atomic mode since there is no bandwidth

    // contention.  If we ever do want to enable prefetching in atomic

    // mode, though, this is the place to do it... see timingAccess()

    // for an example (though we'd want to issue the prefetch(es)

    // immediately rather than calling requestMemSideBus() as we do

    // there).


    // do any writebacks resulting from the response handling

    doWritebacksAtomic(writebacks);


    // if we used temp block, check to see if its valid and if so

    // clear it out, but only do so after the call to recvAtomic is

    // finished so that any downstream observers (such as a snoop

    // filter), first see the fill, and only then see the eviction

    if (blk == tempBlock && tempBlock->isValid()) {

        // the atomic CPU calls recvAtomic for fetch and load/store

        // sequentuially, and we may already have a tempBlock

        // writeback from the fetch that we have not yet sent

        if (tempBlockWriteback) {

            // if that is the case, write the prevoius one back, and

            // do not schedule any new event

            writebackTempBlockAtomic();

        } else {

            // the writeback/clean eviction happens after the call to

            // recvAtomic has finished (but before any successive

            // calls), so that the response handling from the fill is

            // allowed to happen first

            schedule(writebackTempBlockAtomicEvent, curTick());

        }


        tempBlockWriteback = evictBlock(blk);

    }


    if (pkt->needsResponse()) {

        pkt->makeAtomicResponse();

    }


    return lat * clockPeriod();

}


void


BaseCache::functionalAccess(PacketPtr pkt, bool from_cpu_side)

{

    Addr blk_addr = pkt->getBlockAddr(blkSize);

    bool is_secure = pkt->isSecure();

    CacheBlk *blk = tags->findBlock({pkt->getAddr(), is_secure});

    MSHR *mshr = mshrQueue.findMatch(blk_addr, is_secure);


    pkt->pushLabel(name());


    CacheBlkPrintWrapper cbpw(blk);


    // Note that just because an L2/L3 has valid data doesn't mean an

    // L1 doesn't have a more up-to-date modified copy that still

    // needs to be found.  As a result we always update the request if

    // we have it, but only declare it satisfied if we are the owner.


    // see if we have data at all (owned or otherwise)

    bool have_data = blk && blk->isValid()

        && pkt->trySatisfyFunctional(&cbpw, blk_addr, is_secure, blkSize,

                                     blk->data);


    // data we have is dirty if marked as such or if we have an

    // in-service MSHR that is pending a modified line

    bool have_dirty =

        have_data && (blk->isSet(CacheBlk::DirtyBit) ||

                      (mshr && mshr->inService && mshr->isPendingModified()));


    bool done = have_dirty ||

        cpuSidePort.trySatisfyFunctional(pkt) ||

        mshrQueue.trySatisfyFunctional(pkt) ||

        writeBuffer.trySatisfyFunctional(pkt) ||

        memSidePort.trySatisfyFunctional(pkt);


    DPRINTF(CacheVerbose, "%s: %s %s%s%s\n", __func__,  pkt->print(),

            (blk && blk->isValid()) ? "valid " : "",

            have_data ? "data " : "", done ? "done " : "");


    // We're leaving the cache, so pop cache->name() label

    pkt->popLabel();


    if (done) {

        pkt->makeResponse();

    } else {

        // if it came as a request from the CPU side then make sure it

        // continues towards the memory side

        if (from_cpu_side) {

            memSidePort.sendFunctional(pkt);

        } else if (cpuSidePort.isSnooping()) {

            // if it came from the memory side, it must be a snoop request

            // and we should only forward it if we are forwarding snoops

            cpuSidePort.sendFunctionalSnoop(pkt);

        }

    }

}


void


BaseCache::updateBlockData(CacheBlk *blk, const PacketPtr cpkt,

    bool has_old_data)

{

    CacheDataUpdateProbeArg data_update(

        regenerateBlkAddr(blk), blk->isSecure(),

        blk->getSrcRequestorId(), accessor);

    if (ppDataUpdate->hasListeners()) {

        if (has_old_data) {

            data_update.oldData = std::vector<uint64_t>(blk->data,

                blk->data + (blkSize / sizeof(uint64_t)));

        }

    }


    // Actually perform the data update

    if (cpkt) {

        cpkt->writeDataToBlock(blk->data, blkSize);

    }


    if (ppDataUpdate->hasListeners()) {

        if (cpkt) {

            data_update.newData = std::vector<uint64_t>(blk->data,

                blk->data + (blkSize / sizeof(uint64_t)));

            data_update.hwPrefetched = blk->wasPrefetched();

        }

        ppDataUpdate->notify(data_update);

    }

}


void


BaseCache::cmpAndSwap(CacheBlk *blk, PacketPtr pkt)

{

    assert(pkt->isRequest());


    uint64_t overwrite_val;

    bool overwrite_mem;

    uint64_t condition_val64;

    uint32_t condition_val32;


    int offset = pkt->getOffset(blkSize);

    uint8_t *blk_data = blk->data + offset;


    assert(sizeof(uint64_t) >= pkt->getSize());


    // Get a copy of the old block's contents for the probe before the update

    CacheDataUpdateProbeArg data_update(

        regenerateBlkAddr(blk), blk->isSecure(), blk->getSrcRequestorId(),

        accessor);

    if (ppDataUpdate->hasListeners()) {

        data_update.oldData = std::vector<uint64_t>(blk->data,

            blk->data + (blkSize / sizeof(uint64_t)));

    }


    overwrite_mem = true;

    // keep a copy of our possible write value, and copy what is at the

    // memory address into the packet

    pkt->writeData((uint8_t *)&overwrite_val);

    pkt->setData(blk_data);


    if (pkt->req->isCondSwap()) {

        if (pkt->getSize() == sizeof(uint64_t)) {

            condition_val64 = pkt->req->getExtraData();

            overwrite_mem = !std::memcmp(&condition_val64, blk_data,

                                         sizeof(uint64_t));

        } else if (pkt->getSize() == sizeof(uint32_t)) {

            condition_val32 = (uint32_t)pkt->req->getExtraData();

            overwrite_mem = !std::memcmp(&condition_val32, blk_data,

                                         sizeof(uint32_t));

        } else

            panic("Invalid size for conditional read/write\n");

    }


    if (overwrite_mem) {

        std::memcpy(blk_data, &overwrite_val, pkt->getSize());

        blk->setCoherenceBits(CacheBlk::DirtyBit);


        if (ppDataUpdate->hasListeners()) {

            data_update.newData = std::vector<uint64_t>(blk->data,

                blk->data + (blkSize / sizeof(uint64_t)));

            ppDataUpdate->notify(data_update);

        }

    }

}


QueueEntry*


BaseCache::getNextQueueEntry()

{

    // Check both MSHR queue and write buffer for potential requests,

    // note that null does not mean there is no request, it could

    // simply be that it is not ready

    MSHR *miss_mshr  = mshrQueue.getNext();

    WriteQueueEntry *wq_entry = writeBuffer.getNext();


    // If we got a write buffer request ready, first priority is a

    // full write buffer, otherwise we favour the miss requests

    if (wq_entry && (writeBuffer.isFull() || !miss_mshr)) {

        // need to search MSHR queue for conflicting earlier miss.

        MSHR *conflict_mshr = mshrQueue.findPending(wq_entry);


        if (conflict_mshr && conflict_mshr->order < wq_entry->order) {

            // Service misses in order until conflict is cleared.

            return conflict_mshr;


            // @todo Note that we ignore the ready time of the conflict here

        }


        // No conflicts; issue write

        return wq_entry;

    } else if (miss_mshr) {

        // need to check for conflicting earlier writeback

        WriteQueueEntry *conflict_mshr = writeBuffer.findPending(miss_mshr);

        if (conflict_mshr) {

            // not sure why we don't check order here... it was in the

            // original code but commented out.


            // The only way this happens is if we are

            // doing a write and we didn't have permissions

            // then subsequently saw a writeback (owned got evicted)

            // We need to make sure to perform the writeback first

            // To preserve the dirty data, then we can issue the write


            // should we return wq_entry here instead?  I.e. do we

            // have to flush writes in order?  I don't think so... not

            // for Alpha anyway.  Maybe for x86?

            return conflict_mshr;


            // @todo Note that we ignore the ready time of the conflict here

        }


        // No conflicts; issue read

        return miss_mshr;

    }


    // fall through... no pending requests.  Try a prefetch.

    assert(!miss_mshr && !wq_entry);

    if (prefetcher && mshrQueue.canPrefetch() && !isBlocked()) {

        // If we have a miss queue slot, we can try a prefetch

        PacketPtr pkt = prefetcher->getPacket();

        if (pkt) {

            Addr pf_addr = pkt->getBlockAddr(blkSize);

            if (tags->findBlock({pf_addr, pkt->isSecure()})) {

                DPRINTF(HWPrefetch, "Prefetch %#x has hit in cache, "

                        "dropped.\n", pf_addr);

                prefetcher->pfHitInCache();

                // free the request and packet

                delete pkt;

            } else if (mshrQueue.findMatch(pf_addr, pkt->isSecure())) {

                DPRINTF(HWPrefetch, "Prefetch %#x has hit in a MSHR, "

                        "dropped.\n", pf_addr);

                prefetcher->pfHitInMSHR();

                // free the request and packet

                delete pkt;

            } else if (writeBuffer.findMatch(pf_addr, pkt->isSecure())) {

                DPRINTF(HWPrefetch, "Prefetch %#x has hit in the "

                        "Write Buffer, dropped.\n", pf_addr);

                prefetcher->pfHitInWB();

                // free the request and packet

                delete pkt;

            } else {

                // Update statistic on number of prefetches issued

                // (hwpf_mshr_misses)

                assert(pkt->req->requestorId() < system->maxRequestors());

                stats.cmdStats(pkt).mshrMisses[pkt->req->requestorId()]++;


                // allocate an MSHR and return it, note

                // that we send the packet straight away, so do not

                // schedule the send

                return allocateMissBuffer(pkt, curTick(), false);

            }

        }

    }


    return nullptr;

}


bool


BaseCache::handleEvictions(std::vector<CacheBlk*> &evict_blks,

    PacketList &writebacks)

{

    bool replacement = false;

    for (const auto& blk : evict_blks) {

        if (blk->isValid()) {

            replacement = true;


            const MSHR* mshr =

                mshrQueue.findMatch(regenerateBlkAddr(blk), blk->isSecure());

            if (mshr) {

                // Must be an outstanding upgrade or clean request on a block

                // we're about to replace

                assert((!blk->isSet(CacheBlk::WritableBit) &&

                    mshr->needsWritable()) || mshr->isCleaning());

                return false;

            }

        }

    }


    // The victim will be replaced by a new entry, so increase the replacement

    // counter if a valid block is being replaced

    if (replacement) {

        stats.replacements++;


        // Evict valid blocks associated to this victim block

        for (auto& blk : evict_blks) {

            if (blk->isValid()) {

                evictBlock(blk, writebacks);

            }

        }

    }


    return true;

}


bool


BaseCache::updateCompressionData(CacheBlk *&blk, const uint64_t* data,

                                 PacketList &writebacks)

{

    // tempBlock does not exist in the tags, so don't do anything for it.

    if (blk == tempBlock) {

        return true;

    }


    // The compressor is called to compress the updated data, so that its

    // metadata can be updated.

    Cycles compression_lat = Cycles(0);

    Cycles decompression_lat = Cycles(0);

    const auto comp_data =

        compressor->compress(data, compression_lat, decompression_lat);

    std::size_t compression_size = comp_data->getSizeBits();


    // Get previous compressed size

    CompressionBlk* compression_blk = static_cast<CompressionBlk*>(blk);

    [[maybe_unused]] const std::size_t prev_size =

        compression_blk->getSizeBits();


    // If compressed size didn't change enough to modify its co-allocatability

    // there is nothing to do. Otherwise we may be facing a data expansion

    // (block passing from more compressed to less compressed state), or a

    // data contraction (less to more).

    bool is_data_expansion = false;

    bool is_data_contraction = false;

    const CompressionBlk::OverwriteType overwrite_type =

        compression_blk->checkExpansionContraction(compression_size);

    std::string op_name = "";

    if (overwrite_type == CompressionBlk::DATA_EXPANSION) {

        op_name = "expansion";

        is_data_expansion = true;

    } else if ((overwrite_type == CompressionBlk::DATA_CONTRACTION) &&

        moveContractions) {

        op_name = "contraction";

        is_data_contraction = true;

    }


    // If block changed compression state, it was possibly co-allocated with

    // other blocks and cannot be co-allocated anymore, so one or more blocks

    // must be evicted to make room for the expanded/contracted block

    std::vector<CacheBlk*> evict_blks;

    if (is_data_expansion || is_data_contraction) {

        std::vector<CacheBlk*> evict_blks;

        bool victim_itself = false;

        CacheBlk *victim = nullptr;

        if (replaceExpansions || is_data_contraction) {

            victim = tags->findVictim(

                {regenerateBlkAddr(blk), blk->isSecure()},

                compression_size, evict_blks,

                blk->getPartitionId());


            // It is valid to return nullptr if there is no victim

            if (!victim) {

                return false;

            }


            // If the victim block is itself the block won't need to be moved,

            // and the victim should not be evicted

            if (blk == victim) {

                victim_itself = true;

                auto it = std::find_if(evict_blks.begin(), evict_blks.end(),

                    [&blk](CacheBlk* evict_blk){ return evict_blk == blk; });

                evict_blks.erase(it);

            }


            // Print victim block's information

            DPRINTF(CacheRepl, "Data %s replacement victim: %s\n",

                op_name, victim->print());

        } else {

            // If we do not move the expanded block, we must make room for

            // the expansion to happen, so evict every co-allocated block

            const SuperBlk* superblock = static_cast<const SuperBlk*>(

                compression_blk->getSectorBlock());

            for (auto& sub_blk : superblock->blks) {

                if (sub_blk->isValid() && (blk != sub_blk)) {

                    evict_blks.push_back(sub_blk);

                }

            }

        }


        // Try to evict blocks; if it fails, give up on update

        if (!handleEvictions(evict_blks, writebacks)) {

            return false;

        }


        DPRINTF(CacheComp, "Data %s: [%s] from %d to %d bits\n",

                op_name, blk->print(), prev_size, compression_size);


        if (!victim_itself && (replaceExpansions || is_data_contraction)) {

            // Move the block's contents to the invalid block so that it now

            // co-allocates with the other existing superblock entry

            tags->moveBlock(blk, victim);

            blk = victim;

            compression_blk = static_cast<CompressionBlk*>(blk);

        }

    }


    // Update the number of data expansions/contractions

    if (is_data_expansion) {

        stats.dataExpansions++;

    } else if (is_data_contraction) {

        stats.dataContractions++;

    }


    compression_blk->setSizeBits(compression_size);

    compression_blk->setDecompressionLatency(decompression_lat);


    return true;

}


void


BaseCache::satisfyRequest(PacketPtr pkt, CacheBlk *blk, bool, bool)

{

    assert(pkt->isRequest());


    assert(blk && blk->isValid());

    // Occasionally this is not true... if we are a lower-level cache

    // satisfying a string of Read and ReadEx requests from

    // upper-level caches, a Read will mark the block as shared but we

    // can satisfy a following ReadEx anyway since we can rely on the

    // Read requestor(s) to have buffered the ReadEx snoop and to

    // invalidate their blocks after receiving them.

    // assert(!pkt->needsWritable() || blk->isSet(CacheBlk::WritableBit));

    assert(pkt->getOffset(blkSize) + pkt->getSize() <= blkSize);


    // Check RMW operations first since both isRead() and

    // isWrite() will be true for them

    if (pkt->cmd == MemCmd::SwapReq) {

        if (pkt->isAtomicOp()) {

            // Get a copy of the old block's contents for the probe before

            // the update

            CacheDataUpdateProbeArg data_update(

                regenerateBlkAddr(blk), blk->isSecure(),

                blk->getSrcRequestorId(), accessor);

            if (ppDataUpdate->hasListeners()) {

                data_update.oldData = std::vector<uint64_t>(blk->data,

                    blk->data + (blkSize / sizeof(uint64_t)));

            }


            // extract data from cache and save it into the data field in

            // the packet as a return value from this atomic op

            int offset = tags->extractBlkOffset(pkt->getAddr());

            uint8_t *blk_data = blk->data + offset;

            pkt->setData(blk_data);


            // execute AMO operation

            (*(pkt->getAtomicOp()))(blk_data);


            // Inform of this block's data contents update

            if (ppDataUpdate->hasListeners()) {

                data_update.newData = std::vector<uint64_t>(blk->data,

                    blk->data + (blkSize / sizeof(uint64_t)));

                data_update.hwPrefetched = blk->wasPrefetched();

                ppDataUpdate->notify(data_update);

            }


            // set block status to dirty

            blk->setCoherenceBits(CacheBlk::DirtyBit);

        } else {

            cmpAndSwap(blk, pkt);

        }

    } else if (pkt->isWrite()) {

        // we have the block in a writable state and can go ahead,

        // note that the line may be also be considered writable in

        // downstream caches along the path to memory, but always

        // Exclusive, and never Modified

        assert(blk->isSet(CacheBlk::WritableBit));

        // Write or WriteLine at the first cache with block in writable state

        if (blk->checkWrite(pkt)) {

            updateBlockData(blk, pkt, true);

        }

        // Always mark the line as dirty (and thus transition to the

        // Modified state) even if we are a failed StoreCond so we

        // supply data to any snoops that have appended themselves to

        // this cache before knowing the store will fail.

        blk->setCoherenceBits(CacheBlk::DirtyBit);

        DPRINTF(CacheVerbose, "%s for %s (write)\n", __func__, pkt->print());

    } else if (pkt->isRead()) {

        if (pkt->isLLSC()) {

            blk->trackLoadLocked(pkt);

        }


        // all read responses have a data payload

        assert(pkt->hasRespData());

        pkt->setDataFromBlock(blk->data, blkSize);

    } else if (pkt->isUpgrade()) {

        // sanity check

        assert(!pkt->hasSharers());


        if (blk->isSet(CacheBlk::DirtyBit)) {

            // we were in the Owned state, and a cache above us that

            // has the line in Shared state needs to be made aware

            // that the data it already has is in fact dirty

            pkt->setCacheResponding();

            blk->clearCoherenceBits(CacheBlk::DirtyBit);

        }

    } else if (pkt->isClean()) {

        blk->clearCoherenceBits(CacheBlk::DirtyBit);

    } else {

        assert(pkt->isInvalidate());

        invalidateBlock(blk);

        DPRINTF(CacheVerbose, "%s for %s (invalidation)\n", __func__,

                pkt->print());

    }

}


//

// Access path: requests coming in from the CPU side

//

Cycles


BaseCache::calculateTagOnlyLatency(const uint32_t delay,

                                   const Cycles lookup_lat) const

{

    // A tag-only access has to wait for the packet to arrive in order to

    // perform the tag lookup.

    return ticksToCycles(delay) + lookup_lat;

}


Cycles


BaseCache::calculateAccessLatency(const CacheBlk* blk, const uint32_t delay,

                                  const Cycles lookup_lat) const

{

    Cycles lat(0);


    if (blk != nullptr) {

        // As soon as the access arrives, for sequential accesses first access

        // tags, then the data entry. In the case of parallel accesses the

        // latency is dictated by the slowest of tag and data latencies.

        if (sequentialAccess) {

            lat = ticksToCycles(delay) + lookup_lat + dataLatency;

        } else {

            lat = ticksToCycles(delay) + std::max(lookup_lat, dataLatency);

        }


        // Check if the block to be accessed is available. If not, apply the

        // access latency on top of when the block is ready to be accessed.

        const Tick tick = curTick() + delay;

        const Tick when_ready = blk->getWhenReady();

        if (when_ready > tick &&

            ticksToCycles(when_ready - tick) > lat) {

            lat += ticksToCycles(when_ready - tick);

        }

    } else {

        // In case of a miss, we neglect the data access in a parallel

        // configuration (i.e., the data access will be stopped as soon as

        // we find out it is a miss), and use the tag-only latency.

        lat = calculateTagOnlyLatency(delay, lookup_lat);

    }


    return lat;

}


bool


BaseCache::access(PacketPtr pkt, CacheBlk *&blk, Cycles &lat,

                  PacketList &writebacks)

{

    // sanity check

    assert(pkt->isRequest());


    gem5_assert(!(isReadOnly && pkt->isWrite()),

                "Should never see a write in a read-only cache %s\n",

                name());


    // Access block in the tags

    Cycles tag_latency(0);

    blk = tags->accessBlock(pkt, tag_latency);


    DPRINTF(Cache, "%s for %s %s\n", __func__, pkt->print(),

            blk ? "hit " + blk->print() : "miss");


    if (pkt->req->isCacheMaintenance()) {

        // A cache maintenance operation is always forwarded to the

        // memory below even if the block is found in dirty state.


        // We defer any changes to the state of the block until we

        // create and mark as in service the mshr for the downstream

        // packet.


        // Calculate access latency on top of when the packet arrives. This

        // takes into account the bus delay.

        lat = calculateTagOnlyLatency(pkt->headerDelay, tag_latency);


        return false;

    }


    if (pkt->isEviction()) {

        // We check for presence of block in above caches before issuing

        // Writeback or CleanEvict to write buffer. Therefore the only

        // possible cases can be of a CleanEvict packet coming from above

        // encountering a Writeback generated in this cache peer cache and

        // waiting in the write buffer. Cases of upper level peer caches

        // generating CleanEvict and Writeback or simply CleanEvict and

        // CleanEvict almost simultaneously will be caught by snoops sent out

        // by crossbar.

        WriteQueueEntry *wb_entry = writeBuffer.findMatch(pkt->getAddr(),

                                                          pkt->isSecure());

        if (wb_entry) {

            assert(wb_entry->getNumTargets() == 1);

            PacketPtr wbPkt = wb_entry->getTarget()->pkt;

            assert(wbPkt->isWriteback());


            if (pkt->isCleanEviction()) {

                // The CleanEvict and WritebackClean snoops into other

                // peer caches of the same level while traversing the

                // crossbar. If a copy of the block is found, the

                // packet is deleted in the crossbar. Hence, none of

                // the other upper level caches connected to this

                // cache have the block, so we can clear the

                // BLOCK_CACHED flag in the Writeback if set and

                // discard the CleanEvict by returning true.

                wbPkt->clearBlockCached();


                // A clean evict does not need to access the data array

                lat = calculateTagOnlyLatency(pkt->headerDelay, tag_latency);


                return true;

            } else {

                assert(pkt->cmd == MemCmd::WritebackDirty);

                // Dirty writeback from above trumps our clean

                // writeback... discard here

                // Note: markInService will remove entry from writeback buffer.

                markInService(wb_entry);

                delete wbPkt;

            }

        }

    }


    // The critical latency part of a write depends only on the tag access

    if (pkt->isWrite()) {

        lat = calculateTagOnlyLatency(pkt->headerDelay, tag_latency);

    }


    // Writeback handling is special case.  We can write the block into

    // the cache without having a writeable copy (or any copy at all).

    if (pkt->isWriteback()) {

        assert(blkSize == pkt->getSize());


        // we could get a clean writeback while we are having

        // outstanding accesses to a block, do the simple thing for

        // now and drop the clean writeback so that we do not upset

        // any ordering/decisions about ownership already taken

        if (pkt->cmd == MemCmd::WritebackClean &&

            mshrQueue.findMatch(pkt->getAddr(), pkt->isSecure())) {

            DPRINTF(Cache, "Clean writeback %#llx to block with MSHR, "

                    "dropping\n", pkt->getAddr());


            // A writeback searches for the block, then writes the data.

            // As the writeback is being dropped, the data is not touched,

            // and we just had to wait for the time to find a match in the

            // MSHR. As of now assume a mshr queue search takes as long as

            // a tag lookup for simplicity.

            return true;

        }


        const bool has_old_data = blk && blk->isValid();

        if (!blk) {

            // need to do a replacement

            blk = allocateBlock(pkt, writebacks);

            if (!blk) {

                // no replaceable block available: give up, fwd to next level.

                incMissCount(pkt);

                return false;

            }


            blk->setCoherenceBits(CacheBlk::ReadableBit);

        } else if (compressor) {

            // This is an overwrite to an existing block, therefore we need

            // to check for data expansion (i.e., block was compressed with

            // a smaller size, and now it doesn't fit the entry anymore).

            // If that is the case we might need to evict blocks.

            if (!updateCompressionData(blk, pkt->getConstPtr<uint64_t>(),

                writebacks)) {

                invalidateBlock(blk);

                return false;

            }

        }


        // only mark the block dirty if we got a writeback command,

        // and leave it as is for a clean writeback

        if (pkt->cmd == MemCmd::WritebackDirty) {

            // TODO: the coherent cache can assert that the dirty bit is set

            blk->setCoherenceBits(CacheBlk::DirtyBit);

        }

        // if the packet does not have sharers, it is passing

        // writable, and we got the writeback in Modified or Exclusive

        // state, if not we are in the Owned or Shared state

        if (!pkt->hasSharers()) {

            blk->setCoherenceBits(CacheBlk::WritableBit);

        }

        // nothing else to do; writeback doesn't expect response

        assert(!pkt->needsResponse());


        updateBlockData(blk, pkt, has_old_data);

        DPRINTF(Cache, "%s new state is %s\n", __func__, blk->print());

        incHitCount(pkt);


        // When the packet metadata arrives, the tag lookup will be done while

        // the payload is arriving. Then the block will be ready to access as

        // soon as the fill is done

        blk->setWhenReady(clockEdge(fillLatency) + pkt->headerDelay +

            std::max(cyclesToTicks(tag_latency), (uint64_t)pkt->payloadDelay));


        return true;

    } else if (pkt->cmd == MemCmd::CleanEvict) {

        // A CleanEvict does not need to access the data array

        lat = calculateTagOnlyLatency(pkt->headerDelay, tag_latency);


        if (blk) {

            // Found the block in the tags, need to stop CleanEvict from

            // propagating further down the hierarchy. Returning true will

            // treat the CleanEvict like a satisfied write request and delete

            // it.

            return true;

        }

        // We didn't find the block here, propagate the CleanEvict further

        // down the memory hierarchy. Returning false will treat the CleanEvict

        // like a Writeback which could not find a replaceable block so has to

        // go to next level.

        return false;

    } else if (pkt->cmd == MemCmd::WriteClean) {

        // WriteClean handling is a special case. We can allocate a

        // block directly if it doesn't exist and we can update the

        // block immediately. The WriteClean transfers the ownership

        // of the block as well.

        assert(blkSize == pkt->getSize());


        const bool has_old_data = blk && blk->isValid();

        if (!blk) {

            if (pkt->writeThrough()) {

                // if this is a write through packet, we don't try to

                // allocate if the block is not present

                return false;

            } else {

                // a writeback that misses needs to allocate a new block

                blk = allocateBlock(pkt, writebacks);

                if (!blk) {

                    // no replaceable block available: give up, fwd to

                    // next level.

                    incMissCount(pkt);

                    return false;

                }


                blk->setCoherenceBits(CacheBlk::ReadableBit);

            }

        } else if (compressor) {

            // This is an overwrite to an existing block, therefore we need

            // to check for data expansion (i.e., block was compressed with

            // a smaller size, and now it doesn't fit the entry anymore).

            // If that is the case we might need to evict blocks.

            if (!updateCompressionData(blk, pkt->getConstPtr<uint64_t>(),

                writebacks)) {

                invalidateBlock(blk);

                return false;

            }

        }


        // at this point either this is a writeback or a write-through

        // write clean operation and the block is already in this

        // cache, we need to update the data and the block flags

        assert(blk);

        // TODO: the coherent cache can assert that the dirty bit is set

        if (!pkt->writeThrough()) {

            blk->setCoherenceBits(CacheBlk::DirtyBit);

        }

        // nothing else to do; writeback doesn't expect response

        assert(!pkt->needsResponse());


        updateBlockData(blk, pkt, has_old_data);

        DPRINTF(Cache, "%s new state is %s\n", __func__, blk->print());


        incHitCount(pkt);


        // When the packet metadata arrives, the tag lookup will be done while

        // the payload is arriving. Then the block will be ready to access as

        // soon as the fill is done

        blk->setWhenReady(clockEdge(fillLatency) + pkt->headerDelay +

            std::max(cyclesToTicks(tag_latency), (uint64_t)pkt->payloadDelay));


        // If this a write-through packet it will be sent to cache below

        return !pkt->writeThrough();

    } else if (blk && (pkt->needsWritable() ?

            blk->isSet(CacheBlk::WritableBit) :

            blk->isSet(CacheBlk::ReadableBit))) {

        // OK to satisfy access

        incHitCount(pkt);


        // Calculate access latency based on the need to access the data array

        if (pkt->isRead()) {

            lat = calculateAccessLatency(blk, pkt->headerDelay, tag_latency);


            // When a block is compressed, it must first be decompressed

            // before being read. This adds to the access latency.

            if (compressor) {

                lat += compressor->getDecompressionLatency(blk);

            }

        } else {

            lat = calculateTagOnlyLatency(pkt->headerDelay, tag_latency);

        }


        satisfyRequest(pkt, blk);

        maintainClusivity(pkt->fromCache(), blk);


        return true;

    }


    // Can't satisfy access normally... either no block (blk == nullptr)

    // or have block but need writable


    incMissCount(pkt);


    lat = calculateAccessLatency(blk, pkt->headerDelay, tag_latency);


    if (!blk && pkt->isLLSC() && pkt->isWrite()) {

        // complete miss on store conditional... just give up now

        pkt->req->setExtraData(0);

        return true;

    }


    return false;

}


void


BaseCache::maintainClusivity(bool from_cache, CacheBlk *blk)

{

    if (from_cache && blk && blk->isValid() &&

        !blk->isSet(CacheBlk::DirtyBit) && clusivity == enums::mostly_excl) {

        // if we have responded to a cache, and our block is still

        // valid, but not dirty, and this cache is mostly exclusive

        // with respect to the cache above, drop the block

        invalidateBlock(blk);

    }

}


CacheBlk*


BaseCache::handleFill(PacketPtr pkt, CacheBlk *blk, PacketList &writebacks,

                      bool allocate)

{

    assert(pkt->isResponse());

    Addr addr = pkt->getAddr();

    bool is_secure = pkt->isSecure();

    const bool has_old_data = blk && blk->isValid();

    const std::string old_state = (debug::Cache && blk) ? blk->print() : "";


    // When handling a fill, we should have no writes to this line.

    assert(addr == pkt->getBlockAddr(blkSize));

    assert(!writeBuffer.findMatch(addr, is_secure));


    if (!blk) {

        // better have read new data...

        assert(pkt->hasData() || pkt->cmd == MemCmd::InvalidateResp);


        // need to do a replacement if allocating, otherwise we stick

        // with the temporary storage

        blk = allocate ? allocateBlock(pkt, writebacks) : nullptr;


        if (!blk) {

            // No replaceable block or a mostly exclusive

            // cache... just use temporary storage to complete the

            // current request and then get rid of it

            blk = tempBlock;

            tempBlock->insert({addr, is_secure});

            DPRINTF(Cache, "using temp block for %#llx (%s)\n", addr,

                    is_secure ? "s" : "ns");

        }

    } else {

        // existing block... probably an upgrade

        // don't clear block status... if block is already dirty we

        // don't want to lose that

    }


    // Block is guaranteed to be valid at this point

    assert(blk->isValid());

    assert(blk->isSecure() == is_secure);

    assert(regenerateBlkAddr(blk) == addr);


    blk->setCoherenceBits(CacheBlk::ReadableBit);


    // sanity check for whole-line writes, which should always be

    // marked as writable as part of the fill, and then later marked

    // dirty as part of satisfyRequest

    if (pkt->cmd == MemCmd::InvalidateResp) {

        assert(!pkt->hasSharers());

    }


    // here we deal with setting the appropriate state of the line,

    // and we start by looking at the hasSharers flag, and ignore the

    // cacheResponding flag (normally signalling dirty data) if the

    // packet has sharers, thus the line is never allocated as Owned

    // (dirty but not writable), and always ends up being either

    // Shared, Exclusive or Modified, see Packet::setCacheResponding

    // for more details

    if (!pkt->hasSharers()) {

        // we could get a writable line from memory (rather than a

        // cache) even in a read-only cache, note that we set this bit

        // even for a read-only cache, possibly revisit this decision

        blk->setCoherenceBits(CacheBlk::WritableBit);


        // check if we got this via cache-to-cache transfer (i.e., from a

        // cache that had the block in Modified or Owned state)

        if (pkt->cacheResponding()) {

            // we got the block in Modified state, and invalidated the

            // owners copy

            blk->setCoherenceBits(CacheBlk::DirtyBit);


            gem5_assert(!isReadOnly, "Should never see dirty snoop response "

                        "in read-only cache %s\n", name());


        }

    }


    DPRINTF(Cache, "Block addr %#llx (%s) moving from %s to %s\n",

            addr, is_secure ? "s" : "ns", old_state, blk->print());


    // if we got new data, copy it in (checking for a read response

    // and a response that has data is the same in the end)

    if (pkt->isRead()) {

        // sanity checks

        assert(pkt->hasData());

        assert(pkt->getSize() == blkSize);


        updateBlockData(blk, pkt, has_old_data);

    }

    // The block will be ready when the payload arrives and the fill is done

    blk->setWhenReady(clockEdge(fillLatency) + pkt->headerDelay +

                      pkt->payloadDelay);


    return blk;

}


CacheBlk*


BaseCache::allocateBlock(const PacketPtr pkt, PacketList &writebacks)

{

    // Get address

    const Addr addr = pkt->getAddr();


    // Get secure bit

    const bool is_secure = pkt->isSecure();


    // Block size and compression related access latency. Only relevant if

    // using a compressor, otherwise there is no extra delay, and the block

    // is fully sized

    std::size_t blk_size_bits = blkSize*8;

    Cycles compression_lat = Cycles(0);

    Cycles decompression_lat = Cycles(0);


    // If a compressor is being used, it is called to compress data before

    // insertion. Although in Gem5 the data is stored uncompressed, even if a

    // compressor is used, the compression/decompression methods are called to

    // calculate the amount of extra cycles needed to read or write compressed

    // blocks.

    if (compressor && pkt->hasData()) {

        const auto comp_data = compressor->compress(

            pkt->getConstPtr<uint64_t>(), compression_lat, decompression_lat);

        blk_size_bits = comp_data->getSizeBits();

    }


    // get partitionId from Packet

    const auto partition_id = partitionManager ?

        partitionManager->readPacketPartitionID(pkt) : 0;

    // Find replacement victim

    std::vector<CacheBlk*> evict_blks;

    CacheBlk *victim = tags->findVictim({addr, is_secure}, blk_size_bits,

                                        evict_blks, partition_id);


    // It is valid to return nullptr if there is no victim

    if (!victim)

        return nullptr;


    // Print victim block's information

    DPRINTF(CacheRepl, "Replacement victim: %s\n", victim->print());


    // Try to evict blocks; if it fails, give up on allocation

    if (!handleEvictions(evict_blks, writebacks)) {

        return nullptr;

    }


    // Insert new block at victimized entry

    tags->insertBlock(pkt, victim);


    // If using a compressor, set compression data. This must be done after

    // insertion, as the compression bit may be set.

    if (compressor) {

        compressor->setSizeBits(victim, blk_size_bits);

        compressor->setDecompressionLatency(victim, decompression_lat);

    }


    return victim;

}


void


BaseCache::invalidateBlock(CacheBlk *blk)

{

    // If block is still marked as prefetched, then it hasn't been used

    if (blk->wasPrefetched()) {

        prefetcher->prefetchUnused();

    }


    // Notify that the data contents for this address are no longer present

    updateBlockData(blk, nullptr, blk->isValid());


    // If handling a block present in the Tags, let it do its invalidation

    // process, which will update stats and invalidate the block itself

    if (blk != tempBlock) {

        tags->invalidate(blk);

    } else {

        tempBlock->invalidate();

    }

}


void


BaseCache::evictBlock(CacheBlk *blk, PacketList &writebacks)

{

    PacketPtr pkt = evictBlock(blk);

    if (pkt) {

        writebacks.push_back(pkt);

    }

}


PacketPtr


BaseCache::writebackBlk(CacheBlk *blk)

{

    gem5_assert(!isReadOnly || writebackClean,

                "Writeback from read-only cache");

    assert(blk && blk->isValid() &&

        (blk->isSet(CacheBlk::DirtyBit) || writebackClean));


    stats.writebacks[Request::wbRequestorId]++;


    RequestPtr req = std::make_shared<Request>(

        regenerateBlkAddr(blk), blkSize, 0, Request::wbRequestorId);


    if (blk->isSecure())

        req->setFlags(Request::SECURE);


    req->taskId(blk->getTaskId());


    PacketPtr pkt =

        new Packet(req, blk->isSet(CacheBlk::DirtyBit) ?

                   MemCmd::WritebackDirty : MemCmd::WritebackClean);


    DPRINTF(Cache, "Create Writeback %s writable: %d, dirty: %d\n",

        pkt->print(), blk->isSet(CacheBlk::WritableBit),

        blk->isSet(CacheBlk::DirtyBit));


    if (blk->isSet(CacheBlk::WritableBit)) {

        // not asserting shared means we pass the block in modified

        // state, mark our own block non-writeable

        blk->clearCoherenceBits(CacheBlk::WritableBit);

    } else {

        // we are in the Owned state, tell the receiver

        pkt->setHasSharers();

    }


    // make sure the block is not marked dirty

    blk->clearCoherenceBits(CacheBlk::DirtyBit);


    pkt->allocate();

    pkt->setDataFromBlock(blk->data, blkSize);


    // When a block is compressed, it must first be decompressed before being

    // sent for writeback.

    if (compressor) {

        pkt->payloadDelay = compressor->getDecompressionLatency(blk);

    }


    return pkt;

}


PacketPtr


BaseCache::writecleanBlk(CacheBlk *blk, Request::Flags dest, PacketId id)

{

    RequestPtr req = std::make_shared<Request>(

        regenerateBlkAddr(blk), blkSize, 0, Request::wbRequestorId);


    if (blk->isSecure()) {

        req->setFlags(Request::SECURE);

    }

    req->taskId(blk->getTaskId());


    PacketPtr pkt = new Packet(req, MemCmd::WriteClean, blkSize, id);


    if (dest) {

        req->setFlags(dest);

        pkt->setWriteThrough();

    }


    DPRINTF(Cache, "Create %s writable: %d, dirty: %d\n", pkt->print(),

            blk->isSet(CacheBlk::WritableBit), blk->isSet(CacheBlk::DirtyBit));


    if (blk->isSet(CacheBlk::WritableBit)) {

        // not asserting shared means we pass the block in modified

        // state, mark our own block non-writeable

        blk->clearCoherenceBits(CacheBlk::WritableBit);

    } else {

        // we are in the Owned state, tell the receiver

        pkt->setHasSharers();

    }


    // make sure the block is not marked dirty

    blk->clearCoherenceBits(CacheBlk::DirtyBit);


    pkt->allocate();

    pkt->setDataFromBlock(blk->data, blkSize);


    // When a block is compressed, it must first be decompressed before being

    // sent for writeback.

    if (compressor) {

        pkt->payloadDelay = compressor->getDecompressionLatency(blk);

    }


    return pkt;

}


void


BaseCache::memWriteback()

{

    tags->forEachBlk([this](CacheBlk &blk) { writebackVisitor(blk); });

}


void


BaseCache::memInvalidate()

{

    tags->forEachBlk([this](CacheBlk &blk) { invalidateVisitor(blk); });

}


bool


BaseCache::isDirty() const

{

    return tags->anyBlk([](CacheBlk &blk) {

        return blk.isSet(CacheBlk::DirtyBit); });

}


bool


BaseCache::coalesce() const

{

    return writeAllocator && writeAllocator->coalesce();

}


void


BaseCache::writebackVisitor(CacheBlk &blk)

{

    if (blk.isSet(CacheBlk::DirtyBit)) {

        assert(blk.isValid());


        RequestPtr request = std::make_shared<Request>(

            regenerateBlkAddr(&blk), blkSize, 0, Request::funcRequestorId);


        request->taskId(blk.getTaskId());

        if (blk.isSecure()) {

            request->setFlags(Request::SECURE);

        }


        Packet packet(request, MemCmd::WriteReq);

        packet.dataStatic(blk.data);


        memSidePort.sendFunctional(&packet);


        blk.clearCoherenceBits(CacheBlk::DirtyBit);

    }

}


void


BaseCache::invalidateVisitor(CacheBlk &blk)

{

    if (blk.isSet(CacheBlk::DirtyBit))

        warn_once("Invalidating dirty cache lines. " \

                  "Expect things to break.\n");


    if (blk.isValid()) {

        assert(!blk.isSet(CacheBlk::DirtyBit));

        invalidateBlock(&blk);

    }

}


Tick


BaseCache::nextQueueReadyTime() const

{

    Tick nextReady = std::min(mshrQueue.nextReadyTime(),

                              writeBuffer.nextReadyTime());


    // Don't signal prefetch ready time if no MSHRs available

    // Will signal once enoguh MSHRs are deallocated

    if (prefetcher && mshrQueue.canPrefetch() && !isBlocked()) {

        nextReady = std::min(nextReady,

                             prefetcher->nextPrefetchReadyTime());

    }


    return nextReady;

}


bool


BaseCache::sendMSHRQueuePacket(MSHR* mshr)

{

    assert(mshr);


    // use request from 1st target

    PacketPtr tgt_pkt = mshr->getTarget()->pkt;


    DPRINTF(Cache, "%s: MSHR %s\n", __func__, tgt_pkt->print());


    // if the cache is in write coalescing mode or (additionally) in

    // no allocation mode, and we have a write packet with an MSHR

    // that is not a whole-line write (due to incompatible flags etc),

    // then reset the write mode

    if (writeAllocator && writeAllocator->coalesce() && tgt_pkt->isWrite()) {

        if (!mshr->isWholeLineWrite()) {

            // if we are currently write coalescing, hold on the

            // MSHR as many cycles extra as we need to completely

            // write a cache line

            if (writeAllocator->delay(mshr->blkAddr)) {

                Tick delay = blkSize / tgt_pkt->getSize() * clockPeriod();

                DPRINTF(CacheVerbose, "Delaying pkt %s %llu ticks to allow "

                        "for write coalescing\n", tgt_pkt->print(), delay);

                mshrQueue.delay(mshr, delay);

                return false;

            } else {

                writeAllocator->reset();

            }

        } else {

            writeAllocator->resetDelay(mshr->blkAddr);

        }

    }


    CacheBlk *blk = tags->findBlock({mshr->blkAddr, mshr->isSecure});


    // either a prefetch that is not present upstream, or a normal

    // MSHR request, proceed to get the packet to send downstream

    PacketPtr pkt = createMissPacket(tgt_pkt, blk, mshr->needsWritable(),

                                     mshr->isWholeLineWrite());


    mshr->isForward = (pkt == nullptr);


    if (mshr->isForward) {

        // not a cache block request, but a response is expected

        // make copy of current packet to forward, keep current

        // copy for response handling

        pkt = new Packet(tgt_pkt, false, true);

        assert(!pkt->isWrite());

    }


    // play it safe and append (rather than set) the sender state,

    // as forwarded packets may already have existing state

    pkt->pushSenderState(mshr);


    if (pkt->isClean() && blk && blk->isSet(CacheBlk::DirtyBit)) {

        // A cache clean opearation is looking for a dirty block. Mark

        // the packet so that the destination xbar can determine that

        // there will be a follow-up write packet as well.

        pkt->setSatisfied();

    }


    if (!memSidePort.sendTimingReq(pkt)) {

        // we are awaiting a retry, but we

        // delete the packet and will be creating a new packet

        // when we get the opportunity

        delete pkt;


        // note that we have now masked any requestBus and

        // schedSendEvent (we will wait for a retry before

        // doing anything), and this is so even if we do not

        // care about this packet and might override it before

        // it gets retried

        return true;

    } else {

        // As part of the call to sendTimingReq the packet is

        // forwarded to all neighbouring caches (and any caches

        // above them) as a snoop. Thus at this point we know if

        // any of the neighbouring caches are responding, and if

        // so, we know it is dirty, and we can determine if it is

        // being passed as Modified, making our MSHR the ordering

        // point

        bool pending_modified_resp = !pkt->hasSharers() &&

            pkt->cacheResponding();

        markInService(mshr, pending_modified_resp);


        if (pkt->isClean() && blk && blk->isSet(CacheBlk::DirtyBit)) {

            // A cache clean opearation is looking for a dirty

            // block. If a dirty block is encountered a WriteClean

            // will update any copies to the path to the memory

            // until the point of reference.

            DPRINTF(CacheVerbose, "%s: packet %s found block: %s\n",

                    __func__, pkt->print(), blk->print());

            PacketPtr wb_pkt = writecleanBlk(blk, pkt->req->getDest(),

                                             pkt->id);

            PacketList writebacks;

            writebacks.push_back(wb_pkt);

            doWritebacks(writebacks, 0);

        }


        return false;

    }

}


bool


BaseCache::sendWriteQueuePacket(WriteQueueEntry* wq_entry)

{

    assert(wq_entry);


    // always a single target for write queue entries

    PacketPtr tgt_pkt = wq_entry->getTarget()->pkt;


    DPRINTF(Cache, "%s: write %s\n", __func__, tgt_pkt->print());


    // forward as is, both for evictions and uncacheable writes

    if (!memSidePort.sendTimingReq(tgt_pkt)) {

        // note that we have now masked any requestBus and

        // schedSendEvent (we will wait for a retry before

        // doing anything), and this is so even if we do not

        // care about this packet and might override it before

        // it gets retried

        return true;

    } else {

        markInService(wq_entry);

        return false;

    }

}


void


BaseCache::serialize(CheckpointOut &cp) const

{

    bool dirty(isDirty());


    if (dirty) {

        warn("*** The cache still contains dirty data. ***\n");

        warn("    Make sure to drain the system using the correct flags.\n");

        warn("    This checkpoint will not restore correctly " \

             "and dirty data in the cache will be lost!\n");

    }


    // Since we don't checkpoint the data in the cache, any dirty data

    // will be lost when restoring from a checkpoint of a system that

    // wasn't drained properly. Flag the checkpoint as invalid if the

    // cache contains dirty data.

    bool bad_checkpoint(dirty);

    SERIALIZE_SCALAR(bad_checkpoint);

}


void


BaseCache::unserialize(CheckpointIn &cp)

{

    bool bad_checkpoint;

    UNSERIALIZE_SCALAR(bad_checkpoint);

    if (bad_checkpoint) {

        fatal("Restoring from checkpoints with dirty caches is not "

              "supported in the classic memory system. Please remove any "

              "caches or drain them properly before taking checkpoints.\n");

    }

}


BaseCache::CacheCmdStats::CacheCmdStats(BaseCache &c,

                                        const std::string &name)

    : statistics::Group(&c, name.c_str()), cache(c),

      ADD_STAT(hits, statistics::units::Count::get(),

               ("number of " + name + " hits").c_str()),

      ADD_STAT(misses, statistics::units::Count::get(),

               ("number of " + name + " misses").c_str()),

      ADD_STAT(hitLatency, statistics::units::Tick::get(),

               ("number of " + name + " hit ticks").c_str()),

      ADD_STAT(missLatency, statistics::units::Tick::get(),

               ("number of " + name + " miss ticks").c_str()),

      ADD_STAT(accesses, statistics::units::Count::get(),

               ("number of " + name + " accesses(hits+misses)").c_str()),

      ADD_STAT(missRate, statistics::units::Ratio::get(),

               ("miss rate for " + name + " accesses").c_str()),

      ADD_STAT(avgMissLatency, statistics::units::Rate<

                    statistics::units::Tick, statistics::units::Count>::get(),

               ("average " + name + " miss latency").c_str()),

      ADD_STAT(mshrHits, statistics::units::Count::get(),

               ("number of " + name + " MSHR hits").c_str()),

      ADD_STAT(mshrMisses, statistics::units::Count::get(),

               ("number of " + name + " MSHR misses").c_str()),

      ADD_STAT(mshrUncacheable, statistics::units::Count::get(),

               ("number of " + name + " MSHR uncacheable").c_str()),

      ADD_STAT(mshrMissLatency, statistics::units::Tick::get(),

               ("number of " + name + " MSHR miss ticks").c_str()),

      ADD_STAT(mshrUncacheableLatency, statistics::units::Tick::get(),

               ("number of " + name + " MSHR uncacheable ticks").c_str()),

      ADD_STAT(mshrMissRate, statistics::units::Ratio::get(),

               ("mshr miss rate for " + name + " accesses").c_str()),

      ADD_STAT(avgMshrMissLatency, statistics::units::Rate<

                    statistics::units::Tick, statistics::units::Count>::get(),

               ("average " + name + " mshr miss latency").c_str()),

      ADD_STAT(avgMshrUncacheableLatency, statistics::units::Rate<

                    statistics::units::Tick, statistics::units::Count>::get(),

               ("average " + name + " mshr uncacheable latency").c_str())

{

}


void


BaseCache::CacheCmdStats::regStatsFromParent()

{

    using namespace statistics;


    statistics::Group::regStats();

    System *system = cache.system;

    const auto max_requestors = system->maxRequestors();


    hits

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        hits.subname(i, system->getRequestorName(i));

    }


    // Miss statistics

    misses

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        misses.subname(i, system->getRequestorName(i));

    }


    // Hit latency statistics

    hitLatency

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        hitLatency.subname(i, system->getRequestorName(i));

    }


    // Miss latency statistics

    missLatency

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        missLatency.subname(i, system->getRequestorName(i));

    }


    // access formulas

    accesses.flags(total | nozero | nonan);

    accesses = hits + misses;

    for (int i = 0; i < max_requestors; i++) {

        accesses.subname(i, system->getRequestorName(i));

    }


    // miss rate formulas

    missRate.flags(total | nozero | nonan);

    missRate = misses / accesses;

    for (int i = 0; i < max_requestors; i++) {

        missRate.subname(i, system->getRequestorName(i));

    }


    // miss latency formulas

    avgMissLatency.flags(total | nozero | nonan);

    avgMissLatency = missLatency / misses;

    for (int i = 0; i < max_requestors; i++) {

        avgMissLatency.subname(i, system->getRequestorName(i));

    }


    // MSHR statistics

    // MSHR hit statistics

    mshrHits

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        mshrHits.subname(i, system->getRequestorName(i));

    }


    // MSHR miss statistics

    mshrMisses

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        mshrMisses.subname(i, system->getRequestorName(i));

    }


    // MSHR miss latency statistics

    mshrMissLatency

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        mshrMissLatency.subname(i, system->getRequestorName(i));

    }


    // MSHR uncacheable statistics

    mshrUncacheable

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        mshrUncacheable.subname(i, system->getRequestorName(i));

    }


    // MSHR miss latency statistics

    mshrUncacheableLatency

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        mshrUncacheableLatency.subname(i, system->getRequestorName(i));

    }


    // MSHR miss rate formulas

    mshrMissRate.flags(total | nozero | nonan);

    mshrMissRate = mshrMisses / accesses;


    for (int i = 0; i < max_requestors; i++) {

        mshrMissRate.subname(i, system->getRequestorName(i));

    }


    // mshrMiss latency formulas

    avgMshrMissLatency.flags(total | nozero | nonan);

    avgMshrMissLatency = mshrMissLatency / mshrMisses;

    for (int i = 0; i < max_requestors; i++) {

        avgMshrMissLatency.subname(i, system->getRequestorName(i));

    }


    // mshrUncacheable latency formulas

    avgMshrUncacheableLatency.flags(total | nozero | nonan);

    avgMshrUncacheableLatency = mshrUncacheableLatency / mshrUncacheable;

    for (int i = 0; i < max_requestors; i++) {

        avgMshrUncacheableLatency.subname(i, system->getRequestorName(i));

    }

}


BaseCache::CacheStats::CacheStats(BaseCache &c)

    : statistics::Group(&c), cache(c),


    ADD_STAT(demandHits, statistics::units::Count::get(),

             "number of demand (read+write) hits"),

    ADD_STAT(overallHits, statistics::units::Count::get(),

             "number of overall hits"),

    ADD_STAT(demandHitLatency, statistics::units::Tick::get(),

             "number of demand (read+write) hit ticks"),

    ADD_STAT(overallHitLatency, statistics::units::Tick::get(),

            "number of overall hit ticks"),

    ADD_STAT(demandMisses, statistics::units::Count::get(),

             "number of demand (read+write) misses"),

    ADD_STAT(overallMisses, statistics::units::Count::get(),

             "number of overall misses"),

    ADD_STAT(demandMissLatency, statistics::units::Tick::get(),

             "number of demand (read+write) miss ticks"),

    ADD_STAT(overallMissLatency, statistics::units::Tick::get(),

             "number of overall miss ticks"),

    ADD_STAT(demandAccesses, statistics::units::Count::get(),

             "number of demand (read+write) accesses"),

    ADD_STAT(overallAccesses, statistics::units::Count::get(),

             "number of overall (read+write) accesses"),

    ADD_STAT(demandMissRate, statistics::units::Ratio::get(),

             "miss rate for demand accesses"),

    ADD_STAT(overallMissRate, statistics::units::Ratio::get(),

             "miss rate for overall accesses"),

    ADD_STAT(demandAvgMissLatency, statistics::units::Rate<

                statistics::units::Tick, statistics::units::Count>::get(),

             "average overall miss latency in ticks"),

    ADD_STAT(overallAvgMissLatency, statistics::units::Rate<

                statistics::units::Tick, statistics::units::Count>::get(),

             "average overall miss latency"),

    ADD_STAT(blockedCycles, statistics::units::Cycle::get(),

            "number of cycles access was blocked"),

    ADD_STAT(blockedCauses, statistics::units::Count::get(),

            "number of times access was blocked"),

    ADD_STAT(avgBlocked, statistics::units::Rate<

                statistics::units::Cycle, statistics::units::Count>::get(),

             "average number of cycles each access was blocked"),

    ADD_STAT(writebacks, statistics::units::Count::get(),

             "number of writebacks"),

    ADD_STAT(demandMshrHits, statistics::units::Count::get(),

             "number of demand (read+write) MSHR hits"),

    ADD_STAT(overallMshrHits, statistics::units::Count::get(),

             "number of overall MSHR hits"),

    ADD_STAT(demandMshrMisses, statistics::units::Count::get(),

             "number of demand (read+write) MSHR misses"),

    ADD_STAT(overallMshrMisses, statistics::units::Count::get(),

            "number of overall MSHR misses"),

    ADD_STAT(overallMshrUncacheable, statistics::units::Count::get(),

             "number of overall MSHR uncacheable misses"),

    ADD_STAT(demandMshrMissLatency, statistics::units::Tick::get(),

             "number of demand (read+write) MSHR miss ticks"),

    ADD_STAT(overallMshrMissLatency, statistics::units::Tick::get(),

             "number of overall MSHR miss ticks"),

    ADD_STAT(overallMshrUncacheableLatency, statistics::units::Tick::get(),

             "number of overall MSHR uncacheable ticks"),

    ADD_STAT(demandMshrMissRate, statistics::units::Ratio::get(),

             "mshr miss ratio for demand accesses"),

    ADD_STAT(overallMshrMissRate, statistics::units::Ratio::get(),

             "mshr miss ratio for overall accesses"),

    ADD_STAT(demandAvgMshrMissLatency, statistics::units::Rate<

                statistics::units::Tick, statistics::units::Count>::get(),

             "average overall mshr miss latency"),

    ADD_STAT(overallAvgMshrMissLatency, statistics::units::Rate<

                statistics::units::Tick, statistics::units::Count>::get(),

             "average overall mshr miss latency"),

    ADD_STAT(overallAvgMshrUncacheableLatency, statistics::units::Rate<

                statistics::units::Tick, statistics::units::Count>::get(),

             "average overall mshr uncacheable latency"),

    ADD_STAT(replacements, statistics::units::Count::get(),

             "number of replacements"),

    ADD_STAT(dataExpansions, statistics::units::Count::get(),

             "number of data expansions"),

    ADD_STAT(dataContractions, statistics::units::Count::get(),

             "number of data contractions"),

    cmd(MemCmd::NUM_MEM_CMDS)

{

    for (int idx = 0; idx < MemCmd::NUM_MEM_CMDS; ++idx)

        cmd[idx].reset(new CacheCmdStats(c, MemCmd(idx).toString()));

}


void


BaseCache::CacheStats::regStats()

{

    using namespace statistics;


    statistics::Group::regStats();


    System *system = cache.system;

    const auto max_requestors = system->maxRequestors();


    for (auto &cs : cmd)

        cs->regStatsFromParent();


// These macros make it easier to sum the right subset of commands and

// to change the subset of commands that are considered "demand" vs

// "non-demand"

#define SUM_DEMAND(s)                                                   \

    (cmd[MemCmd::ReadReq]->s + cmd[MemCmd::WriteReq]->s +               \

     cmd[MemCmd::WriteLineReq]->s + cmd[MemCmd::ReadExReq]->s +         \

     cmd[MemCmd::ReadCleanReq]->s + cmd[MemCmd::ReadSharedReq]->s)


// should writebacks be included here?  prior code was inconsistent...

#define SUM_NON_DEMAND(s)                                       \

    (cmd[MemCmd::SoftPFReq]->s + cmd[MemCmd::HardPFReq]->s +    \

     cmd[MemCmd::SoftPFExReq]->s)


    demandHits.flags(total | nozero | nonan);

    demandHits = SUM_DEMAND(hits);

    for (int i = 0; i < max_requestors; i++) {

        demandHits.subname(i, system->getRequestorName(i));

    }


    overallHits.flags(total | nozero | nonan);

    overallHits = demandHits + SUM_NON_DEMAND(hits);

    for (int i = 0; i < max_requestors; i++) {

        overallHits.subname(i, system->getRequestorName(i));

    }


    demandMisses.flags(total | nozero | nonan);

    demandMisses = SUM_DEMAND(misses);

    for (int i = 0; i < max_requestors; i++) {

        demandMisses.subname(i, system->getRequestorName(i));

    }


    overallMisses.flags(total | nozero | nonan);

    overallMisses = demandMisses + SUM_NON_DEMAND(misses);

    for (int i = 0; i < max_requestors; i++) {

        overallMisses.subname(i, system->getRequestorName(i));

    }


    demandMissLatency.flags(total | nozero | nonan);

    demandMissLatency = SUM_DEMAND(missLatency);

    for (int i = 0; i < max_requestors; i++) {

        demandMissLatency.subname(i, system->getRequestorName(i));

    }


    overallMissLatency.flags(total | nozero | nonan);

    overallMissLatency = demandMissLatency + SUM_NON_DEMAND(missLatency);

    for (int i = 0; i < max_requestors; i++) {

        overallMissLatency.subname(i, system->getRequestorName(i));

    }


    demandHitLatency.flags(total | nozero | nonan);

    demandHitLatency = SUM_DEMAND(hitLatency);

    for (int i = 0; i < max_requestors; i++) {

        demandHitLatency.subname(i, system->getRequestorName(i));

    }

    overallHitLatency.flags(total | nozero | nonan);

    overallHitLatency = demandHitLatency + SUM_NON_DEMAND(hitLatency);

    for (int i = 0; i < max_requestors; i++) {

        overallHitLatency.subname(i, system->getRequestorName(i));

    }


    demandAccesses.flags(total | nozero | nonan);

    demandAccesses = demandHits + demandMisses;

    for (int i = 0; i < max_requestors; i++) {

        demandAccesses.subname(i, system->getRequestorName(i));

    }


    overallAccesses.flags(total | nozero | nonan);

    overallAccesses = overallHits + overallMisses;

    for (int i = 0; i < max_requestors; i++) {

        overallAccesses.subname(i, system->getRequestorName(i));

    }


    demandMissRate.flags(total | nozero | nonan);

    demandMissRate = demandMisses / demandAccesses;

    for (int i = 0; i < max_requestors; i++) {

        demandMissRate.subname(i, system->getRequestorName(i));

    }


    overallMissRate.flags(total | nozero | nonan);

    overallMissRate = overallMisses / overallAccesses;

    for (int i = 0; i < max_requestors; i++) {

        overallMissRate.subname(i, system->getRequestorName(i));

    }


    demandAvgMissLatency.flags(total | nozero | nonan);

    demandAvgMissLatency = demandMissLatency / demandMisses;

    for (int i = 0; i < max_requestors; i++) {

        demandAvgMissLatency.subname(i, system->getRequestorName(i));

    }


    overallAvgMissLatency.flags(total | nozero | nonan);

    overallAvgMissLatency = overallMissLatency / overallMisses;

    for (int i = 0; i < max_requestors; i++) {

        overallAvgMissLatency.subname(i, system->getRequestorName(i));

    }


    blockedCycles.init(NUM_BLOCKED_CAUSES);

    blockedCycles

        .subname(Blocked_NoMSHRs, "no_mshrs")

        .subname(Blocked_NoWBBuffers, "no_wbuffers")

        .subname(Blocked_NoTargets, "no_targets")

        ;


    blockedCauses.init(NUM_BLOCKED_CAUSES);

    blockedCauses

        .subname(Blocked_NoMSHRs, "no_mshrs")

        .subname(Blocked_NoWBBuffers, "no_wbuffers")

        .subname(Blocked_NoTargets, "no_targets")

        ;


    avgBlocked

        .subname(Blocked_NoMSHRs, "no_mshrs")

        .subname(Blocked_NoWBBuffers, "no_wbuffers")

        .subname(Blocked_NoTargets, "no_targets")

        ;

    avgBlocked = blockedCycles / blockedCauses;


    writebacks

        .init(max_requestors)

        .flags(total | nozero | nonan)

        ;

    for (int i = 0; i < max_requestors; i++) {

        writebacks.subname(i, system->getRequestorName(i));

    }


    demandMshrHits.flags(total | nozero | nonan);

    demandMshrHits = SUM_DEMAND(mshrHits);

    for (int i = 0; i < max_requestors; i++) {

        demandMshrHits.subname(i, system->getRequestorName(i));

    }


    overallMshrHits.flags(total | nozero | nonan);

    overallMshrHits = demandMshrHits + SUM_NON_DEMAND(mshrHits);

    for (int i = 0; i < max_requestors; i++) {

        overallMshrHits.subname(i, system->getRequestorName(i));

    }


    demandMshrMisses.flags(total | nozero | nonan);

    demandMshrMisses = SUM_DEMAND(mshrMisses);

    for (int i = 0; i < max_requestors; i++) {

        demandMshrMisses.subname(i, system->getRequestorName(i));

    }


    overallMshrMisses.flags(total | nozero | nonan);

    overallMshrMisses = demandMshrMisses + SUM_NON_DEMAND(mshrMisses);

    for (int i = 0; i < max_requestors; i++) {

        overallMshrMisses.subname(i, system->getRequestorName(i));

    }


    demandMshrMissLatency.flags(total | nozero | nonan);

    demandMshrMissLatency = SUM_DEMAND(mshrMissLatency);

    for (int i = 0; i < max_requestors; i++) {

        demandMshrMissLatency.subname(i, system->getRequestorName(i));

    }


    overallMshrMissLatency.flags(total | nozero | nonan);

    overallMshrMissLatency =

        demandMshrMissLatency + SUM_NON_DEMAND(mshrMissLatency);

    for (int i = 0; i < max_requestors; i++) {

        overallMshrMissLatency.subname(i, system->getRequestorName(i));

    }


    overallMshrUncacheable.flags(total | nozero | nonan);

    overallMshrUncacheable =

        SUM_DEMAND(mshrUncacheable) + SUM_NON_DEMAND(mshrUncacheable);

    for (int i = 0; i < max_requestors; i++) {

        overallMshrUncacheable.subname(i, system->getRequestorName(i));

    }


    overallMshrUncacheableLatency.flags(total | nozero | nonan);

    overallMshrUncacheableLatency =

        SUM_DEMAND(mshrUncacheableLatency) +

        SUM_NON_DEMAND(mshrUncacheableLatency);

    for (int i = 0; i < max_requestors; i++) {

        overallMshrUncacheableLatency.subname(i, system->getRequestorName(i));

    }


    demandMshrMissRate.flags(total | nozero | nonan);

    demandMshrMissRate = demandMshrMisses / demandAccesses;

    for (int i = 0; i < max_requestors; i++) {

        demandMshrMissRate.subname(i, system->getRequestorName(i));

    }


    overallMshrMissRate.flags(total | nozero | nonan);

    overallMshrMissRate = overallMshrMisses / overallAccesses;

    for (int i = 0; i < max_requestors; i++) {

        overallMshrMissRate.subname(i, system->getRequestorName(i));

    }


    demandAvgMshrMissLatency.flags(total | nozero | nonan);

    demandAvgMshrMissLatency = demandMshrMissLatency / demandMshrMisses;

    for (int i = 0; i < max_requestors; i++) {

        demandAvgMshrMissLatency.subname(i, system->getRequestorName(i));

    }


    overallAvgMshrMissLatency.flags(total | nozero | nonan);

    overallAvgMshrMissLatency = overallMshrMissLatency / overallMshrMisses;

    for (int i = 0; i < max_requestors; i++) {

        overallAvgMshrMissLatency.subname(i, system->getRequestorName(i));

    }


    overallAvgMshrUncacheableLatency.flags(total | nozero | nonan);

    overallAvgMshrUncacheableLatency =

        overallMshrUncacheableLatency / overallMshrUncacheable;

    for (int i = 0; i < max_requestors; i++) {

        overallAvgMshrUncacheableLatency.subname(i,

            system->getRequestorName(i));

    }


    dataExpansions.flags(nozero | nonan);

    dataContractions.flags(nozero | nonan);

}


void


BaseCache::regProbePoints()

{

    ppHit = new ProbePointArg<CacheAccessProbeArg>(

        this->getProbeManager(), "Hit");

    ppMiss = new ProbePointArg<CacheAccessProbeArg>(

        this->getProbeManager(), "Miss");

    ppFill = new ProbePointArg<CacheAccessProbeArg>(

        this->getProbeManager(), "Fill");

    ppDataUpdate =

        new ProbePointArg<CacheDataUpdateProbeArg>(

            this->getProbeManager(), "Data Update");

}


//

// CpuSidePort

//

bool


BaseCache::CpuSidePort::recvTimingSnoopResp(PacketPtr pkt)

{

    // Snoops shouldn't happen when bypassing caches

    assert(!cache.system->bypassCaches());


    assert(pkt->isResponse());


    // Express snoop responses from requestor to responder, e.g., from L1 to L2

    cache.recvTimingSnoopResp(pkt);

    return true;

}


bool


BaseCache::CpuSidePort::tryTiming(PacketPtr pkt)

{

    if (cache.system->bypassCaches() || pkt->isExpressSnoop()) {

        // always let express snoop packets through even if blocked

        return true;

    } else if (blocked || mustSendRetry) {

        // either already committed to send a retry, or blocked

        mustSendRetry = true;

        return false;

    }

    mustSendRetry = false;

    return true;

}


bool


BaseCache::CpuSidePort::recvTimingReq(PacketPtr pkt)

{

    assert(pkt->isRequest());


    if (cache.system->bypassCaches()) {

        // Just forward the packet if caches are disabled.

        // @todo This should really enqueue the packet rather

        [[maybe_unused]] bool success = cache.memSidePort.sendTimingReq(pkt);

        assert(success);

        return true;

    } else if (tryTiming(pkt)) {

        cache.recvTimingReq(pkt);

        return true;

    }

    return false;

}


Tick


BaseCache::CpuSidePort::recvAtomic(PacketPtr pkt)

{

    if (cache.system->bypassCaches()) {

        // Forward the request if the system is in cache bypass mode.

        return cache.memSidePort.sendAtomic(pkt);

    } else {

        return cache.recvAtomic(pkt);

    }

}


void


BaseCache::CpuSidePort::recvFunctional(PacketPtr pkt)

{

    if (cache.system->bypassCaches()) {

        // The cache should be flushed if we are in cache bypass mode,

        // so we don't need to check if we need to update anything.

        cache.memSidePort.sendFunctional(pkt);

        return;

    }


    // functional request

    cache.functionalAccess(pkt, true);

}


AddrRangeList


BaseCache::CpuSidePort::getAddrRanges() const

{

    return cache.getAddrRanges();

}


BaseCache::

CpuSidePort::CpuSidePort(const std::string &_name, BaseCache& _cache,

                         const std::string &_label)

    : CacheResponsePort(_name, _cache, _label)

{

}


//

// MemSidePort

//

bool


BaseCache::MemSidePort::recvTimingResp(PacketPtr pkt)

{

    cache->recvTimingResp(pkt);

    return true;

}


// Express snooping requests to memside port

void


BaseCache::MemSidePort::recvTimingSnoopReq(PacketPtr pkt)

{

    // Snoops shouldn't happen when bypassing caches

    assert(!cache->system->bypassCaches());


    // handle snooping requests

    cache->recvTimingSnoopReq(pkt);

}


Tick


BaseCache::MemSidePort::recvAtomicSnoop(PacketPtr pkt)

{

    // Snoops shouldn't happen when bypassing caches

    assert(!cache->system->bypassCaches());


    return cache->recvAtomicSnoop(pkt);

}


void


BaseCache::MemSidePort::recvFunctionalSnoop(PacketPtr pkt)

{

    // Snoops shouldn't happen when bypassing caches

    assert(!cache->system->bypassCaches());


    // functional snoop (note that in contrast to atomic we don't have

    // a specific functionalSnoop method, as they have the same

    // behaviour regardless)

    cache->functionalAccess(pkt, false);

}


void


BaseCache::CacheReqPacketQueue::sendDeferredPacket()

{

    // sanity check

    assert(!waitingOnRetry);


    // there should never be any deferred request packets in the

    // queue, instead we resly on the cache to provide the packets

    // from the MSHR queue or write queue

    assert(deferredPacketReadyTime() == MaxTick);


    // check for request packets (requests & writebacks)

    QueueEntry* entry = cache.getNextQueueEntry();


    if (!entry) {

        // can happen if e.g. we attempt a writeback and fail, but

        // before the retry, the writeback is eliminated because

        // we snoop another cache's ReadEx.

    } else {

        // let our snoop responses go first if there are responses to

        // the same addresses

        if (checkConflictingSnoop(entry->getTarget()->pkt)) {

            return;

        }

        waitingOnRetry = entry->sendPacket(cache);

    }


    // if we succeeded and are not waiting for a retry, schedule the

    // next send considering when the next queue is ready, note that

    // snoop responses have their own packet queue and thus schedule

    // their own events

    if (!waitingOnRetry) {

        schedSendEvent(cache.nextQueueReadyTime());

    }

}


BaseCache::MemSidePort::MemSidePort(const std::string &_name,

                                    BaseCache *_cache,

                                    const std::string &_label)

    : CacheRequestPort(_name, _reqQueue, _snoopRespQueue),

      _reqQueue(*_cache, *this, _snoopRespQueue, _label),

      _snoopRespQueue(*_cache, *this, true, _label), cache(_cache)

{

}


void


WriteAllocator::updateMode(Addr write_addr, unsigned write_size,

                           Addr blk_addr)

{

    // check if we are continuing where the last write ended

    if (nextAddr == write_addr) {

        delayCtr[blk_addr] = delayThreshold;

        // stop if we have already saturated

        if (mode != WriteMode::NO_ALLOCATE) {

            byteCount += write_size;

            // switch to streaming mode if we have passed the lower

            // threshold

            if (mode == WriteMode::ALLOCATE &&

                byteCount > coalesceLimit) {

                mode = WriteMode::COALESCE;

                DPRINTF(Cache, "Switched to write coalescing\n");

            } else if (mode == WriteMode::COALESCE &&

                       byteCount > noAllocateLimit) {

                // and continue and switch to non-allocating mode if we

                // pass the upper threshold

                mode = WriteMode::NO_ALLOCATE;

                DPRINTF(Cache, "Switched to write-no-allocate\n");

            }

        }

    } else {

        // we did not see a write matching the previous one, start

        // over again

        byteCount = write_size;

        mode = WriteMode::ALLOCATE;

        resetDelay(blk_addr);

    }

    nextAddr = write_addr + write_size;

}


} // namespace gem5

DPRINTF
#define DPRINTF(x,...)
Definition trace.hh:209

data
const char data[]
Definition circlebuf.test.cc:48

gem5::BaseCache::CacheReqPacketQueue::checkConflictingSnoop
bool checkConflictingSnoop(const PacketPtr pkt)
Check if there is a conflicting snoop response about to be send out, and if so simply stall any reque...
Definition base.hh:206

gem5::BaseCache::CacheReqPacketQueue::cache
BaseCache & cache
Definition base.hh:180

gem5::BaseCache::CacheReqPacketQueue::sendDeferredPacket
virtual void sendDeferredPacket()
Override the normal sendDeferredPacket and do not only consider the transmit list (used for responses...
Definition base.cc:2723

gem5::BaseCache::CacheRequestPort::CacheRequestPort
CacheRequestPort(const std::string &_name, ReqPacketQueue &_reqQueue, SnoopRespPacketQueue &_snoopRespQueue)
Definition base.hh:155

gem5::BaseCache::CacheResponsePort::mustSendRetry
bool mustSendRetry
Definition base.hh:285

gem5::BaseCache::CacheResponsePort::CacheResponsePort
CacheResponsePort(const std::string &_name, BaseCache &_cache, const std::string &_label)
Definition base.cc:71

gem5::BaseCache::CacheResponsePort::processSendRetry
void processSendRetry()
Definition base.cc:179

gem5::BaseCache::CacheResponsePort::clearBlocked
void clearBlocked()
Return to normal operation and accept new requests.
Definition base.cc:167

gem5::BaseCache::CacheResponsePort::sendRetryEvent
EventFunctionWrapper sendRetryEvent
Definition base.hh:291

gem5::BaseCache::CacheResponsePort::blocked
bool blocked
Definition base.hh:283

gem5::BaseCache::CacheResponsePort::cache
BaseCache & cache
Definition base.hh:278

gem5::BaseCache::CacheResponsePort::setBlocked
void setBlocked()
Do not accept any new requests.
Definition base.cc:152

gem5::BaseCache::CacheResponsePort::queue
RespPacketQueue queue
A normal packet queue used to store responses.
Definition base.hh:281

gem5::BaseCache::CpuSidePort::recvTimingSnoopResp
virtual bool recvTimingSnoopResp(PacketPtr pkt) override
Receive a timing snoop response from the peer.
Definition base.cc:2593

gem5::BaseCache::CpuSidePort::recvAtomic
virtual Tick recvAtomic(PacketPtr pkt) override
Receive an atomic request packet from the peer.
Definition base.cc:2640

gem5::BaseCache::CpuSidePort::CpuSidePort
CpuSidePort(const std::string &_name, BaseCache &_cache, const std::string &_label)
Definition base.cc:2672

gem5::BaseCache::CpuSidePort::recvTimingReq
virtual bool recvTimingReq(PacketPtr pkt) override
Receive a timing request from the peer.
Definition base.cc:2622

gem5::BaseCache::CpuSidePort::tryTiming
virtual bool tryTiming(PacketPtr pkt) override
Availability request from the peer.
Definition base.cc:2607

gem5::BaseCache::CpuSidePort::recvFunctional
virtual void recvFunctional(PacketPtr pkt) override
Receive a functional request packet from the peer.
Definition base.cc:2651

gem5::BaseCache::CpuSidePort::getAddrRanges
virtual AddrRangeList getAddrRanges() const override
Get a list of the non-overlapping address ranges the owner is responsible for.
Definition base.cc:2665

gem5::BaseCache::MemSidePort::recvAtomicSnoop
virtual Tick recvAtomicSnoop(PacketPtr pkt)
Receive an atomic snoop request packet from our peer.
Definition base.cc:2702

gem5::BaseCache::MemSidePort::recvFunctionalSnoop
virtual void recvFunctionalSnoop(PacketPtr pkt)
Receive a functional snoop request packet from the peer.
Definition base.cc:2711

gem5::BaseCache::MemSidePort::cache
BaseCache * cache
Definition base.hh:234

gem5::BaseCache::MemSidePort::recvTimingResp
virtual bool recvTimingResp(PacketPtr pkt)
Receive a timing response from the peer.
Definition base.cc:2684

gem5::BaseCache::MemSidePort::recvTimingSnoopReq
virtual void recvTimingSnoopReq(PacketPtr pkt)
Receive a timing snoop request from the peer.
Definition base.cc:2692

gem5::BaseCache::MemSidePort::_reqQueue
CacheReqPacketQueue _reqQueue
The cache-specific queue.
Definition base.hh:229

gem5::BaseCache::MemSidePort::_snoopRespQueue
SnoopRespPacketQueue _snoopRespQueue
Definition base.hh:231

gem5::BaseCache::MemSidePort::MemSidePort
MemSidePort(const std::string &_name, BaseCache *_cache, const std::string &_label)
Definition base.cc:2758

gem5::BaseCache::serviceMSHRTargets
virtual void serviceMSHRTargets(MSHR *mshr, const PacketPtr pkt, CacheBlk *blk)=0
Service non-deferred MSHR targets using the received response.

gem5::BaseCache::functionalAccess
virtual void functionalAccess(PacketPtr pkt, bool from_cpu_side)
Performs the access specified by the request.
Definition base.cc:765

gem5::BaseCache::isReadOnly
const bool isReadOnly
Is this cache read only, for example the instruction cache, or table-walker cache.
Definition base.hh:945

gem5::BaseCache::recvTimingReq
virtual void recvTimingReq(PacketPtr pkt)
Performs the access specified by the request.
Definition base.cc:454

gem5::BaseCache::accessor
gem5::BaseCache::CacheAccessorImpl accessor

gem5::BaseCache::doWritebacks
virtual void doWritebacks(PacketList &writebacks, Tick forward_time)=0
Insert writebacks into the write buffer.

gem5::BaseCache::fillLatency
const Cycles fillLatency
The latency to fill a cache block.
Definition base.hh:912

gem5::BaseCache::dataLatency
const Cycles dataLatency
The latency of data access of a cache.
Definition base.hh:902

gem5::BaseCache::invalidateVisitor
void invalidateVisitor(CacheBlk &blk)
Cache block visitor that invalidates all blocks in the cache.
Definition base.cc:1900

gem5::BaseCache::handleAtomicReqMiss
virtual Cycles handleAtomicReqMiss(PacketPtr pkt, CacheBlk *&blk, PacketList &writebacks)=0
Handle a request in atomic mode that missed in this cache.

gem5::BaseCache::doWritebacksAtomic
virtual void doWritebacksAtomic(PacketList &writebacks)=0
Send writebacks down the memory hierarchy in atomic mode.

gem5::BaseCache::updateBlockData
void updateBlockData(CacheBlk *blk, const PacketPtr cpkt, bool has_old_data)
Update the data contents of a block.
Definition base.cc:821

gem5::BaseCache::tempBlockWriteback
PacketPtr tempBlockWriteback
Writebacks from the tempBlock, resulting on the response path in atomic mode, must happen after the c...
Definition base.hh:686

gem5::BaseCache::allocateMissBuffer
MSHR * allocateMissBuffer(PacketPtr pkt, Tick time, bool sched_send=true)
Definition base.hh:1175

gem5::BaseCache::cpuSidePort
CpuSidePort cpuSidePort
Definition base.hh:321

gem5::BaseCache::isDirty
bool isDirty() const
Determine if there are any dirty blocks in the cache.
Definition base.cc:1864

gem5::BaseCache::invalidateBlock
void invalidateBlock(CacheBlk *blk)
Invalidate a cache block.
Definition base.cc:1727

gem5::BaseCache::noTargetMSHR
MSHR * noTargetMSHR
Pointer to the MSHR that has no targets.
Definition base.hh:976

gem5::BaseCache::writebackClean
const bool writebackClean
Determine if clean lines should be written back or not.
Definition base.hh:677

gem5::BaseCache::sendWriteQueuePacket
bool sendWriteQueuePacket(WriteQueueEntry *wq_entry)
Similar to sendMSHR, but for a write-queue entry instead.
Definition base.cc:2033

gem5::BaseCache::inRange
bool inRange(Addr addr) const
Determine if an address is in the ranges covered by this cache.
Definition base.cc:220

gem5::BaseCache::handleTimingReqMiss
virtual void handleTimingReqMiss(PacketPtr pkt, CacheBlk *blk, Tick forward_time, Tick request_time)=0

gem5::BaseCache::allocOnFill
bool allocOnFill(MemCmd cmd) const
Determine whether we should allocate on a fill or not.
Definition base.hh:443

gem5::BaseCache::forwardSnoops
bool forwardSnoops
Do we forward snoops from mem side port through to cpu side port?
Definition base.hh:930

gem5::BaseCache::order
uint64_t order
Increasing order number assigned to each incoming request.
Definition base.hh:970

gem5::BaseCache::incHitCount
void incHitCount(PacketPtr pkt)
Definition base.hh:1282

gem5::BaseCache::MSHRQueue_WriteBuffer
@ MSHRQueue_WriteBuffer
Definition base.hh:112

gem5::BaseCache::satisfyRequest
virtual void satisfyRequest(PacketPtr pkt, CacheBlk *blk, bool deferred_response=false, bool pending_downgrade=false)
Perform any necessary updates to the block and perform any data exchange between the packet and the b...
Definition base.cc:1146

gem5::BaseCache::memWriteback
virtual void memWriteback() override
Write back dirty blocks in the cache using functional accesses.
Definition base.cc:1852

gem5::BaseCache::updateCompressionData
bool updateCompressionData(CacheBlk *&blk, const uint64_t *data, PacketList &writebacks)
When a block is overwriten, its compression information must be updated, and it may need to be recomp...
Definition base.cc:1033

gem5::BaseCache::isBlocked
bool isBlocked() const
Returns true if the cache is blocked for accesses.
Definition base.hh:1198

gem5::BaseCache::stats
gem5::BaseCache::CacheStats stats

gem5::BaseCache::lookupLatency
const Cycles lookupLatency
The latency of tag lookup of a cache.
Definition base.hh:896

gem5::BaseCache::calculateAccessLatency
Cycles calculateAccessLatency(const CacheBlk *blk, const uint32_t delay, const Cycles lookup_lat) const
Calculate access latency in ticks given a tag lookup latency, and whether access was a hit or miss.
Definition base.cc:1256

gem5::BaseCache::nextQueueReadyTime
Tick nextQueueReadyTime() const
Find next request ready time from among possible sources.
Definition base.cc:1913

gem5::BaseCache::regProbePoints
void regProbePoints() override
Registers probes.
Definition base.cc:2574

gem5::BaseCache::memInvalidate
virtual void memInvalidate() override
Invalidates all blocks in the cache.
Definition base.cc:1858

gem5::BaseCache::mshrQueue
MSHRQueue mshrQueue
Miss status registers.
Definition base.hh:351

gem5::BaseCache::createMissPacket
virtual PacketPtr createMissPacket(PacketPtr cpu_pkt, CacheBlk *blk, bool needs_writable, bool is_whole_line_write) const =0
Create an appropriate downstream bus request packet.

gem5::BaseCache::ppFill
ProbePointArg< CacheAccessProbeArg > * ppFill
To probe when a cache fill occurs.
Definition base.hh:375

gem5::BaseCache::getPort
Port & getPort(const std::string &if_name, PortID idx=InvalidPortID) override
Get a port with a given name and index.
Definition base.cc:208

gem5::BaseCache::getNextQueueEntry
QueueEntry * getNextQueueEntry()
Return the next queue entry to service, either a pending miss from the MSHR queue,...
Definition base.cc:905

gem5::BaseCache::handleUncacheableWriteResp
void handleUncacheableWriteResp(PacketPtr pkt)
Handling the special case of uncacheable write responses to make recvTimingResp less cluttered.
Definition base.cc:527

gem5::BaseCache::blkSize
const unsigned blkSize
Block size of this cache.
Definition base.hh:890

gem5::BaseCache::writebackTempBlockAtomic
void writebackTempBlockAtomic()
Send the outstanding tempBlock writeback.
Definition base.hh:693

gem5::BaseCache::BlockedCause
BlockedCause
Reasons for caches to be blocked.
Definition base.hh:120

gem5::BaseCache::NUM_BLOCKED_CAUSES
@ NUM_BLOCKED_CAUSES
Definition base.hh:124

gem5::BaseCache::Blocked_NoTargets
@ Blocked_NoTargets
Definition base.hh:123

gem5::BaseCache::Blocked_NoWBBuffers
@ Blocked_NoWBBuffers
Definition base.hh:122

gem5::BaseCache::Blocked_NoMSHRs
@ Blocked_NoMSHRs
Definition base.hh:121

gem5::BaseCache::forwardLatency
const Cycles forwardLatency
This is the forward latency of the cache.
Definition base.hh:909

gem5::BaseCache::compressor
compression::Base * compressor
Compression method being used.
Definition base.hh:360

gem5::BaseCache::responseLatency
const Cycles responseLatency
The latency of sending reponse to its upper level cache/core on a linefill.
Definition base.hh:919

gem5::BaseCache::writecleanBlk
PacketPtr writecleanBlk(CacheBlk *blk, Request::Flags dest, PacketId id)
Create a writeclean request for the given block.
Definition base.cc:1806

gem5::BaseCache::schedMemSideSendEvent
void schedMemSideSendEvent(Tick time)
Schedule a send event for the memory-side port.
Definition base.hh:1246

gem5::BaseCache::memSidePort
MemSidePort memSidePort
Definition base.hh:322

gem5::BaseCache::~BaseCache
~BaseCache()
Definition base.cc:146

gem5::BaseCache::handleTimingReqHit
virtual void handleTimingReqHit(PacketPtr pkt, CacheBlk *blk, Tick request_time)
Definition base.cc:275

gem5::BaseCache::recvAtomic
virtual Tick recvAtomic(PacketPtr pkt)
Performs the access specified by the request.
Definition base.cc:685

gem5::BaseCache::unserialize
void unserialize(CheckpointIn &cp) override
Unserialize an object.
Definition base.cc:2077

gem5::BaseCache::cmpAndSwap
void cmpAndSwap(CacheBlk *blk, PacketPtr pkt)
Handle doing the Compare and Swap function for SPARC.
Definition base.cc:850

gem5::BaseCache::recvTimingResp
virtual void recvTimingResp(PacketPtr pkt)
Handles a response (cache line fill/write ack) from the bus.
Definition base.cc:539

gem5::BaseCache::access
virtual bool access(PacketPtr pkt, CacheBlk *&blk, Cycles &lat, PacketList &writebacks)
Does all the processing necessary to perform the provided request.
Definition base.cc:1290

gem5::BaseCache::setBlocked
void setBlocked(BlockedCause cause)
Marks the access path of the cache as blocked for the given cause.
Definition base.hh:1208

gem5::BaseCache::BaseCache
BaseCache(const BaseCacheParams &p, unsigned blk_size)
Definition base.cc:82

gem5::BaseCache::regenerateBlkAddr
Addr regenerateBlkAddr(CacheBlk *blk)
Regenerate block address using tags.
Definition base.cc:189

gem5::BaseCache::pendingDelete
std::unique_ptr< Packet > pendingDelete
Upstream caches need this packet until true is returned, so hold it for deletion until a subsequent c...
Definition base.hh:412

gem5::BaseCache::allocateBlock
CacheBlk * allocateBlock(const PacketPtr pkt, PacketList &writebacks)
Allocate a new block and perform any necessary writebacks.
Definition base.cc:1667

gem5::BaseCache::ppDataUpdate
ProbePointArg< CacheDataUpdateProbeArg > * ppDataUpdate
To probe when the contents of a block are updated.
Definition base.hh:382

gem5::BaseCache::prefetcher
prefetch::Base * prefetcher
Prefetcher.
Definition base.hh:366

gem5::BaseCache::tempBlock
TempCacheBlk * tempBlock
Temporary cache block for occasional transitory use.
Definition base.hh:406

gem5::BaseCache::addrRanges
const AddrRangeList addrRanges
The address range to which the cache responds on the CPU side.
Definition base.hh:984

gem5::BaseCache::ppHit
ProbePointArg< CacheAccessProbeArg > * ppHit
To probe when a cache hit occurs.
Definition base.hh:369

gem5::BaseCache::numTarget
const int numTarget
The number of targets for each MSHR.
Definition base.hh:927

gem5::BaseCache::moveContractions
const bool moveContractions
Similar to data expansions, after a block improves its compression, it may need to be moved elsewhere...
Definition base.hh:961

gem5::BaseCache::writeAllocator
WriteAllocator *const writeAllocator
The writeAllocator drive optimizations for streaming writes.
Definition base.hh:398

gem5::BaseCache::markInService
void markInService(MSHR *mshr, bool pending_modified_resp)
Mark a request as in service (sent downstream in the memory system), effectively making this MSHR the...
Definition base.hh:418

gem5::BaseCache::allocateWriteBuffer
void allocateWriteBuffer(PacketPtr pkt, Tick time)
Definition base.cc:231

gem5::BaseCache::calculateTagOnlyLatency
Cycles calculateTagOnlyLatency(const uint32_t delay, const Cycles lookup_lat) const
Calculate latency of accesses that only touch the tag array.
Definition base.cc:1247

gem5::BaseCache::handleFill
CacheBlk * handleFill(PacketPtr pkt, CacheBlk *blk, PacketList &writebacks, bool allocate)
Handle a fill operation caused by a received packet.
Definition base.cc:1571

gem5::BaseCache::incMissCount
void incMissCount(PacketPtr pkt)
Definition base.hh:1271

gem5::BaseCache::writeBuffer
WriteQueue writeBuffer
Write/writeback buffer.
Definition base.hh:354

gem5::BaseCache::replaceExpansions
const bool replaceExpansions
when a data expansion of a compressed block happens it will not be able to co-allocate where it is at...
Definition base.hh:953

gem5::BaseCache::serialize
void serialize(CheckpointOut &cp) const override
Serialize the state of the caches.
Definition base.cc:2057

gem5::BaseCache::coalesce
bool coalesce() const
Checks if the cache is coalescing writes.
Definition base.cc:1871

gem5::BaseCache::sequentialAccess
const bool sequentialAccess
Whether tags and data are accessed sequentially.
Definition base.hh:924

gem5::BaseCache::handleEvictions
bool handleEvictions(std::vector< CacheBlk * > &evict_blks, PacketList &writebacks)
Try to evict the given blocks.
Definition base.cc:996

gem5::BaseCache::init
void init() override
init() is called after all C++ SimObjects have been created and all ports are connected.
Definition base.cc:199

gem5::BaseCache::writebackBlk
PacketPtr writebackBlk(CacheBlk *blk)
Create a writeback request for the given block.
Definition base.cc:1756

gem5::BaseCache::clearBlocked
void clearBlocked(BlockedCause cause)
Marks the cache as unblocked for the given cause.
Definition base.hh:1227

gem5::BaseCache::evictBlock
virtual PacketPtr evictBlock(CacheBlk *blk)=0
Evict a cache block.

gem5::BaseCache::writebackVisitor
void writebackVisitor(CacheBlk &blk)
Cache block visitor that writes back dirty cache blocks using functional writes.
Definition base.cc:1877

gem5::BaseCache::writebackTempBlockAtomicEvent
EventFunctionWrapper writebackTempBlockAtomicEvent
An event to writeback the tempBlock after recvAtomic finishes.
Definition base.hh:705

gem5::BaseCache::tags
BaseTags * tags
Tag and data Storage.
Definition base.hh:357

gem5::BaseCache::clusivity
const enums::Clusivity clusivity
Clusivity with respect to the upstream cache, determining if we fill into both this cache and the cac...
Definition base.hh:937

gem5::BaseCache::ppMiss
ProbePointArg< CacheAccessProbeArg > * ppMiss
To probe when a cache miss occurs.
Definition base.hh:372

gem5::BaseCache::sendMSHRQueuePacket
virtual bool sendMSHRQueuePacket(MSHR *mshr)
Take an MSHR, turn it into a suitable downstream packet, and send it out.
Definition base.cc:1930

gem5::BaseCache::maintainClusivity
void maintainClusivity(bool from_cache, CacheBlk *blk)
Maintain the clusivity of this cache by potentially invalidating a block.
Definition base.cc:1559

gem5::BaseCache::system
System * system
System we are currently operating in.
Definition base.hh:988

gem5::BaseCache::partitionManager
partitioning_policy::PartitionManager * partitionManager
Partitioning manager.
Definition base.hh:363

gem5::CacheAccessProbeArg
Information provided to probes on a cache event.
Definition cache_probe_arg.hh:80

gem5::CacheBlkPrintWrapper
Simple class to provide virtual print() method on cache blocks without allocating a vtable pointer fo...
Definition cache_blk.hh:573

gem5::CacheBlk
A Basic Cache block.
Definition cache_blk.hh:72

gem5::CacheBlk::setWhenReady
void setWhenReady(const Tick tick)
Set tick at which block's data will be available for access.
Definition cache_blk.hh:281

gem5::CacheBlk::ReadableBit
@ ReadableBit
Read permission.
Definition cache_blk.hh:86

gem5::CacheBlk::WritableBit
@ WritableBit
write permission
Definition cache_blk.hh:81

gem5::CacheBlk::DirtyBit
@ DirtyBit
dirty (modified)
Definition cache_blk.hh:88

gem5::CacheBlk::getSrcRequestorId
uint32_t getSrcRequestorId() const
Get the requestor id associated to this block.
Definition cache_blk.hh:291

gem5::CacheBlk::getWhenReady
Tick getWhenReady() const
Get tick at which block's data will be available for access.
Definition cache_blk.hh:268

gem5::CacheBlk::clearPrefetched
void clearPrefetched()
Clear the prefetching bit.
Definition cache_blk.hh:258

gem5::CacheBlk::getPartitionId
uint64_t getPartitionId() const
Getter for _partitionId.
Definition cache_blk.hh:294

gem5::CacheBlk::print
std::string print() const override
Pretty-print tag, set and way, and interpret state bits to readable form including mapping to a MOESI...
Definition cache_blk.hh:372

gem5::CacheBlk::isSet
bool isSet(unsigned bits) const
Checks the given coherence bits are set.
Definition cache_blk.hh:242

gem5::CacheBlk::checkWrite
bool checkWrite(PacketPtr pkt)
Handle interaction of load-locked operations and stores.
Definition cache_blk.hh:420

gem5::CacheBlk::clearCoherenceBits
void clearCoherenceBits(unsigned bits)
Clear the corresponding coherence bits.
Definition cache_blk.hh:234

gem5::CacheBlk::getTaskId
uint32_t getTaskId() const
Get the task id associated to this block.
Definition cache_blk.hh:288

gem5::CacheBlk::trackLoadLocked
void trackLoadLocked(PacketPtr pkt)
Track the fact that a local locked was issued to the block.
Definition cache_blk.hh:335

gem5::CacheBlk::wasPrefetched
bool wasPrefetched() const
Check if this block was the result of a hardware prefetch, yet to be touched.
Definition cache_blk.hh:252

gem5::CacheBlk::data
uint8_t * data
Contains a copy of the data in this block for easy access.
Definition cache_blk.hh:104

gem5::CacheBlk::setCoherenceBits
void setCoherenceBits(unsigned bits)
Sets the corresponding coherence bits.
Definition cache_blk.hh:223

gem5::Cache
A coherent cache that can be arranged in flexible topologies.
Definition cache.hh:68

gem5::CheckpointIn
Definition serialize.hh:69

gem5::ClockedObject::ClockedObject
ClockedObject(const ClockedObjectParams &p)
Definition clocked_object.cc:46

gem5::Clocked::clockEdge
Tick clockEdge(Cycles cycles=Cycles(0)) const
Determine the tick when a cycle begins, by default the current one, but the argument also enables the...
Definition clocked_object.hh:177

gem5::Clocked::cyclesToTicks
Tick cyclesToTicks(Cycles c) const
Definition clocked_object.hh:227

gem5::Clocked::clockPeriod
Tick clockPeriod() const
Definition clocked_object.hh:217

gem5::Clocked::tick
Tick tick
Definition clocked_object.hh:68

gem5::Clocked::ticksToCycles
Cycles ticksToCycles(Tick t) const
Definition clocked_object.hh:222

gem5::CompressionBlk
A superblock is composed of sub-blocks, and each sub-block has information regarding its superblock a...
Definition super_blk.hh:52

gem5::CompressionBlk::getSizeBits
std::size_t getSizeBits() const
Definition super_blk.cc:93

gem5::CompressionBlk::setSizeBits
void setSizeBits(const std::size_t size)
Set size, in bits, of this compressed block's data.
Definition super_blk.cc:99

gem5::CompressionBlk::setDecompressionLatency
void setDecompressionLatency(const Cycles lat)
Set number of cycles needed to decompress this block.
Definition super_blk.cc:135

gem5::CompressionBlk::OverwriteType
OverwriteType
When an overwrite happens, the data size may change an not fit in its current container any longer.
Definition super_blk.hh:75

gem5::CompressionBlk::DATA_EXPANSION
@ DATA_EXPANSION
New data contents are considered larger than previous contents.
Definition super_blk.hh:81

gem5::CompressionBlk::DATA_CONTRACTION
@ DATA_CONTRACTION
New data contents are considered smaller than previous contents.
Definition super_blk.hh:77

gem5::CompressionBlk::checkExpansionContraction
OverwriteType checkExpansionContraction(const std::size_t size) const
Determines if changing the size of the block will cause a data expansion (new size is bigger) or cont...
Definition super_blk.cc:148

gem5::Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition types.hh:79

gem5::MSHR
Miss Status and handling Register.
Definition mshr.hh:75

gem5::MSHR::wasWholeLineWrite
bool wasWholeLineWrite
Track if we sent this as a whole line write or not.
Definition mshr.hh:124

gem5::MSHR::isPendingModified
bool isPendingModified() const
Definition mshr.hh:326

gem5::MSHR::promoteReadable
void promoteReadable()
Promotes deferred targets that do not require writable.
Definition mshr.cc:655

gem5::MSHR::isCleaning
bool isCleaning() const
Definition mshr.hh:321

gem5::MSHR::getNumTargets
int getNumTargets() const
Returns the current number of allocated targets.
Definition mshr.hh:446

gem5::MSHR::getTarget
QueueEntry::Target * getTarget() override
Returns a reference to the first target.
Definition mshr.hh:473

gem5::MSHR::needsWritable
bool needsWritable() const
The pending* and post* flags are only valid if inService is true.
Definition mshr.hh:319

gem5::MSHR::isForward
bool isForward
True if the entry is just a simple forward from an upper level.
Definition mshr.hh:127

gem5::MSHR::hasLockedRMWReadTarget
bool hasLockedRMWReadTarget()
Determine if there are any LockedRMWReads in the Targets list.
Definition mshr.cc:790

gem5::MSHR::promoteDeferredTargets
bool promoteDeferredTargets()
Definition mshr.cc:593

gem5::MSHR::isWholeLineWrite
bool isWholeLineWrite() const
Check if this MSHR contains only compatible writes, and if they span the entire cache line.
Definition mshr.hh:406

gem5::MSHR::allocateTarget
void allocateTarget(PacketPtr target, Tick when, Counter order, bool alloc_on_fill)
Add a request to the list of targets.
Definition mshr.cc:373

gem5::MSHR::promoteWritable
void promoteWritable()
Promotes deferred targets that do not require writable.
Definition mshr.cc:676

gem5::MSHR::allocOnFill
bool allocOnFill() const
Definition mshr.hh:340

gem5::MemCmd
Definition packet.hh:77

gem5::MemCmd::WritebackDirty
@ WritebackDirty
Definition packet.hh:93

gem5::MemCmd::InvalidateResp
@ InvalidateResp
Definition packet.hh:145

gem5::MemCmd::HardPFResp
@ HardPFResp
Definition packet.hh:101

gem5::MemCmd::WriteClean
@ WriteClean
Definition packet.hh:95

gem5::MemCmd::LockedRMWWriteReq
@ LockedRMWWriteReq
Definition packet.hh:118

gem5::MemCmd::WritebackClean
@ WritebackClean
Definition packet.hh:94

gem5::MemCmd::UpgradeResp
@ UpgradeResp
Definition packet.hh:105

gem5::MemCmd::LockedRMWWriteResp
@ LockedRMWWriteResp
Definition packet.hh:119

gem5::MemCmd::SwapReq
@ SwapReq
Definition packet.hh:120

gem5::MemCmd::WriteReq
@ WriteReq
Definition packet.hh:90

gem5::MemCmd::NUM_MEM_CMDS
@ NUM_MEM_CMDS
Definition packet.hh:152

gem5::MemCmd::CleanEvict
@ CleanEvict
Definition packet.hh:96

gem5::Named::_name
const std::string _name
Definition named.hh:54

gem5::Named::name
virtual std::string name() const
Definition named.hh:60

gem5::PacketQueue::waitingOnRetry
bool waitingOnRetry
Remember whether we're awaiting a retry.
Definition packet_queue.hh:113

gem5::PacketQueue::schedSendEvent
void schedSendEvent(Tick when)
Schedule a send event if we are not already waiting for a retry.
Definition packet_queue.cc:155

gem5::PacketQueue::deferredPacketReadyTime
Tick deferredPacketReadyTime() const
Get the next packet ready time.
Definition packet_queue.hh:172

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::Packet::isUpgrade
bool isUpgrade() const
Definition packet.hh:596

gem5::Packet::isRead
bool isRead() const
Definition packet.hh:593

gem5::Packet::isSecure
bool isSecure() const
Definition packet.hh:836

gem5::Packet::id
const PacketId id
Definition packet.hh:374

gem5::Packet::writeDataToBlock
void writeDataToBlock(uint8_t *blk_data, int blkSize) const
Copy data from the packet to the provided block pointer, which is aligned to the given block size.
Definition packet.hh:1346

gem5::Packet::getAddr
Addr getAddr() const
Definition packet.hh:807

gem5::Packet::pushLabel
void pushLabel(const std::string &lbl)
Push label for PrintReq (safe to call unconditionally).
Definition packet.hh:1470

gem5::Packet::isError
bool isError() const
Definition packet.hh:622

gem5::Packet::isLockedRMW
bool isLockedRMW() const
Definition packet.hh:621

gem5::Packet::setWriteThrough
void setWriteThrough()
A writeback/writeclean cmd gets propagated further downstream by the receiver when the flag is set.
Definition packet.hh:735

gem5::Packet::isAtomicOp
bool isAtomicOp() const
Definition packet.hh:846

gem5::Packet::isResponse
bool isResponse() const
Definition packet.hh:598

gem5::Packet::makeTimingResponse
void makeTimingResponse()
Definition packet.hh:1080

gem5::Packet::needsWritable
bool needsWritable() const
Definition packet.hh:599

gem5::Packet::print
void print(std::ostream &o, int verbosity=0, const std::string &prefix="") const
Definition packet.cc:368

gem5::Packet::isDemand
bool isDemand() const
Definition packet.hh:595

gem5::Packet::isCleanEviction
bool isCleanEviction() const
Is this packet a clean eviction, including both actual clean evict packets, but also clean writebacks...
Definition packet.hh:1435

gem5::Packet::needsResponse
bool needsResponse() const
Definition packet.hh:608

gem5::Packet::dataStatic
void dataStatic(T *p)
Set the data pointer to the following value that should not be freed.
Definition packet.hh:1175

gem5::Packet::senderState
SenderState * senderState
This packet's sender state.
Definition packet.hh:545

gem5::Packet::payloadDelay
uint32_t payloadDelay
The extra pipelining delay from seeing the packet until the end of payload is transmitted by the comp...
Definition packet.hh:449

gem5::Packet::makeResponse
void makeResponse()
Take a request packet and modify it in place to be suitable for returning as a response to that reque...
Definition packet.hh:1062

gem5::Packet::headerDelay
uint32_t headerDelay
The extra delay from seeing the packet until the header is transmitted.
Definition packet.hh:431

gem5::Packet::getOffset
Addr getOffset(unsigned int blk_size) const
Definition packet.hh:826

gem5::Packet::clearBlockCached
void clearBlockCached()
Definition packet.hh:761

gem5::Packet::pushSenderState
void pushSenderState(SenderState *sender_state)
Push a new sender state to the packet and make the current sender state the predecessor of the new on...
Definition packet.cc:334

gem5::Packet::hasData
bool hasData() const
Definition packet.hh:614

gem5::Packet::popSenderState
SenderState * popSenderState()
Pop the top of the state stack and return a pointer to it.
Definition packet.cc:342

gem5::Packet::hasRespData
bool hasRespData() const
Definition packet.hh:615

gem5::Packet::writeThrough
bool writeThrough() const
Definition packet.hh:742

gem5::Packet::fromCache
bool fromCache() const
Definition packet.hh:612

gem5::Packet::setData
void setData(const uint8_t *p)
Copy data into the packet from the provided pointer.
Definition packet.hh:1293

gem5::Packet::isWrite
bool isWrite() const
Definition packet.hh:594

gem5::Packet::setDataFromBlock
void setDataFromBlock(const uint8_t *blk_data, int blkSize)
Copy data into the packet from the provided block pointer, which is aligned to the given block size.
Definition packet.hh:1312

gem5::Packet::trySatisfyFunctional
bool trySatisfyFunctional(PacketPtr other)
Check a functional request against a memory value stored in another packet (i.e.
Definition packet.hh:1399

gem5::Packet::getBlockAddr
Addr getBlockAddr(unsigned int blk_size) const
Definition packet.hh:831

gem5::Packet::req
RequestPtr req
A pointer to the original request.
Definition packet.hh:377

gem5::Packet::getSize
unsigned getSize() const
Definition packet.hh:817

gem5::Packet::getAtomicOp
AtomicOpFunctor * getAtomicOp() const
Accessor function to atomic op.
Definition packet.hh:845

gem5::Packet::setCacheResponding
void setCacheResponding()
Snoop flags.
Definition packet.hh:653

gem5::Packet::isClean
bool isClean() const
Definition packet.hh:611

gem5::Packet::popLabel
void popLabel()
Pop label for PrintReq (safe to call unconditionally).
Definition packet.hh:1480

gem5::Packet::isExpressSnoop
bool isExpressSnoop() const
Definition packet.hh:702

gem5::Packet::isWriteback
bool isWriteback() const
Definition packet.hh:613

gem5::Packet::getConstPtr
const T * getConstPtr() const
Definition packet.hh:1234

gem5::Packet::setHasSharers
void setHasSharers()
On fills, the hasSharers flag is used by the caches in combination with the cacheResponding flag,...
Definition packet.hh:685

gem5::Packet::isLLSC
bool isLLSC() const
Definition packet.hh:620

gem5::Packet::cacheResponding
bool cacheResponding() const
Definition packet.hh:659

gem5::Packet::makeAtomicResponse
void makeAtomicResponse()
Definition packet.hh:1074

gem5::Packet::setSatisfied
void setSatisfied()
Set when a request hits in a cache and the cache is not going to respond.
Definition packet.hh:749

gem5::Packet::cmd
MemCmd cmd
The command field of the packet.
Definition packet.hh:372

gem5::Packet::isInvalidate
bool isInvalidate() const
Definition packet.hh:609

gem5::Packet::writeData
void writeData(uint8_t *p) const
Copy data from the packet to the memory at the provided pointer.
Definition packet.hh:1322

gem5::Packet::hasSharers
bool hasSharers() const
Definition packet.hh:686

gem5::Packet::allocate
void allocate()
Allocate memory for the packet.
Definition packet.hh:1367

gem5::Packet::isEviction
bool isEviction() const
Definition packet.hh:610

gem5::Packet::isRequest
bool isRequest() const
Definition packet.hh:597

gem5::Port
Ports are used to interface objects to each other.
Definition port.hh:62

gem5::ProbePointArg
ProbePointArg generates a point for the class of Arg.
Definition probe.hh:273

gem5::QueueEntry::Target
A queue entry is holding packets that will be serviced as soon as resources are available.
Definition queue_entry.hh:88

gem5::QueueEntry::Target::recvTime
const Tick recvTime
Time when request was received (for stats)
Definition queue_entry.hh:90

gem5::QueueEntry::Target::pkt
PacketPtr pkt
Pending request packet.
Definition queue_entry.hh:93

gem5::QueueEntry
A queue entry base class, to be used by both the MSHRs and write-queue entries.
Definition queue_entry.hh:63

gem5::QueueEntry::sendPacket
virtual bool sendPacket(BaseCache &cache)=0
Send this queue entry as a downstream packet, with the exact behaviour depending on the specific entr...

gem5::QueueEntry::getTarget
virtual Target * getTarget()=0
Returns a pointer to the first target.

gem5::QueueEntry::blkAddr
Addr blkAddr
Block aligned address.
Definition queue_entry.hh:116

gem5::QueueEntry::order
Counter order
Order number assigned to disambiguate writes and misses.
Definition queue_entry.hh:113

gem5::QueueEntry::inService
bool inService
True if the entry has been sent downstream.
Definition queue_entry.hh:110

gem5::QueueEntry::isSecure
bool isSecure
True if the entry targets the secure memory space.
Definition queue_entry.hh:122

gem5::QueuedResponsePort::QueuedResponsePort
QueuedResponsePort(const std::string &name, RespPacketQueue &resp_queue, PortID id=InvalidPortID)
Create a QueuedPort with a given name, owner, and a supplied implementation of a packet queue.
Definition qport.hh:80

gem5::Request::SECURE
@ SECURE
The request targets the secure memory space.
Definition request.hh:186

gem5::Request::funcRequestorId
@ funcRequestorId
This requestor id is used for functional requests that don't come from a particular device.
Definition request.hh:282

gem5::Request::wbRequestorId
@ wbRequestorId
This requestor id is used for writeback requests by the caches.
Definition request.hh:277

gem5::Request::Flags
gem5::Flags< FlagsType > Flags
Definition request.hh:102

gem5::ResponsePort::sendRetryReq
void sendRetryReq()
Send a retry to the request port that previously attempted a sendTimingReq to this response port and ...
Definition port.hh:489

gem5::SectorBlk::blks
std::vector< SectorSubBlk * > blks
List of blocks associated to this sector.
Definition sector_blk.hh:151

gem5::SectorSubBlk::getSectorBlock
SectorBlk * getSectorBlock() const
Get sector block associated to this block.
Definition sector_blk.cc:52

gem5::SuperBlk
A basic compression superblock.
Definition super_blk.hh:171

gem5::System
Definition system.hh:75

gem5::TaggedEntry::isValid
virtual bool isValid() const
Checks if the entry is valid.
Definition tagged_entry.hh:133

gem5::TaggedEntry::isSecure
bool isSecure() const
Check if this block holds data from the secure memory space.
Definition tagged_entry.hh:140

gem5::TempCacheBlk
Special instance of CacheBlk for use with tempBlk that deals with its block address regeneration.
Definition cache_blk.hh:517

gem5::WriteAllocator::noAllocateLimit
const uint32_t noAllocateLimit
Definition base.hh:1459

gem5::WriteAllocator::mode
WriteMode mode
Definition base.hh:1444

gem5::WriteAllocator::delayThreshold
const uint32_t delayThreshold
The number of times the allocator will delay an WriteReq MSHR.
Definition base.hh:1463

gem5::WriteAllocator::delayCtr
std::unordered_map< Addr, Counter > delayCtr
Keep track of the number of times the allocator has delayed an WriteReq MSHR.
Definition base.hh:1469

gem5::WriteAllocator::WriteMode::NO_ALLOCATE
@ NO_ALLOCATE
Definition base.hh:1442

gem5::WriteAllocator::WriteMode::COALESCE
@ COALESCE
Definition base.hh:1441

gem5::WriteAllocator::WriteMode::ALLOCATE
@ ALLOCATE
Definition base.hh:1440

gem5::WriteAllocator::updateMode
void updateMode(Addr write_addr, unsigned write_size, Addr blk_addr)
Update the write mode based on the current write packet.
Definition base.cc:2768

gem5::WriteAllocator::coalesceLimit
const uint32_t coalesceLimit
Limits for when to switch between the different write modes.
Definition base.hh:1458

gem5::WriteAllocator::byteCount
uint32_t byteCount
Bytes written contiguously.
Definition base.hh:1453

gem5::WriteAllocator::resetDelay
void resetDelay(Addr blk_addr)
Clear delay counter for the input block.
Definition base.hh:1416

gem5::WriteAllocator::nextAddr
Addr nextAddr
Address to match writes against to detect streams.
Definition base.hh:1447

gem5::WriteQueueEntry
Write queue entry.
Definition write_queue_entry.hh:68

gem5::WriteQueueEntry::getNumTargets
int getNumTargets() const
Returns the current number of allocated targets.
Definition write_queue_entry.hh:142

gem5::WriteQueueEntry::getTarget
Target * getTarget() override
Returns a reference to the first target.
Definition write_queue_entry.hh:155

std::vector
STL vector class.
Definition stl.hh:37

compiler.hh

compressed_tags.hh
Declaration of a compressed set associative tag store using superblocks.

cur_tick.hh

ADD_STAT
#define ADD_STAT(n,...)
Convenience macro to add a stat to a statistics group.
Definition group.hh:75

gem5::AddrRangeList
std::list< AddrRange > AddrRangeList
Convenience typedef for a collection of address ranges.
Definition addr_range.hh:64

gem5::EventBase::Delayed_Writeback_Pri
static const Priority Delayed_Writeback_Pri
For some reason "delayed" inter-cluster writebacks are scheduled before regular writebacks (which hav...
Definition eventq.hh:175

gem5::EventManager::schedule
void schedule(Event &event, Tick when)
Definition eventq.hh:1012

panic
#define panic(...)
This implements a cprintf based panic() function.
Definition logging.hh:220

fatal_if
#define fatal_if(cond,...)
Conditional fatal macro that checks the supplied condition and only causes a fatal error if the condi...
Definition logging.hh:268

gem5_assert
#define gem5_assert(cond,...)
The assert macro will function like a normal assert, but will use panic instead of straight abort().
Definition logging.hh:349

fatal
#define fatal(...)
This implements a cprintf based fatal() function.
Definition logging.hh:232

panic_if
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
Definition logging.hh:246

gem5::SimObject::getProbeManager
ProbeManager * getProbeManager()
Get the probe manager for this object.
Definition sim_object.cc:117

gem5::SimObject::getPort
virtual Port & getPort(const std::string &if_name, PortID idx=InvalidPortID)
Get a port with a given name and index.
Definition sim_object.cc:123

gem5::statistics::Group::regStats
virtual void regStats()
Callback to set stat parameters.
Definition group.cc:68

gem5::statistics::Group::Group
Group()=delete

logging.hh

warn
#define warn(...)
Definition logging.hh:288

warn_once
#define warn_once(...)
Definition logging.hh:292

warn_if
#define warn_if(cond,...)
Conditional warning macro that checks the supplied condition and only prints a warning if the conditi...
Definition logging.hh:315

SUM_DEMAND
#define SUM_DEMAND(s)

SUM_NON_DEMAND
#define SUM_NON_DEMAND(s)

base.hh
Declares a basic cache interface BaseCache.

base.hh
Definition of a basic cache compressor.

base.hh
Miss and writeback queue declarations.

mshr.hh
Miss Status and Handling Register (MSHR) declaration.

mshr_queue.hh
Declaration of a structure to manage MSHRs.

gem5::ArmISA::i
Bitfield< 7 > i
Definition misc_types.hh:67

gem5::ArmISA::offset
Bitfield< 23, 0 > offset
Definition types.hh:144

gem5::ArmISA::c
Bitfield< 29 > c
Definition misc_types.hh:53

gem5::MipsISA::r
r
Definition pra_constants.hh:98

gem5::MipsISA::p
Bitfield< 0 > p
Definition pra_constants.hh:326

gem5::X86ISA::system
Bitfield< 15 > system
Definition misc.hh:1032

gem5::X86ISA::addr
Bitfield< 3 > addr
Definition types.hh:84

gem5::cp
Definition cprintf.cc:41

gem5::statistics::units
Units for Stats.
Definition units.hh:113

gem5::statistics
Definition statistics.cc:57

gem5::statistics::nonan
const FlagsType nonan
Don't print if this is NAN.
Definition info.hh:69

gem5::statistics::nozero
const FlagsType nozero
Don't print if this is zero.
Definition info.hh:67

gem5::statistics::total
const FlagsType total
Print the total.
Definition info.hh:59

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::RequestPtr
std::shared_ptr< Request > RequestPtr
Definition request.hh:94

gem5::curTick
Tick curTick()
The universal simulation clock.
Definition cur_tick.hh:46

gem5::CheckpointOut
std::ostream CheckpointOut
Definition serialize.hh:66

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::PortID
int16_t PortID
Port index/ID type, and a symbolic name for an invalid port id.
Definition types.hh:245

gem5::Tick
uint64_t Tick
Tick count type.
Definition types.hh:58

gem5::PacketId
uint64_t PacketId
Definition packet.hh:74

gem5::MaxTick
const Tick MaxTick
Definition types.hh:60

gem5::PacketPtr
Packet * PacketPtr
Definition thread_context.hh:70

gem5::PacketList
std::list< PacketPtr > PacketList
Definition packet.hh:73

gem5::genTagExtractor
static constexpr auto genTagExtractor(BTBIndexingPolicy *ip)
This helper generates a tag extractor function object which will be typically used by Replaceable ent...
Definition btb_entry.hh:281

partition_manager.hh

queue_entry.hh
Generic queue entry.

UNSERIALIZE_SCALAR
#define UNSERIALIZE_SCALAR(scalar)
Definition serialize.hh:575

SERIALIZE_SCALAR
#define SERIALIZE_SCALAR(scalar)
Definition serialize.hh:568

gem5::BaseCache::CacheCmdStats
Definition base.hh:991

gem5::BaseCache::CacheCmdStats::accesses
statistics::Formula accesses
The number of accesses per command and thread.
Definition base.hh:1021

gem5::BaseCache::CacheCmdStats::avgMshrMissLatency
statistics::Formula avgMshrMissLatency
The average latency of an MSHR miss, per command and thread.
Definition base.hh:1039

gem5::BaseCache::CacheCmdStats::regStatsFromParent
void regStatsFromParent()
Callback to register stats from parent CacheStats::regStats().
Definition base.cc:2129

gem5::BaseCache::CacheCmdStats::avgMshrUncacheableLatency
statistics::Formula avgMshrUncacheableLatency
The average latency of an MSHR miss, per command and thread.
Definition base.hh:1041

gem5::BaseCache::CacheCmdStats::misses
statistics::Vector misses
Number of misses per thread for each type of command.
Definition base.hh:1009

gem5::BaseCache::CacheCmdStats::missRate
statistics::Formula missRate
The miss rate per command and thread.
Definition base.hh:1023

gem5::BaseCache::CacheCmdStats::missLatency
statistics::Vector missLatency
Total number of ticks per thread/command spent waiting for a miss.
Definition base.hh:1019

gem5::BaseCache::CacheCmdStats::mshrMissRate
statistics::Formula mshrMissRate
The miss rate in the MSHRs pre command and thread.
Definition base.hh:1037

gem5::BaseCache::CacheCmdStats::cache
const BaseCache & cache
Definition base.hh:1002

gem5::BaseCache::CacheCmdStats::mshrUncacheableLatency
statistics::Vector mshrUncacheableLatency
Total tick latency of each MSHR miss, per command and thread.
Definition base.hh:1035

gem5::BaseCache::CacheCmdStats::hitLatency
statistics::Vector hitLatency
Total number of ticks per thread/command spent waiting for a hit.
Definition base.hh:1014

gem5::BaseCache::CacheCmdStats::mshrHits
statistics::Vector mshrHits
Number of misses that hit in the MSHRs per command and thread.
Definition base.hh:1027

gem5::BaseCache::CacheCmdStats::mshrUncacheable
statistics::Vector mshrUncacheable
Number of misses that miss in the MSHRs, per command and thread.
Definition base.hh:1031

gem5::BaseCache::CacheCmdStats::CacheCmdStats
CacheCmdStats(BaseCache &c, const std::string &name)
Definition base.cc:2089

gem5::BaseCache::CacheCmdStats::avgMissLatency
statistics::Formula avgMissLatency
The average miss latency per command and thread.
Definition base.hh:1025

gem5::BaseCache::CacheCmdStats::mshrMisses
statistics::Vector mshrMisses
Number of misses that miss in the MSHRs, per command and thread.
Definition base.hh:1029

gem5::BaseCache::CacheCmdStats::mshrMissLatency
statistics::Vector mshrMissLatency
Total tick latency of each MSHR miss, per command and thread.
Definition base.hh:1033

gem5::BaseCache::CacheCmdStats::hits
statistics::Vector hits
Number of hits per thread for each type of command.
Definition base.hh:1006

gem5::BaseCache::CacheStats::overallMshrMissLatency
statistics::Formula overallMshrMissLatency
Total tick latency of overall MSHR misses.
Definition base.hh:1117

gem5::BaseCache::CacheStats::demandMshrMissLatency
statistics::Formula demandMshrMissLatency
Total tick latency of demand MSHR misses.
Definition base.hh:1115

gem5::BaseCache::CacheStats::overallAvgMshrUncacheableLatency
statistics::Formula overallAvgMshrUncacheableLatency
The average overall latency of an MSHR miss.
Definition base.hh:1133

gem5::BaseCache::CacheStats::cache
const BaseCache & cache
Definition base.hh:1054

gem5::BaseCache::CacheStats::demandHits
statistics::Formula demandHits
Number of hits for demand accesses.
Definition base.hh:1057

gem5::BaseCache::CacheStats::demandHitLatency
statistics::Formula demandHitLatency
Total number of ticks spent waiting for demand hits.
Definition base.hh:1061

gem5::BaseCache::CacheStats::demandAccesses
statistics::Formula demandAccesses
The number of demand accesses.
Definition base.hh:1076

gem5::BaseCache::CacheStats::replacements
statistics::Scalar replacements
Number of replacements of valid blocks.
Definition base.hh:1136

gem5::BaseCache::CacheStats::overallAvgMshrMissLatency
statistics::Formula overallAvgMshrMissLatency
The average overall latency of an MSHR miss.
Definition base.hh:1130

gem5::BaseCache::CacheStats::demandMissRate
statistics::Formula demandMissRate
The miss rate of all demand accesses.
Definition base.hh:1081

gem5::BaseCache::CacheStats::overallMissRate
statistics::Formula overallMissRate
The miss rate for all accesses.
Definition base.hh:1083

gem5::BaseCache::CacheStats::demandAvgMshrMissLatency
statistics::Formula demandAvgMshrMissLatency
The average latency of a demand MSHR miss.
Definition base.hh:1128

gem5::BaseCache::CacheStats::demandMshrMisses
statistics::Formula demandMshrMisses
Demand misses that miss in the MSHRs.
Definition base.hh:1107

gem5::BaseCache::CacheStats::overallMshrMisses
statistics::Formula overallMshrMisses
Total number of misses that miss in the MSHRs.
Definition base.hh:1109

gem5::BaseCache::CacheStats::overallMshrHits
statistics::Formula overallMshrHits
Total number of misses that hit in the MSHRs.
Definition base.hh:1104

gem5::BaseCache::CacheStats::overallHitLatency
statistics::Formula overallHitLatency
Total number of ticks spent waiting for all hits.
Definition base.hh:1063

gem5::BaseCache::CacheStats::dataContractions
statistics::Scalar dataContractions
Number of data contractions (blocks that had their compression factor improved).
Definition base.hh:1145

gem5::BaseCache::CacheStats::CacheStats
CacheStats(BaseCache &c)
Definition base.cc:2262

gem5::BaseCache::CacheStats::regStats
void regStats() override
Callback to set stat parameters.
Definition base.cc:2346

gem5::BaseCache::CacheStats::dataExpansions
statistics::Scalar dataExpansions
Number of data expansions.
Definition base.hh:1139

gem5::BaseCache::CacheStats::overallMshrUncacheable
statistics::Formula overallMshrUncacheable
Total number of misses that miss in the MSHRs.
Definition base.hh:1112

gem5::BaseCache::CacheStats::demandMissLatency
statistics::Formula demandMissLatency
Total number of ticks spent waiting for demand misses.
Definition base.hh:1071

gem5::BaseCache::CacheStats::overallMisses
statistics::Formula overallMisses
Number of misses for all accesses.
Definition base.hh:1068

gem5::BaseCache::CacheStats::overallMshrMissRate
statistics::Formula overallMshrMissRate
The overall miss rate in the MSHRs.
Definition base.hh:1125

gem5::BaseCache::CacheStats::overallAccesses
statistics::Formula overallAccesses
The number of overall accesses.
Definition base.hh:1078

gem5::BaseCache::CacheStats::cmd
std::vector< std::unique_ptr< CacheCmdStats > > cmd
Per-command statistics.
Definition base.hh:1148

gem5::BaseCache::CacheStats::demandMshrMissRate
statistics::Formula demandMshrMissRate
The demand miss rate in the MSHRs.
Definition base.hh:1123

gem5::BaseCache::CacheStats::avgBlocked
statistics::Formula avgBlocked
The average number of cycles blocked for each blocked cause.
Definition base.hh:1096

gem5::BaseCache::CacheStats::overallMshrUncacheableLatency
statistics::Formula overallMshrUncacheableLatency
Total tick latency of overall MSHR misses.
Definition base.hh:1120

gem5::BaseCache::CacheStats::demandMisses
statistics::Formula demandMisses
Number of misses for demand accesses.
Definition base.hh:1066

gem5::BaseCache::CacheStats::demandAvgMissLatency
statistics::Formula demandAvgMissLatency
The average miss latency for demand misses.
Definition base.hh:1086

gem5::BaseCache::CacheStats::overallMissLatency
statistics::Formula overallMissLatency
Total number of ticks spent waiting for all misses.
Definition base.hh:1073

gem5::BaseCache::CacheStats::demandMshrHits
statistics::Formula demandMshrHits
Demand misses that hit in the MSHRs.
Definition base.hh:1102

gem5::BaseCache::CacheStats::overallAvgMissLatency
statistics::Formula overallAvgMissLatency
The average miss latency for all misses.
Definition base.hh:1088

gem5::BaseCache::CacheStats::blockedCauses
statistics::Vector blockedCauses
The number of times this cache blocked for each blocked cause.
Definition base.hh:1093

gem5::BaseCache::CacheStats::writebacks
statistics::Vector writebacks
Number of blocks written back per thread.
Definition base.hh:1099

gem5::BaseCache::CacheStats::blockedCycles
statistics::Vector blockedCycles
The total number of cycles blocked for each blocked cause.
Definition base.hh:1091

gem5::BaseCache::CacheStats::overallHits
statistics::Formula overallHits
Number of hit for all accesses.
Definition base.hh:1059

gem5::CacheDataUpdateProbeArg
A data contents update is composed of the updated block's address, the old contents,...
Definition cache_probe_arg.hh:99

gem5::CacheDataUpdateProbeArg::hwPrefetched
bool hwPrefetched
Set if the update is from a prefetch or evicting a prefetched block that was never used.
Definition cache_probe_arg.hh:112

gem5::CacheDataUpdateProbeArg::newData
std::vector< uint64_t > newData
The new data contents.
Definition cache_probe_arg.hh:109

gem5::CacheDataUpdateProbeArg::oldData
std::vector< uint64_t > oldData
The stale data contents.
Definition cache_probe_arg.hh:107

super_blk.hh
Copyright (c) 2018 Inria All rights reserved.

name
const std::string & name()
Definition trace.cc:48