gem5
v19.0.0.0
|
#include <bop.hh>
Classes | |
struct | DelayQueueEntry |
In a first implementation of the BO prefetcher, both banks of the RR were written simultaneously when a prefetched line is inserted into the cache. More... | |
Public Member Functions | |
BOPPrefetcher (const BOPPrefetcherParams *p) | |
Copyright (c) 2018 Metempsy Technology Consulting All rights reserved. More... | |
~BOPPrefetcher () | |
void | calculatePrefetch (const PrefetchInfo &pfi, std::vector< AddrPriority > &addresses) override |
![]() | |
QueuedPrefetcher (const QueuedPrefetcherParams *p) | |
virtual | ~QueuedPrefetcher () |
void | notify (const PacketPtr &pkt, const PrefetchInfo &pfi) override |
Notify prefetcher of cache access (may be any access or just misses, depending on cache parameters.) More... | |
void | insert (const PacketPtr &pkt, PrefetchInfo &new_pfi, int32_t priority) |
PacketPtr | getPacket () override |
Tick | nextPrefetchReadyTime () const override |
void | regStats () override |
Register local statistics. More... | |
![]() | |
BasePrefetcher (const BasePrefetcherParams *p) | |
virtual | ~BasePrefetcher () |
virtual void | setCache (BaseCache *_cache) |
void | regProbeListeners () override |
Register probe points for this object. More... | |
void | probeNotify (const PacketPtr &pkt, bool miss) |
Process a notification event from the ProbeListener. More... | |
void | addEventProbe (SimObject *obj, const char *name) |
Add a SimObject and a probe name to listen events from. More... | |
void | addTLB (BaseTLB *tlb) |
Add a BaseTLB object to be used whenever a translation is needed. More... | |
![]() | |
ClockedObject (const ClockedObjectParams *p) | |
const Params * | params () const |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
Enums::PwrState | pwrState () const |
std::string | pwrStateName () const |
std::vector< double > | pwrStateWeights () const |
Returns the percentage residency for each power state. More... | |
void | computeStats () |
Record stats values like state residency by computing the time difference from previous update. More... | |
void | pwrState (Enums::PwrState) |
![]() | |
const Params * | params () const |
SimObject (const Params *_params) | |
virtual | ~SimObject () |
virtual const std::string | name () const |
virtual void | init () |
init() is called after all C++ SimObjects have been created and all ports are connected. More... | |
virtual void | loadState (CheckpointIn &cp) |
loadState() is called on each SimObject when restoring from a checkpoint. More... | |
virtual void | initState () |
initState() is called on each SimObject when not restoring from a checkpoint. More... | |
virtual void | regProbePoints () |
Register probe points for this object. More... | |
ProbeManager * | getProbeManager () |
Get the probe manager for this object. More... | |
virtual Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) |
Get a port with a given name and index. More... | |
virtual void | startup () |
startup() is the final initialization call before simulation. More... | |
DrainState | drain () override |
Provide a default implementation of the drain interface for objects that don't need draining. More... | |
virtual void | memWriteback () |
Write back dirty buffers to memory using functional writes. More... | |
virtual void | memInvalidate () |
Invalidate the contents of memory buffers. More... | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
![]() | |
EventManager (EventManager &em) | |
EventManager (EventManager *em) | |
EventManager (EventQueue *eq) | |
EventQueue * | eventQueue () const |
void | schedule (Event &event, Tick when) |
void | deschedule (Event &event) |
void | reschedule (Event &event, Tick when, bool always=false) |
void | schedule (Event *event, Tick when) |
void | deschedule (Event *event) |
void | reschedule (Event *event, Tick when, bool always=false) |
void | wakeupEventQueue (Tick when=(Tick) -1) |
void | setCurTick (Tick newVal) |
![]() | |
Serializable () | |
virtual | ~Serializable () |
void | serializeSection (CheckpointOut &cp, const char *name) const |
Serialize an object into a new section. More... | |
void | serializeSection (CheckpointOut &cp, const std::string &name) const |
void | unserializeSection (CheckpointIn &cp, const char *name) |
Unserialize an a child object. More... | |
void | unserializeSection (CheckpointIn &cp, const std::string &name) |
![]() | |
DrainState | drainState () const |
Return the current drain state of an object. More... | |
virtual void | notifyFork () |
Notify a child process of a fork. More... | |
![]() | |
Group ()=delete | |
Group (const Group &)=delete | |
Group & | operator= (const Group &)=delete |
Group (Group *parent, const char *name=nullptr) | |
Construct a new statistics group. More... | |
virtual | ~Group () |
virtual void | resetStats () |
Callback to reset stats. More... | |
virtual void | preDumpStats () |
Callback before stats are dumped. More... | |
void | addStat (Stats::Info *info) |
Register a stat with this group. More... | |
const std::map< std::string, Group * > & | getStatGroups () const |
Get all child groups associated with this object. More... | |
const std::vector< Info * > & | getStats () const |
Get all stats associated with this object. More... | |
void | addStatGroup (const char *name, Group *block) |
Add a stat block as a child of this block. More... | |
![]() | |
void | updateClockPeriod () |
Update the tick to the current tick. More... | |
Tick | clockEdge (Cycles cycles=Cycles(0)) const |
Determine the tick when a cycle begins, by default the current one, but the argument also enables the caller to determine a future cycle. More... | |
Cycles | curCycle () const |
Determine the current cycle, corresponding to a tick aligned to a clock edge. More... | |
Tick | nextCycle () const |
Based on the clock of the object, determine the start tick of the first cycle that is at least one cycle in the future. More... | |
uint64_t | frequency () const |
Tick | clockPeriod () const |
double | voltage () const |
Cycles | ticksToCycles (Tick t) const |
Tick | cyclesToTicks (Cycles c) const |
Private Types | |
enum | RRWay { Left, Right } |
typedef std::pair< int16_t, uint8_t > | OffsetListEntry |
Structure to save the offset and the score. More... | |
Private Member Functions | |
void | delayQueueEventWrapper () |
Event to handle the delay queue processing. More... | |
unsigned int | hash (Addr addr, unsigned int way) const |
Generate a hash for the specified address to index the RR table. More... | |
void | insertIntoRR (Addr addr, unsigned int way) |
Insert the specified address into the RR table. More... | |
void | insertIntoDelayQueue (Addr addr) |
Insert the specified address into the delay queue. More... | |
void | resetScores () |
Reset all the scores from the offset list. More... | |
Addr | tag (Addr addr) const |
Generate the tag for the specified address based on the tag bits and the block size. More... | |
bool | testRR (Addr) const |
Test if -O is hitting in the RR table to update the offset score. More... | |
void | bestOffsetLearning (Addr) |
Learning phase of the BOP. More... | |
void | notifyFill (const PacketPtr &pkt) override |
Update the RR right table after a prefetch fill. More... | |
Private Attributes | |
const unsigned int | scoreMax |
Learning phase parameters. More... | |
const unsigned int | roundMax |
const unsigned int | badScore |
const unsigned int | rrEntries |
Recent requests table parameteres. More... | |
const unsigned int | tagMask |
const bool | delayQueueEnabled |
Delay queue parameters. More... | |
const unsigned int | delayQueueSize |
const unsigned int | delayTicks |
std::vector< Addr > | rrLeft |
std::vector< Addr > | rrRight |
std::vector< OffsetListEntry > | offsetsList |
std::deque< DelayQueueEntry > | delayQueue |
EventFunctionWrapper | delayQueueEvent |
bool | issuePrefetchRequests |
Hardware prefetcher enabled. More... | |
Addr | bestOffset |
Current best offset to issue prefetches. More... | |
Addr | phaseBestOffset |
Current best offset found in the learning phase. More... | |
std::vector< OffsetListEntry >::iterator | offsetsListIterator |
Current test offset index. More... | |
unsigned int | bestScore |
Max score found so far. More... | |
unsigned int | round |
Current round. More... | |
Additional Inherited Members | |
![]() | |
using | AddrPriority = std::pair< Addr, int32_t > |
![]() | |
typedef ClockedObjectParams | Params |
Parameters of ClockedObject. More... | |
![]() | |
typedef SimObjectParams | Params |
![]() | |
static void | serializeAll (CheckpointOut &cp) |
Serialize all SimObjects in the system. More... | |
static SimObject * | find (const char *name) |
Find the SimObject with the given name and return a pointer to it. More... | |
![]() | |
static const std::string & | currentSection () |
Get the fully-qualified name of the active section. More... | |
static void | serializeAll (const std::string &cpt_dir) |
static void | unserializeGlobals (CheckpointIn &cp) |
![]() | |
static int | ckptCount = 0 |
static int | ckptMaxCount = 0 |
static int | ckptPrevCount = -1 |
![]() | |
using | const_iterator = std::list< DeferredPacket >::const_iterator |
using | iterator = std::list< DeferredPacket >::iterator |
![]() | |
bool | observeAccess (const PacketPtr &pkt, bool miss) const |
Determine if this access should be observed. More... | |
bool | inCache (Addr addr, bool is_secure) const |
Determine if address is in cache. More... | |
bool | inMissQueue (Addr addr, bool is_secure) const |
Determine if address is in cache miss queue. More... | |
bool | hasBeenPrefetched (Addr addr, bool is_secure) const |
bool | samePage (Addr a, Addr b) const |
Determine if addresses are on the same page. More... | |
Addr | blockAddress (Addr a) const |
Determine the address of the block in which a lays. More... | |
Addr | blockIndex (Addr a) const |
Determine the address of a at block granularity. More... | |
Addr | pageAddress (Addr a) const |
Determine the address of the page in which a lays. More... | |
Addr | pageOffset (Addr a) const |
Determine the page-offset of a. More... | |
Addr | pageIthBlockAddress (Addr page, uint32_t i) const |
Build the address of the i-th block inside the page. More... | |
![]() | |
Drainable () | |
virtual | ~Drainable () |
virtual void | drainResume () |
Resume execution after a successful drain. More... | |
void | signalDrainDone () const |
Signal that an object is drained. More... | |
![]() | |
Clocked (ClockDomain &clk_domain) | |
Create a clocked object and set the clock domain based on the parameters. More... | |
Clocked (Clocked &)=delete | |
Clocked & | operator= (Clocked &)=delete |
virtual | ~Clocked () |
Virtual destructor due to inheritance. More... | |
void | resetClock () const |
Reset the object's clock using the current global tick value. More... | |
virtual void | clockPeriodUpdated () |
A hook subclasses can implement so they can do any extra work that's needed when the clock rate is changed. More... | |
![]() | |
std::list< DeferredPacket > | pfq |
std::list< DeferredPacket > | pfqMissingTranslation |
const unsigned | queueSize |
Maximum size of the prefetch queue. More... | |
const unsigned | missingTranslationQueueSize |
Maximum size of the queue holding prefetch requests with missing address translations. More... | |
const Cycles | latency |
Cycles after generation when a prefetch can first be issued. More... | |
const bool | queueSquash |
Squash queued prefetch if demand access observed. More... | |
const bool | queueFilter |
Filter prefetches if already queued. More... | |
const bool | cacheSnoop |
Snoop the cache before generating prefetch (cheating basically) More... | |
const bool | tagPrefetch |
Tag prefetch with PC of generating access? More... | |
const unsigned int | throttleControlPct |
Percentage of requests that can be throttled. More... | |
Stats::Scalar | pfIdentified |
Stats::Scalar | pfBufferHit |
Stats::Scalar | pfInCache |
Stats::Scalar | pfRemovedFull |
Stats::Scalar | pfSpanPage |
![]() | |
BaseCache * | cache |
Pointr to the parent cache. More... | |
unsigned | blkSize |
The block size of the parent cache. More... | |
unsigned | lBlkSize |
log_2(block size of the parent cache). More... | |
const bool | onMiss |
Only consult prefetcher on cache misses? More... | |
const bool | onRead |
Consult prefetcher on reads? More... | |
const bool | onWrite |
Consult prefetcher on reads? More... | |
const bool | onData |
Consult prefetcher on data accesses? More... | |
const bool | onInst |
Consult prefetcher on instruction accesses? More... | |
const MasterID | masterId |
Request id for prefetches. More... | |
const Addr | pageBytes |
const bool | prefetchOnAccess |
Prefetch on every access, not just misses. More... | |
const bool | useVirtualAddresses |
Use Virtual Addresses for prefetching. More... | |
Stats::Scalar | pfIssued |
uint64_t | issuedPrefetches |
Total prefetches issued. More... | |
uint64_t | usefulPrefetches |
Total prefetches that has been useful. More... | |
BaseTLB * | tlb |
Registered tlb for address translations. More... | |
![]() | |
Enums::PwrState | _currPwrState |
To keep track of the current power state. More... | |
Tick | prvEvalTick |
ClockedObject::ClockedObjectStats | stats |
![]() | |
const SimObjectParams * | _params |
Cached copy of the object parameters. More... | |
![]() | |
EventQueue * | eventq |
A pointer to this object's event queue. More... | |
|
private |
|
private |
BOPPrefetcher::BOPPrefetcher | ( | const BOPPrefetcherParams * | p | ) |
Copyright (c) 2018 Metempsy Technology Consulting All rights reserved.
Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: redistributions of source code must retain the above copyright notice, this list of conditions and the following disclaimer; redistributions in binary form must reproduce the above copyright notice, this list of conditions and the following disclaimer in the documentation and/or other materials provided with the distribution; neither the name of the copyright holders nor the names of its contributors may be used to endorse or promote products derived from this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
Authors: Ivan Pizarro
Definition at line 36 of file bop.cc.
References bestOffset, bestScore, BasePrefetcher::blkSize, delayQueueEventWrapper(), fatal, ArmISA::i, isPowerOf2(), issuePrefetchRequests, ArmISA::n, SimObject::name(), ArmISA::offset, offsetsList, offsetsListIterator, MipsISA::p, phaseBestOffset, round, rrEntries, rrLeft, and rrRight.
Referenced by notifyFill().
|
inline |
Definition at line 151 of file bop.hh.
References calculatePrefetch().
|
private |
Learning phase of the BOP.
Update the intermediate values of the round and update the best offset if found
Definition at line 184 of file bop.cc.
References badScore, bestOffset, bestScore, DPRINTF, issuePrefetchRequests, offsetsList, offsetsListIterator, phaseBestOffset, resetScores(), round, roundMax, scoreMax, and testRR().
Referenced by calculatePrefetch().
|
overridevirtual |
Implements QueuedPrefetcher.
Definition at line 225 of file bop.cc.
References addr, bestOffset, bestOffsetLearning(), delayQueueEnabled, DPRINTF, BasePrefetcher::PrefetchInfo::getAddr(), insertIntoDelayQueue(), insertIntoRR(), issuePrefetchRequests, BasePrefetcher::lBlkSize, and tag().
Referenced by ~BOPPrefetcher().
|
private |
Event to handle the delay queue processing.
Definition at line 96 of file bop.cc.
References curTick(), delayQueue, delayQueueEvent, insertIntoRR(), and EventManager::schedule().
Referenced by BOPPrefetcher().
|
private |
Generate a hash for the specified address to index the RR table.
addr | address to hash |
way | RR table to which is addressed (left/right) |
Definition at line 113 of file bop.cc.
References floorLog2(), and rrEntries.
Referenced by insertIntoRR().
|
private |
Insert the specified address into the delay queue.
This will trigger an event after the delay cycles pass
addr | address to insert into the delay queue |
Definition at line 134 of file bop.cc.
References curTick(), delayQueue, delayQueueEvent, delayQueueSize, delayTicks, EventManager::schedule(), and Event::scheduled().
Referenced by calculatePrefetch().
|
private |
Insert the specified address into the RR table.
addr | address to insert |
way | RR table to which the address will be inserted |
Definition at line 121 of file bop.cc.
References addr, hash(), rrLeft, and rrRight.
Referenced by calculatePrefetch(), delayQueueEventWrapper(), and notifyFill().
|
overrideprivatevirtual |
Update the RR right table after a prefetch fill.
Reimplemented from BasePrefetcher.
Definition at line 251 of file bop.cc.
References bestOffset, BOPPrefetcher(), Packet::cmd, Packet::getAddr(), insertIntoRR(), MemCmd::isHWPrefetch(), issuePrefetchRequests, and tag().
|
private |
Reset all the scores from the offset list.
Definition at line 152 of file bop.cc.
References offsetsList.
Referenced by bestOffsetLearning().
Generate the tag for the specified address based on the tag bits and the block size.
addr | address to get the tag from |
Definition at line 160 of file bop.cc.
References BasePrefetcher::blkSize, and tagMask.
Referenced by calculatePrefetch(), and notifyFill().
|
private |
Test if -O is hitting in the RR table to update the offset score.
Definition at line 166 of file bop.cc.
References rrLeft, and rrRight.
Referenced by bestOffsetLearning().
|
private |
Definition at line 60 of file bop.hh.
Referenced by bestOffsetLearning().
|
private |
Current best offset to issue prefetches.
Definition at line 100 of file bop.hh.
Referenced by bestOffsetLearning(), BOPPrefetcher(), calculatePrefetch(), and notifyFill().
|
private |
Max score found so far.
Definition at line 106 of file bop.hh.
Referenced by bestOffsetLearning(), and BOPPrefetcher().
|
private |
Definition at line 91 of file bop.hh.
Referenced by delayQueueEventWrapper(), and insertIntoDelayQueue().
|
private |
|
private |
Definition at line 95 of file bop.hh.
Referenced by delayQueueEventWrapper(), and insertIntoDelayQueue().
|
private |
Definition at line 66 of file bop.hh.
Referenced by insertIntoDelayQueue().
|
private |
Definition at line 67 of file bop.hh.
Referenced by insertIntoDelayQueue().
|
private |
Hardware prefetcher enabled.
Definition at line 98 of file bop.hh.
Referenced by bestOffsetLearning(), BOPPrefetcher(), calculatePrefetch(), and notifyFill().
|
private |
Definition at line 74 of file bop.hh.
Referenced by bestOffsetLearning(), BOPPrefetcher(), and resetScores().
|
private |
Current test offset index.
Definition at line 104 of file bop.hh.
Referenced by bestOffsetLearning(), and BOPPrefetcher().
|
private |
Current best offset found in the learning phase.
Definition at line 102 of file bop.hh.
Referenced by bestOffsetLearning(), and BOPPrefetcher().
|
private |
Current round.
Definition at line 108 of file bop.hh.
Referenced by bestOffsetLearning(), and BOPPrefetcher().
|
private |
Definition at line 59 of file bop.hh.
Referenced by bestOffsetLearning().
|
private |
Recent requests table parameteres.
Definition at line 62 of file bop.hh.
Referenced by BOPPrefetcher(), and hash().
|
private |
Definition at line 69 of file bop.hh.
Referenced by BOPPrefetcher(), insertIntoRR(), and testRR().
|
private |
Definition at line 70 of file bop.hh.
Referenced by BOPPrefetcher(), insertIntoRR(), and testRR().
|
private |
Learning phase parameters.
Definition at line 58 of file bop.hh.
Referenced by bestOffsetLearning().
|
private |