gem5  v20.0.0.3
lsq.hh
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2011-2012, 2014, 2018-2019 ARM Limited
3  * Copyright (c) 2013 Advanced Micro Devices, Inc.
4  * All rights reserved
5  *
6  * The license below extends only to copyright in the software and shall
7  * not be construed as granting a license to any other intellectual
8  * property including but not limited to intellectual property relating
9  * to a hardware implementation of the functionality of the software
10  * licensed hereunder. You may use the software subject to the license
11  * terms below provided that you ensure that this notice is replicated
12  * unmodified and in its entirety in all distributions of the software,
13  * modified or unmodified, in source code or in binary form.
14  *
15  * Copyright (c) 2004-2006 The Regents of The University of Michigan
16  * All rights reserved.
17  *
18  * Redistribution and use in source and binary forms, with or without
19  * modification, are permitted provided that the following conditions are
20  * met: redistributions of source code must retain the above copyright
21  * notice, this list of conditions and the following disclaimer;
22  * redistributions in binary form must reproduce the above copyright
23  * notice, this list of conditions and the following disclaimer in the
24  * documentation and/or other materials provided with the distribution;
25  * neither the name of the copyright holders nor the names of its
26  * contributors may be used to endorse or promote products derived from
27  * this software without specific prior written permission.
28  *
29  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
30  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
31  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
32  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
33  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
34  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
35  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
36  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
37  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
38  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
39  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
40  */
41 
42 #ifndef __CPU_O3_LSQ_HH__
43 #define __CPU_O3_LSQ_HH__
44 
45 #include <map>
46 #include <queue>
47 
48 #include "arch/generic/tlb.hh"
49 #include "cpu/inst_seq.hh"
50 #include "cpu/o3/lsq_unit.hh"
51 #include "cpu/utils.hh"
52 #include "enums/SMTQueuePolicy.hh"
53 #include "mem/port.hh"
54 #include "sim/sim_object.hh"
55 
56 struct DerivO3CPUParams;
57 
58 template <class Impl>
59 class FullO3CPU;
60 
61 template <class Impl>
62 class LSQ
63 
64 {
65  public:
66  typedef typename Impl::O3CPU O3CPU;
67  typedef typename Impl::DynInstPtr DynInstPtr;
68  typedef typename Impl::CPUPol::IEW IEW;
69  typedef typename Impl::CPUPol::LSQUnit LSQUnit;
70 
71  class LSQRequest;
74  {
75  protected:
78 
81  : _request(request), mainPkt(nullptr), pendingPacket(nullptr),
82  outstanding(0), isLoad(isLoad_), needWB(isLoad_), isSplit(false),
83  pktToSend(false), deleted(false)
84  { }
85  public:
86 
88  DynInstPtr inst;
94  uint8_t outstanding;
96  bool isLoad;
98  bool needWB;
100  bool isSplit;
102  bool pktToSend;
107  bool deleted;
108  ContextID contextId() { return inst->contextId(); }
109 
111  inline bool isComplete() { return outstanding == 0; }
112  inline void deleteRequest() { deleted = true; }
113  inline bool alive() { return !deleted; }
114  LSQRequest* request() { return _request; }
115  virtual void complete() = 0;
116  void writebackDone() { _request->writebackDone(); }
117  };
118 
122  class DcachePort : public MasterPort
123  {
124  protected:
125 
129 
130  public:
133  : MasterPort(_cpu->name() + ".dcache_port", _cpu), lsq(_lsq),
134  cpu(_cpu)
135  { }
136 
137  protected:
138 
142  virtual bool recvTimingResp(PacketPtr pkt);
143  virtual void recvTimingSnoopReq(PacketPtr pkt);
144 
145  virtual void recvFunctionalSnoop(PacketPtr pkt)
146  {
147  // @todo: Is there a need for potential invalidation here?
148  }
149 
151  virtual void recvReqRetry();
152 
159  virtual bool isSnooping() const { return true; }
160  };
161 
231  {
232  protected:
233  typedef uint32_t FlagsStorage;
234  typedef ::Flags<FlagsStorage> FlagsType;
235 
236  enum Flag : FlagsStorage
237  {
238  IsLoad = 0x00000001,
240  WbStore = 0x00000002,
241  Delayed = 0x00000004,
242  IsSplit = 0x00000008,
244  TranslationStarted = 0x00000010,
246  TranslationFinished = 0x00000020,
247  Sent = 0x00000040,
248  Retry = 0x00000080,
249  Complete = 0x00000100,
252  TranslationSquashed = 0x00000200,
254  Discarded = 0x00000400,
256  LSQEntryFreed = 0x00000800,
258  WritebackScheduled = 0x00001000,
259  WritebackDone = 0x00002000,
261  IsAtomic = 0x00004000
262  };
263  FlagsType flags;
264 
265  enum class State
266  {
267  NotIssued,
268  Translation,
269  Request,
270  Fault,
271  PartialFault,
272  };
275  void setState(const State& newState) { _state = newState; }
276 
279 
281  uint32_t _entryIdx;
282 
283  void markDelayed() override { flags.set(Flag::Delayed); }
284  bool isDelayed() { return flags.isSet(Flag::Delayed); }
285 
286  public:
287  LSQUnit& _port;
288  const DynInstPtr _inst;
289  uint32_t _taskId;
294  uint64_t* _res;
295  const Addr _addr;
296  const uint32_t _size;
301  protected:
302  LSQUnit* lsqUnit() { return &_port; }
303  LSQRequest(LSQUnit* port, const DynInstPtr& inst, bool isLoad) :
304  _state(State::NotIssued), _senderState(nullptr),
305  _port(*port), _inst(inst), _data(nullptr),
306  _res(nullptr), _addr(0), _size(0), _flags(0),
307  _numOutstandingPackets(0), _amo_op(nullptr)
308  {
309  flags.set(Flag::IsLoad, isLoad);
310  flags.set(Flag::WbStore,
311  _inst->isStoreConditional() || _inst->isAtomic());
312  flags.set(Flag::IsAtomic, _inst->isAtomic());
313  install();
314  }
315  LSQRequest(LSQUnit* port, const DynInstPtr& inst, bool isLoad,
316  const Addr& addr, const uint32_t& size,
317  const Request::Flags& flags_,
318  PacketDataPtr data = nullptr, uint64_t* res = nullptr,
319  AtomicOpFunctorPtr amo_op = nullptr)
320  : _state(State::NotIssued), _senderState(nullptr),
321  numTranslatedFragments(0),
322  numInTranslationFragments(0),
323  _port(*port), _inst(inst), _data(data),
324  _res(res), _addr(addr), _size(size),
325  _flags(flags_),
326  _numOutstandingPackets(0),
327  _amo_op(std::move(amo_op))
328  {
329  flags.set(Flag::IsLoad, isLoad);
330  flags.set(Flag::WbStore,
331  _inst->isStoreConditional() || _inst->isAtomic());
332  flags.set(Flag::IsAtomic, _inst->isAtomic());
333  install();
334  }
335 
336  bool
337  isLoad() const
338  {
339  return flags.isSet(Flag::IsLoad);
340  }
341 
342  bool
343  isAtomic() const
344  {
345  return flags.isSet(Flag::IsAtomic);
346  }
347 
349  void install()
350  {
351  if (isLoad()) {
352  _port.loadQueue[_inst->lqIdx].setRequest(this);
353  } else {
354  // Store, StoreConditional, and Atomic requests are pushed
355  // to this storeQueue
356  _port.storeQueue[_inst->sqIdx].setRequest(this);
357  }
358  }
359  virtual bool
360  squashed() const override
361  {
362  return _inst->isSquashed();
363  }
364 
370  bool
372  {
373  return flags.isSet(Flag::LSQEntryFreed) ||
374  flags.isSet(Flag::Discarded);
375  }
376 
386  void release(Flag reason)
387  {
388  assert(reason == Flag::LSQEntryFreed || reason == Flag::Discarded);
389  if (!isAnyOutstandingRequest()) {
390  delete this;
391  } else {
392  if (_senderState) {
393  _senderState->deleteRequest();
394  }
395  flags.set(reason);
396  }
397  }
398 
405  void
406  addRequest(Addr addr, unsigned size,
407  const std::vector<bool>& byte_enable)
408  {
409  if (byte_enable.empty() ||
410  isAnyActiveElement(byte_enable.begin(), byte_enable.end())) {
411  auto request = std::make_shared<Request>(
412  addr, size, _flags, _inst->masterId(),
413  _inst->instAddr(), _inst->contextId(),
414  std::move(_amo_op));
415  if (!byte_enable.empty()) {
416  request->setByteEnable(byte_enable);
417  }
418  _requests.push_back(request);
419  }
420  }
421 
426  virtual ~LSQRequest()
427  {
428  assert(!isAnyOutstandingRequest());
429  _inst->savedReq = nullptr;
430  if (_senderState)
431  delete _senderState;
432 
433  for (auto r: _packets)
434  delete r;
435  };
436 
437 
438  public:
442  void
443  setContext(const ContextID& context_id)
444  {
445  request()->setContext(context_id);
446  }
447 
448  const DynInstPtr&
450  {
451  return _inst;
452  }
453 
457  void
458  setVirt(Addr vaddr, unsigned size, Request::Flags flags_,
459  MasterID mid, Addr pc)
460  {
461  request()->setVirt(vaddr, size, flags_, mid, pc);
462  }
463 
464  void
465  taskId(const uint32_t& v)
466  {
467  _taskId = v;
468  for (auto& r: _requests)
469  r->taskId(v);
470  }
471 
472  uint32_t taskId() const { return _taskId; }
473  RequestPtr request(int idx = 0) { return _requests.at(idx); }
474 
475  const RequestPtr
476  request(int idx = 0) const
477  {
478  return _requests.at(idx);
479  }
480 
481  Addr getVaddr(int idx = 0) const { return request(idx)->getVaddr(); }
482  virtual void initiateTranslation() = 0;
483 
484  PacketPtr packet(int idx = 0) { return _packets.at(idx); }
485 
486  virtual PacketPtr
488  {
489  assert (_packets.size() == 1);
490  return packet();
491  }
492 
493  virtual RequestPtr
495  {
496  assert (_requests.size() == 1);
497  return request();
498  }
499 
500  void
502  {
503  _senderState = st;
504  for (auto& pkt: _packets) {
505  if (pkt)
506  pkt->senderState = st;
507  }
508  }
509 
510  const LSQSenderState*
511  senderState() const
512  {
513  return _senderState;
514  }
515 
520  void
522  {
523  assert(_senderState);
524  _senderState->deleteRequest();
525  }
526 
530  bool
532  {
533  return numInTranslationFragments > 0 ||
534  _numOutstandingPackets > 0 ||
535  (flags.isSet(Flag::WritebackScheduled) &&
536  !flags.isSet(Flag::WritebackDone));
537  }
538 
539  bool
540  isSplit() const
541  {
542  return flags.isSet(Flag::IsSplit);
543  }
545  virtual bool recvTimingResp(PacketPtr pkt) = 0;
546  virtual void sendPacketToCache() = 0;
547  virtual void buildPackets() = 0;
548 
552  virtual Cycles handleLocalAccess(
553  ThreadContext *thread, PacketPtr pkt) = 0;
554 
558  virtual bool isCacheBlockHit(Addr blockAddr, Addr cacheBlockMask) = 0;
559 
561  void
563  {
564  flags.set(Flag::Sent);
565  }
570  void
572  {
573  flags.set(Flag::Retry);
574  flags.clear(Flag::Sent);
575  }
576 
577  void sendFragmentToTranslation(int i);
578  bool
580  {
581  return flags.isSet(Flag::Complete);
582  }
583 
584  bool
586  {
587  return _state == State::Translation;
588  }
589 
590  bool
592  {
593  return flags.isSet(Flag::TranslationStarted) &&
594  !isInTranslation();
595  }
596 
597  bool
599  {
600  return _state == State::Translation &&
601  flags.isSet(Flag::TranslationStarted) &&
602  !flags.isSet(Flag::TranslationFinished);
603  }
604 
605  bool
607  {
608  return flags.isSet(Flag::Sent);
609  }
610 
611  bool
613  {
614  return _state == State::PartialFault;
615  }
616 
617  bool
619  {
620  return (_state == State::Request ||
621  (isPartialFault() && isLoad()));
622  }
623 
624  void
626  {
627  setState(State::Fault);
628  }
629 
633  void
635  {
636  release(Flag::LSQEntryFreed);
637  }
638 
642  void
644  {
645  release(Flag::Discarded);
646  }
647 
648  void
650  {
651  assert(_numOutstandingPackets > 0);
652  _numOutstandingPackets--;
653  if (_numOutstandingPackets == 0 && isReleased())
654  delete this;
655  }
656 
657  void
659  {
660  assert(!flags.isSet(Flag::WritebackScheduled));
661  flags.set(Flag::WritebackScheduled);
662  }
663 
664  void
666  {
667  flags.set(Flag::WritebackDone);
668  /* If the lsq resources are already free */
669  if (isReleased()) {
670  delete this;
671  }
672  }
673 
674  void
676  {
677  assert(numInTranslationFragments == 0);
678  flags.set(Flag::TranslationSquashed);
679  /* If we are on our own, self-destruct. */
680  if (isReleased()) {
681  delete this;
682  }
683  }
684 
685  void
687  {
688  flags.set(Flag::Complete);
689  }
690  };
691 
693  {
694  protected:
695  /* Given that we are inside templates, children need explicit
696  * declaration of the names in the parent class. */
697  using Flag = typename LSQRequest::Flag;
698  using State = typename LSQRequest::State;
699  using LSQRequest::_addr;
700  using LSQRequest::_fault;
701  using LSQRequest::_flags;
702  using LSQRequest::_size;
704  using LSQRequest::_requests;
705  using LSQRequest::_inst;
706  using LSQRequest::_packets;
707  using LSQRequest::_port;
708  using LSQRequest::_res;
709  using LSQRequest::_taskId;
711  using LSQRequest::_state;
712  using LSQRequest::flags;
713  using LSQRequest::isLoad;
715  using LSQRequest::lsqUnit;
716  using LSQRequest::request;
718  using LSQRequest::setState;
722  using LSQRequest::_amo_op;
723  public:
724  SingleDataRequest(LSQUnit* port, const DynInstPtr& inst, bool isLoad,
725  const Addr& addr, const uint32_t& size,
726  const Request::Flags& flags_,
727  PacketDataPtr data = nullptr,
728  uint64_t* res = nullptr,
729  AtomicOpFunctorPtr amo_op = nullptr) :
730  LSQRequest(port, inst, isLoad, addr, size, flags_, data, res,
731  std::move(amo_op)) {}
732 
733  inline virtual ~SingleDataRequest() {}
734  virtual void initiateTranslation();
735  virtual void finish(const Fault &fault, const RequestPtr &req,
737  virtual bool recvTimingResp(PacketPtr pkt);
738  virtual void sendPacketToCache();
739  virtual void buildPackets();
740  virtual Cycles handleLocalAccess(ThreadContext *thread, PacketPtr pkt);
741  virtual bool isCacheBlockHit(Addr blockAddr, Addr cacheBlockMask);
742  };
743 
745  {
746  protected:
747  /* Given that we are inside templates, children need explicit
748  * declaration of the names in the parent class. */
749  using Flag = typename LSQRequest::Flag;
750  using State = typename LSQRequest::State;
751  using LSQRequest::_addr;
752  using LSQRequest::_data;
753  using LSQRequest::_fault;
754  using LSQRequest::_flags;
755  using LSQRequest::_inst;
756  using LSQRequest::_packets;
757  using LSQRequest::_port;
758  using LSQRequest::_requests;
759  using LSQRequest::_res;
762  using LSQRequest::_size;
763  using LSQRequest::_state;
764  using LSQRequest::_taskId;
765  using LSQRequest::flags;
766  using LSQRequest::isLoad;
768  using LSQRequest::lsqUnit;
771  using LSQRequest::request;
773  using LSQRequest::setState;
775 
776  uint32_t numFragments;
780 
781  public:
782  SplitDataRequest(LSQUnit* port, const DynInstPtr& inst, bool isLoad,
783  const Addr& addr, const uint32_t& size,
784  const Request::Flags & flags_,
785  PacketDataPtr data = nullptr,
786  uint64_t* res = nullptr) :
787  LSQRequest(port, inst, isLoad, addr, size, flags_, data, res,
788  nullptr),
789  numFragments(0),
790  numReceivedPackets(0),
791  mainReq(nullptr),
792  _mainPacket(nullptr)
793  {
794  flags.set(Flag::IsSplit);
795  }
797  {
798  if (mainReq) {
799  mainReq = nullptr;
800  }
801  if (_mainPacket) {
802  delete _mainPacket;
803  _mainPacket = nullptr;
804  }
805  }
806  virtual void finish(const Fault &fault, const RequestPtr &req,
808  virtual bool recvTimingResp(PacketPtr pkt);
809  virtual void initiateTranslation();
810  virtual void sendPacketToCache();
811  virtual void buildPackets();
812 
813  virtual Cycles handleLocalAccess(ThreadContext *thread, PacketPtr pkt);
814  virtual bool isCacheBlockHit(Addr blockAddr, Addr cacheBlockMask);
815 
816  virtual RequestPtr mainRequest();
817  virtual PacketPtr mainPacket();
818  };
819 
821  LSQ(O3CPU *cpu_ptr, IEW *iew_ptr, DerivO3CPUParams *params);
822  ~LSQ() { }
823 
825  std::string name() const;
826 
828  void regStats();
829 
832 
834  void drainSanityCheck() const;
836  bool isDrained() const;
838  void takeOverFrom();
839 
841  int entryAmount(ThreadID num_threads);
842 
844  void tick();
845 
847  void insertLoad(const DynInstPtr &load_inst);
849  void insertStore(const DynInstPtr &store_inst);
850 
852  Fault executeLoad(const DynInstPtr &inst);
853 
855  Fault executeStore(const DynInstPtr &inst);
856 
860  void commitLoads(InstSeqNum &youngest_inst, ThreadID tid)
861  { thread.at(tid).commitLoads(youngest_inst); }
862 
866  void commitStores(InstSeqNum &youngest_inst, ThreadID tid)
867  { thread.at(tid).commitStores(youngest_inst); }
868 
873  void writebackStores();
875  void writebackStores(ThreadID tid);
876 
880  void
881  squash(const InstSeqNum &squashed_num, ThreadID tid)
882  {
883  thread.at(tid).squash(squashed_num);
884  }
885 
887  bool violation();
892  bool violation(ThreadID tid) { return thread.at(tid).violation(); }
893 
895  DynInstPtr
897  {
898  return thread.at(tid).getMemDepViolator();
899  }
900 
902  int getLoadHead(ThreadID tid) { return thread.at(tid).getLoadHead(); }
903 
905  InstSeqNum
907  {
908  return thread.at(tid).getLoadHeadSeqNum();
909  }
910 
912  int getStoreHead(ThreadID tid) { return thread.at(tid).getStoreHead(); }
913 
915  InstSeqNum
917  {
918  return thread.at(tid).getStoreHeadSeqNum();
919  }
920 
922  int getCount();
924  int getCount(ThreadID tid) { return thread.at(tid).getCount(); }
925 
927  int numLoads();
929  int numLoads(ThreadID tid) { return thread.at(tid).numLoads(); }
930 
932  int numStores();
934  int numStores(ThreadID tid) { return thread.at(tid).numStores(); }
935 
937  unsigned numFreeLoadEntries();
938 
940  unsigned numFreeStoreEntries();
941 
943  unsigned numFreeEntries(ThreadID tid);
944 
946  unsigned numFreeLoadEntries(ThreadID tid);
947 
949  unsigned numFreeStoreEntries(ThreadID tid);
950 
952  bool isFull();
957  bool isFull(ThreadID tid);
958 
960  bool isEmpty() const;
962  bool lqEmpty() const;
964  bool sqEmpty() const;
965 
967  bool lqFull();
969  bool lqFull(ThreadID tid);
970 
972  bool sqFull();
974  bool sqFull(ThreadID tid);
975 
980  bool isStalled();
985  bool isStalled(ThreadID tid);
986 
988  bool hasStoresToWB();
989 
993  bool hasStoresToWB(ThreadID tid) { return thread.at(tid).hasStoresToWB(); }
994 
996  int numStoresToWB(ThreadID tid) { return thread.at(tid).numStoresToWB(); }
997 
999  bool willWB();
1003  bool willWB(ThreadID tid) { return thread.at(tid).willWB(); }
1004 
1006  void dumpInsts() const;
1008  void dumpInsts(ThreadID tid) const { thread.at(tid).dumpInsts(); }
1009 
1013  Fault read(LSQRequest* req, int load_idx);
1014 
1018  Fault write(LSQRequest* req, uint8_t *data, int store_idx);
1019 
1023  void recvReqRetry();
1024 
1025  void completeDataAccess(PacketPtr pkt);
1032  bool recvTimingResp(PacketPtr pkt);
1033 
1034  void recvTimingSnoopReq(PacketPtr pkt);
1035 
1036  Fault pushRequest(const DynInstPtr& inst, bool isLoad, uint8_t *data,
1037  unsigned int size, Addr addr, Request::Flags flags,
1038  uint64_t *res, AtomicOpFunctorPtr amo_op,
1039  const std::vector<bool>& byte_enable);
1040 
1042  O3CPU *cpu;
1043 
1045  IEW *iewStage;
1046 
1048  bool cacheBlocked() const;
1050  void cacheBlocked(bool v);
1052  bool cachePortAvailable(bool is_load) const;
1054  void cachePortBusy(bool is_load);
1055 
1057 
1058  protected:
1069 
1070 
1072  SMTQueuePolicy lsqPolicy;
1073 
1079  static uint32_t
1080  maxLSQAllocation(SMTQueuePolicy pol, uint32_t entries,
1081  uint32_t numThreads, uint32_t SMTThreshold)
1082  {
1083  if (pol == SMTQueuePolicy::Dynamic) {
1084  return entries;
1085  } else if (pol == SMTQueuePolicy::Partitioned) {
1086  //@todo:make work if part_amt doesnt divide evenly.
1087  return entries / numThreads;
1088  } else if (pol == SMTQueuePolicy::Threshold) {
1089  //Divide up by threshold amount
1090  //@todo: Should threads check the max and the total
1091  //amount of the LSQ
1092  return SMTThreshold;
1093  }
1094  return 0;
1095  }
1096 
1099 
1101  unsigned LQEntries;
1103  unsigned SQEntries;
1104 
1106  unsigned maxLQEntries;
1107 
1109  unsigned maxSQEntries;
1110 
1113 
1116 
1119 };
1120 
1121 template <class Impl>
1122 Fault
1123 LSQ<Impl>::read(LSQRequest* req, int load_idx)
1124 {
1125  ThreadID tid = cpu->contextToThread(req->request()->contextId());
1126 
1127  return thread.at(tid).read(req, load_idx);
1128 }
1129 
1130 template <class Impl>
1131 Fault
1132 LSQ<Impl>::write(LSQRequest* req, uint8_t *data, int store_idx)
1133 {
1134  ThreadID tid = cpu->contextToThread(req->request()->contextId());
1135 
1136  return thread.at(tid).write(req, data, store_idx);
1137 }
1138 
1139 #endif // __CPU_O3_LSQ_HH__
A MasterPort is a specialisation of a BaseMasterPort, which implements the default protocol for the t...
Definition: port.hh:71
IEW * iewStage
The IEW stage pointer.
Definition: lsq.hh:1045
unsigned SQEntries
Total Size of SQ Entries.
Definition: lsq.hh:1103
void takeOverFrom()
Takes over execution from another CPU&#39;s thread.
Definition: lsq_impl.hh:167
FlagsType flags
Definition: lsq.hh:263
void set(T v, ByteOrder endian)
Set the value in the data pointer to v using the specified endianness.
ThreadID numThreads
Number of Threads.
Definition: lsq.hh:1118
DynInstPtr inst
Instruction which initiated the access to memory.
Definition: lsq.hh:88
Impl::DynInstPtr DynInstPtr
Definition: lsq.hh:67
Bitfield< 28 > v
uint32_t _numOutstandingPackets
Definition: lsq.hh:299
Fault pushRequest(const DynInstPtr &inst, bool isLoad, uint8_t *data, unsigned int size, Addr addr, Request::Flags flags, uint64_t *res, AtomicOpFunctorPtr amo_op, const std::vector< bool > &byte_enable)
Definition: lsq_impl.hh:686
Cycles is a wrapper class for representing cycle counts, i.e.
Definition: types.hh:81
PacketPtr mainPkt
The main packet from a split load, used during writeback.
Definition: lsq.hh:90
int getCount(ThreadID tid)
Returns the number of instructions in the queues of one thread.
Definition: lsq.hh:924
void taskId(const uint32_t &v)
Definition: lsq.hh:465
LSQSenderState * _senderState
Definition: lsq.hh:274
const uint32_t _size
Definition: lsq.hh:296
PacketDataPtr _data
Definition: lsq.hh:290
unsigned LQEntries
Total Size of LQ Entries.
Definition: lsq.hh:1101
bool willWB()
Returns if the LSQ will write back to memory this cycle.
Definition: lsq_impl.hh:655
Bitfield< 7 > i
LSQUnit * lsqUnit()
Definition: lsq.hh:302
std::vector< RequestPtr > _requests
Definition: lsq.hh:292
unsigned maxSQEntries
Max SQ Size - Used to Enforce Sharing Policies.
Definition: lsq.hh:1109
SMTQueuePolicy lsqPolicy
The LSQ policy for SMT mode.
Definition: lsq.hh:1072
void dumpInsts(ThreadID tid) const
Debugging function to print out instructions from a specific thread.
Definition: lsq.hh:1008
std::vector< LSQUnit > thread
The LSQ units for individual threads.
Definition: lsq.hh:1115
std::vector< bool > _byteEnable
Definition: lsq.hh:298
uint32_t _taskId
Definition: lsq.hh:289
std::string name() const
Returns the name of the LSQ.
Definition: lsq_impl.hh:113
State _state
Definition: lsq.hh:273
void tick()
Ticks the LSQ.
Definition: lsq_impl.hh:179
bool isInTranslation()
Definition: lsq.hh:585
std::shared_ptr< Request > RequestPtr
Definition: request.hh:81
bool isSet() const
Definition: flags.hh:60
uint8_t * PacketDataPtr
Definition: packet.hh:66
void packetSent()
Update the status to reflect that a packet was sent.
Definition: lsq.hh:562
bool sqFull()
Returns if any of the SQs are full.
Definition: lsq_impl.hh:582
void clear()
Definition: flags.hh:66
void packetNotSent()
Update the status to reflect that a packet was not sent.
Definition: lsq.hh:571
ip6_addr_t addr
Definition: inet.hh:330
bool isComplete()
Completes a packet and returns whether the access is finished.
Definition: lsq.hh:111
std::unique_ptr< AtomicOpFunctor > AtomicOpFunctorPtr
Definition: amo.hh:228
const Request::Flags _flags
Definition: lsq.hh:297
LSQ< Impl > * lsq
Pointer to LSQ.
Definition: lsq.hh:127
LSQRequest * _request
The senderState needs to know the LSQRequest who owns it.
Definition: lsq.hh:77
FullO3CPU< Impl > * cpu
Definition: lsq.hh:128
bool violation()
Returns whether or not there was a memory ordering violation.
Definition: lsq_impl.hh:285
bool hasStoresToWB()
Returns whether or not there are any stores to write back to memory.
Definition: lsq_impl.hh:638
bool isPartialFault()
Definition: lsq.hh:612
Overload hash function for BasicBlockRange type.
Definition: vec_reg.hh:587
Derived class to hold any sender state the LSQ needs.
Definition: lsq.hh:73
Fault executeLoad(const DynInstPtr &inst)
Executes a load.
Definition: lsq_impl.hh:248
bool isComplete()
Definition: lsq.hh:579
LSQSenderState(LSQRequest *request, bool isLoad_)
Default constructor.
Definition: lsq.hh:80
Bitfield< 4, 0 > mode
bool isTranslationComplete()
Definition: lsq.hh:591
int usedStorePorts
The number of used cache ports in this cycle by stores.
Definition: lsq.hh:1064
virtual ~LSQRequest()
Destructor.
Definition: lsq.hh:426
bool isFull()
Returns if the LSQ is full (either LQ or SQ is full).
Definition: lsq_impl.hh:483
Definition: lsq.hh:62
int getLoadHead(ThreadID tid)
Returns the head index of the load queue for a specific thread.
Definition: lsq.hh:902
bool lqEmpty() const
Returns if all of the LQs are empty.
Definition: lsq_impl.hh:519
void packetReplied()
Definition: lsq.hh:649
ThreadContext is the external interface to all thread state for anything outside of the CPU...
bool hasStoresToWB(ThreadID tid)
Returns whether or not a specific thread has any stores to write back to memory.
Definition: lsq.hh:993
void writebackStores()
Attempts to write back stores until all cache ports are used or the interface becomes blocked...
Definition: lsq_impl.hh:266
bool needWB
Whether or not the instruction will need to writeback.
Definition: lsq.hh:98
std::vector< PacketPtr > _packets
Definition: lsq.hh:291
void dumpInsts() const
Debugging function to print out all instructions.
Definition: lsq_impl.hh:672
STL vector class.
Definition: stl.hh:37
AtomicOpFunctorPtr _amo_op
Definition: lsq.hh:300
bool violation(ThreadID tid)
Returns whether or not there was a memory ordering violation for a specific thread.
Definition: lsq.hh:892
uint32_t numFragments
Definition: lsq.hh:776
LSQRequest(LSQUnit *port, const DynInstPtr &inst, bool isLoad)
Definition: lsq.hh:303
bool willWB(ThreadID tid)
Returns if the LSQ of a specific thread will write back to memory this cycle.
Definition: lsq.hh:1003
::Flags< FlagsStorage > FlagsType
Definition: lsq.hh:234
bool isSplit
Whether or not this access is split in two.
Definition: lsq.hh:100
uint32_t numInTranslationFragments
Definition: lsq.hh:278
void writebackScheduled()
Definition: lsq.hh:658
virtual bool squashed() const override
This function is used by the page table walker to determine if it should translate the a pending requ...
Definition: lsq.hh:360
Impl::CPUPol::LSQUnit LSQUnit
Definition: lsq.hh:69
void release(Flag reason)
Release the LSQRequest.
Definition: lsq.hh:386
bool isMemAccessRequired()
Definition: lsq.hh:618
bool _cacheBlocked
D-cache is blocked.
Definition: lsq.hh:1060
Bitfield< 4 > pc
void writebackDone()
Definition: lsq.hh:116
void senderState(LSQSenderState *st)
Definition: lsq.hh:501
LSQUnit & _port
Definition: lsq.hh:287
void insertLoad(const DynInstPtr &load_inst)
Inserts a load into the LSQ.
Definition: lsq_impl.hh:230
bool isDrained() const
Has the LSQ drained?
Definition: lsq_impl.hh:148
bool isDelayed()
Definition: lsq.hh:284
Addr getVaddr(int idx=0) const
Definition: lsq.hh:481
void setState(const State &newState)
Definition: lsq.hh:275
LSQRequest * request()
Definition: lsq.hh:114
void cachePortBusy(bool is_load)
Another store port is in use.
Definition: lsq_impl.hh:218
unsigned numFreeStoreEntries()
Returns the number of free store entries.
Definition: lsq_impl.hh:451
InstSeqNum getLoadHeadSeqNum(ThreadID tid)
Returns the sequence number of the head of the load queue.
Definition: lsq.hh:906
DcachePort dcachePort
Data port.
Definition: lsq.hh:1112
std::vector< Fault > _fault
Definition: lsq.hh:293
void setContext(const ContextID &context_id)
Convenience getters/setters.
Definition: lsq.hh:443
int numStores(ThreadID tid)
Returns the total number of stores for a single thread.
Definition: lsq.hh:934
int usedLoadPorts
The number of used cache ports in this cycle by loads.
Definition: lsq.hh:1068
void drainSanityCheck() const
Perform sanity checks after a drain.
Definition: lsq_impl.hh:138
int numLoads()
Returns the total number of loads in the load queue.
Definition: lsq_impl.hh:397
DcachePort(LSQ< Impl > *_lsq, FullO3CPU< Impl > *_cpu)
Default constructor.
Definition: lsq.hh:132
unsigned maxLQEntries
Max LQ Size - Used to Enforce Sharing Policies.
Definition: lsq.hh:1106
void sendFragmentToTranslation(int i)
Definition: lsq_impl.hh:973
bool isSplit() const
Definition: lsq.hh:540
void setVirt(Addr vaddr, unsigned size, Request::Flags flags_, MasterID mid, Addr pc)
Set up virtual request.
Definition: lsq.hh:458
int numStoresToWB(ThreadID tid)
Returns the number of stores a specific thread has to write back.
Definition: lsq.hh:996
Fault executeStore(const DynInstPtr &inst)
Executes a store.
Definition: lsq_impl.hh:257
Fault write(LSQRequest *req, uint8_t *data, int store_idx)
Executes a store operation, using the store specified at the store index.
Definition: lsq.hh:1132
uint64_t InstSeqNum
Definition: inst_seq.hh:37
void addRequest(Addr addr, unsigned size, const std::vector< bool > &byte_enable)
Helper function used to add a (sub)request, given its address addr, size size and byte-enable mask by...
Definition: lsq.hh:406
Port Object Declaration.
virtual bool isSnooping() const
As this CPU requires snooping to maintain the load store queue change the behaviour from the base CPU...
Definition: lsq.hh:159
void squashTranslation()
Definition: lsq.hh:675
bool isLoad() const
Definition: lsq.hh:337
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:140
void writebackDone()
Definition: lsq.hh:665
void complete()
Definition: lsq.hh:686
bool deleted
Has the request been deleted? LSQ entries can be squashed before the response comes back...
Definition: lsq.hh:107
uint16_t MasterID
Definition: request.hh:84
A Packet is used to encapsulate a transfer between two objects in the memory system (e...
Definition: packet.hh:249
InstSeqNum getStoreHeadSeqNum(ThreadID tid)
Returns the sequence number of the head of the store queue.
Definition: lsq.hh:916
void deleteRequest()
Definition: lsq.hh:112
void markDelayed() override
Signal that the translation has been delayed due to a hw page table walk.
Definition: lsq.hh:283
bool isSent()
Definition: lsq.hh:606
uint32_t numTranslatedFragments
Definition: lsq.hh:277
uint64_t * _res
Definition: lsq.hh:294
bool isLoad
Whether or not it is a load.
Definition: lsq.hh:96
A virtual base opaque structure used to hold state associated with the packet (e.g., an MSHR), specific to a SimObject that sees the packet.
Definition: packet.hh:397
void insertStore(const DynInstPtr &store_inst)
Inserts a store into the LSQ.
Definition: lsq_impl.hh:239
bool isReleased()
Test if the LSQRequest has been released, i.e.
Definition: lsq.hh:371
uint32_t _entryIdx
LQ/SQ entry idx.
Definition: lsq.hh:281
bool isEmpty() const
Returns if the LSQ is empty (both LQ and SQ are empty).
Definition: lsq_impl.hh:512
PacketPtr pendingPacket
A second packet from a split store that needs sending.
Definition: lsq.hh:92
virtual void complete()=0
const DynInstPtr _inst
Definition: lsq.hh:288
void discardSenderState()
Mark senderState as discarded.
Definition: lsq.hh:521
int getCount()
Returns the number of instructions in all of the queues.
Definition: lsq_impl.hh:379
Mode
Definition: tlb.hh:57
bool isTranslationBlocked()
Definition: lsq.hh:598
int16_t ThreadID
Thread index/ID type.
Definition: types.hh:225
bool alive()
Definition: lsq.hh:113
SingleDataRequest(LSQUnit *port, const DynInstPtr &inst, bool isLoad, const Addr &addr, const uint32_t &size, const Request::Flags &flags_, PacketDataPtr data=nullptr, uint64_t *res=nullptr, AtomicOpFunctorPtr amo_op=nullptr)
Definition: lsq.hh:724
Impl::O3CPU O3CPU
Definition: lsq.hh:66
void commitStores(InstSeqNum &youngest_inst, ThreadID tid)
Commits stores up until the given sequence number for a specific thread.
Definition: lsq.hh:866
const LSQSenderState * senderState() const
Definition: lsq.hh:511
uint8_t outstanding
Number of outstanding packets to complete.
Definition: lsq.hh:94
virtual void recvFunctionalSnoop(PacketPtr pkt)
Receive a functional snoop request packet from the peer.
Definition: lsq.hh:145
unsigned numFreeLoadEntries()
Returns the number of free load entries.
Definition: lsq_impl.hh:433
int entryAmount(ThreadID num_threads)
Number of entries needed for the given amount of threads.
void setStateToFault()
Definition: lsq.hh:625
virtual PacketPtr mainPacket()
Definition: lsq.hh:487
LSQRequest(LSQUnit *port, const DynInstPtr &inst, bool isLoad, const Addr &addr, const uint32_t &size, const Request::Flags &flags_, PacketDataPtr data=nullptr, uint64_t *res=nullptr, AtomicOpFunctorPtr amo_op=nullptr)
Definition: lsq.hh:315
RequestPtr request(int idx=0)
Definition: lsq.hh:473
Fault read(LSQRequest *req, int load_idx)
Executes a read operation, using the load specified at the load index.
Definition: lsq.hh:1123
void recvReqRetry()
Retry the previous send that failed.
Definition: lsq_impl.hh:303
Bitfield< 31, 28 > st
DcachePort class for the load/store queue.
Definition: lsq.hh:122
const DynInstPtr & instruction()
Definition: lsq.hh:449
void setActiveThreads(std::list< ThreadID > *at_ptr)
Sets the pointer to the list of active threads.
Definition: lsq_impl.hh:130
uint32_t numReceivedPackets
Definition: lsq.hh:777
int cacheStorePorts
The number of cache ports available each cycle (stores only).
Definition: lsq.hh:1062
RequestPtr mainReq
Definition: lsq.hh:778
uint32_t taskId() const
Definition: lsq.hh:472
virtual RequestPtr mainRequest()
Definition: lsq.hh:494
LSQ(O3CPU *cpu_ptr, IEW *iew_ptr, DerivO3CPUParams *params)
Constructs an LSQ with the given parameters.
Definition: lsq_impl.hh:61
int numStores()
Returns the total number of stores in the store queue.
Definition: lsq_impl.hh:415
bool isAnyOutstandingRequest()
Test if there is any in-flight translation or mem access request.
Definition: lsq.hh:531
void install()
Install the request in the LQ/SQ.
Definition: lsq.hh:349
ContextID contextId()
Definition: lsq.hh:108
bool isAnyActiveElement(const std::vector< bool >::const_iterator &it_start, const std::vector< bool >::const_iterator &it_end)
Test if there is any active element in an enablement range.
Definition: utils.hh:86
bool cachePortAvailable(bool is_load) const
Is any store port available to use?
Definition: lsq_impl.hh:205
PacketPtr _mainPacket
Definition: lsq.hh:779
SplitDataRequest(LSQUnit *port, const DynInstPtr &inst, bool isLoad, const Addr &addr, const uint32_t &size, const Request::Flags &flags_, PacketDataPtr data=nullptr, uint64_t *res=nullptr)
Definition: lsq.hh:782
virtual ~SingleDataRequest()
Definition: lsq.hh:733
void discard()
The request is discarded (e.g.
Definition: lsq.hh:643
Memory operation metadata.
Definition: lsq.hh:230
void completeDataAccess(PacketPtr pkt)
Definition: lsq_impl.hh:315
int cacheLoadPorts
The number of cache ports available each cycle (loads only).
Definition: lsq.hh:1066
void regStats()
Registers statistics of each LSQ unit.
Definition: lsq_impl.hh:120
bool recvTimingResp(PacketPtr pkt)
Handles writing back and completing the load or store that has returned from memory.
Definition: lsq_impl.hh:324
LoadQueue loadQueue
The load queue.
Definition: lsq_unit.hh:482
virtual ~SplitDataRequest()
Definition: lsq.hh:796
bool pktToSend
Whether or not there is a packet that needs sending.
Definition: lsq.hh:102
void squash(const InstSeqNum &squashed_num, ThreadID tid)
Squash instructions from a thread until the specified sequence number.
Definition: lsq.hh:881
CircularQueue< SQEntry > storeQueue
The store queue.
Definition: lsq_unit.hh:479
static uint32_t maxLSQAllocation(SMTQueuePolicy pol, uint32_t entries, uint32_t numThreads, uint32_t SMTThreshold)
Auxiliary function to calculate per-thread max LSQ allocation limit.
Definition: lsq.hh:1080
bool cacheBlocked() const
Is D-cache blocked?
Definition: lsq_impl.hh:191
PacketPtr packet(int idx=0)
Definition: lsq.hh:484
Impl::CPUPol::IEW IEW
Definition: lsq.hh:68
MasterPort & getDataPort()
Definition: lsq.hh:1056
O3CPU * cpu
The CPU pointer.
Definition: lsq.hh:1042
std::list< ThreadID > * activeThreads
List of Active Threads in System.
Definition: lsq.hh:1098
bool isStalled()
Returns if the LSQ is stalled due to a memory operation that must be replayed.
Definition: lsq_impl.hh:611
void freeLSQEntry()
The LSQ entry is cleared.
Definition: lsq.hh:634
DynInstPtr getMemDepViolator(ThreadID tid)
Gets the instruction that caused the memory ordering violation.
Definition: lsq.hh:896
void recvTimingSnoopReq(PacketPtr pkt)
Definition: lsq_impl.hh:362
const char data[]
std::shared_ptr< FaultBase > Fault
Definition: types.hh:238
unsigned numFreeEntries(ThreadID tid)
Returns the number of free entries for a specific thread.
int getStoreHead(ThreadID tid)
Returns the head index of the store queue.
Definition: lsq.hh:912
void set(Type flags)
Definition: flags.hh:68
int ContextID
Globally unique thread context ID.
Definition: types.hh:229
int numLoads(ThreadID tid)
Returns the total number of loads for a single thread.
Definition: lsq.hh:929
void commitLoads(InstSeqNum &youngest_inst, ThreadID tid)
Commits loads up until the given sequence number for a specific thread.
Definition: lsq.hh:860
bool sqEmpty() const
Returns if all of the SQs are empty.
Definition: lsq_impl.hh:536
~LSQ()
Definition: lsq.hh:822
const RequestPtr request(int idx=0) const
Definition: lsq.hh:476
bool lqFull()
Returns if any of the LQs are full.
Definition: lsq_impl.hh:553
FullO3CPU class, has each of the stages (fetch through commit) within it, as well as all of the time ...
Definition: cpu.hh:94
const Addr _addr
Definition: lsq.hh:295
uint32_t FlagsStorage
Definition: lsq.hh:233
bool isAtomic() const
Definition: lsq.hh:343

Generated on Fri Jul 3 2020 15:53:00 for gem5 by doxygen 1.8.13