gem5  v21.0.0.0
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
wavefront.cc
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2011-2017 Advanced Micro Devices, Inc.
3  * All rights reserved.
4  *
5  * For use for simulation and test purposes only
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions are met:
9  *
10  * 1. Redistributions of source code must retain the above copyright notice,
11  * this list of conditions and the following disclaimer.
12  *
13  * 2. Redistributions in binary form must reproduce the above copyright notice,
14  * this list of conditions and the following disclaimer in the documentation
15  * and/or other materials provided with the distribution.
16  *
17  * 3. Neither the name of the copyright holder nor the names of its
18  * contributors may be used to endorse or promote products derived from this
19  * software without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31  * POSSIBILITY OF SUCH DAMAGE.
32  */
33 
34 #include "gpu-compute/wavefront.hh"
35 
36 #include "base/bitfield.hh"
37 #include "debug/GPUExec.hh"
38 #include "debug/GPUInitAbi.hh"
39 #include "debug/WavefrontStack.hh"
43 #include "gpu-compute/shader.hh"
46 
48  : SimObject(p), wfSlotId(p.wf_slot_id), simdId(p.simdId),
49  maxIbSize(p.max_ib_size), _gpuISA(*this),
50  vmWaitCnt(-1), expWaitCnt(-1), lgkmWaitCnt(-1),
51  vmemInstsIssued(0), expInstsIssued(0), lgkmInstsIssued(0),
52  sleepCnt(0), barId(WFBarrier::InvalidID), stats(this)
53 {
54  lastTrace = 0;
55  execUnitId = -1;
56  status = S_STOPPED;
59  startVgprIndex = 0;
60  startSgprIndex = 0;
61  outstandingReqs = 0;
66  rdLmReqsInPipe = 0;
67  rdGmReqsInPipe = 0;
68  wrLmReqsInPipe = 0;
69  wrGmReqsInPipe = 0;
74  lastNonIdleTick = 0;
75  ldsChunk = nullptr;
76 
77  memTraceBusy = 0;
78  oldVgprTcnt = 0xffffffffffffffffll;
79  oldDgprTcnt = 0xffffffffffffffffll;
80  oldVgpr.resize(p.wf_size);
81 
82  pendingFetch = false;
83  dropFetch = false;
84  maxVgprs = 0;
85  maxSgprs = 0;
86 
87  lastAddr.resize(p.wf_size);
88  workItemFlatId.resize(p.wf_size);
89  oldDgpr.resize(p.wf_size);
90  for (int i = 0; i < 3; ++i) {
91  workItemId[i].resize(p.wf_size);
92  }
93 
94  _execMask.set();
95  rawDist.clear();
96  lastInstExec = 0;
97  vecReads.clear();
98 }
99 
100 void
102 {
103  reservedVectorRegs = 0;
104  reservedScalarRegs = 0;
105  startVgprIndex = 0;
106  startSgprIndex = 0;
107 
113 }
114 
115 void
116 Wavefront::initRegState(HSAQueueEntry *task, int wgSizeInWorkItems)
117 {
118  int regInitIdx = 0;
119 
120  // iterate over all the init fields and check which
121  // bits are enabled
122  for (int en_bit = 0; en_bit < NumScalarInitFields; ++en_bit) {
123 
124  if (task->sgprBitEnabled(en_bit)) {
125  int physSgprIdx = 0;
126  uint32_t wiCount = 0;
127  uint32_t firstWave = 0;
128  int orderedAppendTerm = 0;
129  int numWfsInWg = 0;
130  uint32_t finalValue = 0;
131  Addr host_disp_pkt_addr = task->hostDispPktAddr();
132  Addr kernarg_addr = task->kernargAddr();
133  Addr hidden_priv_base(0);
134 
135  switch (en_bit) {
136  case PrivateSegBuf:
137  physSgprIdx =
138  computeUnit->registerManager->mapSgpr(this, regInitIdx);
139  computeUnit->srf[simdId]->write(physSgprIdx,
141  ++regInitIdx;
142  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
143  "Setting PrivateSegBuffer: s[%d] = %x\n",
145  wfSlotId, wfDynId, physSgprIdx,
147 
148  physSgprIdx =
149  computeUnit->registerManager->mapSgpr(this, regInitIdx);
150  computeUnit->srf[simdId]->write(physSgprIdx,
152  ++regInitIdx;
153  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
154  "Setting PrivateSegBuffer: s[%d] = %x\n",
156  wfSlotId, wfDynId, physSgprIdx,
158 
159  physSgprIdx =
160  computeUnit->registerManager->mapSgpr(this, regInitIdx);
161  computeUnit->srf[simdId]->write(physSgprIdx,
163  ++regInitIdx;
164  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
165  "Setting PrivateSegBuffer: s[%d] = %x\n",
167  wfSlotId, wfDynId, physSgprIdx,
169 
170  physSgprIdx =
171  computeUnit->registerManager->mapSgpr(this, regInitIdx);
172  computeUnit->srf[simdId]->write(physSgprIdx,
174 
175  ++regInitIdx;
176  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
177  "Setting PrivateSegBuffer: s[%d] = %x\n",
179  wfSlotId, wfDynId, physSgprIdx,
181  break;
182  case DispatchPtr:
183  physSgprIdx =
184  computeUnit->registerManager->mapSgpr(this, regInitIdx);
185  computeUnit->srf[simdId]->write(physSgprIdx,
186  bits(host_disp_pkt_addr, 31, 0));
187  ++regInitIdx;
188  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
189  "Setting DispatchPtr: s[%d] = %x\n",
191  wfSlotId, wfDynId, physSgprIdx,
192  bits(host_disp_pkt_addr, 31, 0));
193 
194  physSgprIdx =
195  computeUnit->registerManager->mapSgpr(this, regInitIdx);
196  computeUnit->srf[simdId]->write(physSgprIdx,
197  bits(host_disp_pkt_addr, 63, 32));
198  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
199  "Setting DispatchPtr: s[%d] = %x\n",
201  wfSlotId, wfDynId, physSgprIdx,
202  bits(host_disp_pkt_addr, 63, 32));
203 
204  ++regInitIdx;
205  break;
206  case QueuePtr:
207  physSgprIdx =
208  computeUnit->registerManager->mapSgpr(this, regInitIdx);
209  computeUnit->srf[simdId]->write(physSgprIdx,
210  bits(task->hostAMDQueueAddr, 31, 0));
211  ++regInitIdx;
212  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
213  "Setting QueuePtr: s[%d] = %x\n",
215  wfSlotId, wfDynId, physSgprIdx,
216  bits(task->hostAMDQueueAddr, 31, 0));
217 
218  physSgprIdx =
219  computeUnit->registerManager->mapSgpr(this, regInitIdx);
220  computeUnit->srf[simdId]->write(physSgprIdx,
221  bits(task->hostAMDQueueAddr, 63, 32));
222  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
223  "Setting QueuePtr: s[%d] = %x\n",
225  wfSlotId, wfDynId, physSgprIdx,
226  bits(task->hostAMDQueueAddr, 63, 32));
227 
228  ++regInitIdx;
229  break;
230  case KernargSegPtr:
231  physSgprIdx =
232  computeUnit->registerManager->mapSgpr(this, regInitIdx);
233  computeUnit->srf[simdId]->write(physSgprIdx,
234  bits(kernarg_addr, 31, 0));
235  ++regInitIdx;
236  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
237  "Setting KernargSegPtr: s[%d] = %x\n",
239  wfSlotId, wfDynId, physSgprIdx,
240  bits(kernarg_addr, 31, 0));
241 
242  physSgprIdx =
243  computeUnit->registerManager->mapSgpr(this, regInitIdx);
244  computeUnit->srf[simdId]->write(physSgprIdx,
245  bits(kernarg_addr, 63, 32));
246  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
247  "Setting KernargSegPtr: s[%d] = %x\n",
249  wfSlotId, wfDynId, physSgprIdx,
250  bits(kernarg_addr, 63, 32));
251 
252  ++regInitIdx;
253  break;
254  case FlatScratchInit:
255  physSgprIdx
256  = computeUnit->registerManager->mapSgpr(this, regInitIdx);
257  computeUnit->srf[simdId]->write(physSgprIdx,
259  .scratch_backing_memory_location & 0xffffffff));
260  ++regInitIdx;
261  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
262  "Setting FlatScratch Addr: s[%d] = %x\n",
264  wfSlotId, wfDynId, physSgprIdx,
266  .scratch_backing_memory_location & 0xffffffff));
267 
268  physSgprIdx =
269  computeUnit->registerManager->mapSgpr(this, regInitIdx);
270  // This vallue should be sizeof(DWORD) aligned, that is
271  // 4 byte aligned
272  computeUnit->srf[simdId]->write(physSgprIdx,
274  ++regInitIdx;
275  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
276  "Setting FlatScratch size: s[%d] = %x\n",
278  wfSlotId, wfDynId, physSgprIdx,
303  hidden_priv_base =
304  (uint64_t)task->amdQueue.scratch_resource_descriptor[0] |
305  (((uint64_t)task->amdQueue.scratch_resource_descriptor[1]
306  & 0x000000000000ffff) << 32);
308  hidden_priv_base,
310  break;
311  case GridWorkgroupCountX:
312  physSgprIdx =
313  computeUnit->registerManager->mapSgpr(this, regInitIdx);
314  wiCount = ((task->gridSize(0) +
315  task->wgSize(0) - 1) /
316  task->wgSize(0));
317  computeUnit->srf[simdId]->write(physSgprIdx, wiCount);
318 
319  ++regInitIdx;
320  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
321  "Setting num WG X: s[%d] = %x\n",
323  wfSlotId, wfDynId, physSgprIdx, wiCount);
324  break;
325  case GridWorkgroupCountY:
326  physSgprIdx =
327  computeUnit->registerManager->mapSgpr(this, regInitIdx);
328  wiCount = ((task->gridSize(1) +
329  task->wgSize(1) - 1) /
330  task->wgSize(1));
331  computeUnit->srf[simdId]->write(physSgprIdx, wiCount);
332 
333  ++regInitIdx;
334  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
335  "Setting num WG Y: s[%d] = %x\n",
337  wfSlotId, wfDynId, physSgprIdx, wiCount);
338  break;
339  case GridWorkgroupCountZ:
340  physSgprIdx =
341  computeUnit->registerManager->mapSgpr(this, regInitIdx);
342  wiCount = ((task->gridSize(2) +
343  task->wgSize(2) - 1) /
344  task->wgSize(2));
345  computeUnit->srf[simdId]->write(physSgprIdx, wiCount);
346 
347  ++regInitIdx;
348  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
349  "Setting num WG Z: s[%d] = %x\n",
351  wfSlotId, wfDynId, physSgprIdx, wiCount);
352  break;
353  case WorkgroupIdX:
354  physSgprIdx =
355  computeUnit->registerManager->mapSgpr(this, regInitIdx);
356  computeUnit->srf[simdId]->write(physSgprIdx,
357  workGroupId[0]);
358 
359  ++regInitIdx;
360  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
361  "Setting WG ID X: s[%d] = %x\n",
363  wfSlotId, wfDynId, physSgprIdx, workGroupId[0]);
364  break;
365  case WorkgroupIdY:
366  physSgprIdx =
367  computeUnit->registerManager->mapSgpr(this, regInitIdx);
368  computeUnit->srf[simdId]->write(physSgprIdx,
369  workGroupId[1]);
370 
371  ++regInitIdx;
372  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
373  "Setting WG ID Y: s[%d] = %x\n",
375  wfSlotId, wfDynId, physSgprIdx, workGroupId[1]);
376  break;
377  case WorkgroupIdZ:
378  physSgprIdx =
379  computeUnit->registerManager->mapSgpr(this, regInitIdx);
380  computeUnit->srf[simdId]->write(physSgprIdx,
381  workGroupId[2]);
382 
383  ++regInitIdx;
384  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
385  "Setting WG ID Z: s[%d] = %x\n",
387  wfSlotId, wfDynId, physSgprIdx, workGroupId[2]);
388  break;
390  physSgprIdx =
391  computeUnit->registerManager->mapSgpr(this, regInitIdx);
405  computeUnit->srf[simdId]->write(physSgprIdx, 1024 *
406  (wgId * (wgSz / 64) + wfId) *
408 
409  ++regInitIdx;
410  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
411  "Setting Private Seg Offset: s[%d] = %x\n",
413  wfSlotId, wfDynId, physSgprIdx,
414  1024 * (wgId * (wgSz / 64) + wfId) *
416  break;
417  case WorkgroupInfo:
418  firstWave = (wfId == 0) ? 1 : 0;
419  numWfsInWg = divCeil(wgSizeInWorkItems,
420  computeUnit->wfSize());
421  finalValue = firstWave << ((sizeof(uint32_t) * 8) - 1);
422  finalValue |= (orderedAppendTerm << 6);
423  finalValue |= numWfsInWg;
424  physSgprIdx =
425  computeUnit->registerManager->mapSgpr(this, regInitIdx);
427  write(physSgprIdx, finalValue);
428 
429  ++regInitIdx;
430  DPRINTF(GPUInitAbi, "CU%d: WF[%d][%d]: wave[%d] "
431  "Setting WG Info: s[%d] = %x\n",
433  wfSlotId, wfDynId, physSgprIdx, finalValue);
434  break;
435  default:
436  fatal("SGPR enable bit %i not supported\n", en_bit);
437  break;
438  }
439  }
440  }
441 
442  regInitIdx = 0;
443 
444  // iterate over all the init fields and check which
445  // bits are enabled
446  for (int en_bit = 0; en_bit < NumVectorInitFields; ++en_bit) {
447  if (task->vgprBitEnabled(en_bit)) {
448  uint32_t physVgprIdx = 0;
450 
451  switch (en_bit) {
452  case WorkitemIdX:
453  {
454  physVgprIdx = computeUnit->registerManager
455  ->mapVgpr(this, regInitIdx);
456  TheGpuISA::VecRegU32 vgpr_x
457  = raw_vgpr.as<TheGpuISA::VecElemU32>();
458 
459  for (int lane = 0; lane < workItemId[0].size(); ++lane) {
460  vgpr_x[lane] = workItemId[0][lane];
461  }
462 
463  computeUnit->vrf[simdId]->write(physVgprIdx, raw_vgpr);
464  rawDist[regInitIdx] = 0;
465  ++regInitIdx;
466  }
467  break;
468  case WorkitemIdY:
469  {
470  physVgprIdx = computeUnit->registerManager
471  ->mapVgpr(this, regInitIdx);
472  TheGpuISA::VecRegU32 vgpr_y
473  = raw_vgpr.as<TheGpuISA::VecElemU32>();
474 
475  for (int lane = 0; lane < workItemId[1].size(); ++lane) {
476  vgpr_y[lane] = workItemId[1][lane];
477  }
478 
479  computeUnit->vrf[simdId]->write(physVgprIdx, raw_vgpr);
480  rawDist[regInitIdx] = 0;
481  ++regInitIdx;
482  }
483  break;
484  case WorkitemIdZ:
485  {
486  physVgprIdx = computeUnit->registerManager->
487  mapVgpr(this, regInitIdx);
488  TheGpuISA::VecRegU32 vgpr_z
489  = raw_vgpr.as<TheGpuISA::VecElemU32>();
490 
491  for (int lane = 0; lane < workItemId[2].size(); ++lane) {
492  vgpr_z[lane] = workItemId[2][lane];
493  }
494 
495  computeUnit->vrf[simdId]->write(physVgprIdx, raw_vgpr);
496  rawDist[regInitIdx] = 0;
497  ++regInitIdx;
498  }
499  break;
500  }
501  }
502  }
503 }
504 
505 void
506 Wavefront::resizeRegFiles(int num_vregs, int num_sregs)
507 {
508  maxVgprs = num_vregs;
509  maxSgprs = num_sregs;
510 }
511 
513 {
514 }
515 
516 void
518 {
519  if (computeUnit->idleCUTimeout > 0) {
520  // Wavefront's status transitions to stalled or stopped
521  if ((newStatus == S_STOPPED || newStatus == S_STALLED ||
522  newStatus == S_WAITCNT || newStatus == S_BARRIER) &&
523  (status != newStatus)) {
524  computeUnit->idleWfs++;
525  assert(computeUnit->idleWfs <=
527  if (computeUnit->idleWfs ==
530  }
531  // Wavefront's status transitions to an active state (from
532  // a stopped or stalled state)
533  } else if ((status == S_STOPPED || status == S_STALLED ||
534  status == S_WAITCNT || status == S_BARRIER) &&
535  (status != newStatus)) {
536  // if all WFs in the CU were idle then check if the idleness
537  // period exceeded the timeout threshold
538  if (computeUnit->idleWfs ==
542  "CU%d has been idle for %d ticks at tick %d",
544  curTick());
545  }
546  computeUnit->idleWfs--;
547  assert(computeUnit->idleWfs >= 0);
548  }
549  }
550  status = newStatus;
551 }
552 
553 void
554 Wavefront::start(uint64_t _wf_dyn_id, Addr init_pc)
555 {
556  wfDynId = _wf_dyn_id;
557  _pc = init_pc;
558 
559  status = S_RUNNING;
560 
561  vecReads.resize(maxVgprs, 0);
562 }
563 
564 bool
566 {
567  if (ii->isGlobalMem() ||
568  (ii->isFlat() && ii->executedAs() == Enums::SC_GLOBAL)) {
569  return true;
570  }
571 
572  return false;
573 }
574 
575 bool
577 {
578  if (ii->isLocalMem() ||
579  (ii->isFlat() && ii->executedAs() == Enums::SC_GROUP)) {
580  return true;
581  }
582 
583  return false;
584 }
585 
586 bool
588 {
589  if (instructionBuffer.empty())
590  return false;
591 
592  GPUDynInstPtr ii = instructionBuffer.front();
593 
594  if (ii->isSleep()) {
595  return true;
596  }
597  return false;
598 }
599 
600 bool
602 {
603  if (instructionBuffer.empty())
604  return false;
605 
606  GPUDynInstPtr ii = instructionBuffer.front();
607 
608  if (ii->isWaitcnt()) {
609  // waitcnt is a scalar
610  assert(ii->isScalar());
611  return true;
612  }
613 
614  return false;
615 }
616 
617 bool
619 {
620  assert(!instructionBuffer.empty());
621  GPUDynInstPtr ii = instructionBuffer.front();
622 
623  if (status != S_STOPPED && ii->isScalar() && (ii->isNop() || ii->isReturn()
624  || ii->isEndOfKernel() || ii->isBranch() || ii->isALU() ||
625  (ii->isKernArgSeg() && ii->isLoad()))) {
626  return true;
627  }
628 
629  return false;
630 }
631 
632 bool
634 {
635  assert(!instructionBuffer.empty());
636  GPUDynInstPtr ii = instructionBuffer.front();
637 
638  if (status != S_STOPPED && !ii->isScalar() && (ii->isNop() ||
639  ii->isReturn() || ii->isBranch() || ii->isALU() || ii->isEndOfKernel()
640  || (ii->isKernArgSeg() && ii->isLoad()))) {
641  return true;
642  }
643 
644  return false;
645 }
646 
647 bool
649 {
650  assert(!instructionBuffer.empty());
651  GPUDynInstPtr ii = instructionBuffer.front();
652 
653  if (status != S_STOPPED && ii->isBarrier()) {
654  return true;
655  }
656 
657  return false;
658 }
659 
660 bool
662 {
663  assert(!instructionBuffer.empty());
664  GPUDynInstPtr ii = instructionBuffer.front();
665 
666  if (status != S_STOPPED && !ii->isScalar() && ii->isGlobalMem()) {
667  return true;
668  }
669 
670  return false;
671 }
672 
673 bool
675 {
676  assert(!instructionBuffer.empty());
677  GPUDynInstPtr ii = instructionBuffer.front();
678 
679  if (status != S_STOPPED && ii->isScalar() && ii->isGlobalMem()) {
680  return true;
681  }
682 
683  return false;
684 }
685 
686 bool
688 {
689  assert(!instructionBuffer.empty());
690  GPUDynInstPtr ii = instructionBuffer.front();
691 
692  if (status != S_STOPPED && ii->isLocalMem()) {
693  return true;
694  }
695 
696  return false;
697 }
698 
699 bool
701 {
702  assert(!instructionBuffer.empty());
703  GPUDynInstPtr ii = instructionBuffer.front();
704 
705  if (status != S_STOPPED && ii->isPrivateSeg()) {
706  return true;
707  }
708 
709  return false;
710 }
711 
712 bool
714 {
715  assert(!instructionBuffer.empty());
716  GPUDynInstPtr ii = instructionBuffer.front();
717 
718  if (status != S_STOPPED && ii->isFlat()) {
719  return true;
720  }
721 
722  return false;
723 }
724 
725 bool
727 {
728  for (auto it : instructionBuffer) {
729  GPUDynInstPtr ii = it;
730  if (ii->isReturn() || ii->isBranch() ||
731  ii->isEndOfKernel()) {
732  return true;
733  }
734  }
735 
736  return false;
737 }
738 
739 void
741 {
742  execUnitId = -1;
743 }
744 
746 {
748  wrLmReqsInPipe < 0 || rdLmReqsInPipe < 0 ||
749  outstandingReqs < 0,
750  "Negative requests in pipe for WF%d for slot%d"
751  " and SIMD%d: Rd GlobalMem Reqs=%d, Wr GlobalMem Reqs=%d,"
752  " Rd LocalMem Reqs=%d, Wr LocalMem Reqs=%d,"
753  " Outstanding Reqs=%d\n",
756 }
757 
758 void
760 {
761  if (!ii->isScalar()) {
762  if (ii->isLoad()) {
763  rdGmReqsInPipe++;
764  } else if (ii->isStore()) {
765  wrGmReqsInPipe++;
766  } else if (ii->isAtomic() || ii->isMemSync()) {
767  rdGmReqsInPipe++;
768  wrGmReqsInPipe++;
769  } else {
770  panic("Invalid memory operation!\n");
771  }
773  } else {
774  if (ii->isLoad()) {
776  } else if (ii->isStore()) {
778  } else if (ii->isAtomic() || ii->isMemSync()) {
781  } else {
782  panic("Invalid memory operation!\n");
783  }
785  }
786 }
787 
788 void
790 {
791  fatal_if(ii->isScalar(),
792  "Scalar instructions can not access Shared memory!!!");
793  if (ii->isLoad()) {
794  rdLmReqsInPipe++;
795  } else if (ii->isStore()) {
796  wrLmReqsInPipe++;
797  } else if (ii->isAtomic() || ii->isMemSync()) {
798  wrLmReqsInPipe++;
799  rdLmReqsInPipe++;
800  } else {
801  panic("Invalid memory operation!\n");
802  }
804 }
805 
808 {
809  // vector of execution unit IDs to return to schedule stage
810  // this return is only used for debugging and an assertion...
811  std::vector<int> execUnitIds;
812 
813  // Get current instruction
814  GPUDynInstPtr ii = instructionBuffer.front();
815  assert(ii);
816 
817  // Single precision ALU or Branch or Return or Special instruction
818  if (ii->isALU() || ii->isSpecialOp() ||
819  ii->isBranch() || ii->isNop() ||
820  (ii->isKernArgSeg() && ii->isLoad()) || ii->isArgSeg() ||
821  ii->isReturn() || ii->isEndOfKernel()) {
822  if (!ii->isScalar()) {
823  execUnitId = simdId;
824  } else {
826  }
827  // this is to enforce a fixed number of cycles per issue slot per SIMD
828  } else if (ii->isBarrier()) {
829  execUnitId = ii->isScalar() ? scalarAluGlobalIdx : simdId;
830  } else if (ii->isFlat()) {
831  assert(!ii->isScalar());
832  reserveLmResource(ii);
833  // add execUnitId, reserved by reserveLmResource, list before it is
834  // overwriten by reserveGmResource
835  execUnitIds.push_back(execUnitId);
837  reserveGmResource(ii);
839  execUnitIds.push_back(flatGmUnitId);
840  execUnitId = -1;
841  } else if (ii->isGlobalMem()) {
842  reserveGmResource(ii);
843  } else if (ii->isLocalMem()) {
844  reserveLmResource(ii);
845  } else if (ii->isPrivateSeg()) {
846  fatal_if(ii->isScalar(),
847  "Scalar instructions can not access Private memory!!!");
848  reserveGmResource(ii);
849  } else {
850  panic("reserveResources -> Couldn't process op!\n");
851  }
852 
853  if (execUnitId != -1) {
854  execUnitIds.push_back(execUnitId);
855  }
856  assert(execUnitIds.size());
857  return execUnitIds;
858 }
859 
860 void
862 {
863  // ---- Exit if wavefront is inactive ----------------------------- //
864 
865  if (status == S_STOPPED || status == S_RETURNING ||
866  status==S_STALLED || instructionBuffer.empty()) {
867  return;
868  }
869 
870  if (status == S_WAITCNT) {
882  assert(isOldestInstWaitcnt());
883  }
884 
885  // Get current instruction
886 
887  GPUDynInstPtr ii = instructionBuffer.front();
888 
889  const Addr old_pc = pc();
890  DPRINTF(GPUExec, "CU%d: WF[%d][%d]: wave[%d] Executing inst: %s "
891  "(pc: %#x; seqNum: %d)\n", computeUnit->cu_id, simdId, wfSlotId,
892  wfDynId, ii->disassemble(), old_pc, ii->seqNum());
893 
894  ii->execute(ii);
895  // delete the dynamic instruction from the pipeline map
897  // update the instruction stats in the CU
899 
900  // inform VRF of instruction execution to schedule write-back
901  // and scoreboard ready for registers
902  if (!ii->isScalar()) {
903  computeUnit->vrf[simdId]->waveExecuteInst(this, ii);
904  }
905  computeUnit->srf[simdId]->waveExecuteInst(this, ii);
906 
907  computeUnit->shader->incVectorInstSrcOperand(ii->numSrcVecOperands());
908  computeUnit->shader->incVectorInstDstOperand(ii->numDstVecOperands());
917 
918  if (lastInstExec) {
921  }
923 
924  // want to track:
925  // number of reads that occur per value written
926 
927  // vector RAW dependency tracking
928  for (int i = 0; i < ii->getNumOperands(); i++) {
929  if (ii->isVectorRegister(i)) {
930  int vgpr = ii->getRegisterIndex(i, ii);
931  int nReg = ii->getOperandSize(i) <= 4 ? 1 :
932  ii->getOperandSize(i) / 4;
933  for (int n = 0; n < nReg; n++) {
934  if (ii->isSrcOperand(i)) {
935  // This check should never fail, but to be safe we check
936  if (rawDist.find(vgpr+n) != rawDist.end()) {
938  stats.numInstrExecuted.value() - rawDist[vgpr+n]);
939  }
940  // increment number of reads to this register
941  vecReads[vgpr+n]++;
942  } else if (ii->isDstOperand(i)) {
943  // rawDist is set on writes, but will not be set
944  // for the first write to each physical register
945  if (rawDist.find(vgpr+n) != rawDist.end()) {
946  // sample the number of reads that were performed
948  }
949  // on a write, reset count of reads to 0
950  vecReads[vgpr+n] = 0;
951 
953  }
954  }
955  }
956  }
957 
958  if (pc() == old_pc) {
959  // PC not modified by instruction, proceed to next
960  _gpuISA.advancePC(ii);
961  instructionBuffer.pop_front();
962  } else {
963  DPRINTF(GPUExec, "CU%d: WF[%d][%d]: wave%d %s taken branch\n",
965  ii->disassemble());
966  discardFetch();
967  }
968  DPRINTF(GPUExec, "CU%d: WF[%d][%d]: wave[%d] (pc: %#x)\n",
970 
972  const int num_active_lanes = execMask().count();
974  computeUnit->stats.numVecOpsExecuted += num_active_lanes;
975 
976  if (ii->isF16() && ii->isALU()) {
977  if (ii->isF32() || ii->isF64()) {
978  fatal("Instruction is tagged as both (1) F16, and (2)"
979  "either F32 or F64.");
980  }
981  computeUnit->stats.numVecOpsExecutedF16 += num_active_lanes;
982  if (ii->isFMA()) {
983  computeUnit->stats.numVecOpsExecutedFMA16 += num_active_lanes;
985  += num_active_lanes;
986  }
987  else if (ii->isMAC()) {
988  computeUnit->stats.numVecOpsExecutedMAC16 += num_active_lanes;
990  += num_active_lanes;
991  }
992  else if (ii->isMAD()) {
993  computeUnit->stats.numVecOpsExecutedMAD16 += num_active_lanes;
995  += num_active_lanes;
996  }
997  }
998  if (ii->isF32() && ii->isALU()) {
999  if (ii->isF16() || ii->isF64()) {
1000  fatal("Instruction is tagged as both (1) F32, and (2)"
1001  "either F16 or F64.");
1002  }
1003  computeUnit->stats.numVecOpsExecutedF32 += num_active_lanes;
1004  if (ii->isFMA()) {
1005  computeUnit->stats.numVecOpsExecutedFMA32 += num_active_lanes;
1007  += num_active_lanes;
1008  }
1009  else if (ii->isMAC()) {
1010  computeUnit->stats.numVecOpsExecutedMAC32 += num_active_lanes;
1012  += num_active_lanes;
1013  }
1014  else if (ii->isMAD()) {
1015  computeUnit->stats.numVecOpsExecutedMAD32 += num_active_lanes;
1017  += num_active_lanes;
1018  }
1019  }
1020  if (ii->isF64() && ii->isALU()) {
1021  if (ii->isF16() || ii->isF32()) {
1022  fatal("Instruction is tagged as both (1) F64, and (2)"
1023  "either F16 or F32.");
1024  }
1025  computeUnit->stats.numVecOpsExecutedF64 += num_active_lanes;
1026  if (ii->isFMA()) {
1027  computeUnit->stats.numVecOpsExecutedFMA64 += num_active_lanes;
1029  += num_active_lanes;
1030  }
1031  else if (ii->isMAC()) {
1032  computeUnit->stats.numVecOpsExecutedMAC64 += num_active_lanes;
1034  += num_active_lanes;
1035  }
1036  else if (ii->isMAD()) {
1037  computeUnit->stats.numVecOpsExecutedMAD64 += num_active_lanes;
1039  += num_active_lanes;
1040  }
1041  }
1042  if (isGmInstruction(ii)) {
1044  num_active_lanes);
1045  } else if (isLmInstruction(ii)) {
1047  num_active_lanes);
1048  }
1049  }
1050 
1055  if (execMask().none() && ii->isFlat()) {
1057  return;
1058  }
1059 
1060  // Update Vector ALU pipeline and other resources
1061  bool flat_as_gm = false;
1062  bool flat_as_lm = false;
1063  if (ii->isFlat()) {
1064  flat_as_gm = (ii->executedAs() == Enums::SC_GLOBAL) ||
1065  (ii->executedAs() == Enums::SC_PRIVATE);
1066  flat_as_lm = (ii->executedAs() == Enums::SC_GROUP);
1067  }
1068 
1069  // Single precision ALU or Branch or Return or Special instruction
1070  // Note, we use the same timing regardless of SP or DP ALU operation.
1071  if (ii->isALU() || ii->isSpecialOp() ||
1072  ii->isBranch() || ii->isNop() ||
1073  (ii->isKernArgSeg() && ii->isLoad()) ||
1074  ii->isArgSeg() || ii->isEndOfKernel() || ii->isReturn()) {
1075  // this is to enforce a fixed number of cycles per issue slot per SIMD
1076  if (!ii->isScalar()) {
1078  cyclesToTicks(computeUnit->issuePeriod));
1079  } else {
1081  cyclesToTicks(computeUnit->issuePeriod));
1082  }
1083  // Barrier on Scalar ALU
1084  } else if (ii->isBarrier()) {
1086  cyclesToTicks(computeUnit->issuePeriod));
1087  // GM or Flat as GM Load
1088  } else if (ii->isLoad() && (ii->isGlobalMem() || flat_as_gm)) {
1089  if (!ii->isScalar()) {
1096  } else {
1098  cyclesToTicks(computeUnit->srf_scm_bus_latency));
1103  }
1104  // GM or Flat as GM Store
1105  } else if (ii->isStore() && (ii->isGlobalMem() || flat_as_gm)) {
1106  if (!ii->isScalar()) {
1108  cyclesToTicks(Cycles(2 * computeUnit->vrf_gm_bus_latency)));
1113  } else {
1115  cyclesToTicks(Cycles(2 * computeUnit->srf_scm_bus_latency)));
1120  }
1121  } else if ((ii->isAtomic() || ii->isMemSync()) &&
1122  (ii->isGlobalMem() || flat_as_gm)) {
1123  if (!ii->isScalar()) {
1125  cyclesToTicks(Cycles(2 * computeUnit->vrf_gm_bus_latency)));
1130  } else {
1132  cyclesToTicks(Cycles(2 * computeUnit->srf_scm_bus_latency)));
1137  }
1138  // LM or Flat as LM Load
1139  } else if (ii->isLoad() && (ii->isLocalMem() || flat_as_lm)) {
1141  cyclesToTicks(computeUnit->vrf_lm_bus_latency));
1146  // LM or Flat as LM Store
1147  } else if (ii->isStore() && (ii->isLocalMem() || flat_as_lm)) {
1149  cyclesToTicks(Cycles(2 * computeUnit->vrf_lm_bus_latency)));
1154  // LM or Flat as LM, Atomic or MemFence
1155  } else if ((ii->isAtomic() || ii->isMemSync()) &&
1156  (ii->isLocalMem() || flat_as_lm)) {
1158  cyclesToTicks(Cycles(2 * computeUnit->vrf_lm_bus_latency)));
1163  } else {
1164  panic("Bad instruction type!\n");
1165  }
1166 }
1167 
1170 {
1171  // Read next instruction from instruction buffer
1172  GPUDynInstPtr ii = instructionBuffer.front();
1173  // if the WF has been dispatched in the schedule stage then
1174  // check the next oldest instruction for readiness
1175  if (computeUnit->pipeMap.find(ii->seqNum()) !=
1176  computeUnit->pipeMap.end()) {
1177  if (instructionBuffer.size() > 1) {
1178  auto it = instructionBuffer.begin() + 1;
1179  return *it;
1180  } else { // No new instructions to check
1181  return nullptr;
1182  }
1183  }
1184  return ii;
1185 }
1186 
1187 void
1189 {
1190  instructionBuffer.clear();
1192 
1198 }
1199 
1200 bool
1202 {
1203  // Both vmWaitCnt && lgkmWaitCnt uninitialized means
1204  // waitCnt instruction has been dispatched but not executed yet: next
1205  // instruction should be blocked until waitCnt is executed.
1206  if (vmWaitCnt == -1 && expWaitCnt == -1 && lgkmWaitCnt == -1) {
1207  return false;
1208  }
1209 
1215  if (vmWaitCnt != -1) {
1216  if (vmemInstsIssued > vmWaitCnt) {
1217  // vmWaitCnt not satisfied
1218  return false;
1219  }
1220  }
1221 
1222  if (expWaitCnt != -1) {
1223  if (expInstsIssued > expWaitCnt) {
1224  // expWaitCnt not satisfied
1225  return false;
1226  }
1227  }
1228 
1229  if (lgkmWaitCnt != -1) {
1230  if (lgkmInstsIssued > lgkmWaitCnt) {
1231  // lgkmWaitCnt not satisfied
1232  return false;
1233  }
1234  }
1235 
1236  // if we get here all outstanding waitcnts must
1237  // be satisfied, so we resume normal operation
1238  clearWaitCnts();
1239 
1240  return true;
1241 }
1242 
1243 bool
1245 {
1246  assert(status == S_STALLED_SLEEP);
1247 
1248  // if the sleep count has not been set, then the sleep instruction has not
1249  // been executed yet, so we will return true without setting the wavefront
1250  // status
1251  if (sleepCnt == 0)
1252  return false;
1253 
1254  sleepCnt--;
1255  if (sleepCnt != 0)
1256  return false;
1257 
1258  status = S_RUNNING;
1259  return true;
1260 }
1261 
1262 void
1264 {
1265  assert(sleepCnt == 0);
1266  sleepCnt = sleep_time;
1267 }
1268 
1269 void
1270 Wavefront::setWaitCnts(int vm_wait_cnt, int exp_wait_cnt, int lgkm_wait_cnt)
1271 {
1272  // the scoreboard should have set the status
1273  // to S_WAITCNT once a waitcnt instruction
1274  // was marked as ready
1275  assert(status == S_WAITCNT);
1276 
1277  // waitcnt instruction shouldn't be sending
1278  // negative counts
1279  assert(vm_wait_cnt >= 0);
1280  assert(exp_wait_cnt >= 0);
1281  assert(lgkm_wait_cnt >= 0);
1282  // waitcnts are a max of 15 because we have
1283  // only 1 nibble (4 bits) to set the counts
1284  assert(vm_wait_cnt <= 0xf);
1285  assert(exp_wait_cnt <= 0x7);
1286  assert(lgkm_wait_cnt <= 0x1f);
1287 
1294  assert(vmWaitCnt == -1);
1295  assert(expWaitCnt == -1);
1296  assert(lgkmWaitCnt == -1);
1297 
1304  if (vm_wait_cnt != 0xf)
1305  vmWaitCnt = vm_wait_cnt;
1306 
1307  if (exp_wait_cnt != 0x7)
1308  expWaitCnt = exp_wait_cnt;
1309 
1310  if (lgkm_wait_cnt != 0x1f)
1311  lgkmWaitCnt = lgkm_wait_cnt;
1312 }
1313 
1314 void
1316 {
1317  // reset the waitcnts back to
1318  // -1, indicating they are no
1319  // longer valid
1320  vmWaitCnt = -1;
1321  expWaitCnt = -1;
1322  lgkmWaitCnt = -1;
1323 
1324  // resume running normally
1325  status = S_RUNNING;
1326 }
1327 
1328 void
1330 {
1331  ++vmemInstsIssued;
1332 }
1333 
1334 void
1336 {
1337  ++expInstsIssued;
1338 }
1339 
1340 void
1342 {
1343  ++lgkmInstsIssued;
1344 }
1345 
1346 void
1348 {
1349  --vmemInstsIssued;
1350 }
1351 
1352 void
1354 {
1355  --expInstsIssued;
1356 }
1357 
1358 void
1360 {
1361  --lgkmInstsIssued;
1362 }
1363 
1364 Addr
1366 {
1367  return _pc;
1368 }
1369 
1370 void
1372 {
1373  _pc = new_pc;
1374 }
1375 
1376 VectorMask&
1378 {
1379  return _execMask;
1380 }
1381 
1382 bool
1383 Wavefront::execMask(int lane) const
1384 {
1385  return _execMask[lane];
1386 }
1387 
1388 void
1390 {
1391  /* clear busy registers */
1392  for (int i=0; i < maxVgprs; i++) {
1393  int vgprIdx = computeUnit->registerManager->mapVgpr(this, i);
1394  computeUnit->vrf[simdId]->markReg(vgprIdx, false);
1395  }
1396 
1397  /* Free registers used by this wavefront */
1398  uint32_t endIndex = (startVgprIndex + reservedVectorRegs - 1) %
1399  computeUnit->vrf[simdId]->numRegs();
1401  freeRegion(startVgprIndex, endIndex);
1402 }
1403 
1404 void
1406 {
1407  actualWgSzTotal = 1;
1408  for (int d = 0; d < HSAQueueEntry::MAX_DIM; ++d) {
1409  actualWgSz[d] = std::min(workGroupSz[d], gridSz[d]
1410  - task->wgId(d) * workGroupSz[d]);
1412  }
1413 }
1414 
1415 void
1417 {
1418  assert(bar_id >= WFBarrier::InvalidID);
1419  assert(bar_id < computeUnit->numBarrierSlots());
1420  barId = bar_id;
1421 }
1422 
1423 int
1425 {
1426  return barId;
1427 }
1428 
1429 bool
1431 {
1432  return barId > WFBarrier::InvalidID;
1433 }
1434 
1435 void
1437 {
1439 }
1440 
1442  : Stats::Group(parent),
1443  ADD_STAT(numInstrExecuted,
1444  "number of instructions executed by this WF slot"),
1445  ADD_STAT(schCycles, "number of cycles spent in schedule stage"),
1446  ADD_STAT(schStalls, "number of cycles WF is stalled in SCH stage"),
1447  ADD_STAT(schRfAccessStalls, "number of cycles wave selected in SCH but "
1448  "RF denied adding instruction"),
1449  ADD_STAT(schResourceStalls, "number of cycles stalled in sch by resource"
1450  " not available"),
1451  ADD_STAT(schOpdNrdyStalls, "number of cycles stalled in sch waiting for "
1452  "RF reads to complete"),
1453  ADD_STAT(schLdsArbStalls,
1454  "number of cycles wave stalled due to LDS-VRF arbitration"),
1455  // FIXME: the name of the WF needs to be unique
1456  ADD_STAT(numTimesBlockedDueWAXDependencies, "number of times the wf's "
1457  "instructions are blocked due to WAW or WAR dependencies"),
1458  // FIXME: the name of the WF needs to be unique
1459  ADD_STAT(numTimesBlockedDueRAWDependencies, "number of times the wf's "
1460  "instructions are blocked due to RAW dependencies"),
1461  ADD_STAT(vecRawDistance,
1462  "Count of RAW distance in dynamic instructions for this WF"),
1463  ADD_STAT(readsPerWrite, "Count of Vector reads per write for this WF")
1464 {
1465  vecRawDistance.init(0, 20, 1);
1466  readsPerWrite.init(0, 4, 1);
1467 }
ComputeUnit::vectorALUs
std::vector< WaitClass > vectorALUs
Definition: compute_unit.hh:244
Wavefront::isOldestInstScalarALU
bool isOldestInstScalarALU()
Definition: wavefront.cc:618
WorkgroupIdX
@ WorkgroupIdX
Definition: kernel_code.hh:65
_amd_queue_s::scratch_resource_descriptor
uint32_t scratch_resource_descriptor[4]
Definition: hsa_queue.hh:80
fatal
#define fatal(...)
This implements a cprintf based fatal() function.
Definition: logging.hh:183
ComputeUnit::vectorSharedMemUnit
WaitClass vectorSharedMemUnit
Definition: compute_unit.hh:232
PrivSegWaveByteOffset
@ PrivSegWaveByteOffset
Definition: kernel_code.hh:69
Wavefront::barId
int barId
Definition: wavefront.hh:329
Wavefront::isOldestInstFlatMem
bool isOldestInstFlatMem()
Definition: wavefront.cc:713
Wavefront::wrGmReqsInPipe
int wrGmReqsInPipe
Definition: wavefront.hh:185
TokenManager::recvTokens
void recvTokens(int num_tokens)
Increment the number of available tokens by num_tokens.
Definition: token_port.cc:154
Wavefront::clearWaitCnts
void clearWaitCnts()
Definition: wavefront.cc:1315
Wavefront::lgkmInstsIssued
int lgkmInstsIssued
Definition: wavefront.hh:324
Wavefront::scalarMem
int scalarMem
Definition: wavefront.hh:126
simple_pool_manager.hh
Wavefront::startVgprIndex
uint32_t startVgprIndex
Definition: wavefront.hh:197
ComputeUnit::deleteFromPipeMap
void deleteFromPipeMap(Wavefront *w)
Definition: compute_unit.cc:505
Wavefront::barrierId
int barrierId() const
Definition: wavefront.cc:1424
ComputeUnit::vrfToGlobalMemPipeBus
WaitClass vrfToGlobalMemPipeBus
Definition: compute_unit.hh:222
ComputeUnit::mapWaveToScalarAluGlobalIdx
int mapWaveToScalarAluGlobalIdx(Wavefront *w) const
Definition: compute_unit.cc:262
ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAC64
Stats::Scalar numVecOpsExecutedMAC64
Definition: compute_unit.hh:1051
_amd_queue_s::scratch_workitem_byte_size
uint32_t scratch_workitem_byte_size
Definition: hsa_queue.hh:83
HSAQueueEntry::hostDispPktAddr
Addr hostDispPktAddr() const
Definition: hsa_queue_entry.hh:164
shader.hh
PrivateSegBuf
@ PrivateSegBuf
Definition: kernel_code.hh:55
HSAQueueEntry::MAX_DIM
const static int MAX_DIM
Definition: hsa_queue_entry.hh:309
Wavefront::resizeRegFiles
void resizeRegFiles(int num_vregs, int num_sregs)
Definition: wavefront.cc:506
Wavefront::vecReads
std::vector< int > vecReads
Definition: wavefront.hh:235
HSAQueueEntry::vgprBitEnabled
bool vgprBitEnabled(int bit) const
Definition: hsa_queue_entry.hh:285
Wavefront::oldVgprTcnt
uint64_t oldVgprTcnt
Definition: wavefront.hh:207
ArmISA::i
Bitfield< 7 > i
Definition: miscregs_types.hh:63
Wavefront::globalMem
int globalMem
Definition: wavefront.hh:124
ComputeUnit::mapWaveToGlobalMem
int mapWaveToGlobalMem(Wavefront *w) const
Definition: compute_unit.cc:269
Gcn3ISA::VecRegU32
::VecRegT< VecElemU32, NumVecElemPerVecReg, false > VecRegU32
Definition: registers.hh:176
ComputeUnit::srf_scm_bus_latency
Cycles srf_scm_bus_latency
Definition: compute_unit.hh:317
Wavefront::_execMask
VectorMask _execMask
Definition: wavefront.hh:328
Shader::initShHiddenPrivateBase
void initShHiddenPrivateBase(Addr queueBase, uint32_t offset)
Definition: shader.hh:172
ComputeUnit::vrf_gm_bus_latency
Cycles vrf_gm_bus_latency
Definition: compute_unit.hh:315
ComputeUnit::ComputeUnitStats::numVecOpsExecutedTwoOpFP
Stats::Scalar numVecOpsExecutedTwoOpFP
Definition: compute_unit.hh:1057
Wavefront::oldVgpr
std::vector< uint32_t > oldVgpr
Definition: wavefront.hh:203
ComputeUnit::mapWaveToScalarMem
int mapWaveToScalarMem(Wavefront *w) const
Definition: compute_unit.cc:285
Wavefront::vmemInstsIssued
int vmemInstsIssued
Definition: wavefront.hh:322
ComputeUnit::mapWaveToLocalMem
int mapWaveToLocalMem(Wavefront *w) const
Definition: compute_unit.cc:277
ComputeUnit::ComputeUnitStats::numVecOpsExecutedF64
Stats::Scalar numVecOpsExecutedF64
Definition: compute_unit.hh:1043
Wavefront::S_RUNNING
@ S_RUNNING
Definition: wavefront.hh:68
WorkitemIdZ
@ WorkitemIdZ
Definition: kernel_code.hh:77
Wavefront::start
void start(uint64_t _wfDynId, uint64_t _base_ptr)
Definition: wavefront.cc:554
HSAQueueEntry::wgSize
int wgSize(int dim) const
Definition: hsa_queue_entry.hh:120
compute_unit.hh
Wavefront::WavefrontStats::vecRawDistance
Stats::Distribution vecRawDistance
Definition: wavefront.hh:370
Wavefront::wgSz
uint32_t wgSz
Definition: wavefront.hh:159
Wavefront::lastAddr
std::vector< Addr > lastAddr
Definition: wavefront.hh:151
NumScalarInitFields
@ NumScalarInitFields
Definition: kernel_code.hh:70
ComputeUnit::ComputeUnitStats::numVecOpsExecutedFMA64
Stats::Scalar numVecOpsExecutedFMA64
Definition: compute_unit.hh:1047
Wavefront::Params
WavefrontParams Params
Definition: wavefront.hh:242
Wavefront::scalarRdGmReqsInPipe
int scalarRdGmReqsInPipe
Definition: wavefront.hh:186
Wavefront::decVMemInstsIssued
void decVMemInstsIssued()
Definition: wavefront.cc:1347
Shader::n_wf
int n_wf
Definition: shader.hh:208
Wavefront::isOldestInstPrivMem
bool isOldestInstPrivMem()
Definition: wavefront.cc:700
ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAD64
Stats::Scalar numVecOpsExecutedMAD64
Definition: compute_unit.hh:1055
RegisterManager::mapSgpr
int mapSgpr(Wavefront *w, int sgprIndex)
Definition: register_manager.cc:101
Wavefront::S_STALLED_SLEEP
@ S_STALLED_SLEEP
Definition: wavefront.hh:72
ComputeUnit::cu_id
int cu_id
Definition: compute_unit.hh:291
Wavefront::isOldestInstScalarMem
bool isOldestInstScalarMem()
Definition: wavefront.cc:674
Wavefront::isOldestInstSleep
bool isOldestInstSleep()
Definition: wavefront.cc:587
ComputeUnit::stats
ComputeUnit::ComputeUnitStats stats
ComputeUnit::vectorGlobalMemUnit
WaitClass vectorGlobalMemUnit
Definition: compute_unit.hh:224
Wavefront::status
status_e status
Definition: wavefront.hh:326
Wavefront::WavefrontStats::numInstrExecuted
Stats::Scalar numInstrExecuted
Definition: wavefront.hh:338
ComputeUnit::registerManager
RegisterManager * registerManager
Definition: compute_unit.hh:277
Wavefront::pc
Addr pc() const
Definition: wavefront.cc:1365
std::vector< int >
Wavefront::reserveGmResource
void reserveGmResource(GPUDynInstPtr ii)
Definition: wavefront.cc:759
QueuePtr
@ QueuePtr
Definition: kernel_code.hh:57
ComputeUnit::vrf_lm_bus_latency
Cycles vrf_lm_bus_latency
Definition: compute_unit.hh:319
Wavefront::scalarWrGmReqsInPipe
int scalarWrGmReqsInPipe
Definition: wavefront.hh:187
KernargSegPtr
@ KernargSegPtr
Definition: kernel_code.hh:58
Wavefront::wfId
uint32_t wfId
Definition: wavefront.hh:165
ComputeUnit::ComputeUnitStats::numVecOpsExecutedF32
Stats::Scalar numVecOpsExecutedF32
Definition: compute_unit.hh:1041
Wavefront::scalarAluGlobalIdx
int scalarAluGlobalIdx
Definition: wavefront.hh:123
Gcn3ISA::VecElemU32
uint32_t VecElemU32
Definition: registers.hh:164
Wavefront::S_BARRIER
@ S_BARRIER
WF is stalled at a barrier.
Definition: wavefront.hh:90
Wavefront::workItemId
std::vector< uint32_t > workItemId[3]
Definition: wavefront.hh:152
Wavefront::dropFetch
bool dropFetch
Definition: wavefront.hh:110
HSAQueueEntry
Definition: hsa_queue_entry.hh:58
WorkgroupIdZ
@ WorkgroupIdZ
Definition: kernel_code.hh:67
HSAQueueEntry::sgprBitEnabled
bool sgprBitEnabled(int bit) const
Definition: hsa_queue_entry.hh:290
Wavefront::stats
Wavefront::WavefrontStats stats
Wavefront::actualWgSz
uint32_t actualWgSz[3]
Definition: wavefront.hh:161
Stats::none
const FlagsType none
Nothing extra to print.
Definition: info.hh:44
Wavefront::incExpInstsIssued
void incExpInstsIssued()
Definition: wavefront.cc:1335
ComputeUnit::ComputeUnitStats::numVecOpsExecutedF16
Stats::Scalar numVecOpsExecutedF16
Definition: compute_unit.hh:1039
Wavefront::scalarOutstandingReqsWrGm
int scalarOutstandingReqsWrGm
Definition: wavefront.hh:181
wavefront.hh
ComputeUnit::ComputeUnitStats::instCyclesLdsPerSimd
Stats::Vector instCyclesLdsPerSimd
Definition: compute_unit.hh:980
ComputeUnit::scalarALUs
std::vector< WaitClass > scalarALUs
Definition: compute_unit.hh:248
Wavefront::sleepCnt
int sleepCnt
Definition: wavefront.hh:325
Wavefront::wfSlotId
const int wfSlotId
Definition: wavefront.hh:94
Wavefront::vmWaitCnt
int vmWaitCnt
the following are used for waitcnt instructions vmWaitCnt: once set, we wait for the oustanding numbe...
Definition: wavefront.hh:319
HSAQueueEntry::amdQueue
_amd_queue_t amdQueue
Keep a copy of the AMD HSA queue because we need info from some of its fields to initialize register ...
Definition: hsa_queue_entry.hh:306
Wavefront::setStatus
void setStatus(status_e newStatus)
Definition: wavefront.cc:517
Wavefront::actualWgSzTotal
uint32_t actualWgSzTotal
Definition: wavefront.hh:162
Wavefront::wrLmReqsInPipe
int wrLmReqsInPipe
Definition: wavefront.hh:184
ArmISA::n
Bitfield< 31 > n
Definition: miscregs_types.hh:450
Wavefront::S_STALLED
@ S_STALLED
Definition: wavefront.hh:70
Wavefront::ldsChunk
LdsChunk * ldsChunk
Definition: wavefront.hh:221
FlatScratchInit
@ FlatScratchInit
Definition: kernel_code.hh:60
FetchUnit::flushBuf
void flushBuf(int wfSlotId)
Definition: fetch_unit.cc:308
Wavefront::outstandingReqs
int outstandingReqs
Definition: wavefront.hh:169
Wavefront::computeUnit
ComputeUnit * computeUnit
Definition: wavefront.hh:104
divCeil
T divCeil(const T &a, const U &b)
Definition: intmath.hh:114
ComputeUnit::srf
std::vector< ScalarRegisterFile * > srf
Definition: compute_unit.hh:296
Wavefront::S_RETURNING
@ S_RETURNING
Definition: wavefront.hh:66
vector_register_file.hh
Clocked::cyclesToTicks
Tick cyclesToTicks(Cycles c) const
Definition: clocked_object.hh:224
Wavefront::discardFetch
void discardFetch()
Definition: wavefront.cc:1188
Wavefront::scalarOutstandingReqsRdGm
int scalarOutstandingReqsRdGm
Definition: wavefront.hh:179
Wavefront::exec
void exec()
Definition: wavefront.cc:861
Shader::hsail_mode
hsail_mode_e hsail_mode
Definition: shader.hh:195
ComputeUnit::ComputeUnitStats::totalCycles
Stats::Scalar totalCycles
Definition: compute_unit.hh:1059
Stats::ScalarBase::value
Counter value() const
Return the current value of this stat as its base type.
Definition: statistics.hh:603
bitfield.hh
Wavefront::isOldestInstVectorALU
bool isOldestInstVectorALU()
Definition: wavefront.cc:633
HSAQueueEntry::hostAMDQueueAddr
Addr hostAMDQueueAddr
Host-side addr of the amd_queue_t on which this task was queued.
Definition: hsa_queue_entry.hh:299
Wavefront::localMem
int localMem
Definition: wavefront.hh:125
Wavefront::isOldestInstWaitcnt
bool isOldestInstWaitcnt()
Definition: wavefront.cc:601
Wavefront::releaseBarrier
void releaseBarrier()
Definition: wavefront.cc:1436
DPRINTF
#define DPRINTF(x,...)
Definition: trace.hh:237
Wavefront::freeResources
void freeResources()
Definition: wavefront.cc:740
Wavefront::setWaitCnts
void setWaitCnts(int vm_wait_cnt, int exp_wait_cnt, int lgkm_wait_cnt)
Definition: wavefront.cc:1270
ADD_STAT
#define ADD_STAT(n,...)
Convenience macro to add a stat to a statistics group.
Definition: group.hh:71
RegisterManager::vrfPoolMgrs
std::vector< PoolManager * > vrfPoolMgrs
Definition: register_manager.hh:79
HSAQueueEntry::wgId
int wgId(int dim) const
Definition: hsa_queue_entry.hh:208
ComputeUnit::idleCUTimeout
Tick idleCUTimeout
Definition: compute_unit.hh:342
ComputeUnit::idleWfs
int idleWfs
Definition: compute_unit.hh:343
ArmISA::d
Bitfield< 9 > d
Definition: miscregs_types.hh:60
Wavefront::startSgprIndex
uint32_t startSgprIndex
Definition: wavefront.hh:200
Wavefront::lastNonIdleTick
Tick lastNonIdleTick
Definition: wavefront.hh:112
ComputeUnit::vrf
std::vector< VectorRegisterFile * > vrf
Definition: compute_unit.hh:294
WaitClass::set
void set(uint64_t i)
Definition: misc.hh:79
ComputeUnit::instExecPerSimd
std::vector< uint64_t > instExecPerSimd
Definition: compute_unit.hh:325
Wavefront::S_WAITCNT
@ S_WAITCNT
wavefront has unsatisfied wait counts
Definition: wavefront.hh:86
ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAC16
Stats::Scalar numVecOpsExecutedMAC16
Definition: compute_unit.hh:1049
Wavefront::freeRegisterFile
void freeRegisterFile()
Freeing VRF space.
Definition: wavefront.cc:1389
scalar_register_file.hh
Wavefront::outstandingReqsRdGm
int outstandingReqsRdGm
Definition: wavefront.hh:175
HSAQueueEntry::gridSize
int gridSize(int dim) const
Definition: hsa_queue_entry.hh:127
gpu_dyn_inst.hh
WFBarrier
WF barrier slots.
Definition: compute_unit.hh:89
Wavefront::sleepDone
bool sleepDone()
Definition: wavefront.cc:1244
Wavefront::flatGmUnitId
int flatGmUnitId
Definition: wavefront.hh:102
GridWorkgroupCountX
@ GridWorkgroupCountX
Definition: kernel_code.hh:62
FetchStage::fetchUnit
FetchUnit & fetchUnit(int simdId)
Definition: fetch_stage.hh:65
ComputeUnit::ComputeUnitStats::controlFlowDivergenceDist
Stats::Distribution controlFlowDivergenceDist
Definition: compute_unit.hh:1065
Wavefront::validateRequestCounters
void validateRequestCounters()
Definition: wavefront.cc:745
Wavefront::expInstsIssued
int expInstsIssued
Definition: wavefront.hh:323
ComputeUnit::vrfToLocalMemPipeBus
WaitClass vrfToLocalMemPipeBus
Definition: compute_unit.hh:230
ComputeUnit::fetchStage
FetchStage fetchStage
Definition: compute_unit.hh:279
Wavefront::isLmInstruction
bool isLmInstruction(GPUDynInstPtr ii)
Definition: wavefront.cc:576
Wavefront::maxSgprs
uint32_t maxSgprs
Definition: wavefront.hh:131
WorkitemIdX
@ WorkitemIdX
Definition: kernel_code.hh:75
NumVectorInitFields
@ NumVectorInitFields
Definition: kernel_code.hh:78
ComputeUnit::scalarMemUnit
WaitClass scalarMemUnit
Definition: compute_unit.hh:240
ComputeUnit::issuePeriod
Cycles issuePeriod
Definition: compute_unit.hh:312
ComputeUnit::ComputeUnitStats::instCyclesVMemPerSimd
Stats::Vector instCyclesVMemPerSimd
Definition: compute_unit.hh:978
Wavefront::isOldestInstLMem
bool isOldestInstLMem()
Definition: wavefront.cc:687
ComputeUnit::lastExecCycle
std::vector< uint64_t > lastExecCycle
Definition: compute_unit.hh:322
Wavefront::simdId
const int simdId
Definition: wavefront.hh:97
ComputeUnit::ComputeUnitStats::numVecOpsExecutedFMA16
Stats::Scalar numVecOpsExecutedFMA16
Definition: compute_unit.hh:1045
ComputeUnit::ComputeUnitStats::activeLanesPerLMemInstrDist
Stats::Distribution activeLanesPerLMemInstrDist
Definition: compute_unit.hh:1067
ComputeUnit::srfToScalarMemPipeBus
WaitClass srfToScalarMemPipeBus
Definition: compute_unit.hh:238
ComputeUnit::ComputeUnitStats::numVecOpsExecutedFMA32
Stats::Scalar numVecOpsExecutedFMA32
Definition: compute_unit.hh:1046
Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:148
Wavefront::lastInstExec
uint64_t lastInstExec
Definition: wavefront.hh:227
Wavefront::isOldestInstGMem
bool isOldestInstGMem()
Definition: wavefront.cc:661
Wavefront::rdLmReqsInPipe
int rdLmReqsInPipe
Definition: wavefront.hh:182
Wavefront::S_STOPPED
@ S_STOPPED
Definition: wavefront.hh:64
Wavefront::lgkmWaitCnt
int lgkmWaitCnt
Definition: wavefront.hh:321
Wavefront::hasBarrier
bool hasBarrier() const
Definition: wavefront.cc:1430
HSAQueueEntry::kernargAddr
Addr kernargAddr() const
Definition: hsa_queue_entry.hh:182
Wavefront::computeActualWgSz
void computeActualWgSz(HSAQueueEntry *task)
Definition: wavefront.cc:1405
Wavefront::nextInstr
GPUDynInstPtr nextInstr()
Definition: wavefront.cc:1169
Wavefront::rawDist
std::unordered_map< int, uint64_t > rawDist
Definition: wavefront.hh:231
Wavefront::decLGKMInstsIssued
void decLGKMInstsIssued()
Definition: wavefront.cc:1359
Wavefront::decExpInstsIssued
void decExpInstsIssued()
Definition: wavefront.cc:1353
Shader::incVectorInstDstOperand
void incVectorInstDstOperand(int num_operands)
Definition: shader.hh:284
Wavefront::pendingFetch
bool pendingFetch
Definition: wavefront.hh:109
Wavefront::outstandingReqsRdLm
int outstandingReqsRdLm
Definition: wavefront.hh:177
Wavefront::waitCntsSatisfied
bool waitCntsSatisfied()
Definition: wavefront.cc:1201
ComputeUnit::getTokenManager
TokenManager * getTokenManager()
Definition: compute_unit.hh:836
Wavefront::Wavefront
Wavefront(const Params &p)
Definition: wavefront.cc:47
Wavefront::execUnitId
int execUnitId
Definition: wavefront.hh:100
panic_if
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
Definition: logging.hh:197
Wavefront::isGmInstruction
bool isGmInstruction(GPUDynInstPtr ii)
Definition: wavefront.cc:565
Wavefront::reserveLmResource
void reserveLmResource(GPUDynInstPtr ii)
Definition: wavefront.cc:789
Wavefront::memTraceBusy
int memTraceBusy
Definition: wavefront.hh:189
_amd_queue_s::scratch_backing_memory_location
uint64_t scratch_backing_memory_location
Definition: hsa_queue.hh:81
Wavefront::isOldestInstBarrier
bool isOldestInstBarrier()
Definition: wavefront.cc:648
Wavefront::WavefrontStats::readsPerWrite
Stats::Distribution readsPerWrite
Definition: wavefront.hh:374
WorkitemIdY
@ WorkitemIdY
Definition: kernel_code.hh:76
ComputeUnit::updateInstStats
void updateInstStats(GPUDynInstPtr gpuDynInst)
Definition: compute_unit.cc:1793
Stats::Distribution::init
Distribution & init(Counter min, Counter max, Counter bkt)
Set the parameters of this distribution.
Definition: statistics.hh:2113
Wavefront::_pc
Addr _pc
Definition: wavefront.hh:327
Shader::incVectorInstSrcOperand
void incVectorInstSrcOperand(int num_operands)
Definition: shader.hh:278
Shader::SIMT
@ SIMT
Definition: shader.hh:103
ComputeUnit::ComputeUnitStats::activeLanesPerGMemInstrDist
Stats::Distribution activeLanesPerGMemInstrDist
Definition: compute_unit.hh:1066
Wavefront::initRegState
void initRegState(HSAQueueEntry *task, int wgSizeInWorkItems)
Definition: wavefront.cc:116
Stats::Group
Statistics container.
Definition: group.hh:87
Wavefront::execMask
VectorMask & execMask()
Definition: wavefront.cc:1377
Wavefront::wgId
uint32_t wgId
Definition: wavefront.hh:158
ComputeUnit::wfSize
int wfSize() const
Definition: compute_unit.hh:393
GPUDynInstPtr
std::shared_ptr< GPUDynInst > GPUDynInstPtr
Definition: misc.hh:48
Wavefront::workGroupId
uint32_t workGroupId[3]
Definition: wavefront.hh:155
Stats::DistBase::sample
void sample(const U &v, int n=1)
Add a value to the distribtion n times.
Definition: statistics.hh:1323
Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition: types.hh:79
Gcn3ISA::ScalarRegU32
uint32_t ScalarRegU32
Definition: registers.hh:152
WorkgroupIdY
@ WorkgroupIdY
Definition: kernel_code.hh:66
_amd_queue_s::compute_tmpring_size_wavesize
uint32_t compute_tmpring_size_wavesize
Definition: hsa_queue.hh:78
Wavefront::init
virtual void init()
init() is called after all C++ SimObjects have been created and all ports are connected.
Definition: wavefront.cc:101
Wavefront::instructionBuffer
std::deque< GPUDynInstPtr > instructionBuffer
Definition: wavefront.hh:107
bits
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
Definition: bitfield.hh:73
RegisterManager::mapVgpr
int mapVgpr(Wavefront *w, int vgprIndex)
Definition: register_manager.cc:94
Wavefront::~Wavefront
~Wavefront()
Definition: wavefront.cc:512
Stats
Definition: statistics.cc:53
Wavefront::oldDgprTcnt
uint64_t oldDgprTcnt
Definition: wavefront.hh:214
ComputeUnit::ComputeUnitStats::execRateDist
Stats::Distribution execRateDist
Definition: compute_unit.hh:1035
Wavefront::setSleepTime
void setSleepTime(int sleep_time)
Definition: wavefront.cc:1263
ComputeUnit::ComputeUnitStats::instCyclesScMemPerSimd
Stats::Vector instCyclesScMemPerSimd
Definition: compute_unit.hh:979
Wavefront::expWaitCnt
int expWaitCnt
Definition: wavefront.hh:320
curTick
Tick curTick()
The universal simulation clock.
Definition: cur_tick.hh:43
Wavefront::incVMemInstsIssued
void incVMemInstsIssued()
Definition: wavefront.cc:1329
Wavefront::outstandingReqsWrLm
int outstandingReqsWrLm
Definition: wavefront.hh:173
Wavefront::_gpuISA
TheGpuISA::GPUISA _gpuISA
Definition: wavefront.hh:298
Gcn3ISA::VecRegContainerU32
VecRegU32::Container VecRegContainerU32
Definition: registers.hh:196
Wavefront::scalarAlu
int scalarAlu
Definition: wavefront.hh:119
Wavefront::workItemFlatId
std::vector< uint32_t > workItemFlatId
Definition: wavefront.hh:153
Wavefront::reservedVectorRegs
int reservedVectorRegs
Definition: wavefront.hh:192
ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAD16
Stats::Scalar numVecOpsExecutedMAD16
Definition: compute_unit.hh:1053
MipsISA::p
Bitfield< 0 > p
Definition: pra_constants.hh:323
Wavefront::rdGmReqsInPipe
int rdGmReqsInPipe
Definition: wavefront.hh:183
Wavefront::flatLmUnitId
int flatLmUnitId
Definition: wavefront.hh:101
Wavefront::oldDgpr
std::vector< uint64_t > oldDgpr
Definition: wavefront.hh:210
GridWorkgroupCountY
@ GridWorkgroupCountY
Definition: kernel_code.hh:63
VectorMask
std::bitset< std::numeric_limits< unsigned long long >::digits > VectorMask
Definition: misc.hh:44
Wavefront::stopFetch
bool stopFetch()
Definition: wavefront.cc:726
Wavefront::WavefrontStats::WavefrontStats
WavefrontStats(Stats::Group *parent)
Definition: wavefront.cc:1441
Wavefront::workGroupSz
uint32_t workGroupSz[3]
Definition: wavefront.hh:156
ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAC32
Stats::Scalar numVecOpsExecutedMAC32
Definition: compute_unit.hh:1050
fatal_if
#define fatal_if(cond,...)
Conditional fatal macro that checks the supplied condition and only causes a fatal error if the condi...
Definition: logging.hh:219
ComputeUnit::ComputeUnitStats::numVecOpsExecuted
Stats::Scalar numVecOpsExecuted
Definition: compute_unit.hh:1037
ComputeUnit::ComputeUnitStats::numVecOpsExecutedMAD32
Stats::Scalar numVecOpsExecutedMAD32
Definition: compute_unit.hh:1054
Wavefront::reservedScalarRegs
int reservedScalarRegs
Definition: wavefront.hh:194
ComputeUnit::pipeMap
std::unordered_set< uint64_t > pipeMap
Definition: compute_unit.hh:275
ComputeUnit::ComputeUnitStats::numInstrExecuted
Stats::Scalar numInstrExecuted
Definition: compute_unit.hh:1032
ComputeUnit::ComputeUnitStats::instInterleave
Stats::VectorDistribution instInterleave
Definition: compute_unit.hh:1087
ComputeUnit::mapWaveToScalarAlu
int mapWaveToScalarAlu(Wavefront *w) const
Definition: compute_unit.cc:251
GridWorkgroupCountZ
@ GridWorkgroupCountZ
Definition: kernel_code.hh:64
ComputeUnit::shader
Shader * shader
Definition: compute_unit.hh:352
WFBarrier::InvalidID
static const int InvalidID
Definition: compute_unit.hh:96
Wavefront::status_e
status_e
Definition: wavefront.hh:62
Wavefront::gridSz
uint32_t gridSz[3]
Definition: wavefront.hh:157
Wavefront::lastTrace
uint64_t lastTrace
Definition: wavefront.hh:190
Wavefront::outstandingReqsWrGm
int outstandingReqsWrGm
Definition: wavefront.hh:171
Wavefront::wfDynId
uint64_t wfDynId
Definition: wavefront.hh:224
Wavefront::reserveResources
std::vector< int > reserveResources()
Definition: wavefront.cc:807
Wavefront::maxVgprs
uint32_t maxVgprs
Definition: wavefront.hh:129
panic
#define panic(...)
This implements a cprintf based panic() function.
Definition: logging.hh:171
Wavefront::incLGKMInstsIssued
void incLGKMInstsIssued()
Definition: wavefront.cc:1341
ComputeUnit::numVectorALUs
int numVectorALUs
Definition: compute_unit.hh:243
WorkgroupInfo
@ WorkgroupInfo
Definition: kernel_code.hh:68
DispatchPtr
@ DispatchPtr
Definition: kernel_code.hh:56
SimObject
Abstract superclass for simulation objects.
Definition: sim_object.hh:141

Generated on Tue Mar 23 2021 19:41:27 for gem5 by doxygen 1.8.17