gem5  v21.0.1.0
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
operand.hh
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2017-2018 Advanced Micro Devices, Inc.
3  * All rights reserved.
4  *
5  * For use for simulation and test purposes only
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions are met:
9  *
10  * 1. Redistributions of source code must retain the above copyright notice,
11  * this list of conditions and the following disclaimer.
12  *
13  * 2. Redistributions in binary form must reproduce the above copyright notice,
14  * this list of conditions and the following disclaimer in the documentation
15  * and/or other materials provided with the distribution.
16  *
17  * 3. Neither the name of the copyright holder nor the names of its
18  * contributors may be used to endorse or promote products derived from this
19  * software without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31  * POSSIBILITY OF SUCH DAMAGE.
32  */
33 
34 #ifndef __ARCH_GCN3_OPERAND_HH__
35 #define __ARCH_GCN3_OPERAND_HH__
36 
37 #include <array>
38 
39 #include "arch/gcn3/registers.hh"
40 #include "arch/generic/vec_reg.hh"
43 #include "gpu-compute/wavefront.hh"
44 
51 namespace Gcn3ISA
52 {
58  template<typename T> struct OpTraits { typedef float FloatT; };
59  template<> struct OpTraits<ScalarRegF64> { typedef double FloatT; };
60  template<> struct OpTraits<ScalarRegU64> { typedef double FloatT; };
61 
62  class Operand
63  {
64  public:
65  Operand() = delete;
66 
67  Operand(GPUDynInstPtr gpuDynInst, int opIdx)
68  : _gpuDynInst(gpuDynInst), _opIdx(opIdx)
69  {
70  assert(_gpuDynInst);
71  assert(_opIdx >= 0);
72  }
73 
78  virtual void read() = 0;
79  virtual void write() = 0;
80 
81  protected:
92  int _opIdx;
93  };
94 
95  template<typename DataType, bool Const, size_t NumDwords>
97 
98  template<typename DataType, bool Const,
99  size_t NumDwords = sizeof(DataType) / sizeof(VecElemU32)>
100  class VecOperand final : public Operand
101  {
102  static_assert(NumDwords >= 1 && NumDwords <= MaxOperandDwords,
103  "Incorrect number of DWORDS for GCN3 operand.");
104 
105  public:
106  VecOperand() = delete;
107 
108  VecOperand(GPUDynInstPtr gpuDynInst, int opIdx)
109  : Operand(gpuDynInst, opIdx), scalar(false), absMod(false),
110  negMod(false), scRegData(gpuDynInst, _opIdx),
111  vrfData{{ nullptr }}
112  {
113  vecReg.zero();
114  }
115 
117  {
118  }
119 
128  void
130  {
131  if (isVectorReg(_opIdx)) {
133  ->reservedScalarRegs);
134  read();
135  } else {
136  readScalar();
137  }
138  }
139 
144  void
145  read() override
146  {
147  assert(_gpuDynInst);
148  assert(_gpuDynInst->wavefront());
149  assert(_gpuDynInst->computeUnit());
150  Wavefront *wf = _gpuDynInst->wavefront();
151  ComputeUnit *cu = _gpuDynInst->computeUnit();
152 
153  for (auto i = 0; i < NumDwords; ++i) {
154  int vgprIdx = cu->registerManager->mapVgpr(wf, _opIdx + i);
155  vrfData[i] = &cu->vrf[wf->simdId]->readWriteable(vgprIdx);
156 
157  DPRINTF(GPUVRF, "Read v[%d]\n", vgprIdx);
158  cu->vrf[wf->simdId]->printReg(wf, vgprIdx);
159  }
160 
161  if (NumDwords == 1) {
162  assert(vrfData[0]);
163  auto vgpr = vecReg.template as<DataType>();
164  auto reg_file_vgpr = vrfData[0]->template as<VecElemU32>();
165  for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {
166  std::memcpy((void*)&vgpr[lane],
167  (void*)&reg_file_vgpr[lane], sizeof(DataType));
168  }
169  } else if (NumDwords == 2) {
170  assert(vrfData[0]);
171  assert(vrfData[1]);
172  auto vgpr = vecReg.template as<VecElemU64>();
173  auto reg_file_vgpr0 = vrfData[0]->template as<VecElemU32>();
174  auto reg_file_vgpr1 = vrfData[1]->template as<VecElemU32>();
175 
176  for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {
177  VecElemU64 tmp_val(0);
178  ((VecElemU32*)&tmp_val)[0] = reg_file_vgpr0[lane];
179  ((VecElemU32*)&tmp_val)[1] = reg_file_vgpr1[lane];
180  vgpr[lane] = tmp_val;
181  }
182  }
183  }
184 
196  void
197  write() override
198  {
199  assert(_gpuDynInst);
200  assert(_gpuDynInst->wavefront());
201  assert(_gpuDynInst->computeUnit());
202  Wavefront *wf = _gpuDynInst->wavefront();
203  ComputeUnit *cu = _gpuDynInst->computeUnit();
204  VectorMask &exec_mask = _gpuDynInst->isLoad()
205  ? _gpuDynInst->exec_mask : wf->execMask();
206 
207  if (NumDwords == 1) {
208  int vgprIdx = cu->registerManager->mapVgpr(wf, _opIdx);
209  vrfData[0] = &cu->vrf[wf->simdId]->readWriteable(vgprIdx);
210  assert(vrfData[0]);
211  auto reg_file_vgpr = vrfData[0]->template as<VecElemU32>();
212  auto vgpr = vecReg.template as<DataType>();
213 
214  for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {
215  if (exec_mask[lane] || _gpuDynInst->ignoreExec()) {
216  std::memcpy((void*)&reg_file_vgpr[lane],
217  (void*)&vgpr[lane], sizeof(DataType));
218  }
219  }
220 
221  DPRINTF(GPUVRF, "Write v[%d]\n", vgprIdx);
222  cu->vrf[wf->simdId]->printReg(wf, vgprIdx);
223  } else if (NumDwords == 2) {
224  int vgprIdx0 = cu->registerManager->mapVgpr(wf, _opIdx);
225  int vgprIdx1 = cu->registerManager->mapVgpr(wf, _opIdx + 1);
226  vrfData[0] = &cu->vrf[wf->simdId]->readWriteable(vgprIdx0);
227  vrfData[1] = &cu->vrf[wf->simdId]->readWriteable(vgprIdx1);
228  assert(vrfData[0]);
229  assert(vrfData[1]);
230  auto reg_file_vgpr0 = vrfData[0]->template as<VecElemU32>();
231  auto reg_file_vgpr1 = vrfData[1]->template as<VecElemU32>();
232  auto vgpr = vecReg.template as<VecElemU64>();
233 
234  for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {
235  if (exec_mask[lane] || _gpuDynInst->ignoreExec()) {
236  reg_file_vgpr0[lane] = ((VecElemU32*)&vgpr[lane])[0];
237  reg_file_vgpr1[lane] = ((VecElemU32*)&vgpr[lane])[1];
238  }
239  }
240 
241  DPRINTF(GPUVRF, "Write v[%d:%d]\n", vgprIdx0, vgprIdx1);
242  cu->vrf[wf->simdId]->printReg(wf, vgprIdx0);
243  cu->vrf[wf->simdId]->printReg(wf, vgprIdx1);
244  }
245  }
246 
247  void
249  {
250  negMod = true;
251  }
252 
253  void
255  {
256  absMod = true;
257  }
258 
264  template<bool Condition = (NumDwords == 1 || NumDwords == 2) && Const>
265  typename std::enable_if_t<Condition, const DataType>
266  operator[](size_t idx) const
267  {
268  assert(idx < NumVecElemPerVecReg);
269 
270  if (scalar) {
271  DataType ret_val = scRegData.rawData();
272 
273  if (absMod) {
274  assert(std::is_floating_point<DataType>::value);
275  ret_val = std::fabs(ret_val);
276  }
277 
278  if (negMod) {
279  assert(std::is_floating_point<DataType>::value);
280  ret_val = -ret_val;
281  }
282 
283  return ret_val;
284  } else {
285  auto vgpr = vecReg.template as<DataType>();
286  DataType ret_val = vgpr[idx];
287 
288  if (absMod) {
289  assert(std::is_floating_point<DataType>::value);
290  ret_val = std::fabs(ret_val);
291  }
292 
293  if (negMod) {
294  assert(std::is_floating_point<DataType>::value);
295  ret_val = -ret_val;
296  }
297 
298  return ret_val;
299  }
300  }
301 
307  template<bool Condition = (NumDwords == 1 || NumDwords == 2) && !Const>
308  typename std::enable_if_t<Condition, DataType&>
309  operator[](size_t idx)
310  {
311  assert(!scalar);
312  assert(idx < NumVecElemPerVecReg);
313 
314  return vecReg.template as<DataType>()[idx];
315  }
316 
317  private:
322  void
324  {
325  scalar = true;
326  scRegData.read();
327  }
328 
329  using VecRegCont = typename std::conditional<NumDwords == 2,
330  VecRegContainerU64, typename std::conditional<sizeof(DataType)
331  == sizeof(VecElemU16), VecRegContainerU16,
332  typename std::conditional<sizeof(DataType)
333  == sizeof(VecElemU8), VecRegContainerU8,
335 
339  bool scalar;
346  bool absMod;
347  bool negMod;
363  std::array<VecRegContainerU32*, NumDwords> vrfData;
364  };
365 
366  template<typename DataType, bool Const,
367  size_t NumDwords = sizeof(DataType) / sizeof(ScalarRegU32)>
368  class ScalarOperand final : public Operand
369  {
370  static_assert(NumDwords >= 1 && NumDwords <= MaxOperandDwords,
371  "Incorrect number of DWORDS for GCN3 operand.");
372  public:
373  ScalarOperand() = delete;
374 
375  ScalarOperand(GPUDynInstPtr gpuDynInst, int opIdx)
376  : Operand(gpuDynInst, opIdx)
377  {
378  std::memset(srfData.data(), 0, NumDwords * sizeof(ScalarRegU32));
379  }
380 
382  {
383  }
384 
392  template<bool Condition = NumDwords == 1 || NumDwords == 2>
393  typename std::enable_if_t<Condition, DataType>
394  rawData() const
395  {
396  assert(sizeof(DataType) <= sizeof(srfData));
397  DataType raw_data((DataType)0);
398  std::memcpy((void*)&raw_data, (void*)srfData.data(),
399  sizeof(DataType));
400 
401  return raw_data;
402  }
403 
404  void*
406  {
407  return (void*)srfData.data();
408  }
409 
410  void
411  read() override
412  {
413  Wavefront *wf = _gpuDynInst->wavefront();
414  ComputeUnit *cu = _gpuDynInst->computeUnit();
415 
416  if (!isScalarReg(_opIdx)) {
417  readSpecialVal();
418  } else {
419  for (auto i = 0; i < NumDwords; ++i) {
420  int sgprIdx = regIdx(i);
421  srfData[i] = cu->srf[wf->simdId]->read(sgprIdx);
422  DPRINTF(GPUSRF, "Read s[%d]\n", sgprIdx);
423  cu->srf[wf->simdId]->printReg(wf, sgprIdx);
424  }
425  }
426  }
427 
428  void
429  write() override
430  {
431  Wavefront *wf = _gpuDynInst->wavefront();
432  ComputeUnit *cu = _gpuDynInst->computeUnit();
433 
434  if (!isScalarReg(_opIdx)) {
435  if (_opIdx == REG_EXEC_LO) {
436  ScalarRegU64 new_exec_mask_val
437  = wf->execMask().to_ullong();
438  if (NumDwords == 1) {
439  std::memcpy((void*)&new_exec_mask_val,
440  (void*)srfData.data(), sizeof(VecElemU32));
441  } else if (NumDwords == 2) {
442  std::memcpy((void*)&new_exec_mask_val,
443  (void*)srfData.data(), sizeof(VecElemU64));
444  } else {
445  panic("Trying to write more than 2 DWORDS to EXEC\n");
446  }
447  VectorMask new_exec_mask(new_exec_mask_val);
448  wf->execMask() = new_exec_mask;
449  DPRINTF(GPUSRF, "Write EXEC\n");
450  DPRINTF(GPUSRF, "EXEC = %#x\n", new_exec_mask_val);
451  } else if (_opIdx == REG_EXEC_HI) {
456  assert(NumDwords == 1);
457  ScalarRegU32 new_exec_mask_hi_val(0);
458  ScalarRegU64 new_exec_mask_val
459  = wf->execMask().to_ullong();
460  std::memcpy((void*)&new_exec_mask_hi_val,
461  (void*)srfData.data(), sizeof(new_exec_mask_hi_val));
462  replaceBits(new_exec_mask_val, 63, 32,
463  new_exec_mask_hi_val);
464  VectorMask new_exec_mask(new_exec_mask_val);
465  wf->execMask() = new_exec_mask;
466  DPRINTF(GPUSRF, "Write EXEC\n");
467  DPRINTF(GPUSRF, "EXEC = %#x\n", new_exec_mask_val);
468  } else {
469  _gpuDynInst->writeMiscReg(_opIdx, srfData[0]);
470  }
471  } else {
472  for (auto i = 0; i < NumDwords; ++i) {
473  int sgprIdx = regIdx(i);
474  auto &sgpr = cu->srf[wf->simdId]->readWriteable(sgprIdx);
475  if (_gpuDynInst->isLoad()) {
476  assert(sizeof(DataType) <= sizeof(ScalarRegU64));
477  sgpr = reinterpret_cast<ScalarRegU32*>(
478  _gpuDynInst->scalar_data)[i];
479  } else {
480  sgpr = srfData[i];
481  }
482  DPRINTF(GPUSRF, "Write s[%d]\n", sgprIdx);
483  cu->srf[wf->simdId]->printReg(wf, sgprIdx);
484  }
485  }
486  }
487 
491  template<bool Condition = NumDwords == 1 || NumDwords == 2>
492  typename std::enable_if_t<Condition, void>
493  setBit(int bit, int bit_val)
494  {
495  DataType &sgpr = *((DataType*)srfData.data());
496  replaceBits(sgpr, bit, bit_val);
497  }
498 
499  template<bool Condition = (NumDwords == 1 || NumDwords == 2) && !Const>
500  typename std::enable_if_t<Condition, ScalarOperand&>
501  operator=(DataType rhs)
502  {
503  std::memcpy((void*)srfData.data(), (void*)&rhs, sizeof(DataType));
504  return *this;
505  }
506 
507  private:
514  void
516  {
517  assert(NumDwords == 1 || NumDwords == 2);
518 
519  switch(_opIdx) {
520  case REG_EXEC_LO:
521  {
522  if (NumDwords == 1) {
523  ScalarRegU32 exec_mask = _gpuDynInst->wavefront()->
524  execMask().to_ulong();
525  std::memcpy((void*)srfData.data(), (void*)&exec_mask,
526  sizeof(exec_mask));
527  DPRINTF(GPUSRF, "Read EXEC\n");
528  DPRINTF(GPUSRF, "EXEC = %#x\n", exec_mask);
529  } else {
530  assert(NumDwords == 2);
531  ScalarRegU64 exec_mask = _gpuDynInst->wavefront()->
532  execMask().to_ullong();
533  std::memcpy((void*)srfData.data(), (void*)&exec_mask,
534  sizeof(exec_mask));
535  DPRINTF(GPUSRF, "Read EXEC\n");
536  DPRINTF(GPUSRF, "EXEC = %#x\n", exec_mask);
537  }
538  }
539  break;
540  case REG_EXEC_HI:
541  {
546  assert(NumDwords == 1);
547  ScalarRegU64 exec_mask = _gpuDynInst->wavefront()
548  ->execMask().to_ullong();
549 
550  ScalarRegU32 exec_mask_hi = bits(exec_mask, 63, 32);
551  std::memcpy((void*)srfData.data(), (void*)&exec_mask_hi,
552  sizeof(exec_mask_hi));
553  DPRINTF(GPUSRF, "Read EXEC_HI\n");
554  DPRINTF(GPUSRF, "EXEC_HI = %#x\n", exec_mask_hi);
555  }
556  break;
557  case REG_SRC_SWDA:
558  case REG_SRC_DPP:
559  case REG_SRC_LITERAL:
560  assert(NumDwords == 1);
561  srfData[0] = _gpuDynInst->srcLiteral();
562  break;
563  case REG_POS_HALF:
564  {
565  typename OpTraits<DataType>::FloatT pos_half = 0.5;
566  std::memcpy((void*)srfData.data(), (void*)&pos_half,
567  sizeof(pos_half));
568 
569  }
570  break;
571  case REG_NEG_HALF:
572  {
573  typename OpTraits<DataType>::FloatT neg_half = -0.5;
574  std::memcpy((void*)srfData.data(), (void*)&neg_half,
575  sizeof(neg_half));
576  }
577  break;
578  case REG_POS_ONE:
579  {
580  typename OpTraits<DataType>::FloatT pos_one = 1.0;
581  std::memcpy(srfData.data(), &pos_one, sizeof(pos_one));
582  }
583  break;
584  case REG_NEG_ONE:
585  {
586  typename OpTraits<DataType>::FloatT neg_one = -1.0;
587  std::memcpy(srfData.data(), &neg_one, sizeof(neg_one));
588  }
589  break;
590  case REG_POS_TWO:
591  {
592  typename OpTraits<DataType>::FloatT pos_two = 2.0;
593  std::memcpy(srfData.data(), &pos_two, sizeof(pos_two));
594  }
595  break;
596  case REG_NEG_TWO:
597  {
598  typename OpTraits<DataType>::FloatT neg_two = -2.0;
599  std::memcpy(srfData.data(), &neg_two, sizeof(neg_two));
600  }
601  break;
602  case REG_POS_FOUR:
603  {
604  typename OpTraits<DataType>::FloatT pos_four = 4.0;
605  std::memcpy(srfData.data(), &pos_four, sizeof(pos_four));
606  }
607  break;
608  case REG_NEG_FOUR:
609  {
610  typename OpTraits<DataType>::FloatT neg_four = -4.0;
611  std::memcpy((void*)srfData.data(), (void*)&neg_four ,
612  sizeof(neg_four));
613  }
614  break;
615  case REG_PI:
616  {
617  assert(sizeof(DataType) == sizeof(ScalarRegF64)
618  || sizeof(DataType) == sizeof(ScalarRegF32));
619 
620  const ScalarRegU32 pi_u32(0x3e22f983UL);
621  const ScalarRegU64 pi_u64(0x3fc45f306dc9c882ULL);
622 
623  if (sizeof(DataType) == sizeof(ScalarRegF64)) {
624  std::memcpy((void*)srfData.data(),
625  (void*)&pi_u64, sizeof(pi_u64));
626  } else {
627  std::memcpy((void*)srfData.data(),
628  (void*)&pi_u32, sizeof(pi_u32));
629  }
630  }
631  break;
632  default:
633  {
634  assert(sizeof(DataType) <= sizeof(srfData));
635  DataType misc_val(0);
636  if (isConstVal(_opIdx)) {
637  misc_val = (DataType)_gpuDynInst
638  ->readConstVal<DataType>(_opIdx);
639  } else {
640  misc_val = (DataType)_gpuDynInst->readMiscReg(_opIdx);
641  }
642  std::memcpy((void*)srfData.data(), (void*)&misc_val,
643  sizeof(DataType));
644  }
645  }
646  }
647 
653  int
654  regIdx(int dword) const
655  {
656  Wavefront *wf = _gpuDynInst->wavefront();
657  ComputeUnit *cu = _gpuDynInst->computeUnit();
658  int sgprIdx(-1);
659 
660  if (_opIdx == REG_VCC_LO) {
661  sgprIdx = cu->registerManager
662  ->mapSgpr(wf, wf->reservedScalarRegs - 2 + dword);
663  } else if (_opIdx == REG_FLAT_SCRATCH_HI) {
664  sgprIdx = cu->registerManager
665  ->mapSgpr(wf, wf->reservedScalarRegs - 3 + dword);
666  } else if (_opIdx == REG_FLAT_SCRATCH_LO) {
667  assert(NumDwords == 1);
668  sgprIdx = cu->registerManager
669  ->mapSgpr(wf, wf->reservedScalarRegs - 4 + dword);
670  } else {
671  sgprIdx = cu->registerManager->mapSgpr(wf, _opIdx + dword);
672  }
673 
674  assert(sgprIdx > -1);
675 
676  return sgprIdx;
677  }
678 
687  std::array<ScalarRegU32, NumDwords> srfData;
688  };
689 
690  // typedefs for the various sizes/types of scalar operands
704  // non-writeable versions of scalar operands
718  // typedefs for the various sizes/types of vector operands
733  // non-writeable versions of vector operands
748 }
749 
750 #endif // __ARCH_GCN3_OPERAND_HH__
Gcn3ISA::Operand::read
virtual void read()=0
read from and write to the underlying register(s) that this operand is referring to.
Gcn3ISA::OpTraits< ScalarRegU64 >::FloatT
double FloatT
Definition: operand.hh:60
Gcn3ISA::Operand
Definition: operand.hh:62
Gcn3ISA::VecElemU16
uint16_t VecElemU16
Definition: registers.hh:162
Gcn3ISA::REG_SRC_DPP
@ REG_SRC_DPP
Definition: registers.hh:124
Gcn3ISA::NumVecElemPerVecReg
const int NumVecElemPerVecReg(64)
Gcn3ISA::Operand::Operand
Operand(GPUDynInstPtr gpuDynInst, int opIdx)
Definition: operand.hh:67
Gcn3ISA::REG_POS_FOUR
@ REG_POS_FOUR
Definition: registers.hh:119
Gcn3ISA::VecOperand::readScalar
void readScalar()
if we determine that this operand is a scalar (reg or constant) then we read the scalar data into the...
Definition: operand.hh:323
Gcn3ISA::ScalarOperand::rawDataPtr
void * rawDataPtr()
Definition: operand.hh:405
Gcn3ISA::VecOperand::absModifier
void absModifier()
Definition: operand.hh:254
Gcn3ISA::ScalarRegF64
double ScalarRegF64
Definition: registers.hh:157
ArmISA::i
Bitfield< 7 > i
Definition: miscregs_types.hh:63
Gcn3ISA::VecOperand::scalar
bool scalar
whether this operand a scalar or not.
Definition: operand.hh:339
Gcn3ISA::isScalarReg
bool isScalarReg(int opIdx)
Definition: registers.cc:215
Gcn3ISA::REG_FLAT_SCRATCH_LO
@ REG_FLAT_SCRATCH_LO
Definition: registers.hh:51
Gcn3ISA::REG_POS_HALF
@ REG_POS_HALF
Definition: registers.hh:113
Gcn3ISA::ScalarRegF32
float ScalarRegF32
Definition: registers.hh:154
Gcn3ISA::ScalarRegU64
uint64_t ScalarRegU64
Definition: registers.hh:155
RegisterManager::mapSgpr
int mapSgpr(Wavefront *w, int sgprIndex)
Definition: register_manager.cc:101
ComputeUnit::registerManager
RegisterManager * registerManager
Definition: compute_unit.hh:277
Gcn3ISA::VecOperand::absMod
bool absMod
absolute value and negative modifiers.
Definition: operand.hh:346
Gcn3ISA::REG_VCC_LO
@ REG_VCC_LO
Definition: registers.hh:55
Gcn3ISA::REG_EXEC_LO
@ REG_EXEC_LO
Definition: registers.hh:75
registers.hh
Gcn3ISA::ScalarOperand::~ScalarOperand
~ScalarOperand()
Definition: operand.hh:381
Gcn3ISA::Operand::Operand
Operand()=delete
Gcn3ISA::VecElemU32
uint32_t VecElemU32
Definition: registers.hh:164
Gcn3ISA::isVectorReg
bool isVectorReg(int opIdx)
Definition: registers.cc:228
Gcn3ISA::OpTraits::FloatT
float FloatT
Definition: operand.hh:58
wavefront.hh
Gcn3ISA::ScalarOperand::regIdx
int regIdx(int dword) const
for scalars we need to do some extra work to figure out how to map the op selector to the sgpr idx be...
Definition: operand.hh:654
Gcn3ISA::VecOperand::negMod
bool negMod
Definition: operand.hh:347
ComputeUnit
Definition: compute_unit.hh:200
Gcn3ISA::REG_SRC_LITERAL
@ REG_SRC_LITERAL
Definition: registers.hh:129
Gcn3ISA::VecOperand::VecOperand
VecOperand()=delete
ComputeUnit::srf
std::vector< ScalarRegisterFile * > srf
Definition: compute_unit.hh:296
vector_register_file.hh
Gcn3ISA
classes that represnt vector/scalar operands in GCN3 ISA.
Definition: decoder.cc:41
Gcn3ISA::VecOperand::operator[]
std::enable_if_t< Condition, DataType & > operator[](size_t idx)
setter [] operator.
Definition: operand.hh:309
Gcn3ISA::OpTraits< ScalarRegF64 >::FloatT
double FloatT
Definition: operand.hh:59
Gcn3ISA::VecOperand
Definition: operand.hh:100
DPRINTF
#define DPRINTF(x,...)
Definition: trace.hh:237
Gcn3ISA::Operand::_opIdx
int _opIdx
op selector value for this operand.
Definition: operand.hh:92
Gcn3ISA::opSelectorToRegIdx
int opSelectorToRegIdx(int idx, int numScalarRegs)
Definition: registers.cc:121
Gcn3ISA::VecOperand::VecOperand
VecOperand(GPUDynInstPtr gpuDynInst, int opIdx)
Definition: operand.hh:108
ComputeUnit::vrf
std::vector< VectorRegisterFile * > vrf
Definition: compute_unit.hh:294
Gcn3ISA::Operand::_gpuDynInst
GPUDynInstPtr _gpuDynInst
instruction object that owns this operand
Definition: operand.hh:85
Gcn3ISA::ScalarOperand::write
void write() override
Definition: operand.hh:429
Gcn3ISA::VecOperand::operator[]
std::enable_if_t< Condition, const DataType > operator[](size_t idx) const
getter [] operator.
Definition: operand.hh:266
Gcn3ISA::VecRegContainerU16
VecRegU16::Container VecRegContainerU16
Definition: registers.hh:195
scalar_register_file.hh
Gcn3ISA::VecRegContainerU64
VecRegU64::Container VecRegContainerU64
Definition: registers.hh:197
Gcn3ISA::REG_FLAT_SCRATCH_HI
@ REG_FLAT_SCRATCH_HI
Definition: registers.hh:52
Gcn3ISA::OpTraits
convenience traits so we can automatically infer the correct FP type without looking at the number of...
Definition: operand.hh:58
Gcn3ISA::ScalarOperand::readSpecialVal
void readSpecialVal()
we have determined that we are not reading our scalar operand data from the register file,...
Definition: operand.hh:515
Gcn3ISA::REG_POS_TWO
@ REG_POS_TWO
Definition: registers.hh:117
Wavefront::simdId
const int simdId
Definition: wavefront.hh:97
Gcn3ISA::VecOperand::readSrc
void readSrc()
certain vector operands can read from the vrf/srf or constants.
Definition: operand.hh:129
Gcn3ISA::ScalarOperand::setBit
std::enable_if_t< Condition, void > setBit(int bit, int bit_val)
bit access to scalar data.
Definition: operand.hh:493
Gcn3ISA::REG_NEG_ONE
@ REG_NEG_ONE
Definition: registers.hh:116
vec_reg.hh
Gcn3ISA::REG_POS_ONE
@ REG_POS_ONE
Definition: registers.hh:115
Gcn3ISA::VecOperand::~VecOperand
~VecOperand()
Definition: operand.hh:116
Gcn3ISA::ScalarOperand::ScalarOperand
ScalarOperand(GPUDynInstPtr gpuDynInst, int opIdx)
Definition: operand.hh:375
Gcn3ISA::Operand::write
virtual void write()=0
Gcn3ISA::VecOperand::scRegData
ScalarOperand< DataType, Const, NumDwords > scRegData
for src operands that read scalars (i.e., scalar regs or a scalar constant).
Definition: operand.hh:358
Gcn3ISA::VecOperand::negModifier
void negModifier()
Definition: operand.hh:248
Gcn3ISA::ScalarOperand::srfData
std::array< ScalarRegU32, NumDwords > srfData
in GCN3 each register is represented as a 32b unsigned value, however operands may require up to 16 r...
Definition: operand.hh:687
Wavefront
Definition: wavefront.hh:59
Gcn3ISA::ScalarOperand
Definition: operand.hh:96
Wavefront::execMask
VectorMask & execMask()
Definition: wavefront.cc:1377
GPUDynInstPtr
std::shared_ptr< GPUDynInst > GPUDynInstPtr
Definition: misc.hh:48
Gcn3ISA::ScalarRegU32
uint32_t ScalarRegU32
Definition: registers.hh:152
Gcn3ISA::REG_NEG_TWO
@ REG_NEG_TWO
Definition: registers.hh:118
Gcn3ISA::ScalarOperand::ScalarOperand
ScalarOperand()=delete
bits
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
Definition: bitfield.hh:73
RegisterManager::mapVgpr
int mapVgpr(Wavefront *w, int vgprIndex)
Definition: register_manager.cc:94
Gcn3ISA::VecElemU8
uint8_t VecElemU8
Definition: registers.hh:160
X86ISA::type
type
Definition: misc.hh:727
Gcn3ISA::REG_NEG_HALF
@ REG_NEG_HALF
Definition: registers.hh:114
Gcn3ISA::VecRegContainerU32
VecRegU32::Container VecRegContainerU32
Definition: registers.hh:196
Gcn3ISA::ScalarOperand::operator=
std::enable_if_t< Condition, ScalarOperand & > operator=(DataType rhs)
Definition: operand.hh:501
Gcn3ISA::REG_SRC_SWDA
@ REG_SRC_SWDA
Definition: registers.hh:123
Gcn3ISA::REG_NEG_FOUR
@ REG_NEG_FOUR
Definition: registers.hh:120
Gcn3ISA::VecOperand::read
void read() override
read from the vrf.
Definition: operand.hh:145
Gcn3ISA::VecElemU64
uint64_t VecElemU64
Definition: registers.hh:167
VectorMask
std::bitset< std::numeric_limits< unsigned long long >::digits > VectorMask
Definition: misc.hh:44
Gcn3ISA::ScalarOperand::rawData
std::enable_if_t< Condition, DataType > rawData() const
we store scalar data in a std::array, however if we need the full operand data we use this method to ...
Definition: operand.hh:394
Gcn3ISA::REG_PI
@ REG_PI
Definition: registers.hh:121
Gcn3ISA::ScalarOperand::read
void read() override
Definition: operand.hh:411
Wavefront::reservedScalarRegs
int reservedScalarRegs
Definition: wavefront.hh:194
Gcn3ISA::REG_EXEC_HI
@ REG_EXEC_HI
Definition: registers.hh:76
Gcn3ISA::MaxOperandDwords
constexpr size_t MaxOperandDwords(16)
Gcn3ISA::VecRegContainerU8
VecRegU8::Container VecRegContainerU8
Definition: registers.hh:194
Gcn3ISA::VecOperand::vecReg
VecRegCont vecReg
this holds all the operand data in a single vector register object (i.e., if an operand is 64b,...
Definition: operand.hh:353
Gcn3ISA::VecOperand::vrfData
std::array< VecRegContainerU32 *, NumDwords > vrfData
pointers to the underlyding registers (i.e., the actual registers in the register file).
Definition: operand.hh:363
replaceBits
constexpr void replaceBits(T &val, unsigned first, unsigned last, B bit_val)
A convenience function to replace bits first to last of val with bit_val in place.
Definition: bitfield.hh:174
Gcn3ISA::isConstVal
bool isConstVal(int opIdx)
Definition: registers.cc:184
Gcn3ISA::VecOperand::VecRegCont
typename std::conditional< NumDwords==2, VecRegContainerU64, typename std::conditional< sizeof(DataType)==sizeof(VecElemU16), VecRegContainerU16, typename std::conditional< sizeof(DataType)==sizeof(VecElemU8), VecRegContainerU8, VecRegContainerU32 >::type >::type >::type VecRegCont
Definition: operand.hh:334
Gcn3ISA::VecOperand::write
void write() override
write to the vrf.
Definition: operand.hh:197
panic
#define panic(...)
This implements a cprintf based panic() function.
Definition: logging.hh:171

Generated on Tue Jun 22 2021 15:28:24 for gem5 by doxygen 1.8.17