Go to the documentation of this file.
41 #include "debug/GCN3.hh"
42 #include "debug/GPUSync.hh"
74 >= 0x100000000ULL ? 1 : 0;
618 sdst = src0.
rawData() &~ src1.rawData();
648 sdst = src0.
rawData() &~ src1.rawData();
678 sdst = src0.
rawData() |~ src1.rawData();
708 sdst = src0.
rawData() |~ src1.rawData();
1428 scc = (src.rawData() == simm16) ? 1 : 0;
1453 scc = (src.rawData() != simm16) ? 1 : 0;
1478 scc = (src.rawData() > simm16) ? 1 : 0;
1503 scc = (src.rawData() >= simm16) ? 1 : 0;
1528 scc = (src.rawData() < simm16) ? 1 : 0;
1553 scc = (src.rawData() <= simm16) ? 1 : 0;
1578 scc = (src.rawData() == simm16) ? 1 : 0;
1603 scc = (src.rawData() != simm16) ? 1 : 0;
1628 scc = (src.rawData() > simm16) ? 1 : 0;
1653 scc = (src.rawData() >= simm16) ? 1 : 0;
1678 scc = (src.rawData() < simm16) ? 1 : 0;
1703 scc = (src.rawData() <= simm16) ? 1 : 0;
1835 if (hwregId==1 && size==2
1837 warn_once(
"Be cautious that s_setreg_b32 has no real effect "
1838 "on FP modes: %s\n", gpuDynInst->disassemble());
2476 sdst = sext<std::numeric_limits<ScalarRegI8>::digits>(
2501 sdst = sext<std::numeric_limits<ScalarRegI16>::digits>(
2618 Wavefront *wf = gpuDynInst->wavefront();
2642 Wavefront *wf = gpuDynInst->wavefront();
2665 Wavefront *wf = gpuDynInst->wavefront();
2711 Wavefront *wf = gpuDynInst->wavefront();
2720 scc = wf->
execMask().any() ? 1 : 0;
2743 Wavefront *wf = gpuDynInst->wavefront();
2752 scc = wf->
execMask().any() ? 1 : 0;
2775 Wavefront *wf = gpuDynInst->wavefront();
2784 scc = wf->
execMask().any() ? 1 : 0;
2792 :
Inst_SOP1(iFmt,
"s_andn2_saveexec_b64")
2807 Wavefront *wf = gpuDynInst->wavefront();
2816 scc = wf->
execMask().any() ? 1 : 0;
2824 :
Inst_SOP1(iFmt,
"s_orn2_saveexec_b64")
2839 Wavefront *wf = gpuDynInst->wavefront();
2848 scc = wf->
execMask().any() ? 1 : 0;
2856 :
Inst_SOP1(iFmt,
"s_nand_saveexec_b64")
2871 Wavefront *wf = gpuDynInst->wavefront();
2880 scc = wf->
execMask().any() ? 1 : 0;
2903 Wavefront *wf = gpuDynInst->wavefront();
2912 scc = wf->
execMask().any() ? 1 : 0;
2920 :
Inst_SOP1(iFmt,
"s_xnor_saveexec_b64")
2935 Wavefront *wf = gpuDynInst->wavefront();
2944 scc = wf->
execMask().any() ? 1 : 0;
3154 sdst = std::abs(src.
rawData());
3739 Wavefront *wf = gpuDynInst->wavefront();
3769 DPRINTF(GPUSync,
"CU[%d] WF[%d][%d] Wave[%d] - Exiting the "
3770 "program and decrementing max barrier count for "
3771 "barrier Id%d. New max count: %d.\n", cu->
cu_id,
3776 DPRINTF(GPUExec,
"CU%d: decrease ref ctr WG[%d] to [%d]\n",
3786 DPRINTF(GPUExec,
"Doing return for CU%d: WF[%d][%d][%d]\n",
3806 DPRINTF(GPUSync,
"CU[%d] WF[%d][%d] Wave[%d] - All waves are "
3807 "now complete. Releasing barrier Id%d.\n", cu->
cu_id,
3830 if (!kernelEnd || !relNeeded) {
3846 gpuDynInst->simdId = wf->
simdId;
3847 gpuDynInst->wfSlotId = wf->
wfSlotId;
3848 gpuDynInst->wfDynId = wf->
wfDynId;
3850 DPRINTF(GPUExec,
"inject global memory fence for CU%d: "
3878 Wavefront *wf = gpuDynInst->wavefront();
3920 Wavefront *wf = gpuDynInst->wavefront();
3949 Wavefront *wf = gpuDynInst->wavefront();
3979 Wavefront *wf = gpuDynInst->wavefront();
4009 Wavefront *wf = gpuDynInst->wavefront();
4037 Wavefront *wf = gpuDynInst->wavefront();
4062 Wavefront *wf = gpuDynInst->wavefront();
4091 Wavefront *wf = gpuDynInst->wavefront();
4099 DPRINTF(GPUSync,
"CU[%d] WF[%d][%d] Wave[%d] - Stalling at "
4100 "barrier Id%d. %d waves now at barrier, %d waves "
4148 gpuDynInst->wavefront()->setWaitCnts(vm_cnt, exp_cnt, lgkm_cnt);
4342 :
Inst_SOPP(iFmt,
"s_cbranch_cdbgsys_or_user")
4360 :
Inst_SOPP(iFmt,
"s_cbranch_cdbgsys_and_user")
4452 Wavefront *wf = gpuDynInst->wavefront();
4454 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4455 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4471 gpuDynInst->computeUnit()->scalarMemoryPipe
4472 .getGMReqFIFO().push(gpuDynInst);
4476 gpuDynInst->wavefront()->outstandingReqs++;
4477 gpuDynInst->wavefront()->validateRequestCounters();
4483 initMemRead<1>(gpuDynInst);
4511 Wavefront *wf = gpuDynInst->wavefront();
4513 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4514 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4530 gpuDynInst->computeUnit()->scalarMemoryPipe.
4531 getGMReqFIFO().push(gpuDynInst);
4535 gpuDynInst->wavefront()->outstandingReqs++;
4536 gpuDynInst->wavefront()->validateRequestCounters();
4542 initMemRead<2>(gpuDynInst);
4568 Wavefront *wf = gpuDynInst->wavefront();
4570 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4571 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4587 gpuDynInst->computeUnit()->scalarMemoryPipe.
4588 getGMReqFIFO().push(gpuDynInst);
4592 gpuDynInst->wavefront()->outstandingReqs++;
4593 gpuDynInst->wavefront()->validateRequestCounters();
4599 initMemRead<4>(gpuDynInst);
4625 Wavefront *wf = gpuDynInst->wavefront();
4627 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4628 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4644 gpuDynInst->computeUnit()->scalarMemoryPipe.
4645 getGMReqFIFO().push(gpuDynInst);
4649 gpuDynInst->wavefront()->outstandingReqs++;
4650 gpuDynInst->wavefront()->validateRequestCounters();
4656 initMemRead<8>(gpuDynInst);
4682 Wavefront *wf = gpuDynInst->wavefront();
4684 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4685 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4701 gpuDynInst->computeUnit()->scalarMemoryPipe.
4702 getGMReqFIFO().push(gpuDynInst);
4706 gpuDynInst->wavefront()->outstandingReqs++;
4707 gpuDynInst->wavefront()->validateRequestCounters();
4713 initMemRead<16>(gpuDynInst);
4725 :
Inst_SMEM(iFmt,
"s_buffer_load_dword")
4740 Wavefront *wf = gpuDynInst->wavefront();
4742 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4743 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4759 gpuDynInst->computeUnit()->scalarMemoryPipe
4760 .getGMReqFIFO().push(gpuDynInst);
4764 gpuDynInst->wavefront()->outstandingReqs++;
4765 gpuDynInst->wavefront()->validateRequestCounters();
4771 initMemRead<1>(gpuDynInst);
4784 :
Inst_SMEM(iFmt,
"s_buffer_load_dwordx2")
4799 Wavefront *wf = gpuDynInst->wavefront();
4801 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4802 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4818 gpuDynInst->computeUnit()->scalarMemoryPipe
4819 .getGMReqFIFO().push(gpuDynInst);
4823 gpuDynInst->wavefront()->outstandingReqs++;
4824 gpuDynInst->wavefront()->validateRequestCounters();
4830 initMemRead<2>(gpuDynInst);
4843 :
Inst_SMEM(iFmt,
"s_buffer_load_dwordx4")
4858 Wavefront *wf = gpuDynInst->wavefront();
4860 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4861 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4877 gpuDynInst->computeUnit()->scalarMemoryPipe
4878 .getGMReqFIFO().push(gpuDynInst);
4882 gpuDynInst->wavefront()->outstandingReqs++;
4883 gpuDynInst->wavefront()->validateRequestCounters();
4889 initMemRead<4>(gpuDynInst);
4902 :
Inst_SMEM(iFmt,
"s_buffer_load_dwordx8")
4917 Wavefront *wf = gpuDynInst->wavefront();
4919 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4920 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4936 gpuDynInst->computeUnit()->scalarMemoryPipe
4937 .getGMReqFIFO().push(gpuDynInst);
4941 gpuDynInst->wavefront()->outstandingReqs++;
4942 gpuDynInst->wavefront()->validateRequestCounters();
4948 initMemRead<8>(gpuDynInst);
4961 :
Inst_SMEM(iFmt,
"s_buffer_load_dwordx16")
4976 Wavefront *wf = gpuDynInst->wavefront();
4978 gpuDynInst->latency.init(gpuDynInst->computeUnit());
4979 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
4995 gpuDynInst->computeUnit()->scalarMemoryPipe
4996 .getGMReqFIFO().push(gpuDynInst);
5000 gpuDynInst->wavefront()->outstandingReqs++;
5001 gpuDynInst->wavefront()->validateRequestCounters();
5007 initMemRead<16>(gpuDynInst);
5037 Wavefront *wf = gpuDynInst->wavefront();
5039 gpuDynInst->latency.init(gpuDynInst->computeUnit());
5040 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
5056 gpuDynInst->computeUnit()->scalarMemoryPipe.
5057 getGMReqFIFO().push(gpuDynInst);
5061 gpuDynInst->wavefront()->outstandingReqs++;
5062 gpuDynInst->wavefront()->validateRequestCounters();
5070 std::memcpy((
void*)gpuDynInst->scalar_data, sdata.
rawDataPtr(),
5072 initMemWrite<1>(gpuDynInst);
5096 Wavefront *wf = gpuDynInst->wavefront();
5098 gpuDynInst->latency.init(gpuDynInst->computeUnit());
5099 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
5115 gpuDynInst->computeUnit()->scalarMemoryPipe.
5116 getGMReqFIFO().push(gpuDynInst);
5120 gpuDynInst->wavefront()->outstandingReqs++;
5121 gpuDynInst->wavefront()->validateRequestCounters();
5129 std::memcpy((
void*)gpuDynInst->scalar_data, sdata.
rawDataPtr(),
5131 initMemWrite<2>(gpuDynInst);
5155 Wavefront *wf = gpuDynInst->wavefront();
5157 gpuDynInst->latency.init(gpuDynInst->computeUnit());
5158 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
5174 gpuDynInst->computeUnit()->scalarMemoryPipe.
5175 getGMReqFIFO().push(gpuDynInst);
5179 gpuDynInst->wavefront()->outstandingReqs++;
5180 gpuDynInst->wavefront()->validateRequestCounters();
5188 std::memcpy((
void*)gpuDynInst->scalar_data, sdata.
rawDataPtr(),
5190 initMemWrite<4>(gpuDynInst);
5200 :
Inst_SMEM(iFmt,
"s_buffer_store_dword")
5230 :
Inst_SMEM(iFmt,
"s_buffer_store_dwordx2")
5260 :
Inst_SMEM(iFmt,
"s_buffer_store_dwordx4")
5431 Wavefront *wf = gpuDynInst->wavefront();
5444 =
bits(vcc.
rawData(), lane) ? src1[lane] : src0[lane];
5466 Wavefront *wf = gpuDynInst->wavefront();
5478 DPRINTF(GCN3,
"Handling V_ADD_F32 SRC DPP. SRC0: register v[%d], "
5479 "DPP_CTRL: 0x%#x, SRC0_ABS: %d, SRC0_NEG: %d, "
5480 "SRC1_ABS: %d, SRC1_NEG: %d, BOUND_CTRL: %d, "
5495 vdst[lane] = src0_dpp[lane] + src1[lane];
5501 vdst[lane] = src0[lane] + src1[lane];
5524 Wavefront *wf = gpuDynInst->wavefront();
5534 vdst[lane] = src0[lane] - src1[lane];
5556 Wavefront *wf = gpuDynInst->wavefront();
5566 vdst[lane] = src1[lane] - src0[lane];
5588 Wavefront *wf = gpuDynInst->wavefront();
5598 vdst[lane] = src0[lane] * src1[lane];
5620 Wavefront *wf = gpuDynInst->wavefront();
5630 if (std::isnan(src0[lane]) ||
5631 std::isnan(src1[lane])) {
5633 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
5634 std::fpclassify(src0[lane]) == FP_ZERO) &&
5635 !std::signbit(src0[lane])) {
5636 if (std::isinf(src1[lane])) {
5638 }
else if (!std::signbit(src1[lane])) {
5643 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
5644 std::fpclassify(src0[lane]) == FP_ZERO) &&
5645 std::signbit(src0[lane])) {
5646 if (std::isinf(src1[lane])) {
5648 }
else if (std::signbit(src1[lane])) {
5653 }
else if (std::isinf(src0[lane]) &&
5654 !std::signbit(src0[lane])) {
5655 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
5656 std::fpclassify(src1[lane]) == FP_ZERO) {
5658 }
else if (!std::signbit(src1[lane])) {
5659 vdst[lane] = +INFINITY;
5661 vdst[lane] = -INFINITY;
5663 }
else if (std::isinf(src0[lane]) &&
5664 std::signbit(src0[lane])) {
5665 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
5666 std::fpclassify(src1[lane]) == FP_ZERO) {
5668 }
else if (std::signbit(src1[lane])) {
5669 vdst[lane] = +INFINITY;
5671 vdst[lane] = -INFINITY;
5674 vdst[lane] = src0[lane] * src1[lane];
5696 Wavefront *wf = gpuDynInst->wavefront();
5706 vdst[lane] = sext<24>(
bits(src0[lane], 23, 0))
5707 * sext<24>(
bits(src1[lane], 23, 0));
5728 Wavefront *wf = gpuDynInst->wavefront();
5743 vdst[lane] = (
VecElemI32)((tmp_src0 * tmp_src1) >> 32);
5764 Wavefront *wf = gpuDynInst->wavefront();
5781 origSrc0_sdwa.
read();
5784 DPRINTF(GCN3,
"Handling V_MUL_U32_U24 SRC SDWA. SRC0: register "
5785 "v[%d], DST_SEL: %d, DST_UNUSED: %d, CLAMP: %d, SRC0_SEL: "
5786 "%d, SRC0_SEXT: %d, SRC0_NEG: %d, SRC0_ABS: %d, SRC1_SEL: "
5787 "%d, SRC1_SEXT: %d, SRC1_NEG: %d, SRC1_ABS: %d\n",
5805 vdst[lane] =
bits(src0_sdwa[lane], 23, 0) *
5806 bits(src1[lane], 23, 0);
5807 origVdst[lane] = vdst[lane];
5815 vdst[lane] =
bits(src0[lane], 23, 0) *
5816 bits(src1[lane], 23, 0);
5839 Wavefront *wf = gpuDynInst->wavefront();
5851 vdst[lane] = (
VecElemU32)((tmp_src0 * tmp_src1) >> 32);
5873 Wavefront *wf = gpuDynInst->wavefront();
5883 vdst[lane] = std::fmin(src0[lane], src1[lane]);
5905 Wavefront *wf = gpuDynInst->wavefront();
5915 vdst[lane] = std::fmax(src0[lane], src1[lane]);
5936 Wavefront *wf = gpuDynInst->wavefront();
5946 vdst[lane] = std::min(src0[lane], src1[lane]);
5967 Wavefront *wf = gpuDynInst->wavefront();
5977 vdst[lane] = std::max(src0[lane], src1[lane]);
5998 Wavefront *wf = gpuDynInst->wavefront();
6008 vdst[lane] = std::min(src0[lane], src1[lane]);
6029 Wavefront *wf = gpuDynInst->wavefront();
6039 vdst[lane] = std::max(src0[lane], src1[lane]);
6061 Wavefront *wf = gpuDynInst->wavefront();
6071 vdst[lane] = src1[lane] >>
bits(src0[lane], 4, 0);
6093 Wavefront *wf = gpuDynInst->wavefront();
6103 vdst[lane] = src1[lane] >>
bits(src0[lane], 4, 0);
6124 Wavefront *wf = gpuDynInst->wavefront();
6141 origSrc0_sdwa.
read();
6144 DPRINTF(GCN3,
"Handling V_LSHLREV_B32 SRC SDWA. SRC0: register "
6145 "v[%d], DST_SEL: %d, DST_UNUSED: %d, CLAMP: %d, SRC0_SEL: "
6146 "%d, SRC0_SEXT: %d, SRC0_NEG: %d, SRC0_ABS: %d, SRC1_SEL: "
6147 "%d, SRC1_SEXT: %d, SRC1_NEG: %d, SRC1_ABS: %d\n",
6165 vdst[lane] = src1[lane] <<
bits(src0_sdwa[lane], 4, 0);
6166 origVdst[lane] = vdst[lane];
6174 vdst[lane] = src1[lane] <<
bits(src0[lane], 4, 0);
6197 Wavefront *wf = gpuDynInst->wavefront();
6207 vdst[lane] = src0[lane] & src1[lane];
6229 Wavefront *wf = gpuDynInst->wavefront();
6246 origSrc0_sdwa.
read();
6249 DPRINTF(GCN3,
"Handling V_OR_B32 SRC SDWA. SRC0: register v[%d], "
6250 "DST_SEL: %d, DST_UNUSED: %d, CLAMP: %d, SRC0_SEL: %d, "
6251 "SRC0_SEXT: %d, SRC0_NEG: %d, SRC0_ABS: %d, SRC1_SEL: %d, "
6252 "SRC1_SEXT: %d, SRC1_NEG: %d, SRC1_ABS: %d\n",
6270 vdst[lane] = src0_sdwa[lane] | src1[lane];
6271 origVdst[lane] = vdst[lane];
6279 vdst[lane] = src0[lane] | src1[lane];
6302 Wavefront *wf = gpuDynInst->wavefront();
6312 vdst[lane] = src0[lane] ^ src1[lane];
6335 Wavefront *wf = gpuDynInst->wavefront();
6348 DPRINTF(GCN3,
"Handling V_MAC_F32 SRC DPP. SRC0: register v[%d], "
6349 "DPP_CTRL: 0x%#x, SRC0_ABS: %d, SRC0_NEG: %d, "
6350 "SRC1_ABS: %d, SRC1_NEG: %d, BOUND_CTRL: %d, "
6365 vdst[lane] = std::fma(src0_dpp[lane], src1[lane],
6372 vdst[lane] = std::fma(src0[lane], src1[lane], vdst[lane]);
6397 Wavefront *wf = gpuDynInst->wavefront();
6408 vdst[lane] = std::fma(src0[lane],
k, src1[lane]);
6432 Wavefront *wf = gpuDynInst->wavefront();
6443 vdst[lane] = std::fma(src0[lane], src1[lane],
k);
6468 Wavefront *wf = gpuDynInst->wavefront();
6486 origSrc0_sdwa.
read();
6489 DPRINTF(GCN3,
"Handling V_ADD_U32 SRC SDWA. SRC0: register v[%d], "
6490 "DST_SEL: %d, DST_UNUSED: %d, CLAMP: %d, SRC0_SEL: %d, "
6491 "SRC0_SEXT: %d, SRC0_NEG: %d, SRC0_ABS: %d, SRC1_SEL: %d, "
6492 "SRC1_SEXT: %d, SRC1_NEG: %d, SRC1_ABS: %d\n",
6510 vdst[lane] = src0_sdwa[lane] + src1[lane];
6511 origVdst[lane] = vdst[lane];
6513 + (
VecElemU64)src1[lane] >= 0x100000000ULL) ? 1 : 0);
6521 vdst[lane] = src0[lane] + src1[lane];
6523 + (
VecElemU64)src1[lane] >= 0x100000000ULL) ? 1 : 0);
6550 Wavefront *wf = gpuDynInst->wavefront();
6561 vdst[lane] = src0[lane] - src1[lane];
6562 vcc.
setBit(lane, src1[lane] > src0[lane] ? 1 : 0);
6588 Wavefront *wf = gpuDynInst->wavefront();
6599 vdst[lane] = src1[lane] - src0[lane];
6600 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
6628 Wavefront *wf = gpuDynInst->wavefront();
6640 vdst[lane] = src0[lane] + src1[lane]
6645 >= 0x100000000 ? 1 : 0);
6673 Wavefront *wf = gpuDynInst->wavefront();
6686 = src0[lane] - src1[lane] -
bits(vcc.
rawData(), lane);
6688 > src0[lane] ? 1 : 0);
6716 Wavefront *wf = gpuDynInst->wavefront();
6729 = src1[lane] - src0[lane] -
bits(vcc.
rawData(), lane);
6731 > src1[lane] ? 1 : 0);
6888 Wavefront *wf = gpuDynInst->wavefront();
6898 vdst[lane] = src0[lane] + src1[lane];
6919 Wavefront *wf = gpuDynInst->wavefront();
6929 vdst[lane] = src0[lane] - src1[lane];
6950 Wavefront *wf = gpuDynInst->wavefront();
6960 vdst[lane] = src1[lane] - src0[lane];
6981 Wavefront *wf = gpuDynInst->wavefront();
6991 vdst[lane] = src0[lane] * src1[lane];
7012 Wavefront *wf = gpuDynInst->wavefront();
7022 vdst[lane] = src1[lane] <<
bits(src0[lane], 3, 0);
7044 Wavefront *wf = gpuDynInst->wavefront();
7054 vdst[lane] = src1[lane] >> src0[lane];
7076 Wavefront *wf = gpuDynInst->wavefront();
7086 vdst[lane] = src1[lane] >> src0[lane];
7143 Wavefront *wf = gpuDynInst->wavefront();
7153 vdst[lane] = std::max(src0[lane], src1[lane]);
7174 Wavefront *wf = gpuDynInst->wavefront();
7184 vdst[lane] = std::max(src0[lane], src1[lane]);
7205 Wavefront *wf = gpuDynInst->wavefront();
7215 vdst[lane] = std::min(src0[lane], src1[lane]);
7236 Wavefront *wf = gpuDynInst->wavefront();
7246 vdst[lane] = std::min(src0[lane], src1[lane]);
7303 Wavefront *wf = gpuDynInst->wavefront();
7313 DPRINTF(GCN3,
"Handling V_MOV_B32 SRC DPP. SRC0: register v[%d], "
7314 "DPP_CTRL: 0x%#x, SRC0_ABS: %d, SRC0_NEG: %d, "
7315 "SRC1_ABS: %d, SRC1_NEG: %d, BOUND_CTRL: %d, "
7334 vdst[lane] = src_dpp[lane];
7340 vdst[lane] = src[lane];
7350 :
Inst_VOP1(iFmt,
"v_readfirstlane_b32")
7366 Wavefront *wf = gpuDynInst->wavefront();
7378 sdst = src[src_lane];
7400 Wavefront *wf = gpuDynInst->wavefront();
7409 std::frexp(src[lane],&exp);
7410 if (std::isnan(src[lane])) {
7412 }
else if (std::isinf(src[lane]) || exp > 30) {
7413 if (std::signbit(src[lane])) {
7414 vdst[lane] = INT_MIN;
7416 vdst[lane] = INT_MAX;
7442 Wavefront *wf = gpuDynInst->wavefront();
7472 Wavefront *wf = gpuDynInst->wavefront();
7502 Wavefront *wf = gpuDynInst->wavefront();
7534 Wavefront *wf = gpuDynInst->wavefront();
7543 std::frexp(src[lane],&exp);
7544 if (std::isnan(src[lane])) {
7546 }
else if (std::isinf(src[lane])) {
7547 if (std::signbit(src[lane])) {
7550 vdst[lane] = UINT_MAX;
7552 }
else if (exp > 31) {
7553 vdst[lane] = UINT_MAX;
7580 Wavefront *wf = gpuDynInst->wavefront();
7589 std::frexp(src[lane],&exp);
7590 if (std::isnan(src[lane])) {
7592 }
else if (std::isinf(src[lane]) || exp > 30) {
7593 if (std::signbit(src[lane])) {
7594 vdst[lane] = INT_MIN;
7596 vdst[lane] = INT_MAX;
7677 Wavefront *wf = gpuDynInst->wavefront();
7685 vdst[lane] = (
VecElemI32)std::floor(src[lane] + 0.5);
7708 Wavefront *wf = gpuDynInst->wavefront();
7716 vdst[lane] = (
VecElemI32)std::floor(src[lane]);
7756 Wavefront *wf = gpuDynInst->wavefront();
7786 Wavefront *wf = gpuDynInst->wavefront();
7816 Wavefront *wf = gpuDynInst->wavefront();
7846 Wavefront *wf = gpuDynInst->wavefront();
7876 Wavefront *wf = gpuDynInst->wavefront();
7906 Wavefront *wf = gpuDynInst->wavefront();
7938 Wavefront *wf = gpuDynInst->wavefront();
7947 std::frexp(src[lane],&exp);
7948 if (std::isnan(src[lane])) {
7950 }
else if (std::isinf(src[lane])) {
7951 if (std::signbit(src[lane])) {
7954 vdst[lane] = UINT_MAX;
7956 }
else if (exp > 31) {
7957 vdst[lane] = UINT_MAX;
7982 Wavefront *wf = gpuDynInst->wavefront();
8012 Wavefront *wf = gpuDynInst->wavefront();
8020 vdst[lane] = std::trunc(src[lane]);
8042 Wavefront *wf = gpuDynInst->wavefront();
8050 vdst[lane] = std::ceil(src[lane]);
8072 Wavefront *wf = gpuDynInst->wavefront();
8102 Wavefront *wf = gpuDynInst->wavefront();
8110 vdst[lane] = std::floor(src[lane]);
8132 Wavefront *wf = gpuDynInst->wavefront();
8141 vdst[lane] = std::modf(src[lane], &int_part);
8163 Wavefront *wf = gpuDynInst->wavefront();
8171 vdst[lane] = std::trunc(src[lane]);
8193 Wavefront *wf = gpuDynInst->wavefront();
8201 vdst[lane] = std::ceil(src[lane]);
8223 Wavefront *wf = gpuDynInst->wavefront();
8253 Wavefront *wf = gpuDynInst->wavefront();
8261 vdst[lane] = std::floor(src[lane]);
8283 Wavefront *wf = gpuDynInst->wavefront();
8291 vdst[lane] = std::pow(2.0, src[lane]);
8313 Wavefront *wf = gpuDynInst->wavefront();
8321 vdst[lane] = std::log2(src[lane]);
8343 Wavefront *wf = gpuDynInst->wavefront();
8351 vdst[lane] = 1.0 / src[lane];
8373 Wavefront *wf = gpuDynInst->wavefront();
8381 vdst[lane] = 1.0 / src[lane];
8403 Wavefront *wf = gpuDynInst->wavefront();
8411 vdst[lane] = 1.0 / std::sqrt(src[lane]);
8433 Wavefront *wf = gpuDynInst->wavefront();
8441 if (std::fpclassify(src[lane]) == FP_ZERO) {
8442 vdst[lane] = +INFINITY;
8443 }
else if (std::isnan(src[lane])) {
8445 }
else if (std::isinf(src[lane])) {
8446 if (std::signbit(src[lane])) {
8452 vdst[lane] = 1.0 / src[lane];
8475 Wavefront *wf = gpuDynInst->wavefront();
8483 if (std::fpclassify(src[lane]) == FP_ZERO) {
8484 vdst[lane] = +INFINITY;
8485 }
else if (std::isnan(src[lane])) {
8487 }
else if (std::isinf(src[lane])
8488 && !std::signbit(src[lane])) {
8490 }
else if (std::signbit(src[lane])) {
8493 vdst[lane] = 1.0 / std::sqrt(src[lane]);
8516 Wavefront *wf = gpuDynInst->wavefront();
8524 vdst[lane] = std::sqrt(src[lane]);
8546 Wavefront *wf = gpuDynInst->wavefront();
8554 vdst[lane] = std::sqrt(src[lane]);
8576 Wavefront *wf = gpuDynInst->wavefront();
8586 if (src[lane] < -256.0 || src[lane] > 256.0) {
8589 vdst[lane] = std::sin(src[lane] * 2.0 * pi.
rawData());
8612 Wavefront *wf = gpuDynInst->wavefront();
8622 if (src[lane] < -256.0 || src[lane] > 256.0) {
8625 vdst[lane] = std::cos(src[lane] * 2.0 * pi.
rawData());
8648 Wavefront *wf = gpuDynInst->wavefront();
8656 vdst[lane] = ~src[lane];
8678 Wavefront *wf = gpuDynInst->wavefront();
8708 Wavefront *wf = gpuDynInst->wavefront();
8738 Wavefront *wf = gpuDynInst->wavefront();
8768 Wavefront *wf = gpuDynInst->wavefront();
8785 :
Inst_VOP1(iFmt,
"v_frexp_exp_i32_f64")
8798 Wavefront *wf = gpuDynInst->wavefront();
8806 if (std::isinf(src[lane]) || std::isnan(src[lane])) {
8810 std::frexp(src[lane], &exp);
8833 Wavefront *wf = gpuDynInst->wavefront();
8841 if (std::isinf(src[lane]) || std::isnan(src[lane])) {
8842 vdst[lane] = src[lane];
8845 vdst[lane] = std::frexp(src[lane], &exp);
8867 Wavefront *wf = gpuDynInst->wavefront();
8876 vdst[lane] = std::modf(src[lane], &int_part);
8885 :
Inst_VOP1(iFmt,
"v_frexp_exp_i32_f32")
8901 Wavefront *wf = gpuDynInst->wavefront();
8909 if (std::isinf(src[lane]) || std::isnan(src[lane])) {
8913 std::frexp(src[lane], &exp);
8938 Wavefront *wf = gpuDynInst->wavefront();
8946 if (std::isinf(src[lane]) || std::isnan(src[lane])) {
8947 vdst[lane] = src[lane];
8950 vdst[lane] = std::frexp(src[lane], &exp);
9174 :
Inst_VOP1(iFmt,
"v_frexp_exp_i16_f16")
9336 Wavefront *wf = gpuDynInst->wavefront();
9344 vdst[lane] = std::pow(2.0, src[lane]);
9366 Wavefront *wf = gpuDynInst->wavefront();
9374 vdst[lane] = std::log2(src[lane]);
9408 Wavefront *wf = gpuDynInst->wavefront();
9418 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
9420 if (std::isnan(src0[lane])) {
9425 if (
bits(src1[lane], 2)) {
9427 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
9432 if (
bits(src1[lane], 3)) {
9434 if (std::isnormal(src0[lane])
9435 && std::signbit(src0[lane])) {
9440 if (
bits(src1[lane], 4)) {
9442 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9443 && std::signbit(src0[lane])) {
9448 if (
bits(src1[lane], 5)) {
9450 if (std::fpclassify(src0[lane]) == FP_ZERO
9451 && std::signbit(src0[lane])) {
9456 if (
bits(src1[lane], 6)) {
9458 if (std::fpclassify(src0[lane]) == FP_ZERO
9459 && !std::signbit(src0[lane])) {
9464 if (
bits(src1[lane], 7)) {
9466 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9467 && !std::signbit(src0[lane])) {
9472 if (
bits(src1[lane], 8)) {
9474 if (std::isnormal(src0[lane])
9475 && !std::signbit(src0[lane])) {
9480 if (
bits(src1[lane], 9)) {
9482 if (std::isinf(src0[lane]) && !std::signbit(src0[lane])) {
9520 Wavefront *wf = gpuDynInst->wavefront();
9530 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
9532 if (std::isnan(src0[lane])) {
9537 if (
bits(src1[lane], 2)) {
9539 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
9544 if (
bits(src1[lane], 3)) {
9546 if (std::isnormal(src0[lane])
9547 && std::signbit(src0[lane])) {
9552 if (
bits(src1[lane], 4)) {
9554 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9555 && std::signbit(src0[lane])) {
9560 if (
bits(src1[lane], 5)) {
9562 if (std::fpclassify(src0[lane]) == FP_ZERO
9563 && std::signbit(src0[lane])) {
9568 if (
bits(src1[lane], 6)) {
9570 if (std::fpclassify(src0[lane]) == FP_ZERO
9571 && !std::signbit(src0[lane])) {
9576 if (
bits(src1[lane], 7)) {
9578 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9579 && !std::signbit(src0[lane])) {
9584 if (
bits(src1[lane], 8)) {
9586 if (std::isnormal(src0[lane])
9587 && !std::signbit(src0[lane])) {
9592 if (
bits(src1[lane], 9)) {
9594 if (std::isinf(src0[lane]) && !std::signbit(src0[lane])) {
9633 Wavefront *wf = gpuDynInst->wavefront();
9643 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
9645 if (std::isnan(src0[lane])) {
9650 if (
bits(src1[lane], 2)) {
9652 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
9657 if (
bits(src1[lane], 3)) {
9659 if (std::isnormal(src0[lane])
9660 && std::signbit(src0[lane])) {
9665 if (
bits(src1[lane], 4)) {
9667 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9668 && std::signbit(src0[lane])) {
9673 if (
bits(src1[lane], 5)) {
9675 if (std::fpclassify(src0[lane]) == FP_ZERO
9676 && std::signbit(src0[lane])) {
9681 if (
bits(src1[lane], 6)) {
9683 if (std::fpclassify(src0[lane]) == FP_ZERO
9684 && !std::signbit(src0[lane])) {
9689 if (
bits(src1[lane], 7)) {
9691 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9692 && !std::signbit(src0[lane])) {
9697 if (
bits(src1[lane], 8)) {
9699 if (std::isnormal(src0[lane])
9700 && !std::signbit(src0[lane])) {
9705 if (
bits(src1[lane], 9)) {
9707 if (std::isinf(src0[lane])
9708 && !std::signbit(src0[lane])) {
9746 Wavefront *wf = gpuDynInst->wavefront();
9756 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
9758 if (std::isnan(src0[lane])) {
9763 if (
bits(src1[lane], 2)) {
9765 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
9770 if (
bits(src1[lane], 3)) {
9772 if (std::isnormal(src0[lane])
9773 && std::signbit(src0[lane])) {
9778 if (
bits(src1[lane], 4)) {
9780 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9781 && std::signbit(src0[lane])) {
9786 if (
bits(src1[lane], 5)) {
9788 if (std::fpclassify(src0[lane]) == FP_ZERO
9789 && std::signbit(src0[lane])) {
9794 if (
bits(src1[lane], 6)) {
9796 if (std::fpclassify(src0[lane]) == FP_ZERO
9797 && !std::signbit(src0[lane])) {
9802 if (
bits(src1[lane], 7)) {
9804 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
9805 && !std::signbit(src0[lane])) {
9810 if (
bits(src1[lane], 8)) {
9812 if (std::isnormal(src0[lane])
9813 && !std::signbit(src0[lane])) {
9818 if (
bits(src1[lane], 9)) {
9820 if (std::isinf(src0[lane])
9821 && !std::signbit(src0[lane])) {
10487 Wavefront *wf = gpuDynInst->wavefront();
10514 Wavefront *wf = gpuDynInst->wavefront();
10524 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
10546 Wavefront *wf = gpuDynInst->wavefront();
10556 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
10578 Wavefront *wf = gpuDynInst->wavefront();
10588 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
10610 Wavefront *wf = gpuDynInst->wavefront();
10620 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
10642 Wavefront *wf = gpuDynInst->wavefront();
10652 vcc.
setBit(lane, (src0[lane] < src1[lane]
10653 || src0[lane] > src1[lane]) ? 1 : 0);
10675 Wavefront *wf = gpuDynInst->wavefront();
10685 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
10707 Wavefront *wf = gpuDynInst->wavefront();
10717 vcc.
setBit(lane, (!std::isnan(src0[lane])
10718 && !std::isnan(src1[lane])) ? 1 : 0);
10740 Wavefront *wf = gpuDynInst->wavefront();
10750 vcc.
setBit(lane, (std::isnan(src0[lane])
10751 || std::isnan(src1[lane])) ? 1 : 0);
10773 Wavefront *wf = gpuDynInst->wavefront();
10783 vcc.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
10805 Wavefront *wf = gpuDynInst->wavefront();
10815 vcc.
setBit(lane, !(src0[lane] < src1[lane]
10816 || src0[lane] > src1[lane]) ? 1 : 0);
10838 Wavefront *wf = gpuDynInst->wavefront();
10848 vcc.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
10870 Wavefront *wf = gpuDynInst->wavefront();
10880 vcc.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
10902 Wavefront *wf = gpuDynInst->wavefront();
10912 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
10934 Wavefront *wf = gpuDynInst->wavefront();
10944 vcc.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
10966 Wavefront *wf = gpuDynInst->wavefront();
10993 Wavefront *wf = gpuDynInst->wavefront();
11021 Wavefront *wf = gpuDynInst->wavefront();
11031 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
11054 Wavefront *wf = gpuDynInst->wavefront();
11064 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
11087 Wavefront *wf = gpuDynInst->wavefront();
11097 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
11120 Wavefront *wf = gpuDynInst->wavefront();
11130 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
11153 Wavefront *wf = gpuDynInst->wavefront();
11163 vcc.
setBit(lane, (src0[lane] < src1[lane]
11164 || src0[lane] > src1[lane]) ? 1 : 0);
11187 Wavefront *wf = gpuDynInst->wavefront();
11197 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
11221 Wavefront *wf = gpuDynInst->wavefront();
11231 vcc.
setBit(lane, (!std::isnan(src0[lane])
11232 && !std::isnan(src1[lane])) ? 1 : 0);
11256 Wavefront *wf = gpuDynInst->wavefront();
11266 vcc.
setBit(lane, (std::isnan(src0[lane])
11267 || std::isnan(src1[lane])) ? 1 : 0);
11290 Wavefront *wf = gpuDynInst->wavefront();
11300 vcc.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
11323 Wavefront *wf = gpuDynInst->wavefront();
11333 vcc.
setBit(lane, !(src0[lane] < src1[lane]
11334 || src0[lane] > src1[lane]) ? 1 : 0);
11357 Wavefront *wf = gpuDynInst->wavefront();
11367 vcc.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
11390 Wavefront *wf = gpuDynInst->wavefront();
11400 vcc.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
11423 Wavefront *wf = gpuDynInst->wavefront();
11433 vcc.
setBit(lane, !(src0[lane] == src1[lane]) ? 1 : 0);
11455 Wavefront *wf = gpuDynInst->wavefront();
11465 vcc.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
11488 Wavefront *wf = gpuDynInst->wavefront();
11516 Wavefront *wf = gpuDynInst->wavefront();
11543 Wavefront *wf = gpuDynInst->wavefront();
11553 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
11575 Wavefront *wf = gpuDynInst->wavefront();
11585 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
11607 Wavefront *wf = gpuDynInst->wavefront();
11617 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
11639 Wavefront *wf = gpuDynInst->wavefront();
11649 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
11671 Wavefront *wf = gpuDynInst->wavefront();
11681 vcc.
setBit(lane, (src0[lane] < src1[lane]
11682 || src0[lane] > src1[lane]) ? 1 : 0);
11704 Wavefront *wf = gpuDynInst->wavefront();
11714 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
11736 Wavefront *wf = gpuDynInst->wavefront();
11746 vcc.
setBit(lane, (!std::isnan(src0[lane])
11747 && !std::isnan(src1[lane])) ? 1 : 0);
11769 Wavefront *wf = gpuDynInst->wavefront();
11779 vcc.
setBit(lane, (std::isnan(src0[lane])
11780 || std::isnan(src1[lane])) ? 1 : 0);
11802 Wavefront *wf = gpuDynInst->wavefront();
11812 vcc.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
11834 Wavefront *wf = gpuDynInst->wavefront();
11844 vcc.
setBit(lane, !(src0[lane] < src1[lane]
11845 || src0[lane] > src1[lane]) ? 1 : 0);
11867 Wavefront *wf = gpuDynInst->wavefront();
11877 vcc.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
11899 Wavefront *wf = gpuDynInst->wavefront();
11909 vcc.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
11931 Wavefront *wf = gpuDynInst->wavefront();
11941 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
11963 Wavefront *wf = gpuDynInst->wavefront();
11973 vcc.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
11995 Wavefront *wf = gpuDynInst->wavefront();
12022 Wavefront *wf = gpuDynInst->wavefront();
12050 Wavefront *wf = gpuDynInst->wavefront();
12060 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
12083 Wavefront *wf = gpuDynInst->wavefront();
12093 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
12116 Wavefront *wf = gpuDynInst->wavefront();
12126 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
12149 Wavefront *wf = gpuDynInst->wavefront();
12159 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
12182 Wavefront *wf = gpuDynInst->wavefront();
12192 vcc.
setBit(lane, (src0[lane] < src1[lane]
12193 || src0[lane] > src1[lane]) ? 1 : 0);
12216 Wavefront *wf = gpuDynInst->wavefront();
12226 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
12250 Wavefront *wf = gpuDynInst->wavefront();
12260 vcc.
setBit(lane, (!std::isnan(src0[lane])
12261 && !std::isnan(src1[lane])) ? 1 : 0);
12285 Wavefront *wf = gpuDynInst->wavefront();
12295 vcc.
setBit(lane, (std::isnan(src0[lane])
12296 || std::isnan(src1[lane])) ? 1 : 0);
12319 Wavefront *wf = gpuDynInst->wavefront();
12329 vcc.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
12352 Wavefront *wf = gpuDynInst->wavefront();
12362 vcc.
setBit(lane, !(src0[lane] < src1[lane]
12363 || src0[lane] > src1[lane]) ? 1 : 0);
12386 Wavefront *wf = gpuDynInst->wavefront();
12396 vcc.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
12419 Wavefront *wf = gpuDynInst->wavefront();
12429 vcc.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
12452 Wavefront *wf = gpuDynInst->wavefront();
12462 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
12485 Wavefront *wf = gpuDynInst->wavefront();
12495 vcc.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
12518 Wavefront *wf = gpuDynInst->wavefront();
12545 Wavefront *wf = gpuDynInst->wavefront();
12571 Wavefront *wf = gpuDynInst->wavefront();
12581 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
12602 Wavefront *wf = gpuDynInst->wavefront();
12612 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
12633 Wavefront *wf = gpuDynInst->wavefront();
12643 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
12664 Wavefront *wf = gpuDynInst->wavefront();
12674 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
12695 Wavefront *wf = gpuDynInst->wavefront();
12705 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
12726 Wavefront *wf = gpuDynInst->wavefront();
12736 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
12757 Wavefront *wf = gpuDynInst->wavefront();
12783 Wavefront *wf = gpuDynInst->wavefront();
12809 Wavefront *wf = gpuDynInst->wavefront();
12819 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
12840 Wavefront *wf = gpuDynInst->wavefront();
12850 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
12871 Wavefront *wf = gpuDynInst->wavefront();
12881 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
12902 Wavefront *wf = gpuDynInst->wavefront();
12912 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
12933 Wavefront *wf = gpuDynInst->wavefront();
12943 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
12964 Wavefront *wf = gpuDynInst->wavefront();
12974 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
12995 Wavefront *wf = gpuDynInst->wavefront();
13021 Wavefront *wf = gpuDynInst->wavefront();
13048 Wavefront *wf = gpuDynInst->wavefront();
13058 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
13080 Wavefront *wf = gpuDynInst->wavefront();
13090 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
13112 Wavefront *wf = gpuDynInst->wavefront();
13122 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
13144 Wavefront *wf = gpuDynInst->wavefront();
13154 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
13176 Wavefront *wf = gpuDynInst->wavefront();
13186 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
13208 Wavefront *wf = gpuDynInst->wavefront();
13218 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
13240 Wavefront *wf = gpuDynInst->wavefront();
13267 Wavefront *wf = gpuDynInst->wavefront();
13294 Wavefront *wf = gpuDynInst->wavefront();
13304 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
13326 Wavefront *wf = gpuDynInst->wavefront();
13336 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
13358 Wavefront *wf = gpuDynInst->wavefront();
13368 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
13390 Wavefront *wf = gpuDynInst->wavefront();
13400 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
13422 Wavefront *wf = gpuDynInst->wavefront();
13432 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
13454 Wavefront *wf = gpuDynInst->wavefront();
13464 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
13486 Wavefront *wf = gpuDynInst->wavefront();
13513 Wavefront *wf = gpuDynInst->wavefront();
13539 Wavefront *wf = gpuDynInst->wavefront();
13549 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
13570 Wavefront *wf = gpuDynInst->wavefront();
13580 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
13601 Wavefront *wf = gpuDynInst->wavefront();
13611 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
13632 Wavefront *wf = gpuDynInst->wavefront();
13642 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
13663 Wavefront *wf = gpuDynInst->wavefront();
13673 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
13694 Wavefront *wf = gpuDynInst->wavefront();
13704 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
13725 Wavefront *wf = gpuDynInst->wavefront();
13751 Wavefront *wf = gpuDynInst->wavefront();
13777 Wavefront *wf = gpuDynInst->wavefront();
13787 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
13808 Wavefront *wf = gpuDynInst->wavefront();
13818 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
13839 Wavefront *wf = gpuDynInst->wavefront();
13849 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
13870 Wavefront *wf = gpuDynInst->wavefront();
13880 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
13901 Wavefront *wf = gpuDynInst->wavefront();
13911 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
13932 Wavefront *wf = gpuDynInst->wavefront();
13942 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
13963 Wavefront *wf = gpuDynInst->wavefront();
13989 Wavefront *wf = gpuDynInst->wavefront();
14016 Wavefront *wf = gpuDynInst->wavefront();
14026 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
14048 Wavefront *wf = gpuDynInst->wavefront();
14058 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
14080 Wavefront *wf = gpuDynInst->wavefront();
14090 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
14112 Wavefront *wf = gpuDynInst->wavefront();
14122 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
14144 Wavefront *wf = gpuDynInst->wavefront();
14154 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
14176 Wavefront *wf = gpuDynInst->wavefront();
14186 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
14208 Wavefront *wf = gpuDynInst->wavefront();
14235 Wavefront *wf = gpuDynInst->wavefront();
14262 Wavefront *wf = gpuDynInst->wavefront();
14272 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
14294 Wavefront *wf = gpuDynInst->wavefront();
14304 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
14326 Wavefront *wf = gpuDynInst->wavefront();
14336 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
14358 Wavefront *wf = gpuDynInst->wavefront();
14368 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
14390 Wavefront *wf = gpuDynInst->wavefront();
14400 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
14422 Wavefront *wf = gpuDynInst->wavefront();
14432 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
14454 Wavefront *wf = gpuDynInst->wavefront();
14481 Wavefront *wf = gpuDynInst->wavefront();
14507 Wavefront *wf = gpuDynInst->wavefront();
14517 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
14538 Wavefront *wf = gpuDynInst->wavefront();
14548 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
14569 Wavefront *wf = gpuDynInst->wavefront();
14579 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
14600 Wavefront *wf = gpuDynInst->wavefront();
14610 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
14631 Wavefront *wf = gpuDynInst->wavefront();
14641 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
14662 Wavefront *wf = gpuDynInst->wavefront();
14672 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
14693 Wavefront *wf = gpuDynInst->wavefront();
14719 Wavefront *wf = gpuDynInst->wavefront();
14745 Wavefront *wf = gpuDynInst->wavefront();
14755 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
14776 Wavefront *wf = gpuDynInst->wavefront();
14786 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
14807 Wavefront *wf = gpuDynInst->wavefront();
14817 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
14838 Wavefront *wf = gpuDynInst->wavefront();
14848 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
14869 Wavefront *wf = gpuDynInst->wavefront();
14879 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
14900 Wavefront *wf = gpuDynInst->wavefront();
14910 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
14931 Wavefront *wf = gpuDynInst->wavefront();
14957 Wavefront *wf = gpuDynInst->wavefront();
14984 Wavefront *wf = gpuDynInst->wavefront();
14994 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
15016 Wavefront *wf = gpuDynInst->wavefront();
15026 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
15048 Wavefront *wf = gpuDynInst->wavefront();
15058 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
15080 Wavefront *wf = gpuDynInst->wavefront();
15090 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
15112 Wavefront *wf = gpuDynInst->wavefront();
15122 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
15144 Wavefront *wf = gpuDynInst->wavefront();
15154 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
15176 Wavefront *wf = gpuDynInst->wavefront();
15203 Wavefront *wf = gpuDynInst->wavefront();
15230 Wavefront *wf = gpuDynInst->wavefront();
15240 vcc.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
15262 Wavefront *wf = gpuDynInst->wavefront();
15272 vcc.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
15294 Wavefront *wf = gpuDynInst->wavefront();
15304 vcc.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
15326 Wavefront *wf = gpuDynInst->wavefront();
15336 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
15358 Wavefront *wf = gpuDynInst->wavefront();
15368 vcc.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
15390 Wavefront *wf = gpuDynInst->wavefront();
15400 vcc.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
15422 Wavefront *wf = gpuDynInst->wavefront();
15493 :
Inst_VOP3(iFmt,
"v_cmp_class_f32", true)
15519 Wavefront *wf = gpuDynInst->wavefront();
15529 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
15531 if (std::isnan(src0[lane])) {
15536 if (
bits(src1[lane], 2)) {
15538 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
15543 if (
bits(src1[lane], 3)) {
15545 if (std::isnormal(src0[lane])
15546 && std::signbit(src0[lane])) {
15551 if (
bits(src1[lane], 4)) {
15553 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15554 && std::signbit(src0[lane])) {
15559 if (
bits(src1[lane], 5)) {
15561 if (std::fpclassify(src0[lane]) == FP_ZERO
15562 && std::signbit(src0[lane])) {
15567 if (
bits(src1[lane], 6)) {
15569 if (std::fpclassify(src0[lane]) == FP_ZERO
15570 && !std::signbit(src0[lane])) {
15575 if (
bits(src1[lane], 7)) {
15577 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15578 && !std::signbit(src0[lane])) {
15583 if (
bits(src1[lane], 8)) {
15585 if (std::isnormal(src0[lane])
15586 && !std::signbit(src0[lane])) {
15591 if (
bits(src1[lane], 9)) {
15593 if (std::isinf(src0[lane])
15594 && !std::signbit(src0[lane])) {
15607 :
Inst_VOP3(iFmt,
"v_cmpx_class_f32", true)
15634 Wavefront *wf = gpuDynInst->wavefront();
15644 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
15646 if (std::isnan(src0[lane])) {
15651 if (
bits(src1[lane], 2)) {
15653 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
15658 if (
bits(src1[lane], 3)) {
15660 if (std::isnormal(src0[lane])
15661 && std::signbit(src0[lane])) {
15666 if (
bits(src1[lane], 4)) {
15668 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15669 && std::signbit(src0[lane])) {
15674 if (
bits(src1[lane], 5)) {
15676 if (std::fpclassify(src0[lane]) == FP_ZERO
15677 && std::signbit(src0[lane])) {
15682 if (
bits(src1[lane], 6)) {
15684 if (std::fpclassify(src0[lane]) == FP_ZERO
15685 && !std::signbit(src0[lane])) {
15690 if (
bits(src1[lane], 7)) {
15692 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15693 && !std::signbit(src0[lane])) {
15698 if (
bits(src1[lane], 8)) {
15700 if (std::isnormal(src0[lane])
15701 && !std::signbit(src0[lane])) {
15706 if (
bits(src1[lane], 9)) {
15708 if (std::isinf(src0[lane])
15709 && !std::signbit(src0[lane])) {
15723 :
Inst_VOP3(iFmt,
"v_cmp_class_f64", true)
15749 Wavefront *wf = gpuDynInst->wavefront();
15759 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
15761 if (std::isnan(src0[lane])) {
15766 if (
bits(src1[lane], 2)) {
15768 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
15773 if (
bits(src1[lane], 3)) {
15775 if (std::isnormal(src0[lane])
15776 && std::signbit(src0[lane])) {
15781 if (
bits(src1[lane], 4)) {
15783 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15784 && std::signbit(src0[lane])) {
15789 if (
bits(src1[lane], 5)) {
15791 if (std::fpclassify(src0[lane]) == FP_ZERO
15792 && std::signbit(src0[lane])) {
15797 if (
bits(src1[lane], 6)) {
15799 if (std::fpclassify(src0[lane]) == FP_ZERO
15800 && !std::signbit(src0[lane])) {
15805 if (
bits(src1[lane], 7)) {
15807 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15808 && !std::signbit(src0[lane])) {
15813 if (
bits(src1[lane], 8)) {
15815 if (std::isnormal(src0[lane])
15816 && !std::signbit(src0[lane])) {
15821 if (
bits(src1[lane], 9)) {
15823 if (std::isinf(src0[lane])
15824 && !std::signbit(src0[lane])) {
15837 :
Inst_VOP3(iFmt,
"v_cmpx_class_f64", true)
15864 Wavefront *wf = gpuDynInst->wavefront();
15874 if (
bits(src1[lane], 0) ||
bits(src1[lane], 1)) {
15876 if (std::isnan(src0[lane])) {
15881 if (
bits(src1[lane], 2)) {
15883 if (std::isinf(src0[lane]) && std::signbit(src0[lane])) {
15888 if (
bits(src1[lane], 3)) {
15890 if (std::isnormal(src0[lane])
15891 && std::signbit(src0[lane])) {
15896 if (
bits(src1[lane], 4)) {
15898 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15899 && std::signbit(src0[lane])) {
15904 if (
bits(src1[lane], 5)) {
15906 if (std::fpclassify(src0[lane]) == FP_ZERO
15907 && std::signbit(src0[lane])) {
15912 if (
bits(src1[lane], 6)) {
15914 if (std::fpclassify(src0[lane]) == FP_ZERO
15915 && !std::signbit(src0[lane])) {
15920 if (
bits(src1[lane], 7)) {
15922 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
15923 && !std::signbit(src0[lane])) {
15928 if (
bits(src1[lane], 8)) {
15930 if (std::isnormal(src0[lane])
15931 && !std::signbit(src0[lane])) {
15936 if (
bits(src1[lane], 9)) {
15938 if (std::isinf(src0[lane])
15939 && !std::signbit(src0[lane])) {
15953 :
Inst_VOP3(iFmt,
"v_cmp_class_f16", true)
15984 :
Inst_VOP3(iFmt,
"v_cmpx_class_f16", true)
16034 :
Inst_VOP3(iFmt,
"v_cmp_lt_f16", true)
16053 :
Inst_VOP3(iFmt,
"v_cmp_eq_f16", true)
16072 :
Inst_VOP3(iFmt,
"v_cmp_le_f16", true)
16091 :
Inst_VOP3(iFmt,
"v_cmp_gt_f16", true)
16110 :
Inst_VOP3(iFmt,
"v_cmp_lg_f16", true)
16129 :
Inst_VOP3(iFmt,
"v_cmp_ge_f16", true)
16184 :
Inst_VOP3(iFmt,
"v_cmp_nge_f16", true)
16203 :
Inst_VOP3(iFmt,
"v_cmp_nlg_f16", true)
16222 :
Inst_VOP3(iFmt,
"v_cmp_ngt_f16", true)
16241 :
Inst_VOP3(iFmt,
"v_cmp_nle_f16", true)
16260 :
Inst_VOP3(iFmt,
"v_cmp_neq_f16", true)
16279 :
Inst_VOP3(iFmt,
"v_cmp_nlt_f16", true)
16298 :
Inst_VOP3(iFmt,
"v_cmp_tru_f16", true)
16312 Wavefront *wf = gpuDynInst->wavefront();
16326 :
Inst_VOP3(iFmt,
"v_cmpx_f_f16", true)
16339 Wavefront *wf = gpuDynInst->wavefront();
16354 :
Inst_VOP3(iFmt,
"v_cmpx_lt_f16", true)
16373 :
Inst_VOP3(iFmt,
"v_cmpx_eq_f16", true)
16392 :
Inst_VOP3(iFmt,
"v_cmpx_le_f16", true)
16411 :
Inst_VOP3(iFmt,
"v_cmpx_gt_f16", true)
16430 :
Inst_VOP3(iFmt,
"v_cmpx_lg_f16", true)
16449 :
Inst_VOP3(iFmt,
"v_cmpx_ge_f16", true)
16468 :
Inst_VOP3(iFmt,
"v_cmpx_o_f16", true)
16488 :
Inst_VOP3(iFmt,
"v_cmpx_u_f16", true)
16508 :
Inst_VOP3(iFmt,
"v_cmpx_nge_f16", true)
16527 :
Inst_VOP3(iFmt,
"v_cmpx_nlg_f16", true)
16546 :
Inst_VOP3(iFmt,
"v_cmpx_ngt_f16", true)
16565 :
Inst_VOP3(iFmt,
"v_cmpx_nle_f16", true)
16584 :
Inst_VOP3(iFmt,
"v_cmpx_neq_f16", true)
16603 :
Inst_VOP3(iFmt,
"v_cmpx_nlt_f16", true)
16622 :
Inst_VOP3(iFmt,
"v_cmpx_tru_f16", true)
16636 Wavefront *wf = gpuDynInst->wavefront();
16664 Wavefront *wf = gpuDynInst->wavefront();
16678 :
Inst_VOP3(iFmt,
"v_cmp_lt_f32", true)
16692 Wavefront *wf = gpuDynInst->wavefront();
16702 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
16711 :
Inst_VOP3(iFmt,
"v_cmp_eq_f32", true)
16725 Wavefront *wf = gpuDynInst->wavefront();
16735 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
16744 :
Inst_VOP3(iFmt,
"v_cmp_le_f32", true)
16758 Wavefront *wf = gpuDynInst->wavefront();
16768 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
16777 :
Inst_VOP3(iFmt,
"v_cmp_gt_f32", true)
16791 Wavefront *wf = gpuDynInst->wavefront();
16801 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
16810 :
Inst_VOP3(iFmt,
"v_cmp_lg_f32", true)
16824 Wavefront *wf = gpuDynInst->wavefront();
16834 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
16843 :
Inst_VOP3(iFmt,
"v_cmp_ge_f32", true)
16857 Wavefront *wf = gpuDynInst->wavefront();
16867 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
16889 Wavefront *wf = gpuDynInst->wavefront();
16899 sdst.
setBit(lane, (!std::isnan(src0[lane])
16900 && !std::isnan(src1[lane])) ? 1 : 0);
16922 Wavefront *wf = gpuDynInst->wavefront();
16932 sdst.
setBit(lane, (std::isnan(src0[lane])
16933 || std::isnan(src1[lane])) ? 1 : 0);
16942 :
Inst_VOP3(iFmt,
"v_cmp_nge_f32", true)
16956 Wavefront *wf = gpuDynInst->wavefront();
16966 sdst.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
16975 :
Inst_VOP3(iFmt,
"v_cmp_nlg_f32", true)
16989 Wavefront *wf = gpuDynInst->wavefront();
16999 sdst.
setBit(lane, !(src0[lane] < src1[lane]
17000 || src0[lane] > src1[lane]) ? 1 : 0);
17009 :
Inst_VOP3(iFmt,
"v_cmp_ngt_f32", true)
17023 Wavefront *wf = gpuDynInst->wavefront();
17033 sdst.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
17042 :
Inst_VOP3(iFmt,
"v_cmp_nle_f32", true)
17056 Wavefront *wf = gpuDynInst->wavefront();
17066 sdst.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
17075 :
Inst_VOP3(iFmt,
"v_cmp_neq_f32", true)
17089 Wavefront *wf = gpuDynInst->wavefront();
17099 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
17108 :
Inst_VOP3(iFmt,
"v_cmp_nlt_f32", true)
17122 Wavefront *wf = gpuDynInst->wavefront();
17132 sdst.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
17141 :
Inst_VOP3(iFmt,
"v_cmp_tru_f32", true)
17155 Wavefront *wf = gpuDynInst->wavefront();
17169 :
Inst_VOP3(iFmt,
"v_cmpx_f_f32", true)
17183 Wavefront *wf = gpuDynInst->wavefront();
17198 :
Inst_VOP3(iFmt,
"v_cmpx_lt_f32", true)
17212 Wavefront *wf = gpuDynInst->wavefront();
17222 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
17232 :
Inst_VOP3(iFmt,
"v_cmpx_eq_f32", true)
17246 Wavefront *wf = gpuDynInst->wavefront();
17256 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
17266 :
Inst_VOP3(iFmt,
"v_cmpx_le_f32", true)
17280 Wavefront *wf = gpuDynInst->wavefront();
17290 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
17300 :
Inst_VOP3(iFmt,
"v_cmpx_gt_f32", true)
17314 Wavefront *wf = gpuDynInst->wavefront();
17324 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
17334 :
Inst_VOP3(iFmt,
"v_cmpx_lg_f32", true)
17348 Wavefront *wf = gpuDynInst->wavefront();
17358 sdst.
setBit(lane, (src0[lane] < src1[lane]
17359 || src0[lane] > src1[lane]) ? 1 : 0);
17369 :
Inst_VOP3(iFmt,
"v_cmpx_ge_f32", true)
17383 Wavefront *wf = gpuDynInst->wavefront();
17393 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
17403 :
Inst_VOP3(iFmt,
"v_cmpx_o_f32", true)
17418 Wavefront *wf = gpuDynInst->wavefront();
17428 sdst.
setBit(lane, (!std::isnan(src0[lane])
17429 && !std::isnan(src1[lane])) ? 1 : 0);
17439 :
Inst_VOP3(iFmt,
"v_cmpx_u_f32", true)
17454 Wavefront *wf = gpuDynInst->wavefront();
17464 sdst.
setBit(lane, (std::isnan(src0[lane])
17465 || std::isnan(src1[lane])) ? 1 : 0);
17475 :
Inst_VOP3(iFmt,
"v_cmpx_nge_f32", true)
17489 Wavefront *wf = gpuDynInst->wavefront();
17499 sdst.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
17509 :
Inst_VOP3(iFmt,
"v_cmpx_nlg_f32", true)
17523 Wavefront *wf = gpuDynInst->wavefront();
17533 sdst.
setBit(lane, !(src0[lane] < src1[lane]
17534 || src0[lane] > src1[lane]) ? 1 : 0);
17544 :
Inst_VOP3(iFmt,
"v_cmpx_ngt_f32", true)
17558 Wavefront *wf = gpuDynInst->wavefront();
17568 sdst.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
17578 :
Inst_VOP3(iFmt,
"v_cmpx_nle_f32", true)
17592 Wavefront *wf = gpuDynInst->wavefront();
17602 sdst.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
17612 :
Inst_VOP3(iFmt,
"v_cmpx_neq_f32", true)
17626 Wavefront *wf = gpuDynInst->wavefront();
17636 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
17646 :
Inst_VOP3(iFmt,
"v_cmpx_nlt_f32", true)
17660 Wavefront *wf = gpuDynInst->wavefront();
17670 sdst.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
17680 :
Inst_VOP3(iFmt,
"v_cmpx_tru_f32", true)
17694 Wavefront *wf = gpuDynInst->wavefront();
17722 Wavefront *wf = gpuDynInst->wavefront();
17736 :
Inst_VOP3(iFmt,
"v_cmp_lt_f64", true)
17750 Wavefront *wf = gpuDynInst->wavefront();
17782 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
17791 :
Inst_VOP3(iFmt,
"v_cmp_eq_f64", true)
17805 Wavefront *wf = gpuDynInst->wavefront();
17837 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
17846 :
Inst_VOP3(iFmt,
"v_cmp_le_f64", true)
17860 Wavefront *wf = gpuDynInst->wavefront();
17892 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
17901 :
Inst_VOP3(iFmt,
"v_cmp_gt_f64", true)
17915 Wavefront *wf = gpuDynInst->wavefront();
17947 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
17956 :
Inst_VOP3(iFmt,
"v_cmp_lg_f64", true)
17970 Wavefront *wf = gpuDynInst->wavefront();
18002 sdst.
setBit(lane, (src0[lane] < src1[lane]
18003 || src0[lane] > src1[lane]) ? 1 : 0);
18012 :
Inst_VOP3(iFmt,
"v_cmp_ge_f64", true)
18026 Wavefront *wf = gpuDynInst->wavefront();
18058 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
18080 Wavefront *wf = gpuDynInst->wavefront();
18112 sdst.
setBit(lane, (!std::isnan(src0[lane])
18113 && !std::isnan(src1[lane])) ? 1 : 0);
18135 Wavefront *wf = gpuDynInst->wavefront();
18167 sdst.
setBit(lane, (std::isnan(src0[lane])
18168 || std::isnan(src1[lane])) ? 1 : 0);
18177 :
Inst_VOP3(iFmt,
"v_cmp_nge_f64", true)
18191 Wavefront *wf = gpuDynInst->wavefront();
18223 sdst.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
18232 :
Inst_VOP3(iFmt,
"v_cmp_nlg_f64", true)
18246 Wavefront *wf = gpuDynInst->wavefront();
18278 sdst.
setBit(lane, !(src0[lane] < src1[lane]
18279 || src0[lane] > src1[lane]) ? 1 : 0);
18288 :
Inst_VOP3(iFmt,
"v_cmp_ngt_f64", true)
18302 Wavefront *wf = gpuDynInst->wavefront();
18334 sdst.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
18343 :
Inst_VOP3(iFmt,
"v_cmp_nle_f64", true)
18357 Wavefront *wf = gpuDynInst->wavefront();
18389 sdst.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
18398 :
Inst_VOP3(iFmt,
"v_cmp_neq_f64", true)
18412 Wavefront *wf = gpuDynInst->wavefront();
18444 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
18453 :
Inst_VOP3(iFmt,
"v_cmp_nlt_f64", true)
18467 Wavefront *wf = gpuDynInst->wavefront();
18499 sdst.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
18508 :
Inst_VOP3(iFmt,
"v_cmp_tru_f64", true)
18522 Wavefront *wf = gpuDynInst->wavefront();
18536 :
Inst_VOP3(iFmt,
"v_cmpx_f_f64", true)
18550 Wavefront *wf = gpuDynInst->wavefront();
18565 :
Inst_VOP3(iFmt,
"v_cmpx_lt_f64", true)
18579 Wavefront *wf = gpuDynInst->wavefront();
18611 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
18621 :
Inst_VOP3(iFmt,
"v_cmpx_eq_f64", true)
18635 Wavefront *wf = gpuDynInst->wavefront();
18667 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
18677 :
Inst_VOP3(iFmt,
"v_cmpx_le_f64", true)
18691 Wavefront *wf = gpuDynInst->wavefront();
18723 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
18733 :
Inst_VOP3(iFmt,
"v_cmpx_gt_f64", true)
18747 Wavefront *wf = gpuDynInst->wavefront();
18779 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
18789 :
Inst_VOP3(iFmt,
"v_cmpx_lg_f64", true)
18803 Wavefront *wf = gpuDynInst->wavefront();
18835 sdst.
setBit(lane, (src0[lane] < src1[lane]
18836 || src0[lane] > src1[lane]) ? 1 : 0);
18846 :
Inst_VOP3(iFmt,
"v_cmpx_ge_f64", true)
18860 Wavefront *wf = gpuDynInst->wavefront();
18892 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
18902 :
Inst_VOP3(iFmt,
"v_cmpx_o_f64", true)
18917 Wavefront *wf = gpuDynInst->wavefront();
18949 sdst.
setBit(lane, (!std::isnan(src0[lane])
18950 && !std::isnan(src1[lane])) ? 1 : 0);
18960 :
Inst_VOP3(iFmt,
"v_cmpx_u_f64", true)
18975 Wavefront *wf = gpuDynInst->wavefront();
19007 sdst.
setBit(lane, (std::isnan(src0[lane])
19008 || std::isnan(src1[lane])) ? 1 : 0);
19018 :
Inst_VOP3(iFmt,
"v_cmpx_nge_f64", true)
19032 Wavefront *wf = gpuDynInst->wavefront();
19064 sdst.
setBit(lane, !(src0[lane] >= src1[lane]) ? 1 : 0);
19074 :
Inst_VOP3(iFmt,
"v_cmpx_nlg_f64", true)
19088 Wavefront *wf = gpuDynInst->wavefront();
19120 sdst.
setBit(lane, !(src0[lane] < src1[lane]
19121 || src0[lane] > src1[lane]) ? 1 : 0);
19131 :
Inst_VOP3(iFmt,
"v_cmpx_ngt_f64", true)
19145 Wavefront *wf = gpuDynInst->wavefront();
19177 sdst.
setBit(lane, !(src0[lane] > src1[lane]) ? 1 : 0);
19187 :
Inst_VOP3(iFmt,
"v_cmpx_nle_f64", true)
19201 Wavefront *wf = gpuDynInst->wavefront();
19233 sdst.
setBit(lane, !(src0[lane] <= src1[lane]) ? 1 : 0);
19243 :
Inst_VOP3(iFmt,
"v_cmpx_neq_f64", true)
19257 Wavefront *wf = gpuDynInst->wavefront();
19289 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
19299 :
Inst_VOP3(iFmt,
"v_cmpx_nlt_f64", true)
19313 Wavefront *wf = gpuDynInst->wavefront();
19345 sdst.
setBit(lane, !(src0[lane] < src1[lane]) ? 1 : 0);
19355 :
Inst_VOP3(iFmt,
"v_cmpx_tru_f64", true)
19369 Wavefront *wf = gpuDynInst->wavefront();
19396 Wavefront *wf = gpuDynInst->wavefront();
19410 :
Inst_VOP3(iFmt,
"v_cmp_lt_i16", true)
19423 Wavefront *wf = gpuDynInst->wavefront();
19443 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
19452 :
Inst_VOP3(iFmt,
"v_cmp_eq_i16", true)
19465 Wavefront *wf = gpuDynInst->wavefront();
19485 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
19494 :
Inst_VOP3(iFmt,
"v_cmp_le_i16", true)
19507 Wavefront *wf = gpuDynInst->wavefront();
19527 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
19536 :
Inst_VOP3(iFmt,
"v_cmp_gt_i16", true)
19549 Wavefront *wf = gpuDynInst->wavefront();
19569 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
19578 :
Inst_VOP3(iFmt,
"v_cmp_ne_i16", true)
19591 Wavefront *wf = gpuDynInst->wavefront();
19611 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
19620 :
Inst_VOP3(iFmt,
"v_cmp_ge_i16", true)
19633 Wavefront *wf = gpuDynInst->wavefront();
19653 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
19674 Wavefront *wf = gpuDynInst->wavefront();
19700 Wavefront *wf = gpuDynInst->wavefront();
19714 :
Inst_VOP3(iFmt,
"v_cmp_lt_u16", true)
19727 Wavefront *wf = gpuDynInst->wavefront();
19747 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
19756 :
Inst_VOP3(iFmt,
"v_cmp_eq_u16", true)
19769 Wavefront *wf = gpuDynInst->wavefront();
19789 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
19798 :
Inst_VOP3(iFmt,
"v_cmp_le_u16", true)
19811 Wavefront *wf = gpuDynInst->wavefront();
19831 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
19840 :
Inst_VOP3(iFmt,
"v_cmp_gt_u16", true)
19853 Wavefront *wf = gpuDynInst->wavefront();
19873 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
19882 :
Inst_VOP3(iFmt,
"v_cmp_ne_u16", true)
19895 Wavefront *wf = gpuDynInst->wavefront();
19915 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
19924 :
Inst_VOP3(iFmt,
"v_cmp_ge_u16", true)
19937 Wavefront *wf = gpuDynInst->wavefront();
19957 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
19978 Wavefront *wf = gpuDynInst->wavefront();
19992 :
Inst_VOP3(iFmt,
"v_cmpx_f_i16", true)
20005 Wavefront *wf = gpuDynInst->wavefront();
20020 :
Inst_VOP3(iFmt,
"v_cmpx_lt_i16", true)
20033 Wavefront *wf = gpuDynInst->wavefront();
20053 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
20063 :
Inst_VOP3(iFmt,
"v_cmpx_eq_i16", true)
20076 Wavefront *wf = gpuDynInst->wavefront();
20096 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
20106 :
Inst_VOP3(iFmt,
"v_cmpx_le_i16", true)
20119 Wavefront *wf = gpuDynInst->wavefront();
20139 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
20149 :
Inst_VOP3(iFmt,
"v_cmpx_gt_i16", true)
20162 Wavefront *wf = gpuDynInst->wavefront();
20182 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
20192 :
Inst_VOP3(iFmt,
"v_cmpx_ne_i16", true)
20205 Wavefront *wf = gpuDynInst->wavefront();
20225 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
20235 :
Inst_VOP3(iFmt,
"v_cmpx_ge_i16", true)
20248 Wavefront *wf = gpuDynInst->wavefront();
20268 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
20278 :
Inst_VOP3(iFmt,
"v_cmpx_t_i16", true)
20291 Wavefront *wf = gpuDynInst->wavefront();
20306 :
Inst_VOP3(iFmt,
"v_cmpx_f_u16", true)
20319 Wavefront *wf = gpuDynInst->wavefront();
20334 :
Inst_VOP3(iFmt,
"v_cmpx_lt_u16", true)
20347 Wavefront *wf = gpuDynInst->wavefront();
20367 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
20377 :
Inst_VOP3(iFmt,
"v_cmpx_eq_u16", true)
20390 Wavefront *wf = gpuDynInst->wavefront();
20410 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
20420 :
Inst_VOP3(iFmt,
"v_cmpx_le_u16", true)
20433 Wavefront *wf = gpuDynInst->wavefront();
20453 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
20463 :
Inst_VOP3(iFmt,
"v_cmpx_gt_u16", true)
20476 Wavefront *wf = gpuDynInst->wavefront();
20496 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
20506 :
Inst_VOP3(iFmt,
"v_cmpx_ne_u16", true)
20519 Wavefront *wf = gpuDynInst->wavefront();
20539 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
20549 :
Inst_VOP3(iFmt,
"v_cmpx_ge_u16", true)
20562 Wavefront *wf = gpuDynInst->wavefront();
20582 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
20592 :
Inst_VOP3(iFmt,
"v_cmpx_t_u16", true)
20605 Wavefront *wf = gpuDynInst->wavefront();
20632 Wavefront *wf = gpuDynInst->wavefront();
20647 :
Inst_VOP3(iFmt,
"v_cmp_lt_i32", true)
20660 Wavefront *wf = gpuDynInst->wavefront();
20680 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
20689 :
Inst_VOP3(iFmt,
"v_cmp_eq_i32", true)
20702 Wavefront *wf = gpuDynInst->wavefront();
20722 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
20731 :
Inst_VOP3(iFmt,
"v_cmp_le_i32", true)
20744 Wavefront *wf = gpuDynInst->wavefront();
20764 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
20773 :
Inst_VOP3(iFmt,
"v_cmp_gt_i32", true)
20786 Wavefront *wf = gpuDynInst->wavefront();
20806 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
20815 :
Inst_VOP3(iFmt,
"v_cmp_ne_i32", true)
20828 Wavefront *wf = gpuDynInst->wavefront();
20848 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
20857 :
Inst_VOP3(iFmt,
"v_cmp_ge_i32", true)
20870 Wavefront *wf = gpuDynInst->wavefront();
20890 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
20911 Wavefront *wf = gpuDynInst->wavefront();
20937 Wavefront *wf = gpuDynInst->wavefront();
20951 :
Inst_VOP3(iFmt,
"v_cmp_lt_u32", true)
20964 Wavefront *wf = gpuDynInst->wavefront();
20984 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
20993 :
Inst_VOP3(iFmt,
"v_cmp_eq_u32", true)
21006 Wavefront *wf = gpuDynInst->wavefront();
21026 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
21035 :
Inst_VOP3(iFmt,
"v_cmp_le_u32", true)
21048 Wavefront *wf = gpuDynInst->wavefront();
21068 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
21077 :
Inst_VOP3(iFmt,
"v_cmp_gt_u32", true)
21090 Wavefront *wf = gpuDynInst->wavefront();
21110 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
21119 :
Inst_VOP3(iFmt,
"v_cmp_ne_u32", true)
21132 Wavefront *wf = gpuDynInst->wavefront();
21152 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
21161 :
Inst_VOP3(iFmt,
"v_cmp_ge_u32", true)
21174 Wavefront *wf = gpuDynInst->wavefront();
21194 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
21215 Wavefront *wf = gpuDynInst->wavefront();
21229 :
Inst_VOP3(iFmt,
"v_cmpx_f_i32", true)
21242 Wavefront *wf = gpuDynInst->wavefront();
21257 :
Inst_VOP3(iFmt,
"v_cmpx_lt_i32", true)
21270 Wavefront *wf = gpuDynInst->wavefront();
21290 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
21300 :
Inst_VOP3(iFmt,
"v_cmpx_eq_i32", true)
21313 Wavefront *wf = gpuDynInst->wavefront();
21333 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
21343 :
Inst_VOP3(iFmt,
"v_cmpx_le_i32", true)
21356 Wavefront *wf = gpuDynInst->wavefront();
21376 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
21386 :
Inst_VOP3(iFmt,
"v_cmpx_gt_i32", true)
21399 Wavefront *wf = gpuDynInst->wavefront();
21419 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
21429 :
Inst_VOP3(iFmt,
"v_cmpx_ne_i32", true)
21442 Wavefront *wf = gpuDynInst->wavefront();
21462 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
21472 :
Inst_VOP3(iFmt,
"v_cmpx_ge_i32", true)
21485 Wavefront *wf = gpuDynInst->wavefront();
21505 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
21515 :
Inst_VOP3(iFmt,
"v_cmpx_t_i32", true)
21528 Wavefront *wf = gpuDynInst->wavefront();
21543 :
Inst_VOP3(iFmt,
"v_cmpx_f_u32", true)
21556 Wavefront *wf = gpuDynInst->wavefront();
21571 :
Inst_VOP3(iFmt,
"v_cmpx_lt_u32", true)
21584 Wavefront *wf = gpuDynInst->wavefront();
21604 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
21614 :
Inst_VOP3(iFmt,
"v_cmpx_eq_u32", true)
21627 Wavefront *wf = gpuDynInst->wavefront();
21647 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
21657 :
Inst_VOP3(iFmt,
"v_cmpx_le_u32", true)
21670 Wavefront *wf = gpuDynInst->wavefront();
21690 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
21700 :
Inst_VOP3(iFmt,
"v_cmpx_gt_u32", true)
21713 Wavefront *wf = gpuDynInst->wavefront();
21733 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
21743 :
Inst_VOP3(iFmt,
"v_cmpx_ne_u32", true)
21756 Wavefront *wf = gpuDynInst->wavefront();
21776 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
21786 :
Inst_VOP3(iFmt,
"v_cmpx_ge_u32", true)
21799 Wavefront *wf = gpuDynInst->wavefront();
21819 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
21829 :
Inst_VOP3(iFmt,
"v_cmpx_t_u32", true)
21842 Wavefront *wf = gpuDynInst->wavefront();
21869 Wavefront *wf = gpuDynInst->wavefront();
21883 :
Inst_VOP3(iFmt,
"v_cmp_lt_i64", true)
21896 Wavefront *wf = gpuDynInst->wavefront();
21916 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
21925 :
Inst_VOP3(iFmt,
"v_cmp_eq_i64", true)
21938 Wavefront *wf = gpuDynInst->wavefront();
21958 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
21967 :
Inst_VOP3(iFmt,
"v_cmp_le_i64", true)
21980 Wavefront *wf = gpuDynInst->wavefront();
22000 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
22009 :
Inst_VOP3(iFmt,
"v_cmp_gt_i64", true)
22022 Wavefront *wf = gpuDynInst->wavefront();
22042 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
22051 :
Inst_VOP3(iFmt,
"v_cmp_ne_i64", true)
22064 Wavefront *wf = gpuDynInst->wavefront();
22084 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
22093 :
Inst_VOP3(iFmt,
"v_cmp_ge_i64", true)
22106 Wavefront *wf = gpuDynInst->wavefront();
22126 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
22147 Wavefront *wf = gpuDynInst->wavefront();
22173 Wavefront *wf = gpuDynInst->wavefront();
22187 :
Inst_VOP3(iFmt,
"v_cmp_lt_u64", true)
22200 Wavefront *wf = gpuDynInst->wavefront();
22220 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
22229 :
Inst_VOP3(iFmt,
"v_cmp_eq_u64", true)
22242 Wavefront *wf = gpuDynInst->wavefront();
22262 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
22271 :
Inst_VOP3(iFmt,
"v_cmp_le_u64", true)
22284 Wavefront *wf = gpuDynInst->wavefront();
22304 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
22313 :
Inst_VOP3(iFmt,
"v_cmp_gt_u64", true)
22326 Wavefront *wf = gpuDynInst->wavefront();
22346 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
22355 :
Inst_VOP3(iFmt,
"v_cmp_ne_u64", true)
22368 Wavefront *wf = gpuDynInst->wavefront();
22388 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
22397 :
Inst_VOP3(iFmt,
"v_cmp_ge_u64", true)
22410 Wavefront *wf = gpuDynInst->wavefront();
22430 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
22451 Wavefront *wf = gpuDynInst->wavefront();
22465 :
Inst_VOP3(iFmt,
"v_cmpx_f_i64", true)
22478 Wavefront *wf = gpuDynInst->wavefront();
22493 :
Inst_VOP3(iFmt,
"v_cmpx_lt_i64", true)
22506 Wavefront *wf = gpuDynInst->wavefront();
22526 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
22536 :
Inst_VOP3(iFmt,
"v_cmpx_eq_i64", true)
22549 Wavefront *wf = gpuDynInst->wavefront();
22569 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
22579 :
Inst_VOP3(iFmt,
"v_cmpx_le_i64", true)
22592 Wavefront *wf = gpuDynInst->wavefront();
22612 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
22622 :
Inst_VOP3(iFmt,
"v_cmpx_gt_i64", true)
22635 Wavefront *wf = gpuDynInst->wavefront();
22655 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
22665 :
Inst_VOP3(iFmt,
"v_cmpx_ne_i64", true)
22678 Wavefront *wf = gpuDynInst->wavefront();
22698 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
22708 :
Inst_VOP3(iFmt,
"v_cmpx_ge_i64", true)
22721 Wavefront *wf = gpuDynInst->wavefront();
22741 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
22751 :
Inst_VOP3(iFmt,
"v_cmpx_t_i64", true)
22764 Wavefront *wf = gpuDynInst->wavefront();
22779 :
Inst_VOP3(iFmt,
"v_cmpx_f_u64", true)
22792 Wavefront *wf = gpuDynInst->wavefront();
22807 :
Inst_VOP3(iFmt,
"v_cmpx_lt_u64", true)
22820 Wavefront *wf = gpuDynInst->wavefront();
22840 sdst.
setBit(lane, src0[lane] < src1[lane] ? 1 : 0);
22850 :
Inst_VOP3(iFmt,
"v_cmpx_eq_u64", true)
22863 Wavefront *wf = gpuDynInst->wavefront();
22883 sdst.
setBit(lane, src0[lane] == src1[lane] ? 1 : 0);
22893 :
Inst_VOP3(iFmt,
"v_cmpx_le_u64", true)
22906 Wavefront *wf = gpuDynInst->wavefront();
22926 sdst.
setBit(lane, src0[lane] <= src1[lane] ? 1 : 0);
22936 :
Inst_VOP3(iFmt,
"v_cmpx_gt_u64", true)
22949 Wavefront *wf = gpuDynInst->wavefront();
22969 sdst.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
22979 :
Inst_VOP3(iFmt,
"v_cmpx_ne_u64", true)
22992 Wavefront *wf = gpuDynInst->wavefront();
23012 sdst.
setBit(lane, src0[lane] != src1[lane] ? 1 : 0);
23022 :
Inst_VOP3(iFmt,
"v_cmpx_ge_u64", true)
23035 Wavefront *wf = gpuDynInst->wavefront();
23055 sdst.
setBit(lane, src0[lane] >= src1[lane] ? 1 : 0);
23065 :
Inst_VOP3(iFmt,
"v_cmpx_t_u64", true)
23078 Wavefront *wf = gpuDynInst->wavefront();
23102 :
Inst_VOP3(iFmt,
"v_cndmask_b32", false)
23117 Wavefront *wf = gpuDynInst->wavefront();
23140 ? src1[lane] : src0[lane];
23162 Wavefront *wf = gpuDynInst->wavefront();
23194 vdst[lane] = src0[lane] + src1[lane];
23216 Wavefront *wf = gpuDynInst->wavefront();
23248 vdst[lane] = src0[lane] - src1[lane];
23256 :
Inst_VOP3(iFmt,
"v_subrev_f32", false)
23270 Wavefront *wf = gpuDynInst->wavefront();
23302 vdst[lane] = src1[lane] - src0[lane];
23310 :
Inst_VOP3(iFmt,
"v_mul_legacy_f32", false)
23324 Wavefront *wf = gpuDynInst->wavefront();
23356 if (std::isnan(src0[lane]) ||
23357 std::isnan(src1[lane])) {
23359 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
23360 std::fpclassify(src0[lane]) == FP_ZERO) &&
23361 !std::signbit(src0[lane])) {
23362 if (std::isinf(src1[lane])) {
23364 }
else if (!std::signbit(src1[lane])) {
23369 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
23370 std::fpclassify(src0[lane]) == FP_ZERO) &&
23371 std::signbit(src0[lane])) {
23372 if (std::isinf(src1[lane])) {
23374 }
else if (std::signbit(src1[lane])) {
23379 }
else if (std::isinf(src0[lane]) &&
23380 !std::signbit(src0[lane])) {
23381 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
23382 std::fpclassify(src1[lane]) == FP_ZERO) {
23384 }
else if (!std::signbit(src1[lane])) {
23385 vdst[lane] = +INFINITY;
23387 vdst[lane] = -INFINITY;
23389 }
else if (std::isinf(src0[lane]) &&
23390 std::signbit(src0[lane])) {
23391 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
23392 std::fpclassify(src1[lane]) == FP_ZERO) {
23394 }
else if (std::signbit(src1[lane])) {
23395 vdst[lane] = +INFINITY;
23397 vdst[lane] = -INFINITY;
23400 vdst[lane] = src0[lane] * src1[lane];
23423 Wavefront *wf = gpuDynInst->wavefront();
23455 if (std::isnan(src0[lane]) ||
23456 std::isnan(src1[lane])) {
23458 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
23459 std::fpclassify(src0[lane]) == FP_ZERO) &&
23460 !std::signbit(src0[lane])) {
23461 if (std::isinf(src1[lane])) {
23463 }
else if (!std::signbit(src1[lane])) {
23468 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
23469 std::fpclassify(src0[lane]) == FP_ZERO) &&
23470 std::signbit(src0[lane])) {
23471 if (std::isinf(src1[lane])) {
23473 }
else if (std::signbit(src1[lane])) {
23478 }
else if (std::isinf(src0[lane]) &&
23479 !std::signbit(src0[lane])) {
23480 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
23481 std::fpclassify(src1[lane]) == FP_ZERO) {
23483 }
else if (!std::signbit(src1[lane])) {
23484 vdst[lane] = +INFINITY;
23486 vdst[lane] = -INFINITY;
23488 }
else if (std::isinf(src0[lane]) &&
23489 std::signbit(src0[lane])) {
23490 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
23491 std::fpclassify(src1[lane]) == FP_ZERO) {
23493 }
else if (std::signbit(src1[lane])) {
23494 vdst[lane] = +INFINITY;
23496 vdst[lane] = -INFINITY;
23499 vdst[lane] = src0[lane] * src1[lane];
23508 :
Inst_VOP3(iFmt,
"v_mul_i32_i24", false)
23521 Wavefront *wf = gpuDynInst->wavefront();
23541 vdst[lane] = sext<24>(
bits(src0[lane], 23, 0))
23542 * sext<24>(
bits(src1[lane], 23, 0));
23550 :
Inst_VOP3(iFmt,
"v_mul_hi_i32_i24", false)
23563 Wavefront *wf = gpuDynInst->wavefront();
23588 vdst[lane] = (
VecElemI32)((tmp_src0 * tmp_src1) >> 32);
23596 :
Inst_VOP3(iFmt,
"v_mul_u32_u24", false)
23609 Wavefront *wf = gpuDynInst->wavefront();
23629 vdst[lane] =
bits(src0[lane], 23, 0) *
bits(src1[lane], 23, 0);
23637 :
Inst_VOP3(iFmt,
"v_mul_hi_u32_u24", false)
23650 Wavefront *wf = gpuDynInst->wavefront();
23672 vdst[lane] = (
VecElemU32)((tmp_src0 * tmp_src1) >> 32);
23694 Wavefront *wf = gpuDynInst->wavefront();
23726 vdst[lane] = std::fmin(src0[lane], src1[lane]);
23748 Wavefront *wf = gpuDynInst->wavefront();
23780 vdst[lane] = std::fmax(src0[lane], src1[lane]);
23801 Wavefront *wf = gpuDynInst->wavefront();
23821 vdst[lane] = std::min(src0[lane], src1[lane]);
23842 Wavefront *wf = gpuDynInst->wavefront();
23862 vdst[lane] = std::max(src0[lane], src1[lane]);
23883 Wavefront *wf = gpuDynInst->wavefront();
23903 vdst[lane] = std::min(src0[lane], src1[lane]);
23924 Wavefront *wf = gpuDynInst->wavefront();
23944 vdst[lane] = std::max(src0[lane], src1[lane]);
23952 :
Inst_VOP3(iFmt,
"v_lshrrev_b32", false)
23966 Wavefront *wf = gpuDynInst->wavefront();
23986 vdst[lane] = src1[lane] >>
bits(src0[lane], 4, 0);
23994 :
Inst_VOP3(iFmt,
"v_ashrrev_i32", false)
24008 Wavefront *wf = gpuDynInst->wavefront();
24028 vdst[lane] = src1[lane] >>
bits(src0[lane], 4, 0);
24036 :
Inst_VOP3(iFmt,
"v_lshlrev_b32", false)
24049 Wavefront *wf = gpuDynInst->wavefront();
24069 vdst[lane] = src1[lane] <<
bits(src0[lane], 4, 0);
24091 Wavefront *wf = gpuDynInst->wavefront();
24111 vdst[lane] = src0[lane] & src1[lane];
24133 Wavefront *wf = gpuDynInst->wavefront();
24153 vdst[lane] = src0[lane] | src1[lane];
24175 Wavefront *wf = gpuDynInst->wavefront();
24195 vdst[lane] = src0[lane] ^ src1[lane];
24218 Wavefront *wf = gpuDynInst->wavefront();
24251 vdst[lane] = std::fma(src0[lane], src1[lane], vdst[lane]);
24276 Wavefront *wf = gpuDynInst->wavefront();
24294 vdst[lane] = src0[lane] + src1[lane];
24296 + (
VecElemU64)src1[lane]) >= 0x100000000ULL ? 1 : 0);
24322 Wavefront *wf = gpuDynInst->wavefront();
24340 vdst[lane] = src0[lane] - src1[lane];
24341 vcc.
setBit(lane, src1[lane] > src0[lane] ? 1 : 0);
24368 Wavefront *wf = gpuDynInst->wavefront();
24386 vdst[lane] = src1[lane] - src0[lane];
24387 vcc.
setBit(lane, src0[lane] > src1[lane] ? 1 : 0);
24415 Wavefront *wf = gpuDynInst->wavefront();
24435 vdst[lane] = src0[lane] + src1[lane]
24440 >= 0x100000000 ? 1 : 0);
24468 Wavefront *wf = gpuDynInst->wavefront();
24488 vdst[lane] = src0[lane] - src1[lane]
24491 > src0[lane] ? 1 : 0);
24520 Wavefront *wf = gpuDynInst->wavefront();
24540 vdst[lane] = src1[lane] - src0[lane]
24543 > src0[lane] ? 1 : 0);
24588 :
Inst_VOP3(iFmt,
"v_subrev_f16", false)
24656 Wavefront *wf = gpuDynInst->wavefront();
24676 vdst[lane] = src0[lane] + src1[lane];
24697 Wavefront *wf = gpuDynInst->wavefront();
24717 vdst[lane] = src0[lane] - src1[lane];
24725 :
Inst_VOP3(iFmt,
"v_subrev_u16", false)
24738 Wavefront *wf = gpuDynInst->wavefront();
24758 vdst[lane] = src1[lane] - src0[lane];
24766 :
Inst_VOP3(iFmt,
"v_mul_lo_u16", false)
24779 Wavefront *wf = gpuDynInst->wavefront();
24799 vdst[lane] = src0[lane] * src1[lane];
24807 :
Inst_VOP3(iFmt,
"v_lshlrev_b16", false)
24820 Wavefront *wf = gpuDynInst->wavefront();
24840 vdst[lane] = src1[lane] <<
bits(src0[lane], 3, 0);
24848 :
Inst_VOP3(iFmt,
"v_lshrrev_b16", false)
24862 Wavefront *wf = gpuDynInst->wavefront();
24888 vdst[lane] = src1[lane] >>
bits(src0[lane], 3, 0);
24896 :
Inst_VOP3(iFmt,
"v_ashrrev_i16", false)
24910 Wavefront *wf = gpuDynInst->wavefront();
24930 vdst[lane] = src1[lane] >>
bits(src0[lane], 3, 0);
24987 Wavefront *wf = gpuDynInst->wavefront();
25013 vdst[lane] = std::max(src0[lane], src1[lane]);
25034 Wavefront *wf = gpuDynInst->wavefront();
25060 vdst[lane] = std::max(src0[lane], src1[lane]);
25081 Wavefront *wf = gpuDynInst->wavefront();
25107 vdst[lane] = std::min(src0[lane], src1[lane]);
25128 Wavefront *wf = gpuDynInst->wavefront();
25154 vdst[lane] = std::min(src0[lane], src1[lane]);
25162 :
Inst_VOP3(iFmt,
"v_ldexp_f16", false)
25211 Wavefront *wf = gpuDynInst->wavefront();
25219 vdst[lane] = src[lane];
25227 :
Inst_VOP3(iFmt,
"v_cvt_i32_f64", false)
25243 Wavefront *wf = gpuDynInst->wavefront();
25260 std::frexp(src[lane],&exp);
25261 if (std::isnan(src[lane])) {
25263 }
else if (std::isinf(src[lane]) || exp > 30) {
25264 if (std::signbit(src[lane])) {
25265 vdst[lane] = INT_MIN;
25267 vdst[lane] = INT_MAX;
25279 :
Inst_VOP3(iFmt,
"v_cvt_f64_i32", false)
25293 Wavefront *wf = gpuDynInst->wavefront();
25317 :
Inst_VOP3(iFmt,
"v_cvt_f32_i32", false)
25331 Wavefront *wf = gpuDynInst->wavefront();
25357 :
Inst_VOP3(iFmt,
"v_cvt_f32_u32", false)
25371 Wavefront *wf = gpuDynInst->wavefront();
25395 :
Inst_VOP3(iFmt,
"v_cvt_u32_f32", false)
25411 Wavefront *wf = gpuDynInst->wavefront();
25428 std::frexp(src[lane],&exp);
25429 if (std::isnan(src[lane])) {
25431 }
else if (std::isinf(src[lane])) {
25432 if (std::signbit(src[lane])) {
25435 vdst[lane] = UINT_MAX;
25437 }
else if (exp > 31) {
25438 vdst[lane] = UINT_MAX;
25449 :
Inst_VOP3(iFmt,
"v_cvt_i32_f32", false)
25465 Wavefront *wf = gpuDynInst->wavefront();
25490 std::frexp(src[lane],&exp);
25491 if (std::isnan(src[lane])) {
25493 }
else if (std::isinf(src[lane]) || exp > 30) {
25494 if (std::signbit(src[lane])) {
25495 vdst[lane] = INT_MIN;
25497 vdst[lane] = INT_MAX;
25509 :
Inst_VOP3(iFmt,
"v_mov_fed_b32", false)
25527 :
Inst_VOP3(iFmt,
"v_cvt_f16_f32", false)
25545 :
Inst_VOP3(iFmt,
"v_cvt_f32_f16", false)
25564 :
Inst_VOP3(iFmt,
"v_cvt_rpi_i32_f32", false)
25578 Wavefront *wf = gpuDynInst->wavefront();
25594 vdst[lane] = (
VecElemI32)std::floor(src[lane] + 0.5);
25603 :
Inst_VOP3(iFmt,
"v_cvt_flr_i32_f32", false)
25617 Wavefront *wf = gpuDynInst->wavefront();
25633 vdst[lane] = (
VecElemI32)std::floor(src[lane]);
25641 :
Inst_VOP3(iFmt,
"v_cvt_off_f32_i4", false)
25659 :
Inst_VOP3(iFmt,
"v_cvt_f32_f64", false)
25673 Wavefront *wf = gpuDynInst->wavefront();
25705 :
Inst_VOP3(iFmt,
"v_cvt_f64_f32", false)
25719 Wavefront *wf = gpuDynInst->wavefront();
25751 :
Inst_VOP3(iFmt,
"v_cvt_f32_ubyte0", false)
25765 Wavefront *wf = gpuDynInst->wavefront();
25789 :
Inst_VOP3(iFmt,
"v_cvt_f32_ubyte1", false)
25803 Wavefront *wf = gpuDynInst->wavefront();
25827 :
Inst_VOP3(iFmt,
"v_cvt_f32_ubyte2", false)
25841 Wavefront *wf = gpuDynInst->wavefront();
25865 :
Inst_VOP3(iFmt,
"v_cvt_f32_ubyte3", false)
25879 Wavefront *wf = gpuDynInst->wavefront();
25903 :
Inst_VOP3(iFmt,
"v_cvt_u32_f64", false)
25919 Wavefront *wf = gpuDynInst->wavefront();
25936 std::frexp(src[lane],&exp);
25937 if (std::isnan(src[lane])) {
25939 }
else if (std::isinf(src[lane])) {
25940 if (std::signbit(src[lane])) {
25943 vdst[lane] = UINT_MAX;
25945 }
else if (exp > 31) {
25946 vdst[lane] = UINT_MAX;
25957 :
Inst_VOP3(iFmt,
"v_cvt_f64_u32", false)
25971 Wavefront *wf = gpuDynInst->wavefront();
25995 :
Inst_VOP3(iFmt,
"v_trunc_f64", false)
26009 Wavefront *wf = gpuDynInst->wavefront();
26025 vdst[lane] = std::trunc(src[lane]);
26047 Wavefront *wf = gpuDynInst->wavefront();
26063 vdst[lane] = std::ceil(src[lane]);
26071 :
Inst_VOP3(iFmt,
"v_rndne_f64", false)
26085 Wavefront *wf = gpuDynInst->wavefront();
26109 :
Inst_VOP3(iFmt,
"v_floor_f64", false)
26123 Wavefront *wf = gpuDynInst->wavefront();
26139 vdst[lane] = std::floor(src[lane]);
26147 :
Inst_VOP3(iFmt,
"v_fract_f32", false)
26161 Wavefront *wf = gpuDynInst->wavefront();
26178 vdst[lane] = std::modf(src[lane], &int_part);
26186 :
Inst_VOP3(iFmt,
"v_trunc_f32", false)
26200 Wavefront *wf = gpuDynInst->wavefront();
26216 vdst[lane] = std::trunc(src[lane]);
26238 Wavefront *wf = gpuDynInst->wavefront();
26254 vdst[lane] = std::ceil(src[lane]);
26262 :
Inst_VOP3(iFmt,
"v_rndne_f32", false)
26276 Wavefront *wf = gpuDynInst->wavefront();
26300 :
Inst_VOP3(iFmt,
"v_floor_f32", false)
26314 Wavefront *wf = gpuDynInst->wavefront();
26330 vdst[lane] = std::floor(src[lane]);
26352 Wavefront *wf = gpuDynInst->wavefront();
26368 vdst[lane] = std::pow(2.0, src[lane]);
26390 Wavefront *wf = gpuDynInst->wavefront();
26414 vdst[lane] = std::log2(src[lane]);
26436 Wavefront *wf = gpuDynInst->wavefront();
26452 vdst[lane] = 1.0 / src[lane];
26460 :
Inst_VOP3(iFmt,
"v_rcp_iflag_f32", false)
26474 Wavefront *wf = gpuDynInst->wavefront();
26490 vdst[lane] = 1.0 / src[lane];
26512 Wavefront *wf = gpuDynInst->wavefront();
26528 vdst[lane] = 1.0 / std::sqrt(src[lane]);
26550 Wavefront *wf = gpuDynInst->wavefront();
26566 if (std::fpclassify(src[lane]) == FP_ZERO) {
26567 vdst[lane] = +INFINITY;
26568 }
else if (std::isnan(src[lane])) {
26570 }
else if (std::isinf(src[lane])) {
26571 if (std::signbit(src[lane])) {
26577 vdst[lane] = 1.0 / src[lane];
26600 Wavefront *wf = gpuDynInst->wavefront();
26616 if (std::fpclassify(src[lane]) == FP_ZERO) {
26617 vdst[lane] = +INFINITY;
26618 }
else if (std::isnan(src[lane])) {
26620 }
else if (std::isinf(src[lane]) && !std::signbit(src[lane])) {
26622 }
else if (std::signbit(src[lane])) {
26625 vdst[lane] = 1.0 / std::sqrt(src[lane]);
26648 Wavefront *wf = gpuDynInst->wavefront();
26664 vdst[lane] = std::sqrt(src[lane]);
26686 Wavefront *wf = gpuDynInst->wavefront();
26702 vdst[lane] = std::sqrt(src[lane]);
26724 Wavefront *wf = gpuDynInst->wavefront();
26742 vdst[lane] = std::sin(src[lane] * 2 * pi.
rawData());
26764 Wavefront *wf = gpuDynInst->wavefront();
26782 vdst[lane] = std::cos(src[lane] * 2 * pi.
rawData());
26804 Wavefront *wf = gpuDynInst->wavefront();
26812 vdst[lane] = ~src[lane];
26820 :
Inst_VOP3(iFmt,
"v_bfrev_b32", false)
26834 Wavefront *wf = gpuDynInst->wavefront();
26864 Wavefront *wf = gpuDynInst->wavefront();
26902 Wavefront *wf = gpuDynInst->wavefront();
26940 Wavefront *wf = gpuDynInst->wavefront();
26965 :
Inst_VOP3(iFmt,
"v_frexp_exp_i32_f64", false)
26979 Wavefront *wf = gpuDynInst->wavefront();
26995 if (std::isinf(src[lane]) || std::isnan(src[lane])) {
26999 std::frexp(src[lane], &exp);
27009 :
Inst_VOP3(iFmt,
"v_frexp_mant_f64", false)
27022 Wavefront *wf = gpuDynInst->wavefront();
27039 vdst[lane] = std::frexp(src[lane], &exp);
27047 :
Inst_VOP3(iFmt,
"v_fract_f64", false)
27060 Wavefront *wf = gpuDynInst->wavefront();
27077 vdst[lane] = std::modf(src[lane], &int_part);
27086 :
Inst_VOP3(iFmt,
"v_frexp_exp_i32_f32", false)
27102 Wavefront *wf = gpuDynInst->wavefront();
27118 if (std::isinf(src[lane])|| std::isnan(src[lane])) {
27122 std::frexp(src[lane], &exp);
27132 :
Inst_VOP3(iFmt,
"v_frexp_mant_f32", false)
27147 Wavefront *wf = gpuDynInst->wavefront();
27163 if (std::isinf(src[lane]) || std::isnan(src[lane])) {
27164 vdst[lane] = src[lane];
27167 vdst[lane] = std::frexp(src[lane], &exp);
27191 :
Inst_VOP3(iFmt,
"v_cvt_f16_u16", false)
27209 :
Inst_VOP3(iFmt,
"v_cvt_f16_i16", false)
27227 :
Inst_VOP3(iFmt,
"v_cvt_u16_f16", false)
27245 :
Inst_VOP3(iFmt,
"v_cvt_i16_f16", false)
27368 :
Inst_VOP3(iFmt,
"v_frexp_mant_f16", false)
27390 :
Inst_VOP3(iFmt,
"v_frexp_exp_i16_f16", false)
27407 :
Inst_VOP3(iFmt,
"v_floor_f16", false)
27443 :
Inst_VOP3(iFmt,
"v_trunc_f16", false)
27461 :
Inst_VOP3(iFmt,
"v_rndne_f16", false)
27479 :
Inst_VOP3(iFmt,
"v_fract_f16", false)
27533 :
Inst_VOP3(iFmt,
"v_exp_legacy_f32", false)
27547 Wavefront *wf = gpuDynInst->wavefront();
27571 vdst[lane] = std::pow(2.0, src[lane]);
27579 :
Inst_VOP3(iFmt,
"v_log_legacy_f32", false)
27593 Wavefront *wf = gpuDynInst->wavefront();
27601 vdst[lane] = std::log2(src[lane]);
27609 :
Inst_VOP3(iFmt,
"v_mad_legacy_f32", false)
27624 Wavefront *wf = gpuDynInst->wavefront();
27660 vdst[lane] = std::fma(src0[lane], src1[lane], src2[lane]);
27683 Wavefront *wf = gpuDynInst->wavefront();
27719 vdst[lane] = std::fma(src0[lane], src1[lane], src2[lane]);
27727 :
Inst_VOP3(iFmt,
"v_mad_i32_i24", false)
27741 Wavefront *wf = gpuDynInst->wavefront();
27763 vdst[lane] = sext<24>(
bits(src0[lane], 23, 0))
27764 * sext<24>(
bits(src1[lane], 23, 0)) + src2[lane];
27772 :
Inst_VOP3(iFmt,
"v_mad_u32_u24", false)
27786 Wavefront *wf = gpuDynInst->wavefront();
27808 vdst[lane] =
bits(src0[lane], 23, 0) *
bits(src1[lane], 23, 0)
27817 :
Inst_VOP3(iFmt,
"v_cubeid_f32", false)
27834 :
Inst_VOP3(iFmt,
"v_cubesc_f32", false)
27851 :
Inst_VOP3(iFmt,
"v_cubetc_f32", false)
27868 :
Inst_VOP3(iFmt,
"v_cubema_f32", false)
27899 Wavefront *wf = gpuDynInst->wavefront();
27921 vdst[lane] = (src0[lane] >>
bits(src1[lane], 4, 0))
27922 & ((1 <<
bits(src2[lane], 4, 0)) - 1);
27944 Wavefront *wf = gpuDynInst->wavefront();
27966 vdst[lane] = (src0[lane] >>
bits(src1[lane], 4, 0))
27967 & ((1 <<
bits(src2[lane], 4, 0)) - 1);
27988 Wavefront *wf = gpuDynInst->wavefront();
28010 vdst[lane] = (src0[lane] & src1[lane]) | (~src0[lane]
28034 Wavefront *wf = gpuDynInst->wavefront();
28070 vdst[lane] = std::fma(src0[lane], src1[lane], src2[lane]);
28093 Wavefront *wf = gpuDynInst->wavefront();
28129 vdst[lane] = std::fma(src0[lane], src1[lane], src2[lane]);
28153 Wavefront *wf = gpuDynInst->wavefront();
28175 vdst[lane] = ((
bits(src0[lane], 31, 24)
28176 +
bits(src1[lane], 31, 24) +
bits(src2[lane], 24)) >> 1)
28178 vdst[lane] += ((
bits(src0[lane], 23, 16)
28179 +
bits(src1[lane], 23, 16) +
bits(src2[lane], 16)) >> 1)
28181 vdst[lane] += ((
bits(src0[lane], 15, 8)
28182 +
bits(src1[lane], 15, 8) +
bits(src2[lane], 8)) >> 1)
28184 vdst[lane] += ((
bits(src0[lane], 7, 0) +
bits(src1[lane], 7, 0)
28185 +
bits(src2[lane], 0)) >> 1);
28193 :
Inst_VOP3(iFmt,
"v_alignbit_b32", false)
28206 Wavefront *wf = gpuDynInst->wavefront();
28239 :
Inst_VOP3(iFmt,
"v_alignbyte_b32", false)
28252 Wavefront *wf = gpuDynInst->wavefront();
28300 Wavefront *wf = gpuDynInst->wavefront();
28336 VecElemF32 min_0_1 = std::fmin(src0[lane], src1[lane]);
28337 vdst[lane] = std::fmin(min_0_1, src2[lane]);
28358 Wavefront *wf = gpuDynInst->wavefront();
28380 VecElemI32 min_0_1 = std::min(src0[lane], src1[lane]);
28381 vdst[lane] = std::min(min_0_1, src2[lane]);
28402 Wavefront *wf = gpuDynInst->wavefront();
28424 VecElemU32 min_0_1 = std::min(src0[lane], src1[lane]);
28425 vdst[lane] = std::min(min_0_1, src2[lane]);
28447 Wavefront *wf = gpuDynInst->wavefront();
28483 VecElemF32 max_0_1 = std::fmax(src0[lane], src1[lane]);
28484 vdst[lane] = std::fmax(max_0_1, src2[lane]);
28505 Wavefront *wf = gpuDynInst->wavefront();
28527 VecElemI32 max_0_1 = std::max(src0[lane], src1[lane]);
28528 vdst[lane] = std::max(max_0_1, src2[lane]);
28549 Wavefront *wf = gpuDynInst->wavefront();
28571 VecElemU32 max_0_1 = std::max(src0[lane], src1[lane]);
28572 vdst[lane] = std::max(max_0_1, src2[lane]);
28594 Wavefront *wf = gpuDynInst->wavefront();
28630 vdst[lane] =
median(src0[lane], src1[lane], src2[lane]);
28651 Wavefront *wf = gpuDynInst->wavefront();
28673 vdst[lane] =
median(src0[lane], src1[lane], src2[lane]);
28694 Wavefront *wf = gpuDynInst->wavefront();
28716 vdst[lane] =
median(src0[lane], src1[lane], src2[lane]);
28740 Wavefront *wf = gpuDynInst->wavefront();
28762 vdst[lane] = std::abs(
bits(src0[lane], 31, 24)
28763 -
bits(src1[lane], 31, 24))
28764 + std::abs(
bits(src0[lane], 23, 16)
28765 -
bits(src1[lane], 23, 16))
28766 + std::abs(
bits(src0[lane], 15, 8)
28767 -
bits(src1[lane], 15, 8))
28768 + std::abs(
bits(src0[lane], 7, 0)
28769 -
bits(src1[lane], 7, 0)) + src2[lane];
28777 :
Inst_VOP3(iFmt,
"v_sad_hi_u8", false)
28791 Wavefront *wf = gpuDynInst->wavefront();
28813 vdst[lane] = (((
bits(src0[lane], 31, 24)
28814 -
bits(src1[lane], 31, 24)) + (
bits(src0[lane], 23, 16)
28815 -
bits(src1[lane], 23, 16)) + (
bits(src0[lane], 15, 8)
28816 -
bits(src1[lane], 15, 8)) + (
bits(src0[lane], 7, 0)
28817 -
bits(src1[lane], 7, 0))) << 16) + src2[lane];
28840 Wavefront *wf = gpuDynInst->wavefront();
28862 vdst[lane] = std::abs(
bits(src0[lane], 31, 16)
28863 -
bits(src1[lane], 31, 16))
28864 + std::abs(
bits(src0[lane], 15, 0)
28865 -
bits(src1[lane], 15, 0)) + src2[lane];
28887 Wavefront *wf = gpuDynInst->wavefront();
28909 vdst[lane] = std::abs(src0[lane] - src1[lane]) + src2[lane];
28917 :
Inst_VOP3(iFmt,
"v_cvt_pk_u8_f32", false)
28934 Wavefront *wf = gpuDynInst->wavefront();
28963 vdst[lane] = (((
VecElemU8)src0[lane] & 0xff)
28964 << (8 *
bits(src1[lane], 1, 0)))
28965 | (src2[lane] & ~(0xff << (8 *
bits(src1[lane], 1, 0))));
28973 :
Inst_VOP3(iFmt,
"v_div_fixup_f32", false)
28988 Wavefront *wf = gpuDynInst->wavefront();
29024 if (std::fpclassify(src1[lane]) == FP_ZERO) {
29025 if (std::signbit(src1[lane])) {
29026 vdst[lane] = -INFINITY;
29028 vdst[lane] = +INFINITY;
29030 }
else if (std::isnan(src2[lane]) || std::isnan(src1[lane])) {
29032 }
else if (std::isinf(src1[lane])) {
29033 if (std::signbit(src1[lane])) {
29034 vdst[lane] = -INFINITY;
29036 vdst[lane] = +INFINITY;
29039 vdst[lane] = src2[lane] / src1[lane];
29049 :
Inst_VOP3(iFmt,
"v_div_fixup_f64", false)
29064 Wavefront *wf = gpuDynInst->wavefront();
29100 int sign_out = std::signbit(src1[lane])
29101 ^ std::signbit(src2[lane]);
29104 std::frexp(src1[lane], &exp1);
29105 std::frexp(src2[lane], &exp2);
29107 if (std::isnan(src1[lane]) || std::isnan(src2[lane])) {
29108 vdst[lane] = std::numeric_limits<VecElemF64>::quiet_NaN();
29109 }
else if (std::fpclassify(src1[lane]) == FP_ZERO
29110 && std::fpclassify(src2[lane]) == FP_ZERO) {
29112 = std::numeric_limits<VecElemF64>::signaling_NaN();
29113 }
else if (std::isinf(src1[lane]) && std::isinf(src2[lane])) {
29115 = std::numeric_limits<VecElemF64>::signaling_NaN();
29116 }
else if (std::fpclassify(src1[lane]) == FP_ZERO
29117 || std::isinf(src2[lane])) {
29118 vdst[lane] = sign_out ? -INFINITY : +INFINITY;
29119 }
else if (std::isinf(src1[lane])
29120 || std::fpclassify(src2[lane]) == FP_ZERO) {
29121 vdst[lane] = sign_out ? -0.0 : +0.0;
29122 }
else if (exp2 - exp1 < -1075) {
29123 vdst[lane] = src0[lane];
29124 }
else if (exp1 == 2047) {
29125 vdst[lane] = src0[lane];
29127 vdst[lane] = sign_out ? -std::fabs(src0[lane])
29128 : std::fabs(src0[lane]);
29157 Wavefront *wf = gpuDynInst->wavefront();
29182 vdst[lane] = src0[lane];
29213 Wavefront *wf = gpuDynInst->wavefront();
29240 std::frexp(src1[lane], &exp1);
29241 std::frexp(src2[lane], &exp2);
29244 if (std::fpclassify(src1[lane]) == FP_ZERO
29245 || std::fpclassify(src2[lane]) == FP_ZERO) {
29247 }
else if (exp2 - exp1 >= 768) {
29249 if (src0[lane] == src1[lane]) {
29250 vdst[lane] = std::ldexp(src0[lane], 128);
29252 }
else if (std::fpclassify(src1[lane]) == FP_SUBNORMAL) {
29253 vdst[lane] = std::ldexp(src0[lane], 128);
29254 }
else if (std::fpclassify(1.0 / src1[lane]) == FP_SUBNORMAL
29255 && std::fpclassify(src2[lane] / src1[lane])
29258 if (src0[lane] == src1[lane]) {
29259 vdst[lane] = std::ldexp(src0[lane], 128);
29261 }
else if (std::fpclassify(1.0 / src1[lane]) == FP_SUBNORMAL) {
29262 vdst[lane] = std::ldexp(src0[lane], -128);
29263 }
else if (std::fpclassify(src2[lane] / src1[lane])
29266 if (src0[lane] == src2[lane]) {
29267 vdst[lane] = std::ldexp(src0[lane], 128);
29269 }
else if (exp2 <= 53) {
29270 vdst[lane] = std::ldexp(src0[lane], 128);
29280 :
Inst_VOP3(iFmt,
"v_div_fmas_f32", false)
29297 Wavefront *wf = gpuDynInst->wavefront();
29333 vdst[lane] = std::fma(src0[lane], src1[lane], src2[lane]);
29342 :
Inst_VOP3(iFmt,
"v_div_fmas_f64", false)
29359 Wavefront *wf = gpuDynInst->wavefront();
29398 vdst[lane] = std::pow(2, 64)
29399 * std::fma(src0[lane], src1[lane], src2[lane]);
29401 vdst[lane] = std::fma(src0[lane], src1[lane], src2[lane]);
29427 :
Inst_VOP3(iFmt,
"v_qsad_pk_u16_u8", false)
29446 :
Inst_VOP3(iFmt,
"v_mqsad_pk_u16_u8", false)
29464 :
Inst_VOP3(iFmt,
"v_mqsad_u32_u8", false)
29498 Wavefront *wf = gpuDynInst->wavefront();
29519 vcc.
setBit(lane,
muladd(vdst[lane], src0[lane], src1[lane],
29545 Wavefront *wf = gpuDynInst->wavefront();
29565 vcc.
setBit(lane,
muladd(vdst[lane], src0[lane], src1[lane],
29610 Wavefront *wf = gpuDynInst->wavefront();
29632 vdst[lane] = src0[lane] * src1[lane] + src2[lane];
29655 Wavefront *wf = gpuDynInst->wavefront();
29677 vdst[lane] = src0[lane] * src1[lane] + src2[lane];
29710 Wavefront *wf = gpuDynInst->wavefront();
29726 DPRINTF(GCN3,
"Executing v_perm_b32 src_0 0x%08x, src_1 "
29727 "0x%08x, src_2 0x%08x, vdst 0x%08x\n", src0[lane],
29728 src1[lane], src2[lane], vdst[lane]);
29731 for (
int i = 0;
i < 4 ; ++
i) {
29734 vdst[lane] |= (permuted_val <<
i);
29737 DPRINTF(GCN3,
"v_perm result: 0x%08x\n", vdst[lane]);
29765 :
Inst_VOP3(iFmt,
"v_div_fixup_f16", false)
29812 :
Inst_VOP3(iFmt,
"v_cvt_pkaccum_u8_f32", false)
29834 :
Inst_VOP3(iFmt,
"v_interp_p1_f32", false)
29852 :
Inst_VOP3(iFmt,
"v_interp_p2_f32", false)
29870 :
Inst_VOP3(iFmt,
"v_interp_mov_f32", false)
29889 :
Inst_VOP3(iFmt,
"v_interp_p1ll_f16", false)
29908 :
Inst_VOP3(iFmt,
"v_interp_p1lv_f16", false)
29925 :
Inst_VOP3(iFmt,
"v_interp_p2_f16", false)
29957 Wavefront *wf = gpuDynInst->wavefront();
29989 if (std::isnan(src0[lane]) ||
29990 std::isnan(src1[lane]) ) {
29992 }
else if (std::isinf(src0[lane]) &&
29993 std::isinf(src1[lane])) {
29994 if (std::signbit(src0[lane]) !=
29995 std::signbit(src1[lane])) {
29998 vdst[lane] = src0[lane];
30000 }
else if (std::isinf(src0[lane])) {
30001 vdst[lane] = src0[lane];
30002 }
else if (std::isinf(src1[lane])) {
30003 vdst[lane] = src1[lane];
30004 }
else if (std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
30005 std::fpclassify(src0[lane]) == FP_ZERO) {
30006 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
30007 std::fpclassify(src1[lane]) == FP_ZERO) {
30008 if (std::signbit(src0[lane]) &&
30009 std::signbit(src1[lane])) {
30015 vdst[lane] = src1[lane];
30017 }
else if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
30018 std::fpclassify(src1[lane]) == FP_ZERO) {
30019 if (std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
30020 std::fpclassify(src0[lane]) == FP_ZERO) {
30021 if (std::signbit(src0[lane]) &&
30022 std::signbit(src1[lane])) {
30028 vdst[lane] = src0[lane];
30031 vdst[lane] = src0[lane] + src1[lane];
30054 Wavefront *wf = gpuDynInst->wavefront();
30086 if (std::isnan(src0[lane]) ||
30087 std::isnan(src1[lane])) {
30089 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
30090 std::fpclassify(src0[lane]) == FP_ZERO) &&
30091 !std::signbit(src0[lane])) {
30092 if (std::isinf(src1[lane])) {
30094 }
else if (!std::signbit(src1[lane])) {
30099 }
else if ((std::fpclassify(src0[lane]) == FP_SUBNORMAL ||
30100 std::fpclassify(src0[lane]) == FP_ZERO) &&
30101 std::signbit(src0[lane])) {
30102 if (std::isinf(src1[lane])) {
30104 }
else if (std::signbit(src1[lane])) {
30109 }
else if (std::isinf(src0[lane]) &&
30110 !std::signbit(src0[lane])) {
30111 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
30112 std::fpclassify(src1[lane]) == FP_ZERO) {
30114 }
else if (!std::signbit(src1[lane])) {
30115 vdst[lane] = +INFINITY;
30117 vdst[lane] = -INFINITY;
30119 }
else if (std::isinf(src0[lane]) &&
30120 std::signbit(src0[lane])) {
30121 if (std::fpclassify(src1[lane]) == FP_SUBNORMAL ||
30122 std::fpclassify(src1[lane]) == FP_ZERO) {
30124 }
else if (std::signbit(src1[lane])) {
30125 vdst[lane] = +INFINITY;
30127 vdst[lane] = -INFINITY;
30130 vdst[lane] = src0[lane] * src1[lane];
30153 Wavefront *wf = gpuDynInst->wavefront();
30185 vdst[lane] = std::fmin(src0[lane], src1[lane]);
30207 Wavefront *wf = gpuDynInst->wavefront();
30239 vdst[lane] = std::fmax(src0[lane], src1[lane]);
30247 :
Inst_VOP3(iFmt,
"v_ldexp_f64", false)
30261 Wavefront *wf = gpuDynInst->wavefront();
30287 if (std::isnan(src0[lane]) || std::isinf(src0[lane])) {
30288 vdst[lane] = src0[lane];
30289 }
else if (std::fpclassify(src0[lane]) == FP_SUBNORMAL
30290 || std::fpclassify(src0[lane]) == FP_ZERO) {
30291 if (std::signbit(src0[lane])) {
30297 vdst[lane] = std::ldexp(src0[lane], src1[lane]);
30306 :
Inst_VOP3(iFmt,
"v_mul_lo_u32", false)
30319 Wavefront *wf = gpuDynInst->wavefront();
30349 :
Inst_VOP3(iFmt,
"v_mul_hi_u32", false)
30362 Wavefront *wf = gpuDynInst->wavefront();
30385 = (
VecElemU32)(((s0 * s1) >> 32) & 0xffffffffLL);
30393 :
Inst_VOP3(iFmt,
"v_mul_hi_i32", false)
30406 Wavefront *wf = gpuDynInst->wavefront();
30437 :
Inst_VOP3(iFmt,
"v_ldexp_f32", false)
30451 Wavefront *wf = gpuDynInst->wavefront();
30469 vdst[lane] = std::ldexp(src0[lane], src1[lane]);
30477 :
Inst_VOP3(iFmt,
"v_readlane_b32", true)
30510 sdst = src0[src1.
rawData() & 0x3f];
30516 :
Inst_VOP3(iFmt,
"v_writelane_b32", false)
30557 :
Inst_VOP3(iFmt,
"v_bcnt_u32_b32", false)
30570 Wavefront *wf = gpuDynInst->wavefront();
30590 vdst[lane] =
popCount(src0[lane]) + src1[lane];
30599 :
Inst_VOP3(iFmt,
"v_mbcnt_lo_u32_b32", false)
30613 Wavefront *wf = gpuDynInst->wavefront();
30617 uint64_t threadMask = 0;
30634 threadMask = ((1
LL << lane) - 1
LL);
30635 vdst[lane] =
popCount(src0[lane] &
bits(threadMask, 31, 0)) +
30646 :
Inst_VOP3(iFmt,
"v_mbcnt_hi_u32_b32", false)
30662 Wavefront *wf = gpuDynInst->wavefront();
30666 uint64_t threadMask = 0;
30683 threadMask = ((1
LL << lane) - 1
LL);
30684 vdst[lane] =
popCount(src0[lane] &
bits(threadMask, 63, 32)) +
30694 :
Inst_VOP3(iFmt,
"v_lshlrev_b64", false)
30707 Wavefront *wf = gpuDynInst->wavefront();
30727 vdst[lane] = src1[lane] <<
bits(src0[lane], 5, 0);
30735 :
Inst_VOP3(iFmt,
"v_lshrrev_b64", false)
30749 Wavefront *wf = gpuDynInst->wavefront();
30769 vdst[lane] = src1[lane] >>
bits(src0[lane], 5, 0);
30777 :
Inst_VOP3(iFmt,
"v_ashrrev_i64", false)
30791 Wavefront *wf = gpuDynInst->wavefront();
30812 = src1[lane] >>
bits(src0[lane], 5, 0);
30820 :
Inst_VOP3(iFmt,
"v_trig_preop_f64", false)
30850 Wavefront *wf = gpuDynInst->wavefront();
30870 vdst[lane] = ((1 <<
bits(src0[lane], 4, 0)) - 1)
30871 <<
bits(src1[lane], 4, 0);
30880 :
Inst_VOP3(iFmt,
"v_cvt_pknorm_i16_f32", false)
30899 :
Inst_VOP3(iFmt,
"v_cvt_pknorm_u16_f32", false)
30918 :
Inst_VOP3(iFmt,
"v_cvt_pkrtz_f16_f32", false)
30935 :
Inst_VOP3(iFmt,
"v_cvt_pk_u16_u32", false)
30952 :
Inst_VOP3(iFmt,
"v_cvt_pk_i16_i32", false)
30969 :
Inst_DS(iFmt,
"ds_add_u32")
30987 :
Inst_DS(iFmt,
"ds_sub_u32")
31005 :
Inst_DS(iFmt,
"ds_rsub_u32")
31024 :
Inst_DS(iFmt,
"ds_inc_u32")
31042 :
Inst_DS(iFmt,
"ds_dec_u32")
31060 :
Inst_DS(iFmt,
"ds_min_i32")
31078 :
Inst_DS(iFmt,
"ds_max_i32")
31096 :
Inst_DS(iFmt,
"ds_min_u32")
31114 :
Inst_DS(iFmt,
"ds_max_u32")
31132 :
Inst_DS(iFmt,
"ds_and_b32")
31168 :
Inst_DS(iFmt,
"ds_xor_b32")
31186 :
Inst_DS(iFmt,
"ds_mskor_b32")
31204 :
Inst_DS(iFmt,
"ds_write_b32")
31219 Wavefront *wf = gpuDynInst->wavefront();
31221 gpuDynInst->exec_mask = wf->
execMask();
31222 gpuDynInst->latency.init(gpuDynInst->computeUnit());
31223 gpuDynInst->latency.set(
31224 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
31235 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane]
31240 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
31255 initMemWrite<VecElemU32>(gpuDynInst,
offset);
31264 :
Inst_DS(iFmt,
"ds_write2_b32")
31280 Wavefront *wf = gpuDynInst->wavefront();
31282 gpuDynInst->exec_mask = wf->
execMask();
31283 gpuDynInst->latency.init(gpuDynInst->computeUnit());
31284 gpuDynInst->latency.set(
31285 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
31298 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane * 2]
31301 gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];
31305 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
31319 initDualMemWrite<VecElemU32>(gpuDynInst, offset0, offset1);
31328 :
Inst_DS(iFmt,
"ds_write2st64_b32")
31344 Wavefront *wf = gpuDynInst->wavefront();
31346 gpuDynInst->exec_mask = wf->
execMask();
31347 gpuDynInst->latency.init(gpuDynInst->computeUnit());
31348 gpuDynInst->latency.set(
31349 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
31362 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane * 2]
31365 gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];
31369 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
31383 initDualMemWrite<VecElemU32>(gpuDynInst, offset0, offset1);
31393 :
Inst_DS(iFmt,
"ds_cmpst_b32")
31414 :
Inst_DS(iFmt,
"ds_cmpst_f32")
31435 :
Inst_DS(iFmt,
"ds_min_f32")
31455 :
Inst_DS(iFmt,
"ds_max_f32")
31491 :
Inst_DS(iFmt,
"ds_add_f32")
31510 :
Inst_DS(iFmt,
"ds_write_b8")
31524 Wavefront *wf = gpuDynInst->wavefront();
31526 gpuDynInst->exec_mask = wf->
execMask();
31527 gpuDynInst->latency.init(gpuDynInst->computeUnit());
31528 gpuDynInst->latency.set(
31529 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
31540 (
reinterpret_cast<VecElemU8*
>(gpuDynInst->d_data))[lane]
31545 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
31560 initMemWrite<VecElemU8>(gpuDynInst,
offset);
31570 :
Inst_DS(iFmt,
"ds_write_b16")
31584 Wavefront *wf = gpuDynInst->wavefront();
31586 gpuDynInst->exec_mask = wf->
execMask();
31587 gpuDynInst->latency.init(gpuDynInst->computeUnit());
31588 gpuDynInst->latency.set(
31589 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
31600 (
reinterpret_cast<VecElemU16*
>(gpuDynInst->d_data))[lane]
31605 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
31620 initMemWrite<VecElemU16>(gpuDynInst,
offset);
31630 :
Inst_DS(iFmt,
"ds_add_rtn_u32")
31648 :
Inst_DS(iFmt,
"ds_sub_rtn_u32")
31666 :
Inst_DS(iFmt,
"ds_rsub_rtn_u32")
31684 :
Inst_DS(iFmt,
"ds_inc_rtn_u32")
31702 :
Inst_DS(iFmt,
"ds_dec_rtn_u32")
31720 :
Inst_DS(iFmt,
"ds_min_rtn_i32")
31738 :
Inst_DS(iFmt,
"ds_max_rtn_i32")
31756 :
Inst_DS(iFmt,
"ds_min_rtn_u32")
31774 :
Inst_DS(iFmt,
"ds_max_rtn_u32")
31792 :
Inst_DS(iFmt,
"ds_and_rtn_b32")
31810 :
Inst_DS(iFmt,
"ds_or_rtn_b32")
31828 :
Inst_DS(iFmt,
"ds_xor_rtn_b32")
31846 :
Inst_DS(iFmt,
"ds_mskor_rtn_b32")
31864 :
Inst_DS(iFmt,
"ds_wrxchg_rtn_b32")
31883 :
Inst_DS(iFmt,
"ds_wrxchg2_rtn_b32")
31900 :
Inst_DS(iFmt,
"ds_wrxchg2st64_rtn_b32")
31916 :
Inst_DS(iFmt,
"ds_cmpst_rtn_b32")
31937 :
Inst_DS(iFmt,
"ds_cmpst_rtn_f32")
31958 :
Inst_DS(iFmt,
"ds_min_rtn_f32")
31978 :
Inst_DS(iFmt,
"ds_max_rtn_f32")
31998 :
Inst_DS(iFmt,
"ds_wrap_rtn_b32")
32016 :
Inst_DS(iFmt,
"ds_add_rtn_f32")
32034 :
Inst_DS(iFmt,
"ds_read_b32")
32049 Wavefront *wf = gpuDynInst->wavefront();
32051 gpuDynInst->exec_mask = wf->
execMask();
32052 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32053 gpuDynInst->latency.set(
32054 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32061 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32076 initMemRead<VecElemU32>(gpuDynInst,
offset);
32085 if (gpuDynInst->exec_mask[lane]) {
32086 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
32087 gpuDynInst->d_data))[lane];
32095 :
Inst_DS(iFmt,
"ds_read2_b32")
32111 Wavefront *wf = gpuDynInst->wavefront();
32113 gpuDynInst->exec_mask = wf->
execMask();
32114 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32115 gpuDynInst->latency.set(
32116 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32123 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32137 initDualMemRead<VecElemU32>(gpuDynInst, offset0, offset1);
32147 if (gpuDynInst->exec_mask[lane]) {
32148 vdst0[lane] = (
reinterpret_cast<VecElemU32*
>(
32149 gpuDynInst->d_data))[lane * 2];
32150 vdst1[lane] = (
reinterpret_cast<VecElemU32*
>(
32151 gpuDynInst->d_data))[lane * 2 + 1];
32160 :
Inst_DS(iFmt,
"ds_read2st64_b32")
32176 Wavefront *wf = gpuDynInst->wavefront();
32178 gpuDynInst->exec_mask = wf->
execMask();
32179 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32180 gpuDynInst->latency.set(
32181 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32188 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32202 initDualMemRead<VecElemU32>(gpuDynInst, offset0, offset1);
32212 if (gpuDynInst->exec_mask[lane]) {
32213 vdst0[lane] = (
reinterpret_cast<VecElemU64*
>(
32214 gpuDynInst->d_data))[lane * 2];
32215 vdst1[lane] = (
reinterpret_cast<VecElemU64*
>(
32216 gpuDynInst->d_data))[lane * 2 + 1];
32226 :
Inst_DS(iFmt,
"ds_read_i8")
32245 :
Inst_DS(iFmt,
"ds_read_u8")
32260 Wavefront *wf = gpuDynInst->wavefront();
32262 gpuDynInst->exec_mask = wf->
execMask();
32263 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32264 gpuDynInst->latency.set(
32265 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32272 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32287 initMemRead<VecElemU8>(gpuDynInst,
offset);
32296 if (gpuDynInst->exec_mask[lane]) {
32298 gpuDynInst->d_data))[lane];
32307 :
Inst_DS(iFmt,
"ds_read_i16")
32326 :
Inst_DS(iFmt,
"ds_read_u16")
32341 Wavefront *wf = gpuDynInst->wavefront();
32343 gpuDynInst->exec_mask = wf->
execMask();
32344 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32345 gpuDynInst->latency.set(
32346 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32353 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32367 initMemRead<VecElemU16>(gpuDynInst,
offset);
32376 if (gpuDynInst->exec_mask[lane]) {
32378 gpuDynInst->d_data))[lane];
32387 :
Inst_DS(iFmt,
"ds_swizzle_b32")
32401 Wavefront *wf = gpuDynInst->wavefront();
32405 if (gpuDynInst->exec_mask.none()) {
32410 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32411 gpuDynInst->latency.set(gpuDynInst->computeUnit()
32412 ->cyclesToTicks(
Cycles(24)));
32437 if (
bits(ds_pattern, 15)) {
32445 if (gpuDynInst->exec_mask[lane]) {
32446 int index0 = lane +
bits(ds_pattern, 1, 0);
32448 "is out of bounds.\n", gpuDynInst->disassemble(),
32451 = gpuDynInst->exec_mask[index0] ?
data[index0]: 0;
32453 if (gpuDynInst->exec_mask[lane + 1]) {
32454 int index1 = lane +
bits(ds_pattern, 3, 2);
32456 "is out of bounds.\n", gpuDynInst->disassemble(),
32459 = gpuDynInst->exec_mask[index1] ?
data[index1]: 0;
32461 if (gpuDynInst->exec_mask[lane + 2]) {
32462 int index2 = lane +
bits(ds_pattern, 5, 4);
32464 "is out of bounds.\n", gpuDynInst->disassemble(),
32467 = gpuDynInst->exec_mask[index2] ?
data[index2]: 0;
32469 if (gpuDynInst->exec_mask[lane + 3]) {
32470 int index3 = lane +
bits(ds_pattern, 7, 6);
32472 "is out of bounds.\n", gpuDynInst->disassemble(),
32475 = gpuDynInst->exec_mask[index3] ?
data[index3]: 0;
32480 int and_mask =
bits(ds_pattern, 4, 0);
32481 int or_mask =
bits(ds_pattern, 9, 5);
32482 int xor_mask =
bits(ds_pattern, 14, 10);
32484 if (gpuDynInst->exec_mask[lane]) {
32485 int index = (((lane & and_mask) | or_mask) ^ xor_mask);
32491 "out of bounds.\n", gpuDynInst->disassemble(),
32504 :
Inst_DS(iFmt,
"ds_permute_b32")
32523 Wavefront *wf = gpuDynInst->wavefront();
32525 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32526 gpuDynInst->latency.set(gpuDynInst->computeUnit()
32527 ->cyclesToTicks(
Cycles(24)));
32552 "of bounds.\n", gpuDynInst->disassemble(),
index);
32575 :
Inst_DS(iFmt,
"ds_bpermute_b32")
32594 Wavefront *wf = gpuDynInst->wavefront();
32596 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32597 gpuDynInst->latency.set(gpuDynInst->computeUnit()
32598 ->cyclesToTicks(
Cycles(24)));
32623 "of bounds.\n", gpuDynInst->disassemble(),
index);
32647 :
Inst_DS(iFmt,
"ds_add_u64")
32665 :
Inst_DS(iFmt,
"ds_sub_u64")
32683 :
Inst_DS(iFmt,
"ds_rsub_u64")
32702 :
Inst_DS(iFmt,
"ds_inc_u64")
32720 :
Inst_DS(iFmt,
"ds_dec_u64")
32739 :
Inst_DS(iFmt,
"ds_min_i64")
32757 :
Inst_DS(iFmt,
"ds_max_i64")
32775 :
Inst_DS(iFmt,
"ds_min_u64")
32793 :
Inst_DS(iFmt,
"ds_max_u64")
32811 :
Inst_DS(iFmt,
"ds_and_b64")
32847 :
Inst_DS(iFmt,
"ds_xor_b64")
32865 :
Inst_DS(iFmt,
"ds_mskor_b64")
32883 :
Inst_DS(iFmt,
"ds_write_b64")
32898 Wavefront *wf = gpuDynInst->wavefront();
32900 gpuDynInst->exec_mask = wf->
execMask();
32901 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32902 gpuDynInst->latency.set(
32903 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32914 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->d_data))[lane]
32919 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32934 initMemWrite<VecElemU64>(gpuDynInst,
offset);
32943 :
Inst_DS(iFmt,
"ds_write2_b64")
32959 Wavefront *wf = gpuDynInst->wavefront();
32961 gpuDynInst->exec_mask = wf->
execMask();
32962 gpuDynInst->latency.init(gpuDynInst->computeUnit());
32963 gpuDynInst->latency.set(
32964 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
32978 gpuDynInst->d_data))[lane * 2] = data0[lane];
32980 gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];
32984 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
32998 initDualMemWrite<VecElemU64>(gpuDynInst, offset0, offset1);
33007 :
Inst_DS(iFmt,
"ds_write2st64_b64")
33027 :
Inst_DS(iFmt,
"ds_cmpst_b64")
33048 :
Inst_DS(iFmt,
"ds_cmpst_f64")
33069 :
Inst_DS(iFmt,
"ds_min_f64")
33089 :
Inst_DS(iFmt,
"ds_max_f64")
33109 :
Inst_DS(iFmt,
"ds_add_rtn_u64")
33127 :
Inst_DS(iFmt,
"ds_sub_rtn_u64")
33145 :
Inst_DS(iFmt,
"ds_rsub_rtn_u64")
33164 :
Inst_DS(iFmt,
"ds_inc_rtn_u64")
33182 :
Inst_DS(iFmt,
"ds_dec_rtn_u64")
33201 :
Inst_DS(iFmt,
"ds_min_rtn_i64")
33219 :
Inst_DS(iFmt,
"ds_max_rtn_i64")
33237 :
Inst_DS(iFmt,
"ds_min_rtn_u64")
33255 :
Inst_DS(iFmt,
"ds_max_rtn_u64")
33273 :
Inst_DS(iFmt,
"ds_and_rtn_b64")
33291 :
Inst_DS(iFmt,
"ds_or_rtn_b64")
33309 :
Inst_DS(iFmt,
"ds_xor_rtn_b64")
33327 :
Inst_DS(iFmt,
"ds_mskor_rtn_b64")
33346 :
Inst_DS(iFmt,
"ds_wrxchg_rtn_b64")
33365 :
Inst_DS(iFmt,
"ds_wrxchg2_rtn_b64")
33382 :
Inst_DS(iFmt,
"ds_wrxchg2st64_rtn_b64")
33398 :
Inst_DS(iFmt,
"ds_cmpst_rtn_b64")
33419 :
Inst_DS(iFmt,
"ds_cmpst_rtn_f64")
33440 :
Inst_DS(iFmt,
"ds_min_rtn_f64")
33460 :
Inst_DS(iFmt,
"ds_max_rtn_f64")
33480 :
Inst_DS(iFmt,
"ds_read_b64")
33495 Wavefront *wf = gpuDynInst->wavefront();
33497 gpuDynInst->exec_mask = wf->
execMask();
33498 gpuDynInst->latency.init(gpuDynInst->computeUnit());
33499 gpuDynInst->latency.set(
33500 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
33507 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
33522 initMemRead<VecElemU64>(gpuDynInst,
offset);
33531 if (gpuDynInst->exec_mask[lane]) {
33532 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
33533 gpuDynInst->d_data))[lane];
33541 :
Inst_DS(iFmt,
"ds_read2_b64")
33557 Wavefront *wf = gpuDynInst->wavefront();
33559 gpuDynInst->exec_mask = wf->
execMask();
33560 gpuDynInst->latency.init(gpuDynInst->computeUnit());
33561 gpuDynInst->latency.set(
33562 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
33569 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
33583 initDualMemRead<VecElemU64>(gpuDynInst, offset0, offset1);
33593 if (gpuDynInst->exec_mask[lane]) {
33594 vdst0[lane] = (
reinterpret_cast<VecElemU64*
>(
33595 gpuDynInst->d_data))[lane * 2];
33596 vdst1[lane] = (
reinterpret_cast<VecElemU64*
>(
33597 gpuDynInst->d_data))[lane * 2 + 1];
33606 :
Inst_DS(iFmt,
"ds_read2st64_b64")
33622 Wavefront *wf = gpuDynInst->wavefront();
33624 gpuDynInst->exec_mask = wf->
execMask();
33625 gpuDynInst->latency.init(gpuDynInst->computeUnit());
33626 gpuDynInst->latency.set(
33627 gpuDynInst->computeUnit()->cyclesToTicks(
Cycles(24)));
33634 gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);
33648 initDualMemRead<VecElemU64>(gpuDynInst, offset0, offset1);
33658 if (gpuDynInst->exec_mask[lane]) {
33659 vdst0[lane] = (
reinterpret_cast<VecElemU64*
>(
33660 gpuDynInst->d_data))[lane * 2];
33661 vdst1[lane] = (
reinterpret_cast<VecElemU64*
>(
33662 gpuDynInst->d_data))[lane * 2 + 1];
33672 :
Inst_DS(iFmt,
"ds_condxchg32_rtn_b64")
33688 :
Inst_DS(iFmt,
"ds_add_src2_u32")
33707 :
Inst_DS(iFmt,
"ds_sub_src2_u32")
33726 :
Inst_DS(iFmt,
"ds_rsub_src2_u32")
33745 :
Inst_DS(iFmt,
"ds_inc_src2_u32")
33764 :
Inst_DS(iFmt,
"ds_dec_src2_u32")
33784 :
Inst_DS(iFmt,
"ds_min_src2_i32")
33803 :
Inst_DS(iFmt,
"ds_max_src2_i32")
33822 :
Inst_DS(iFmt,
"ds_min_src2_u32")
33841 :
Inst_DS(iFmt,
"ds_max_src2_u32")
33860 :
Inst_DS(iFmt,
"ds_and_src2_b32")
33879 :
Inst_DS(iFmt,
"ds_or_src2_b32")
33898 :
Inst_DS(iFmt,
"ds_xor_src2_b32")
33917 :
Inst_DS(iFmt,
"ds_write_src2_b32")
33939 :
Inst_DS(iFmt,
"ds_min_src2_f32")
33959 :
Inst_DS(iFmt,
"ds_max_src2_f32")
33979 :
Inst_DS(iFmt,
"ds_add_src2_f32")
34000 :
Inst_DS(iFmt,
"ds_gws_sema_release_all")
34015 :
Inst_DS(iFmt,
"ds_gws_init")
34030 :
Inst_DS(iFmt,
"ds_gws_sema_v")
34045 :
Inst_DS(iFmt,
"ds_gws_sema_br")
34060 :
Inst_DS(iFmt,
"ds_gws_sema_p")
34075 :
Inst_DS(iFmt,
"ds_gws_barrier")
34090 :
Inst_DS(iFmt,
"ds_consume")
34120 :
Inst_DS(iFmt,
"ds_ordered_count")
34135 :
Inst_DS(iFmt,
"ds_add_src2_u64")
34154 :
Inst_DS(iFmt,
"ds_sub_src2_u64")
34173 :
Inst_DS(iFmt,
"ds_rsub_src2_u64")
34192 :
Inst_DS(iFmt,
"ds_inc_src2_u64")
34211 :
Inst_DS(iFmt,
"ds_dec_src2_u64")
34231 :
Inst_DS(iFmt,
"ds_min_src2_i64")
34250 :
Inst_DS(iFmt,
"ds_max_src2_i64")
34269 :
Inst_DS(iFmt,
"ds_min_src2_u64")
34288 :
Inst_DS(iFmt,
"ds_max_src2_u64")
34307 :
Inst_DS(iFmt,
"ds_and_src2_b64")
34326 :
Inst_DS(iFmt,
"ds_or_src2_b64")
34345 :
Inst_DS(iFmt,
"ds_xor_src2_b64")
34364 :
Inst_DS(iFmt,
"ds_write_src2_b64")
34386 :
Inst_DS(iFmt,
"ds_min_src2_f64")
34406 :
Inst_DS(iFmt,
"ds_max_src2_f64")
34426 :
Inst_DS(iFmt,
"ds_write_b96")
34445 :
Inst_DS(iFmt,
"ds_write_b128")
34464 :
Inst_DS(iFmt,
"ds_read_b96")
34482 :
Inst_DS(iFmt,
"ds_read_b128")
34503 setFlag(MemoryRef);
34505 setFlag(GlobalSegment);
34533 setFlag(MemoryRef);
34535 setFlag(GlobalSegment);
34561 :
Inst_MUBUF(iFmt,
"buffer_load_format_xyz")
34563 setFlag(MemoryRef);
34565 setFlag(GlobalSegment);
34591 :
Inst_MUBUF(iFmt,
"buffer_load_format_xyzw")
34593 setFlag(MemoryRef);
34595 setFlag(GlobalSegment);
34623 setFlag(MemoryRef);
34625 setFlag(GlobalSegment);
34651 :
Inst_MUBUF(iFmt,
"buffer_store_format_xy")
34653 setFlag(MemoryRef);
34655 setFlag(GlobalSegment);
34681 :
Inst_MUBUF(iFmt,
"buffer_store_format_xyz")
34683 setFlag(MemoryRef);
34685 setFlag(GlobalSegment);
34711 :
Inst_MUBUF(iFmt,
"buffer_store_format_xyzw")
34713 setFlag(MemoryRef);
34715 setFlag(GlobalSegment);
34742 :
Inst_MUBUF(iFmt,
"buffer_load_format_d16_x")
34744 setFlag(MemoryRef);
34746 setFlag(GlobalSegment);
34773 :
Inst_MUBUF(iFmt,
"buffer_load_format_d16_xy")
34775 setFlag(MemoryRef);
34777 setFlag(GlobalSegment);
34806 :
Inst_MUBUF(iFmt,
"buffer_load_format_d16_xyz")
34808 setFlag(MemoryRef);
34810 setFlag(GlobalSegment);
34839 :
Inst_MUBUF(iFmt,
"buffer_load_format_d16_xyzw")
34841 setFlag(MemoryRef);
34843 setFlag(GlobalSegment);
34872 :
Inst_MUBUF(iFmt,
"buffer_store_format_d16_x")
34874 setFlag(MemoryRef);
34876 setFlag(GlobalSegment);
34905 :
Inst_MUBUF(iFmt,
"buffer_store_format_d16_xy")
34907 setFlag(MemoryRef);
34909 setFlag(GlobalSegment);
34938 :
Inst_MUBUF(iFmt,
"buffer_store_format_d16_xyz")
34940 setFlag(MemoryRef);
34942 setFlag(GlobalSegment);
34971 :
Inst_MUBUF(iFmt,
"buffer_store_format_d16_xyzw")
34973 setFlag(MemoryRef);
34975 setFlag(GlobalSegment);
35006 setFlag(MemoryRef);
35008 if (instData.LDS) {
35009 setFlag(GroupSegment);
35011 setFlag(GlobalSegment);
35023 Wavefront *wf = gpuDynInst->wavefront();
35025 gpuDynInst->exec_mask = wf->
execMask();
35026 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35027 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35042 addr0, addr1, rsrcDesc,
offset, inst_offset);
35047 addr0, addr1, rsrcDesc,
offset, inst_offset);
35052 addr1, addr0, rsrcDesc,
offset, inst_offset);
35058 addr1, addr0, rsrcDesc,
offset, inst_offset);
35062 gpuDynInst->computeUnit()->localMemoryPipe.
35063 issueRequest(gpuDynInst);
35067 gpuDynInst->computeUnit()->globalMemoryPipe.
35068 issueRequest(gpuDynInst);
35080 initMemRead<VecElemU8>(gpuDynInst);
35089 if (gpuDynInst->exec_mask[lane]) {
35092 gpuDynInst->d_data))[lane]);
35107 setFlag(MemoryRef);
35109 setFlag(GlobalSegment);
35137 setFlag(MemoryRef);
35139 if (instData.LDS) {
35140 setFlag(GroupSegment);
35142 setFlag(GlobalSegment);
35154 Wavefront *wf = gpuDynInst->wavefront();
35156 gpuDynInst->exec_mask = wf->
execMask();
35157 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35158 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35173 addr0, addr1, rsrcDesc,
offset, inst_offset);
35178 addr0, addr1, rsrcDesc,
offset, inst_offset);
35183 addr1, addr0, rsrcDesc,
offset, inst_offset);
35189 addr1, addr0, rsrcDesc,
offset, inst_offset);
35193 gpuDynInst->computeUnit()->localMemoryPipe
35194 .issueRequest(gpuDynInst);
35198 gpuDynInst->computeUnit()->globalMemoryPipe
35199 .issueRequest(gpuDynInst);
35211 initMemRead<VecElemU16>(gpuDynInst);
35220 if (gpuDynInst->exec_mask[lane]) {
35223 gpuDynInst->d_data))[lane]);
35238 setFlag(MemoryRef);
35240 setFlag(GlobalSegment);
35268 setFlag(MemoryRef);
35270 if (instData.LDS) {
35271 setFlag(GroupSegment);
35273 setFlag(GlobalSegment);
35285 Wavefront *wf = gpuDynInst->wavefront();
35287 gpuDynInst->exec_mask = wf->
execMask();
35288 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35289 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35304 addr0, addr1, rsrcDesc,
offset, inst_offset);
35309 addr0, addr1, rsrcDesc,
offset, inst_offset);
35314 addr1, addr0, rsrcDesc,
offset, inst_offset);
35320 addr1, addr0, rsrcDesc,
offset, inst_offset);
35324 gpuDynInst->computeUnit()->localMemoryPipe
35325 .issueRequest(gpuDynInst);
35329 gpuDynInst->computeUnit()->globalMemoryPipe
35330 .issueRequest(gpuDynInst);
35342 initMemRead<VecElemU32>(gpuDynInst);
35351 if (gpuDynInst->exec_mask[lane]) {
35353 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
35354 gpuDynInst->d_data))[lane];
35368 setFlag(MemoryRef);
35370 if (instData.LDS) {
35371 setFlag(GroupSegment);
35373 setFlag(GlobalSegment);
35385 Wavefront *wf = gpuDynInst->wavefront();
35387 gpuDynInst->exec_mask = wf->
execMask();
35388 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35389 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35404 addr0, addr1, rsrcDesc,
offset, inst_offset);
35409 addr0, addr1, rsrcDesc,
offset, inst_offset);
35414 addr1, addr0, rsrcDesc,
offset, inst_offset);
35420 addr1, addr0, rsrcDesc,
offset, inst_offset);
35424 gpuDynInst->computeUnit()->localMemoryPipe
35425 .issueRequest(gpuDynInst);
35429 gpuDynInst->computeUnit()->globalMemoryPipe
35430 .issueRequest(gpuDynInst);
35442 initMemRead<2>(gpuDynInst);
35452 if (gpuDynInst->exec_mask[lane]) {
35454 vdst0[lane] = (
reinterpret_cast<VecElemU32*
>(
35455 gpuDynInst->d_data))[lane * 2];
35456 vdst1[lane] = (
reinterpret_cast<VecElemU32*
>(
35457 gpuDynInst->d_data))[lane * 2 + 1];
35473 setFlag(MemoryRef);
35475 if (instData.LDS) {
35476 setFlag(GroupSegment);
35478 setFlag(GlobalSegment);
35490 Wavefront *wf = gpuDynInst->wavefront();
35492 gpuDynInst->exec_mask = wf->
execMask();
35493 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35494 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35509 addr0, addr1, rsrcDesc,
offset, inst_offset);
35514 addr0, addr1, rsrcDesc,
offset, inst_offset);
35519 addr1, addr0, rsrcDesc,
offset, inst_offset);
35525 addr1, addr0, rsrcDesc,
offset, inst_offset);
35529 gpuDynInst->computeUnit()->localMemoryPipe
35530 .issueRequest(gpuDynInst);
35534 gpuDynInst->computeUnit()->globalMemoryPipe
35535 .issueRequest(gpuDynInst);
35547 initMemRead<3>(gpuDynInst);
35558 if (gpuDynInst->exec_mask[lane]) {
35560 vdst0[lane] = (
reinterpret_cast<VecElemU32*
>(
35561 gpuDynInst->d_data))[lane * 3];
35562 vdst1[lane] = (
reinterpret_cast<VecElemU32*
>(
35563 gpuDynInst->d_data))[lane * 3 + 1];
35564 vdst2[lane] = (
reinterpret_cast<VecElemU32*
>(
35565 gpuDynInst->d_data))[lane * 3 + 2];
35583 setFlag(MemoryRef);
35585 if (instData.LDS) {
35586 setFlag(GroupSegment);
35588 setFlag(GlobalSegment);
35600 Wavefront *wf = gpuDynInst->wavefront();
35602 gpuDynInst->exec_mask = wf->
execMask();
35603 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35604 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35619 addr0, addr1, rsrcDesc,
offset, inst_offset);
35624 addr0, addr1, rsrcDesc,
offset, inst_offset);
35629 addr1, addr0, rsrcDesc,
offset, inst_offset);
35635 addr1, addr0, rsrcDesc,
offset, inst_offset);
35639 gpuDynInst->computeUnit()->localMemoryPipe
35640 .issueRequest(gpuDynInst);
35644 gpuDynInst->computeUnit()->globalMemoryPipe
35645 .issueRequest(gpuDynInst);
35657 initMemRead<4>(gpuDynInst);
35669 if (gpuDynInst->exec_mask[lane]) {
35671 vdst0[lane] = (
reinterpret_cast<VecElemU32*
>(
35672 gpuDynInst->d_data))[lane * 4];
35673 vdst1[lane] = (
reinterpret_cast<VecElemU32*
>(
35674 gpuDynInst->d_data))[lane * 4 + 1];
35675 vdst2[lane] = (
reinterpret_cast<VecElemU32*
>(
35676 gpuDynInst->d_data))[lane * 4 + 2];
35677 vdst3[lane] = (
reinterpret_cast<VecElemU32*
>(
35678 gpuDynInst->d_data))[lane * 4 + 3];
35698 setFlag(MemoryRef);
35700 if (instData.LDS) {
35701 setFlag(GroupSegment);
35703 setFlag(GlobalSegment);
35715 Wavefront *wf = gpuDynInst->wavefront();
35717 gpuDynInst->exec_mask = wf->
execMask();
35718 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35719 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35734 addr0, addr1, rsrcDesc,
offset, inst_offset);
35739 addr0, addr1, rsrcDesc,
offset, inst_offset);
35744 addr1, addr0, rsrcDesc,
offset, inst_offset);
35750 addr1, addr0, rsrcDesc,
offset, inst_offset);
35754 gpuDynInst->computeUnit()->localMemoryPipe
35755 .issueRequest(gpuDynInst);
35759 gpuDynInst->computeUnit()->globalMemoryPipe
35760 .issueRequest(gpuDynInst);
35776 if (gpuDynInst->exec_mask[lane]) {
35777 (
reinterpret_cast<VecElemI8*
>(gpuDynInst->d_data))[lane]
35782 initMemWrite<VecElemI8>(gpuDynInst);
35794 setFlag(MemoryRef);
35796 if (instData.LDS) {
35797 setFlag(GroupSegment);
35799 setFlag(GlobalSegment);
35811 Wavefront *wf = gpuDynInst->wavefront();
35813 gpuDynInst->exec_mask = wf->
execMask();
35814 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35815 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35830 addr0, addr1, rsrcDesc,
offset, inst_offset);
35835 addr0, addr1, rsrcDesc,
offset, inst_offset);
35840 addr1, addr0, rsrcDesc,
offset, inst_offset);
35846 addr1, addr0, rsrcDesc,
offset, inst_offset);
35850 gpuDynInst->computeUnit()->localMemoryPipe
35851 .issueRequest(gpuDynInst);
35855 gpuDynInst->computeUnit()->globalMemoryPipe
35856 .issueRequest(gpuDynInst);
35872 if (gpuDynInst->exec_mask[lane]) {
35873 (
reinterpret_cast<VecElemI16*
>(gpuDynInst->d_data))[lane]
35878 initMemWrite<VecElemI16>(gpuDynInst);
35907 Wavefront *wf = gpuDynInst->wavefront();
35909 gpuDynInst->exec_mask = wf->
execMask();
35910 gpuDynInst->latency.init(gpuDynInst->computeUnit());
35911 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
35926 addr0, addr1, rsrcDesc,
offset, inst_offset);
35931 addr0, addr1, rsrcDesc,
offset, inst_offset);
35936 addr1, addr0, rsrcDesc,
offset, inst_offset);
35942 addr1, addr0, rsrcDesc,
offset, inst_offset);
35946 gpuDynInst->computeUnit()->localMemoryPipe
35947 .issueRequest(gpuDynInst);
35951 gpuDynInst->computeUnit()->globalMemoryPipe
35952 .issueRequest(gpuDynInst);
35968 if (gpuDynInst->exec_mask[lane]) {
35969 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane]
35974 initMemWrite<VecElemU32>(gpuDynInst);
35986 setFlag(MemoryRef);
35988 if (instData.LDS) {
35989 setFlag(GroupSegment);
35991 setFlag(GlobalSegment);
36003 Wavefront *wf = gpuDynInst->wavefront();
36005 gpuDynInst->exec_mask = wf->
execMask();
36006 gpuDynInst->latency.init(gpuDynInst->computeUnit());
36007 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
36026 addr0, addr1, rsrcDesc,
offset, inst_offset);
36031 addr0, addr1, rsrcDesc,
offset, inst_offset);
36036 addr1, addr0, rsrcDesc,
offset, inst_offset);
36042 addr1, addr0, rsrcDesc,
offset, inst_offset);
36046 gpuDynInst->computeUnit()->localMemoryPipe
36047 .issueRequest(gpuDynInst);
36051 gpuDynInst->computeUnit()->globalMemoryPipe
36052 .issueRequest(gpuDynInst);
36058 if (gpuDynInst->exec_mask[lane]) {
36059 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane * 4]
36061 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane*4 + 1]
36073 initMemWrite<2>(gpuDynInst);
36085 setFlag(MemoryRef);
36087 if (instData.LDS) {
36088 setFlag(GroupSegment);
36090 setFlag(GlobalSegment);
36102 Wavefront *wf = gpuDynInst->wavefront();
36104 gpuDynInst->exec_mask = wf->
execMask();
36105 gpuDynInst->latency.init(gpuDynInst->computeUnit());
36106 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
36127 addr0, addr1, rsrcDesc,
offset, inst_offset);
36132 addr0, addr1, rsrcDesc,
offset, inst_offset);
36137 addr1, addr0, rsrcDesc,
offset, inst_offset);
36143 addr1, addr0, rsrcDesc,
offset, inst_offset);
36147 gpuDynInst->computeUnit()->localMemoryPipe
36148 .issueRequest(gpuDynInst);
36152 gpuDynInst->computeUnit()->globalMemoryPipe
36153 .issueRequest(gpuDynInst);
36159 if (gpuDynInst->exec_mask[lane]) {
36160 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane * 4]
36162 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane*4 + 1]
36164 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane*4 + 2]
36176 initMemWrite<3>(gpuDynInst);
36188 setFlag(MemoryRef);
36190 if (instData.LDS) {
36191 setFlag(GroupSegment);
36193 setFlag(GlobalSegment);
36205 Wavefront *wf = gpuDynInst->wavefront();
36207 gpuDynInst->exec_mask = wf->
execMask();
36208 gpuDynInst->latency.init(gpuDynInst->computeUnit());
36209 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
36232 addr0, addr1, rsrcDesc,
offset, inst_offset);
36237 addr0, addr1, rsrcDesc,
offset, inst_offset);
36242 addr1, addr0, rsrcDesc,
offset, inst_offset);
36248 addr1, addr0, rsrcDesc,
offset, inst_offset);
36252 gpuDynInst->computeUnit()->localMemoryPipe
36253 .issueRequest(gpuDynInst);
36257 gpuDynInst->computeUnit()->globalMemoryPipe
36258 .issueRequest(gpuDynInst);
36264 if (gpuDynInst->exec_mask[lane]) {
36265 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane * 4]
36267 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane*4 + 1]
36269 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane*4 + 2]
36271 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane*4 + 3]
36283 initMemWrite<4>(gpuDynInst);
36293 :
Inst_MUBUF(iFmt,
"buffer_store_lds_dword")
36295 setFlag(GlobalSegment);
36314 setFlag(GPUStaticInst::MemSync);
36328 Wavefront *wf = gpuDynInst->wavefront();
36330 gpuDynInst->exec_mask = wf->
execMask();
36331 gpuDynInst->latency.init(gpuDynInst->computeUnit());
36332 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
36334 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
36335 gpuDynInst->computeUnit()->globalMemoryPipe.
36336 issueRequest(gpuDynInst);
36343 fatal(
"Non global flat instructions not implemented yet.\n");
36371 setFlag(MemoryRef);
36372 setFlag(GPUStaticInst::MemSync);
36373 setFlag(GlobalSegment);
36386 Wavefront *wf = gpuDynInst->wavefront();
36388 gpuDynInst->exec_mask = wf->
execMask();
36389 gpuDynInst->latency.init(gpuDynInst->computeUnit());
36390 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
36392 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
36393 gpuDynInst->computeUnit()->globalMemoryPipe.
36394 issueRequest(gpuDynInst);
36401 fatal(
"Non global flat instructions not implemented yet.\n");
36421 setFlag(AtomicExch);
36422 if (instData.GLC) {
36423 setFlag(AtomicReturn);
36425 setFlag(AtomicNoReturn);
36427 setFlag(MemoryRef);
36428 setFlag(GlobalSegment);
36448 setFlag(AtomicCAS);
36449 if (instData.GLC) {
36450 setFlag(AtomicReturn);
36452 setFlag(AtomicNoReturn);
36454 setFlag(MemoryRef);
36455 setFlag(GlobalSegment);
36477 setFlag(AtomicAdd);
36478 if (instData.GLC) {
36479 setFlag(AtomicReturn);
36481 setFlag(AtomicNoReturn);
36483 setFlag(MemoryRef);
36484 setFlag(GlobalSegment);
36504 setFlag(AtomicSub);
36505 if (instData.GLC) {
36506 setFlag(AtomicReturn);
36508 setFlag(AtomicNoReturn);
36510 setFlag(MemoryRef);
36511 setFlag(GlobalSegment);
36531 setFlag(AtomicMin);
36532 if (instData.GLC) {
36533 setFlag(AtomicReturn);
36535 setFlag(AtomicNoReturn);
36537 setFlag(MemoryRef);
36538 setFlag(GlobalSegment);
36558 setFlag(AtomicMin);
36559 if (instData.GLC) {
36560 setFlag(AtomicReturn);
36562 setFlag(AtomicNoReturn);
36564 setFlag(MemoryRef);
36565 setFlag(GlobalSegment);
36585 setFlag(AtomicMax);
36586 if (instData.GLC) {
36587 setFlag(AtomicReturn);
36589 setFlag(AtomicNoReturn);
36591 setFlag(MemoryRef);
36592 setFlag(GlobalSegment);
36612 setFlag(AtomicMax);
36613 if (instData.GLC) {
36614 setFlag(AtomicReturn);
36616 setFlag(AtomicNoReturn);
36618 setFlag(MemoryRef);
36619 setFlag(GlobalSegment);
36639 setFlag(AtomicAnd);
36640 if (instData.GLC) {
36641 setFlag(AtomicReturn);
36643 setFlag(AtomicNoReturn);
36645 setFlag(MemoryRef);
36646 setFlag(GlobalSegment);
36667 if (instData.GLC) {
36668 setFlag(AtomicReturn);
36670 setFlag(AtomicNoReturn);
36672 setFlag(MemoryRef);
36673 setFlag(GlobalSegment);
36693 setFlag(AtomicXor);
36694 if (instData.GLC) {
36695 setFlag(AtomicReturn);
36697 setFlag(AtomicNoReturn);
36699 setFlag(MemoryRef);
36700 setFlag(GlobalSegment);
36720 setFlag(AtomicInc);
36721 if (instData.GLC) {
36722 setFlag(AtomicReturn);
36724 setFlag(AtomicNoReturn);
36726 setFlag(MemoryRef);
36727 setFlag(GlobalSegment);
36747 setFlag(AtomicDec);
36748 if (instData.GLC) {
36749 setFlag(AtomicReturn);
36751 setFlag(AtomicNoReturn);
36753 setFlag(MemoryRef);
36754 setFlag(GlobalSegment);
36774 setFlag(AtomicExch);
36775 if (instData.GLC) {
36776 setFlag(AtomicReturn);
36778 setFlag(AtomicNoReturn);
36780 setFlag(MemoryRef);
36781 setFlag(GlobalSegment);
36799 :
Inst_MUBUF(iFmt,
"buffer_atomic_cmpswap_x2")
36801 setFlag(AtomicCAS);
36802 if (instData.GLC) {
36803 setFlag(AtomicReturn);
36805 setFlag(AtomicNoReturn);
36807 setFlag(MemoryRef);
36808 setFlag(GlobalSegment);
36831 setFlag(AtomicAdd);
36832 if (instData.GLC) {
36833 setFlag(AtomicReturn);
36835 setFlag(AtomicNoReturn);
36837 setFlag(MemoryRef);
36838 setFlag(GlobalSegment);
36858 setFlag(AtomicSub);
36859 if (instData.GLC) {
36860 setFlag(AtomicReturn);
36862 setFlag(AtomicNoReturn);
36864 setFlag(MemoryRef);
36865 setFlag(GlobalSegment);
36885 setFlag(AtomicMin);
36886 if (instData.GLC) {
36887 setFlag(AtomicReturn);
36889 setFlag(AtomicNoReturn);
36891 setFlag(MemoryRef);
36892 setFlag(GlobalSegment);
36912 setFlag(AtomicMin);
36913 if (instData.GLC) {
36914 setFlag(AtomicReturn);
36916 setFlag(AtomicNoReturn);
36918 setFlag(MemoryRef);
36919 setFlag(GlobalSegment);
36939 setFlag(AtomicMax);
36940 if (instData.GLC) {
36941 setFlag(AtomicReturn);
36943 setFlag(AtomicNoReturn);
36945 setFlag(MemoryRef);
36946 setFlag(GlobalSegment);
36966 setFlag(AtomicMax);
36967 if (instData.GLC) {
36968 setFlag(AtomicReturn);
36970 setFlag(AtomicNoReturn);
36972 setFlag(MemoryRef);
36973 setFlag(GlobalSegment);
36993 setFlag(AtomicAnd);
36994 if (instData.GLC) {
36995 setFlag(AtomicReturn);
36997 setFlag(AtomicNoReturn);
36999 setFlag(MemoryRef);
37000 setFlag(GlobalSegment);
37021 if (instData.GLC) {
37022 setFlag(AtomicReturn);
37024 setFlag(AtomicNoReturn);
37026 setFlag(MemoryRef);
37027 setFlag(GlobalSegment);
37047 setFlag(AtomicXor);
37048 if (instData.GLC) {
37049 setFlag(AtomicReturn);
37051 setFlag(AtomicNoReturn);
37053 setFlag(MemoryRef);
37054 setFlag(GlobalSegment);
37074 setFlag(AtomicInc);
37075 if (instData.GLC) {
37076 setFlag(AtomicReturn);
37078 setFlag(AtomicNoReturn);
37080 setFlag(MemoryRef);
37081 setFlag(GlobalSegment);
37101 setFlag(AtomicDec);
37102 if (instData.GLC) {
37103 setFlag(AtomicReturn);
37105 setFlag(AtomicNoReturn);
37107 setFlag(MemoryRef);
37108 setFlag(GlobalSegment);
37129 setFlag(MemoryRef);
37131 setFlag(GlobalSegment);
37157 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_xy")
37159 setFlag(MemoryRef);
37161 setFlag(GlobalSegment);
37187 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_xyz")
37189 setFlag(MemoryRef);
37191 setFlag(GlobalSegment);
37217 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_xyzw")
37219 setFlag(MemoryRef);
37221 setFlag(GlobalSegment);
37248 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_x")
37250 setFlag(MemoryRef);
37252 setFlag(GlobalSegment);
37278 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_xy")
37280 setFlag(MemoryRef);
37282 setFlag(GlobalSegment);
37308 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_xyz")
37310 setFlag(MemoryRef);
37312 setFlag(GlobalSegment);
37339 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_xyzw")
37341 setFlag(MemoryRef);
37343 setFlag(GlobalSegment);
37372 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_d16_x")
37374 setFlag(MemoryRef);
37376 setFlag(GlobalSegment);
37405 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_d16_xy")
37407 setFlag(MemoryRef);
37409 setFlag(GlobalSegment);
37439 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_d16_xyz")
37441 setFlag(MemoryRef);
37443 setFlag(GlobalSegment);
37473 :
Inst_MTBUF(iFmt,
"tbuffer_load_format_d16_xyzw")
37475 setFlag(MemoryRef);
37477 setFlag(GlobalSegment);
37506 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_d16_x")
37508 setFlag(MemoryRef);
37510 setFlag(GlobalSegment);
37539 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_d16_xy")
37541 setFlag(MemoryRef);
37543 setFlag(GlobalSegment);
37572 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_d16_xyz")
37574 setFlag(MemoryRef);
37576 setFlag(GlobalSegment);
37605 :
Inst_MTBUF(iFmt,
"tbuffer_store_format_d16_xyzw")
37607 setFlag(MemoryRef);
37609 setFlag(GlobalSegment);
37724 :
Inst_MIMG(iFmt,
"image_load_pck_sgn")
37754 :
Inst_MIMG(iFmt,
"image_load_mip_pck")
37784 :
Inst_MIMG(iFmt,
"image_load_mip_pck_sgn")
37900 :
Inst_MIMG(iFmt,
"image_store_mip_pck")
37974 :
Inst_MIMG(iFmt,
"image_atomic_cmpswap")
38472 :
Inst_MIMG(iFmt,
"image_sample_c_d_cl")
38521 :
Inst_MIMG(iFmt,
"image_sample_c_b_cl")
38604 :
Inst_MIMG(iFmt,
"image_sample_d_cl_o")
38653 :
Inst_MIMG(iFmt,
"image_sample_b_cl_o")
38703 :
Inst_MIMG(iFmt,
"image_sample_c_cl_o")
38720 :
Inst_MIMG(iFmt,
"image_sample_c_d_o")
38737 :
Inst_MIMG(iFmt,
"image_sample_c_d_cl_o")
38754 :
Inst_MIMG(iFmt,
"image_sample_c_l_o")
38771 :
Inst_MIMG(iFmt,
"image_sample_c_b_o")
38788 :
Inst_MIMG(iFmt,
"image_sample_c_b_cl_o")
38805 :
Inst_MIMG(iFmt,
"image_sample_c_lz_o")
38886 :
Inst_MIMG(iFmt,
"image_gather4_b_cl")
38935 :
Inst_MIMG(iFmt,
"image_gather4_c_cl")
38986 :
Inst_MIMG(iFmt,
"image_gather4_c_b_cl")
39003 :
Inst_MIMG(iFmt,
"image_gather4_c_lz")
39036 :
Inst_MIMG(iFmt,
"image_gather4_cl_o")
39087 :
Inst_MIMG(iFmt,
"image_gather4_b_cl_o")
39104 :
Inst_MIMG(iFmt,
"image_gather4_lz_o")
39138 :
Inst_MIMG(iFmt,
"image_gather4_c_cl_o")
39155 :
Inst_MIMG(iFmt,
"image_gather4_c_l_o")
39172 :
Inst_MIMG(iFmt,
"image_gather4_c_b_o")
39189 :
Inst_MIMG(iFmt,
"image_gather4_c_b_cl_o")
39206 :
Inst_MIMG(iFmt,
"image_gather4_c_lz_o")
39255 :
Inst_MIMG(iFmt,
"image_sample_cd_cl")
39289 :
Inst_MIMG(iFmt,
"image_sample_c_cd_cl")
39323 :
Inst_MIMG(iFmt,
"image_sample_cd_cl_o")
39340 :
Inst_MIMG(iFmt,
"image_sample_c_cd_o")
39357 :
Inst_MIMG(iFmt,
"image_sample_c_cd_cl_o")
39402 Wavefront *wf = gpuDynInst->wavefront();
39409 gpuDynInst->exec_mask = wf->
execMask();
39411 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
39416 gpuDynInst->exec_mask = gpuDynInst->wavefront()->execMask();
39417 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39418 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39426 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39427 gpuDynInst->computeUnit()->globalMemoryPipe
39428 .issueRequest(gpuDynInst);
39432 fatal(
"Non global flat instructions not implemented yet.\n");
39435 gpuDynInst->wavefront()->outstandingReqs++;
39436 gpuDynInst->wavefront()->validateRequestCounters();
39442 initMemRead<VecElemU8>(gpuDynInst);
39451 if (gpuDynInst->exec_mask[lane]) {
39453 gpuDynInst->d_data))[lane]);
39503 Wavefront *wf = gpuDynInst->wavefront();
39510 gpuDynInst->exec_mask = wf->
execMask();
39512 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
39517 gpuDynInst->exec_mask = gpuDynInst->wavefront()->execMask();
39518 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39519 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39527 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39528 gpuDynInst->computeUnit()->globalMemoryPipe
39529 .issueRequest(gpuDynInst);
39533 fatal(
"Non global flat instructions not implemented yet.\n");
39536 gpuDynInst->wavefront()->outstandingReqs++;
39537 gpuDynInst->wavefront()->validateRequestCounters();
39543 initMemRead<VecElemU16>(gpuDynInst);
39552 if (gpuDynInst->exec_mask[lane]) {
39554 gpuDynInst->d_data))[lane]);
39604 Wavefront *wf = gpuDynInst->wavefront();
39611 gpuDynInst->exec_mask = wf->
execMask();
39613 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
39618 gpuDynInst->exec_mask = gpuDynInst->wavefront()->execMask();
39619 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39620 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39628 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39629 gpuDynInst->computeUnit()->globalMemoryPipe
39630 .issueRequest(gpuDynInst);
39634 fatal(
"Non global flat instructions not implemented yet.\n");
39637 gpuDynInst->wavefront()->outstandingReqs++;
39638 gpuDynInst->wavefront()->validateRequestCounters();
39644 initMemRead<VecElemU32>(gpuDynInst);
39653 if (gpuDynInst->exec_mask[lane]) {
39654 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
39655 gpuDynInst->d_data))[lane];
39677 Wavefront *wf = gpuDynInst->wavefront();
39684 gpuDynInst->exec_mask = wf->
execMask();
39686 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
39691 gpuDynInst->exec_mask = gpuDynInst->wavefront()->execMask();
39692 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39693 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39701 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39702 gpuDynInst->computeUnit()->globalMemoryPipe
39703 .issueRequest(gpuDynInst);
39707 fatal(
"Non global flat instructions not implemented yet.\n");
39710 gpuDynInst->wavefront()->outstandingReqs++;
39711 gpuDynInst->wavefront()->validateRequestCounters();
39717 initMemRead<VecElemU64>(gpuDynInst);
39726 if (gpuDynInst->exec_mask[lane]) {
39727 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
39728 gpuDynInst->d_data))[lane];
39750 Wavefront *wf = gpuDynInst->wavefront();
39757 gpuDynInst->exec_mask = wf->
execMask();
39759 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
39764 gpuDynInst->exec_mask = wf->
execMask();
39765 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39766 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39774 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39775 gpuDynInst->computeUnit()->globalMemoryPipe
39776 .issueRequest(gpuDynInst);
39780 fatal(
"Non global flat instructions not implemented yet.\n");
39783 gpuDynInst->wavefront()->outstandingReqs++;
39784 gpuDynInst->wavefront()->validateRequestCounters();
39790 initMemRead<3>(gpuDynInst);
39801 if (gpuDynInst->exec_mask[lane]) {
39802 vdst0[lane] = (
reinterpret_cast<VecElemU32*
>(
39803 gpuDynInst->d_data))[lane * 3];
39804 vdst1[lane] = (
reinterpret_cast<VecElemU32*
>(
39805 gpuDynInst->d_data))[lane * 3 + 1];
39806 vdst2[lane] = (
reinterpret_cast<VecElemU32*
>(
39807 gpuDynInst->d_data))[lane * 3 + 2];
39832 Wavefront *wf = gpuDynInst->wavefront();
39839 gpuDynInst->exec_mask = wf->
execMask();
39841 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
39846 gpuDynInst->exec_mask = wf->
execMask();
39847 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39848 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39856 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39857 gpuDynInst->computeUnit()->globalMemoryPipe
39858 .issueRequest(gpuDynInst);
39862 fatal(
"Non global flat instructions not implemented yet.\n");
39865 gpuDynInst->wavefront()->outstandingReqs++;
39866 gpuDynInst->wavefront()->validateRequestCounters();
39872 initMemRead<4>(gpuDynInst);
39884 if (gpuDynInst->exec_mask[lane]) {
39885 vdst0[lane] = (
reinterpret_cast<VecElemU32*
>(
39886 gpuDynInst->d_data))[lane * 4];
39887 vdst1[lane] = (
reinterpret_cast<VecElemU32*
>(
39888 gpuDynInst->d_data))[lane * 4 + 1];
39889 vdst2[lane] = (
reinterpret_cast<VecElemU32*
>(
39890 gpuDynInst->d_data))[lane * 4 + 2];
39891 vdst3[lane] = (
reinterpret_cast<VecElemU32*
>(
39892 gpuDynInst->d_data))[lane * 4 + 3];
39917 Wavefront *wf = gpuDynInst->wavefront();
39928 gpuDynInst->exec_mask = wf->
execMask();
39929 gpuDynInst->latency.init(gpuDynInst->computeUnit());
39930 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
39938 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
39939 gpuDynInst->computeUnit()->globalMemoryPipe
39940 .issueRequest(gpuDynInst);
39944 fatal(
"Non global flat instructions not implemented yet.\n");
39947 gpuDynInst->wavefront()->outstandingReqs++;
39948 gpuDynInst->wavefront()->validateRequestCounters();
39958 if (gpuDynInst->exec_mask[lane]) {
39959 (
reinterpret_cast<VecElemU8*
>(gpuDynInst->d_data))[lane]
39964 initMemWrite<VecElemU8>(gpuDynInst);
39987 Wavefront *wf = gpuDynInst->wavefront();
39998 gpuDynInst->exec_mask = wf->
execMask();
39999 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40000 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40008 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40009 gpuDynInst->computeUnit()->globalMemoryPipe
40010 .issueRequest(gpuDynInst);
40014 fatal(
"Non global flat instructions not implemented yet.\n");
40017 gpuDynInst->wavefront()->outstandingReqs++;
40018 gpuDynInst->wavefront()->validateRequestCounters();
40029 if (gpuDynInst->exec_mask[lane]) {
40030 (
reinterpret_cast<VecElemU16*
>(gpuDynInst->d_data))[lane]
40035 initMemWrite<VecElemU16>(gpuDynInst);
40058 Wavefront *wf = gpuDynInst->wavefront();
40069 gpuDynInst->exec_mask = wf->
execMask();
40070 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40071 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40079 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40080 gpuDynInst->computeUnit()->globalMemoryPipe
40081 .issueRequest(gpuDynInst);
40085 fatal(
"Non global flat instructions not implemented yet.\n");
40088 gpuDynInst->wavefront()->outstandingReqs++;
40089 gpuDynInst->wavefront()->validateRequestCounters();
40099 if (gpuDynInst->exec_mask[lane]) {
40100 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->d_data))[lane]
40105 initMemWrite<VecElemU32>(gpuDynInst);
40115 :
Inst_FLAT(iFmt,
"flat_store_dwordx2")
40129 Wavefront *wf = gpuDynInst->wavefront();
40140 gpuDynInst->exec_mask = wf->
execMask();
40141 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40142 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40150 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40151 gpuDynInst->computeUnit()->globalMemoryPipe
40152 .issueRequest(gpuDynInst);
40156 fatal(
"Non global flat instructions not implemented yet.\n");
40170 if (gpuDynInst->exec_mask[lane]) {
40171 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->d_data))[lane]
40176 initMemWrite<VecElemU64>(gpuDynInst);
40186 :
Inst_FLAT(iFmt,
"flat_store_dwordx3")
40200 Wavefront *wf = gpuDynInst->wavefront();
40211 gpuDynInst->exec_mask = wf->
execMask();
40212 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40213 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40221 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40222 gpuDynInst->computeUnit()->globalMemoryPipe
40223 .issueRequest(gpuDynInst);
40227 fatal(
"Non global flat instructions not implemented yet.\n");
40230 gpuDynInst->wavefront()->outstandingReqs++;
40231 gpuDynInst->wavefront()->validateRequestCounters();
40246 if (gpuDynInst->exec_mask[lane]) {
40248 gpuDynInst->d_data))[lane * 3] = data0[lane];
40250 gpuDynInst->d_data))[lane * 3 + 1] = data1[lane];
40252 gpuDynInst->d_data))[lane * 3 + 2] = data2[lane];
40256 initMemWrite<3>(gpuDynInst);
40266 :
Inst_FLAT(iFmt,
"flat_store_dwordx4")
40280 Wavefront *wf = gpuDynInst->wavefront();
40291 gpuDynInst->exec_mask = wf->
execMask();
40292 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40293 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40301 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40302 gpuDynInst->computeUnit()->globalMemoryPipe
40303 .issueRequest(gpuDynInst);
40307 fatal(
"Non global flat instructions not implemented yet.\n");
40310 gpuDynInst->wavefront()->outstandingReqs++;
40311 gpuDynInst->wavefront()->validateRequestCounters();
40328 if (gpuDynInst->exec_mask[lane]) {
40330 gpuDynInst->d_data))[lane * 4] = data0[lane];
40332 gpuDynInst->d_data))[lane * 4 + 1] = data1[lane];
40334 gpuDynInst->d_data))[lane * 4 + 2] = data2[lane];
40336 gpuDynInst->d_data))[lane * 4 + 3] = data3[lane];
40340 initMemWrite<4>(gpuDynInst);
40370 Wavefront *wf = gpuDynInst->wavefront();
40380 gpuDynInst->exec_mask = wf->
execMask();
40382 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
40388 gpuDynInst->exec_mask = wf->
execMask();
40389 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40390 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40398 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL ||
40399 gpuDynInst->executedAs() == Enums::SC_PRIVATE) {
40401 panic_if(gpuDynInst->executedAs() == Enums::SC_PRIVATE,
40402 "Flats to private aperture not tested yet\n");
40403 gpuDynInst->computeUnit()->globalMemoryPipe.
40404 issueRequest(gpuDynInst);
40410 fatal(
"Non global flat instructions not implemented yet.\n");
40413 gpuDynInst->wavefront()->outstandingReqs++;
40414 gpuDynInst->wavefront()->validateRequestCounters();
40421 if (gpuDynInst->exec_mask[lane]) {
40422 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->a_data))[lane]
40432 initAtomicAccess<VecElemU32>(gpuDynInst);
40442 if (gpuDynInst->exec_mask[lane]) {
40443 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
40444 gpuDynInst->d_data))[lane];
40456 :
Inst_FLAT(iFmt,
"flat_atomic_cmpswap")
40458 setFlag(AtomicCAS);
40459 if (instData.GLC) {
40460 setFlag(AtomicReturn);
40462 setFlag(AtomicNoReturn);
40464 setFlag(MemoryRef);
40479 Wavefront *wf = gpuDynInst->wavefront();
40489 gpuDynInst->exec_mask = wf->
execMask();
40491 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
40497 gpuDynInst->exec_mask = wf->
execMask();
40498 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40499 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40512 if (gpuDynInst->exec_mask[lane]) {
40513 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->x_data))[lane]
40515 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->a_data))[lane]
40520 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL ||
40521 gpuDynInst->executedAs() == Enums::SC_PRIVATE) {
40528 panic_if(gpuDynInst->executedAs() == Enums::SC_PRIVATE,
40529 "Flats to private aperture not tested yet\n");
40530 gpuDynInst->computeUnit()->globalMemoryPipe.
40531 issueRequest(gpuDynInst);
40537 fatal(
"Non global flat instructions not implemented yet.\n");
40540 gpuDynInst->wavefront()->outstandingReqs++;
40541 gpuDynInst->wavefront()->validateRequestCounters();
40547 initAtomicAccess<VecElemU32>(gpuDynInst);
40557 if (gpuDynInst->exec_mask[lane]) {
40558 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
40559 gpuDynInst->d_data))[lane];
40589 Wavefront *wf = gpuDynInst->wavefront();
40599 gpuDynInst->exec_mask = wf->
execMask();
40601 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
40607 gpuDynInst->exec_mask = wf->
execMask();
40608 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40609 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40620 if (gpuDynInst->exec_mask[lane]) {
40621 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->a_data))[lane]
40626 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40627 gpuDynInst->computeUnit()->globalMemoryPipe.
40628 issueRequest(gpuDynInst);
40634 fatal(
"Non global flat instructions not implemented yet.\n");
40637 gpuDynInst->wavefront()->outstandingReqs++;
40638 gpuDynInst->wavefront()->validateRequestCounters();
40644 initAtomicAccess<VecElemU32>(gpuDynInst);
40654 if (gpuDynInst->exec_mask[lane]) {
40655 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
40656 gpuDynInst->d_data))[lane];
40686 Wavefront *wf = gpuDynInst->wavefront();
40696 gpuDynInst->exec_mask = wf->
execMask();
40698 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
40704 gpuDynInst->exec_mask = wf->
execMask();
40705 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40706 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40717 if (gpuDynInst->exec_mask[lane]) {
40718 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->a_data))[lane]
40723 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40724 gpuDynInst->computeUnit()->globalMemoryPipe.
40725 issueRequest(gpuDynInst);
40731 fatal(
"Non global flat instructions not implemented yet.\n");
40734 gpuDynInst->wavefront()->outstandingReqs++;
40735 gpuDynInst->wavefront()->validateRequestCounters();
40740 initAtomicAccess<VecElemU32>(gpuDynInst);
40750 if (gpuDynInst->exec_mask[lane]) {
40751 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
40752 gpuDynInst->d_data))[lane];
40957 Wavefront *wf = gpuDynInst->wavefront();
40967 gpuDynInst->exec_mask = wf->
execMask();
40969 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
40975 gpuDynInst->exec_mask = wf->
execMask();
40976 gpuDynInst->latency.init(gpuDynInst->computeUnit());
40977 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
40988 if (gpuDynInst->exec_mask[lane]) {
40989 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->a_data))[lane]
40994 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
40995 gpuDynInst->computeUnit()->globalMemoryPipe.
40996 issueRequest(gpuDynInst);
41002 fatal(
"Non global flat instructions not implemented yet.\n");
41005 gpuDynInst->wavefront()->outstandingReqs++;
41006 gpuDynInst->wavefront()->validateRequestCounters();
41012 initAtomicAccess<VecElemU32>(gpuDynInst);
41022 if (gpuDynInst->exec_mask[lane]) {
41023 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
41024 gpuDynInst->d_data))[lane];
41054 Wavefront *wf = gpuDynInst->wavefront();
41064 gpuDynInst->exec_mask = wf->
execMask();
41066 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
41072 gpuDynInst->exec_mask = wf->
execMask();
41073 gpuDynInst->latency.init(gpuDynInst->computeUnit());
41074 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
41085 if (gpuDynInst->exec_mask[lane]) {
41086 (
reinterpret_cast<VecElemU32*
>(gpuDynInst->a_data))[lane]
41091 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
41092 gpuDynInst->computeUnit()->globalMemoryPipe.
41093 issueRequest(gpuDynInst);
41099 fatal(
"Non global flat instructions not implemented yet.\n");
41102 gpuDynInst->wavefront()->outstandingReqs++;
41103 gpuDynInst->wavefront()->validateRequestCounters();
41109 initAtomicAccess<VecElemU32>(gpuDynInst);
41119 if (gpuDynInst->exec_mask[lane]) {
41120 vdst[lane] = (
reinterpret_cast<VecElemU32*
>(
41121 gpuDynInst->d_data))[lane];
41131 :
Inst_FLAT(iFmt,
"flat_atomic_swap_x2")
41157 :
Inst_FLAT(iFmt,
"flat_atomic_cmpswap_x2")
41180 Wavefront *wf = gpuDynInst->wavefront();
41190 gpuDynInst->exec_mask = wf->
execMask();
41192 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
41198 gpuDynInst->exec_mask = wf->
execMask();
41199 gpuDynInst->latency.init(gpuDynInst->computeUnit());
41200 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
41213 if (gpuDynInst->exec_mask[lane]) {
41214 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->x_data))[lane]
41216 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->a_data))[lane]
41221 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL ||
41222 gpuDynInst->executedAs() == Enums::SC_PRIVATE) {
41229 panic_if(gpuDynInst->executedAs() == Enums::SC_PRIVATE,
41230 "Flats to private aperture not tested yet\n");
41231 gpuDynInst->computeUnit()->globalMemoryPipe.
41232 issueRequest(gpuDynInst);
41238 fatal(
"Non global flat instructions not implemented yet.\n");
41241 gpuDynInst->wavefront()->outstandingReqs++;
41242 gpuDynInst->wavefront()->validateRequestCounters();
41248 initAtomicAccess<VecElemU64>(gpuDynInst);
41258 if (gpuDynInst->exec_mask[lane]) {
41259 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
41260 gpuDynInst->d_data))[lane];
41270 :
Inst_FLAT(iFmt,
"flat_atomic_add_x2")
41291 Wavefront *wf = gpuDynInst->wavefront();
41301 gpuDynInst->exec_mask = wf->
execMask();
41303 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
41309 gpuDynInst->exec_mask = wf->
execMask();
41310 gpuDynInst->latency.init(gpuDynInst->computeUnit());
41311 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
41322 if (gpuDynInst->exec_mask[lane]) {
41323 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->a_data))[lane]
41328 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
41329 gpuDynInst->computeUnit()->globalMemoryPipe.
41330 issueRequest(gpuDynInst);
41336 fatal(
"Non global flat instructions not implemented yet.\n");
41339 gpuDynInst->wavefront()->outstandingReqs++;
41340 gpuDynInst->wavefront()->validateRequestCounters();
41346 initAtomicAccess<VecElemU64>(gpuDynInst);
41357 if (gpuDynInst->exec_mask[lane]) {
41358 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
41359 gpuDynInst->d_data))[lane];
41369 :
Inst_FLAT(iFmt,
"flat_atomic_sub_x2")
41390 Wavefront *wf = gpuDynInst->wavefront();
41400 gpuDynInst->exec_mask = wf->
execMask();
41402 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
41408 gpuDynInst->exec_mask = wf->
execMask();
41409 gpuDynInst->latency.init(gpuDynInst->computeUnit());
41410 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
41421 if (gpuDynInst->exec_mask[lane]) {
41422 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->a_data))[lane]
41427 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
41428 gpuDynInst->computeUnit()->globalMemoryPipe.
41429 issueRequest(gpuDynInst);
41435 fatal(
"Non global flat instructions not implemented yet.\n");
41438 gpuDynInst->wavefront()->outstandingReqs++;
41439 gpuDynInst->wavefront()->validateRequestCounters();
41445 initAtomicAccess<VecElemU64>(gpuDynInst);
41456 if (gpuDynInst->exec_mask[lane]) {
41457 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
41458 gpuDynInst->d_data))[lane];
41468 :
Inst_FLAT(iFmt,
"flat_atomic_smin_x2")
41494 :
Inst_FLAT(iFmt,
"flat_atomic_umin_x2")
41520 :
Inst_FLAT(iFmt,
"flat_atomic_smax_x2")
41546 :
Inst_FLAT(iFmt,
"flat_atomic_umax_x2")
41572 :
Inst_FLAT(iFmt,
"flat_atomic_and_x2")
41624 :
Inst_FLAT(iFmt,
"flat_atomic_xor_x2")
41650 :
Inst_FLAT(iFmt,
"flat_atomic_inc_x2")
41671 Wavefront *wf = gpuDynInst->wavefront();
41681 gpuDynInst->exec_mask = wf->
execMask();
41683 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
41689 gpuDynInst->exec_mask = wf->
execMask();
41690 gpuDynInst->latency.init(gpuDynInst->computeUnit());
41691 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
41702 if (gpuDynInst->exec_mask[lane]) {
41703 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->a_data))[lane]
41708 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
41709 gpuDynInst->computeUnit()->globalMemoryPipe.
41710 issueRequest(gpuDynInst);
41716 fatal(
"Non global flat instructions not implemented yet.\n");
41719 gpuDynInst->wavefront()->outstandingReqs++;
41720 gpuDynInst->wavefront()->validateRequestCounters();
41726 initAtomicAccess<VecElemU64>(gpuDynInst);
41737 if (gpuDynInst->exec_mask[lane]) {
41738 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
41739 gpuDynInst->d_data))[lane];
41749 :
Inst_FLAT(iFmt,
"flat_atomic_dec_x2")
41771 Wavefront *wf = gpuDynInst->wavefront();
41781 gpuDynInst->exec_mask = wf->
execMask();
41783 scheduleWriteOperandsFromLoad(wf, gpuDynInst);
41789 gpuDynInst->exec_mask = wf->
execMask();
41790 gpuDynInst->latency.init(gpuDynInst->computeUnit());
41791 gpuDynInst->latency.set(gpuDynInst->computeUnit()->clockPeriod());
41802 if (gpuDynInst->exec_mask[lane]) {
41803 (
reinterpret_cast<VecElemU64*
>(gpuDynInst->a_data))[lane]
41808 if (gpuDynInst->executedAs() == Enums::SC_GLOBAL) {
41809 gpuDynInst->computeUnit()->globalMemoryPipe.
41810 issueRequest(gpuDynInst);
41816 fatal(
"Non global flat instructions not implemented yet.\n");
41819 gpuDynInst->wavefront()->outstandingReqs++;
41820 gpuDynInst->wavefront()->validateRequestCounters();
41826 initAtomicAccess<VecElemU64>(gpuDynInst);
41837 if (gpuDynInst->exec_mask[lane]) {
41838 vdst[lane] = (
reinterpret_cast<VecElemU64*
>(
41839 gpuDynInst->d_data))[lane];
~Inst_MIMG__IMAGE_SAMPLE_CD_CL()
Inst_VOP3__V_RCP_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_NGT_F32()
Inst_VOPC__V_CMP_LT_U16(InFmt_VOPC *)
Inst_SOPP__S_CBRANCH_CDBGSYS(InFmt_SOPP *)
Inst_DS__DS_OR_SRC2_B64(InFmt_DS *)
Inst_VOPC__V_CMP_LG_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_SOPK__S_CMPK_GE_I32()
Inst_DS__DS_XOR_RTN_B32(InFmt_DS *)
Inst_DS__DS_MIN_F64(InFmt_DS *)
~Inst_VOP3__V_CMP_O_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_F_F32()
~Inst_VOP3__V_CMP_GE_U32()
~Inst_MIMG__IMAGE_GATHER4_O()
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRITE_B128(InFmt_DS *)
~Inst_DS__DS_WRITE2_B32()
Inst_FLAT__FLAT_ATOMIC_ADD_X2(InFmt_FLAT *)
Inst_VOP2__V_MIN_F32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LT_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_RTN_I64(InFmt_DS *)
~Inst_VOPC__V_CMP_EQ_F16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MUL_F32(InFmt_VOP3 *)
Inst_VOP2__V_ADD_U32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_GE_I32()
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_SRC2_I64(InFmt_DS *)
~Inst_VOP3__V_RCP_IFLAG_F32()
#define fatal(...)
This implements a cprintf based fatal() function.
~Inst_VOPC__V_CMPX_F_F16()
Inst_VOP3__V_CVT_F32_F16(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_F_I32(InFmt_VOP3 *)
Inst_VOP3__V_SUBREV_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_F_U64(InFmt_VOPC *)
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LT_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP2__V_MADMK_F32()
Inst_VOP3__V_TRUNC_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_READ_B128(InFmt_DS *)
Inst_VOP3__V_ALIGNBYTE_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_F16(InFmt_VOP3 *)
~Inst_VOP3__V_DIV_FIXUP_F64()
~Inst_VINTRP__V_INTERP_P1_F32()
~Inst_VOP3__V_CVT_PK_U16_U32()
Inst_VOPC__V_CMP_F_U16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_FREXP_EXP_I32_F64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MUL_LO_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_LOAD_DWORDX3()
void execute(GPUDynInstPtr) override
void calcAddr(GPUDynInstPtr gpu_dyn_inst, ConstScalarOperandU64 &addr, ScalarRegU32 offset)
For normal s_load_dword/s_store_dword instruction addresses.
Inst_VOP3__V_CMP_F_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_B_CL_O()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP2__V_MIN_U32(InFmt_VOP2 *)
Inst_DS__DS_AND_RTN_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_GT_U32(InFmt_VOP3 *)
Inst_VOPC__V_CMP_NLE_F16(InFmt_VOPC *)
~Inst_SOPK__S_CMPK_LT_U32()
Inst_VOPC__V_CMP_NLE_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LE_F16(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_LG_F16()
Inst_MIMG__IMAGE_SAMPLE_CL(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_T_U16(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_ADD_F16(InFmt_VOP2 *)
Inst_EXP__EXP(InFmt_EXP *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_XOR_RTN_B64()
~Inst_SMEM__S_STORE_DWORDX2()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_BITSET1_B32(InFmt_SOP1 *)
~Inst_VOPC__V_CMPX_GE_I16()
Inst_SOP1__S_SET_GPR_IDX_IDX(InFmt_SOP1 *)
Inst_SOP2__S_MIN_U32(InFmt_SOP2 *)
const int NumVecElemPerVecReg(64)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_C_CL_O()
void execute(GPUDynInstPtr) override
ScalarOperand< ScalarRegU32, true, 4 > ConstScalarOperandU128
Inst_VOP3__V_CMPX_NLE_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NE_U16()
Inst_VOP3__V_CMPX_GT_I32(InFmt_VOP3 *)
Inst_VOP3__V_WRITELANE_B32(InFmt_VOP3 *)
Inst_VOP1__V_SIN_F16(InFmt_VOP1 *)
Inst_VOPC__V_CMP_LE_F16(InFmt_VOPC *)
Inst_DS__DS_MIN_I32(InFmt_DS *)
Inst_MIMG__IMAGE_SAMPLE(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NEQ_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
std::enable_if< Condition, DataType >::type rawData() const
we store scalar data in a std::array, however if we need the full operand data we use this method to ...
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_TRU_F32(InFmt_VOPC *)
~Inst_FLAT__FLAT_ATOMIC_OR_X2()
Inst_VOP3__V_CVT_U32_F32(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_LE_U32()
Inst_VOPC__V_CMP_F_F32(InFmt_VOPC *)
Inst_VOP3__V_MUL_LO_U16(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_NE_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_DEC_X2()
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_LG_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CVT_PKNORM_I16_F32()
Inst_MIMG__IMAGE_GATHER4_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_NGE_F64(InFmt_VOPC *)
Inst_FLAT__FLAT_ATOMIC_UMIN(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
~Inst_SMEM__S_LOAD_DWORDX4()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_T_I16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_RSUB_SRC2_U64(InFmt_DS *)
~Inst_VOP3__V_CMP_GT_U32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_LZ_O()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_EQ_F64(InFmt_VOPC *)
Inst_VOP3__V_CMP_GT_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NGE_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_SOPP__S_CBRANCH_CDBGSYS_AND_USER(InFmt_SOPP *)
~Inst_VOP3__V_BFREV_B32()
Inst_VOP3__V_CMP_O_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_NLT_F32()
Inst_FLAT__FLAT_ATOMIC_UMAX_X2(InFmt_FLAT *)
void completeAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GT_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_CSELECT_B64(InFmt_SOP2 *)
~Inst_VOPC__V_CMP_LT_I64()
~Inst_MIMG__IMAGE_ATOMIC_SMIN()
~Inst_VOP3__V_CMP_LG_F64()
Inst_VOPC__V_CMP_EQ_U16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_GT_I16(InFmt_VOPC *)
Inst_VOP3__V_RCP_F16(InFmt_VOP3 *)
void panicUnimplemented() const
void execute(GPUDynInstPtr) override
Inst_VOP3__V_NOT_B32(InFmt_VOP3 *)
~Inst_MIMG__IMAGE_GATHER4_C_LZ_O()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_SMIN_X2()
Inst_MUBUF__BUFFER_ATOMIC_OR(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NE_I64(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_GT_I64()
~Inst_VOP3__V_BCNT_U32_B32()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NGT_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_F32(InFmt_DS *)
void execute(GPUDynInstPtr) override
#define LL(N)
int64_t constant
~Inst_VOP1__V_RNDNE_F64()
~Inst_SOP1__S_BITSET0_B64()
Inst_VOPC__V_CMPX_GT_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_T_U64()
void execute(GPUDynInstPtr) override
Inst_SOPP__S_CBRANCH_VCCNZ(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_F_I64()
Inst_VINTRP__V_INTERP_MOV_F32(InFmt_VINTRP *)
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_SEXT_I32_I8()
~Inst_DS__DS_MAX_RTN_F32()
Inst_VOPC__V_CMPX_GE_U32(InFmt_VOPC *)
Inst_VOP1__V_CVT_F64_U32(InFmt_VOP1 *)
void initiateAcc(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_DS__DS_SUB_RTN_U64()
Inst_VOP2__V_MIN_I32(InFmt_VOP2 *)
Inst_SOPC__S_BITCMP0_B64(InFmt_SOPC *)
~Inst_VOPC__V_CMPX_NLT_F16()
~Inst_SOPC__S_CMP_LE_I32()
~Inst_VOP3__V_DIV_SCALE_F64()
Inst_MUBUF__BUFFER_STORE_SHORT(InFmt_MUBUF *)
~Inst_VOP3__V_ASHRREV_I32()
~Inst_VOP3__V_CMP_LE_U16()
Inst_SOPK__S_CMPK_GE_I32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_BCNT0_I32_B32()
Inst_VOP2__V_SUBB_U32(InFmt_VOP2 *)
~Inst_MIMG__IMAGE_GET_RESINFO()
~Inst_FLAT__FLAT_ATOMIC_UMIN()
Inst_SOP2__S_SUB_I32(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_CL()
Inst_SMEM__S_BUFFER_STORE_DWORDX2(InFmt_SMEM *)
void initiateAcc(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_INC()
Inst_VOP3__V_CMP_LE_U64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_F16_U16(InFmt_VOP3 *)
Inst_VOP3__V_CMP_NLG_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_T_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_INTERP_P2_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAD_U64_U32(InFmt_VOP3_SDST_ENC *)
void initiateAcc(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_DS__DS_MAX_RTN_U64(InFmt_DS *)
Inst_VOP2__V_MIN_I16(InFmt_VOP2 *)
Inst_VOP3__V_CMPX_LT_U16(InFmt_VOP3 *)
Inst_VOP3__V_MAD_I64_I32(InFmt_VOP3_SDST_ENC *)
Inst_VOP3__V_CMPX_CLASS_F16(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_LG_F32(InFmt_VOP3 *)
Inst_MIMG__IMAGE_SAMPLE_C_CL(InFmt_MIMG *)
~Inst_VOPC__V_CMP_GE_F32()
Inst_SOP1__S_SWAPPC_B64(InFmt_SOP1 *)
Inst_VOPC__V_CMPX_NE_U64(InFmt_VOPC *)
Inst_SOP2__S_MIN_I32(InFmt_SOP2 *)
~Inst_VOPC__V_CMP_GE_U64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_ASHRREV_I64()
~Inst_VOP3__V_CMP_LT_I32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SMEM__S_LOAD_DWORDX2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LT_F64(InFmt_VOP3 *)
~Inst_DS__DS_DEC_RTN_U64()
~Inst_DS__DS_MIN_RTN_F32()
~Inst_VOPC__V_CMPX_LT_U64()
Inst_DS__DS_RSUB_RTN_U32(InFmt_DS *)
~Inst_VOPC__V_CMP_GT_I32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_LOAD_DWORDX4(InFmt_FLAT *)
Inst_VOP3__V_CMPX_TRU_F16(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LT_U32(InFmt_VOPC *)
~Inst_VOPC__V_CMP_GE_U16()
~Inst_VOPC__V_CMP_F_F32()
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_F_I32()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LG_F32()
Inst_DS__DS_MIN_U32(InFmt_DS *)
~Inst_MUBUF__BUFFER_ATOMIC_SMAX()
~Inst_VOPC__V_CMP_LE_I32()
Inst_SOP1__S_WQM_B32(InFmt_SOP1 *)
Inst_VOP3__V_LSHLREV_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOPK__S_CMPK_LE_I32()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_CD_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_CLASS_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_SUB_U16(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_TRU_F64(InFmt_VOP3 *)
~Inst_MUBUF__BUFFER_STORE_DWORDX3()
Inst_VOP3__V_MAX_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GT_U64()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_LZ()
void execute(GPUDynInstPtr) override
Inst_DS__DS_XOR_RTN_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NLG_F64()
Inst_SOP2__S_LSHR_B64(InFmt_SOP2 *)
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_EQ_I16()
Inst_VOP3__V_INTERP_P1_F32(InFmt_VOP3 *)
Inst_SOP2__S_LSHL_B32(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_XOR_B32(InFmt_SOP2 *)
Inst_VOP3__V_ADD_U16(InFmt_VOP3 *)
~Inst_VOP1__V_CVT_F64_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_CL_O()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_MOVRELD_B64(InFmt_SOP1 *)
Inst_SOP1__S_QUADMASK_B64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LE_F64()
void initiateAcc(GPUDynInstPtr) override
~Inst_SOPC__S_BITCMP1_B32()
~Inst_VOP1__V_CVT_F64_I32()
Inst_MIMG__IMAGE_SAMPLE_C_B_CL(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_ATOMIC_UMIN(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP2__V_CNDMASK_B32(InFmt_VOP2 *)
~Inst_VOP3__V_CMPX_F_U64()
Inst_VOP1__V_CVT_F16_U16(InFmt_VOP1 *)
Inst_DS__DS_MAX_I64(InFmt_DS *)
T median(T val_0, T val_1, T val_2)
Inst_SOPC__S_BITCMP1_B64(InFmt_SOPC *)
Inst_VOP3__V_MAX_I32(InFmt_VOP3 *)
Inst_DS__DS_INC_SRC2_U64(InFmt_DS *)
Inst_VOPC__V_CMP_NLG_F64(InFmt_VOPC *)
~Inst_VOP3__V_CMPX_LT_F32()
Inst_VOPC__V_CMPX_GT_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GE_F16()
Inst_VOP3__V_INTERP_P1LV_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_FREXP_EXP_I32_F32()
void initiateAcc(GPUDynInstPtr) override
~Inst_SOP1__S_MOVRELD_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_F_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_DIV_FMAS_F64()
~Inst_FLAT__FLAT_ATOMIC_SMAX()
Inst_VOP2__V_MUL_LEGACY_F32(InFmt_VOP2 *)
~Inst_VOP3__V_CMPX_GE_I16()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_MOV_FED_B32()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
std::vector< int > vecReads
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_BFE_U32(InFmt_VOP3 *)
Inst_DS__DS_READ_U8(InFmt_DS *)
~Inst_VOP3__V_CMPX_T_U16()
~Inst_FLAT__FLAT_LOAD_USHORT()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_EQ_U32()
void execute(GPUDynInstPtr) override
Inst_SOPP__S_SET_GPR_IDX_MODE(InFmt_SOPP *)
Inst_DS__DS_SUB_U32(InFmt_DS *)
Inst_VOP3__V_CMP_TRU_F16(InFmt_VOP3 *)
Inst_VOPC__V_CMP_LE_U16(InFmt_VOPC *)
Inst_SOP2__S_NAND_B32(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_B_O()
void execute(GPUDynInstPtr) override
Inst_SOPC__S_CMP_GE_I32(InFmt_SOPC *)
~Inst_VOPC__V_CMPX_CLASS_F16()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_EQ_I64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_T_I16()
Inst_VOPC__V_CMPX_TRU_F32(InFmt_VOPC *)
Inst_VOP3__V_CMPX_LT_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NLG_F32()
Inst_VOP2__V_SUB_F32(InFmt_VOP2 *)
~Inst_VOP2__V_MADMK_F16()
Inst_VOPC__V_CMP_LE_F64(InFmt_VOPC *)
Inst_SOP1__S_BCNT0_I32_B64(InFmt_SOP1 *)
~Inst_VOP3__V_CMPX_LT_U32()
~Inst_MIMG__IMAGE_SAMPLE_D_CL()
~Inst_VOP3__V_INTERP_P1LL_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GT_I16()
Inst_VOPC__V_CMP_NGE_F32(InFmt_VOPC *)
Inst_MUBUF__BUFFER_ATOMIC_ADD(InFmt_MUBUF *)
~Inst_VOP3__V_CMPX_NEQ_F32()
~Inst_VOP1__V_CVT_F16_U16()
~Inst_VOP3__V_INTERP_P2_F32()
~Inst_VOP1__V_CVT_F16_F32()
void execute(GPUDynInstPtr) override
Inst_DS__DS_ADD_SRC2_U64(InFmt_DS *)
Inst_VOPC__V_CMP_GE_I16(InFmt_VOPC *)
Inst_DS__DS_WRITE2_B64(InFmt_DS *)
~Inst_VOP3__V_CVT_F16_F32()
~Inst_VOP3__V_CVT_F32_I32()
Stats::Scalar completedWGs
~Inst_VOPC__V_CMP_U_F16()
~Inst_VOPC__V_CMP_NLE_F16()
~Inst_MUBUF__BUFFER_WBINVL1_VOL()
Inst_VOP3__V_CVT_I16_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CVT_F32_I32(InFmt_VOP1 *)
~Inst_VOP2__V_MUL_LO_U16()
~Inst_VOPC__V_CMPX_NGE_F32()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NE_U16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAX_I16(InFmt_VOP3 *)
Inst_SOP1__S_WQM_B64(InFmt_SOP1 *)
Inst_DS__DS_SUB_RTN_U32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LE_U32(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_LG_F64()
~Inst_SOP1__S_FF0_I32_B64()
Inst_SOPC__S_CMP_LE_I32(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_T_U32()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NLT_F32()
void execute(GPUDynInstPtr) override
Inst_SOPP__S_SETPRIO(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_ATOMIC_OR(InFmt_MIMG *)
Inst_VOPC__V_CMP_EQ_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_READ_B96(InFmt_DS *)
~Inst_VOP2__V_MUL_HI_U32_U24()
~Inst_VOP3__V_CMP_GE_F64()
Inst_VOP3__V_CMPX_NE_I32(InFmt_VOP3 *)
~Inst_VOP1__V_CVT_I32_F64()
Inst_MUBUF__BUFFER_ATOMIC_DEC_X2(InFmt_MUBUF *)
void incNumAtBarrier(int bar_id)
void execute(GPUDynInstPtr) override
Inst_DS__DS_XOR_SRC2_B32(InFmt_DS *)
Inst_VOPC__V_CMPX_GE_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_C_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_CMPST_B32(InFmt_DS *)
~Inst_VOPC__V_CMP_EQ_U16()
Inst_FLAT__FLAT_ATOMIC_INC(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_DEC_SRC2_U32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LE_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LG_F64()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_FF1_I32_B32(InFmt_SOP1 *)
~Inst_VOP3__V_CMPX_NLE_F32()
Inst_MUBUF__BUFFER_ATOMIC_AND(InFmt_MUBUF *)
Inst_FLAT__FLAT_STORE_DWORDX4(InFmt_FLAT *)
~Inst_DS__DS_MIN_SRC2_F64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_ASHRREV_I32(InFmt_VOP3 *)
Inst_VOP3__V_CMP_NEQ_F32(InFmt_VOP3 *)
~Inst_VOP1__V_LOG_LEGACY_F32()
~Inst_FLAT__FLAT_ATOMIC_SMIN()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GT_U32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_LOAD_DWORD()
~Inst_VOP3__V_MUL_HI_I32()
Inst_SOP1__S_ORN2_SAVEEXEC_B64(InFmt_SOP1 *)
void completeAcc(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_UMAX(InFmt_FLAT *)
Inst_VOPC__V_CMP_U_F16(InFmt_VOPC *)
Inst_MIMG__IMAGE_GATHER4_C_B(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CUBEID_F32()
Inst_VOP3__V_MUL_U32_U24(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_SUBREV_U32(InFmt_VOP3_SDST_ENC *)
Inst_VOP3__V_CMPX_LT_I64(InFmt_VOP3 *)
Inst_MIMG__IMAGE_STORE_MIP(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_VOP2__V_SUBREV_F32()
~Inst_SOP1__S_NOR_SAVEEXEC_B64()
~Inst_SOP1__S_FF1_I32_B64()
Inst_DS__DS_MAX_U32(InFmt_DS *)
~Inst_DS__DS_WRXCHG_RTN_B64()
Inst_VOP3__V_LSHRREV_B16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_U16_F16(InFmt_VOP3 *)
Inst_VOP3__V_CMP_LT_U64(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_LOAD_DWORDX2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_LT_F16()
~Inst_VOP3__V_CMP_LE_U64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_GE_F16()
~Inst_VOPC__V_CMPX_LT_U16()
Inst_DS__DS_READ_I8(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_XOR_RTN_B32()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_O_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_BITSET1_B32()
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_SUBBREV_U32(InFmt_VOP3_SDST_ENC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_RTN_F64(InFmt_DS *)
Inst_VOP3__V_CLREXCP(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_CD_CL_O()
Inst_VOPC__V_CMP_GT_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_ENDPGM_SAVED()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_FLBIT_I32()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_F_U64()
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_STORE_DWORD()
Inst_DS__DS_AND_RTN_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_SOPP__S_ENDPGM_SAVED(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GT_I32(InFmt_VOPC *)
Inst_DS__DS_READ_U16(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_EQ_F64()
~Inst_VOP3__V_CMPX_O_F32()
Inst_VOP3__V_CMPX_LE_F32(InFmt_VOP3 *)
~Inst_MIMG__IMAGE_GATHER4_C_B_CL()
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MADMK_F32(InFmt_VOP2 *)
~Inst_FLAT__FLAT_ATOMIC_AND_X2()
Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP_X2(InFmt_MUBUF *)
~Inst_SOP1__S_QUADMASK_B32()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4()
Inst_VOP2__V_MAX_I16(InFmt_VOP2 *)
~Inst_VOP3__V_CMPX_O_F16()
~Inst_VOP3__V_CMP_GT_F64()
Inst_VOP3__V_SQRT_F64(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_LG_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_LSHRREV_B16(InFmt_VOP2 *)
~Inst_VOPC__V_CMP_LE_I16()
ScalarRegI32 countZeroBits(T val)
Inst_VOP3__V_CMP_CLASS_F16(InFmt_VOP3 *)
Inst_MIMG__IMAGE_SAMPLE_C_B_O(InFmt_MIMG *)
~Inst_VOP3__V_CVT_U16_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_EQ_I16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOPC__S_CMP_GT_I32()
Inst_VOPC__V_CMP_T_I16(InFmt_VOPC *)
int numYetToReachBarrier(int bar_id)
~Inst_VOP3__V_CUBETC_F32()
~Inst_VOPC__V_CMP_EQ_U32()
~Inst_VOP3__V_CMP_NE_I64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_TRU_F16()
Inst_VOPC__V_CMP_LT_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP1__V_FREXP_EXP_I32_F32(InFmt_VOP1 *)
~Inst_VOP1__V_TRUNC_F32()
~Inst_VOPC__V_CMPX_LG_F64()
Inst_SOP1__S_FLBIT_I32(InFmt_SOP1 *)
Inst_VOPC__V_CMPX_NGT_F16(InFmt_VOPC *)
~Inst_SMEM__S_ATC_PROBE()
~Inst_VOP3__V_CMP_LE_I64()
void execute(GPUDynInstPtr) override
void prepareFlush(GPUDynInstPtr gpuDynInst)
dispatcher/shader arranges flush requests to the CUs
Inst_VOP1__V_FREXP_EXP_I16_F16(InFmt_VOP1 *)
Inst_VOP3__V_CMP_NGT_F64(InFmt_VOP3 *)
Inst_SOPC__S_BITCMP1_B32(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FLOOR_F32()
Inst_MIMG__IMAGE_ATOMIC_SMIN(InFmt_MIMG *)
Inst_VINTRP__V_INTERP_P1_F32(InFmt_VINTRP *)
~Inst_MIMG__IMAGE_SAMPLE_C_B_CL_O()
~Inst_VOP3__V_CMP_F_U32()
Inst_VOP1__V_RSQ_F32(InFmt_VOP1 *)
Inst_MIMG__IMAGE_SAMPLE_B(InFmt_MIMG *)
Inst_VOP3__V_CMP_NEQ_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_ADD_SRC2_F32(InFmt_DS *)
Inst_VOP3__V_BFI_B32(InFmt_VOP3 *)
Inst_VOP3__V_PERM_B32(InFmt_VOP3 *)
Inst_VOP3__V_CMP_T_I64(InFmt_VOP3 *)
Inst_SOPK__S_CMPK_GT_I32(InFmt_SOPK *)
~Inst_VOP3__V_CMPX_U_F16()
~Inst_VOP3__V_CVT_F32_F64()
Inst_DS__DS_CONDXCHG32_RTN_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NGT_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NEQ_F16()
~Inst_VOPC__V_CMP_GE_U32()
Inst_VOP3__V_CMPX_EQ_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_SMEM__S_DCACHE_INV_VOL()
~Inst_SOP1__S_SET_GPR_IDX_IDX()
Inst_VOP3__V_QSAD_PK_U16_U8(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_T_I16(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_NE_U16(InFmt_VOPC *)
~Inst_VOP3__V_MUL_LO_U16()
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_U64(InFmt_DS *)
~Inst_VOP3__V_CVT_F16_U16()
Inst_VOPC__V_CMP_GE_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GE_U16()
~Inst_VOP1__V_BFREV_B32()
~Inst_VOPC__V_CMPX_EQ_I16()
~Inst_FLAT__FLAT_LOAD_UBYTE()
~Inst_VOP3__V_CMPX_F_F16()
Inst_MUBUF__BUFFER_ATOMIC_XOR_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_AND_B64(InFmt_DS *)
Inst_SMEM__S_STORE_DWORD(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
Inst_SOPP__S_CBRANCH_CDBGUSER(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GT_U16()
Inst_DS__DS_CMPST_F32(InFmt_DS *)
Inst_SOP2__S_RFE_RESTORE_B64(InFmt_SOP2 *)
~Inst_VOPC__V_CMP_GT_U32()
~Inst_MIMG__IMAGE_GET_LOD()
Inst_VOP3__V_CMP_GE_U16(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_EQ_I32()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_EQ_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MUL_HI_U32()
~Inst_FLAT__FLAT_ATOMIC_SWAP_X2()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_EQ_I32(InFmt_VOPC *)
Inst_VOP3__V_CMPX_TRU_F64(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_NLE_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NLG_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_LE_I64(InFmt_VOPC *)
~Inst_VOP3__V_CMPX_TRU_F64()
~Inst_VOP3__V_CMP_LE_U32()
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NE_I32()
~Inst_MUBUF__BUFFER_LOAD_DWORDX4()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void decVMemInstsIssued()
~Inst_SMEM__S_DCACHE_INV()
Inst_SOP1__S_BREV_B32(InFmt_SOP1 *)
~Inst_FLAT__FLAT_ATOMIC_UMIN_X2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_D()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_OR_SAVEEXEC_B64(InFmt_SOP1 *)
Inst_DS__DS_AND_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_RTN_I64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_T_I32(InFmt_VOP3 *)
void barrierId(int bar_id)
void completeAcc(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_LZ_O(InFmt_MIMG *)
Inst_VOP1__V_TRUNC_F64(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_GWS_SEMA_BR(InFmt_DS *)
Inst_MIMG__IMAGE_ATOMIC_SWAP(InFmt_MIMG *)
Inst_MUBUF__BUFFER_LOAD_DWORDX4(InFmt_MUBUF *)
Inst_VOP1__V_SIN_F32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MSKOR_RTN_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_VINTRP__V_INTERP_MOV_F32()
~Inst_VOP3__V_CMP_LE_I32()
Inst_SOPK__S_CMPK_LE_I32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_RSUB_RTN_U64()
~Inst_DS__DS_MIN_SRC2_U64()
ScalarRegI32 findFirstZero(T val)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_EQ_F64()
Inst_VOP3__V_CMPX_T_U32(InFmt_VOP3 *)
~Inst_VOP2__V_SUBREV_F16()
~Inst_VOPC__V_CMPX_T_I16()
Inst_SOP1__S_NOT_B32(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_MIN_RTN_U32()
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_STORE_DWORDX2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CNDMASK_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_DIV_FMAS_F32()
~Inst_FLAT__FLAT_ATOMIC_SUB_X2()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NGE_F64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MOV_B32(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_GE_F32()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_T_I32()
Inst_VOP1__V_CVT_F16_I16(InFmt_VOP1 *)
Inst_SOP2__S_ABSDIFF_I32(InFmt_SOP2 *)
Inst_VOP2__V_ASHRREV_I32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MADAK_F16(InFmt_VOP2 *)
Inst_VOP3__V_CMPX_EQ_U32(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_ATOMIC_XOR(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_XOR_X2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_C_CL(InFmt_MIMG *)
Inst_VOP1__V_CVT_F16_F32(InFmt_VOP1 *)
void completeAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_NLG_F16(InFmt_VOPC *)
~Inst_DS__DS_SUB_SRC2_U32()
Inst_VOP3__V_RSQ_F32(InFmt_VOP3 *)
Inst_VOP1__V_READFIRSTLANE_B32(InFmt_VOP1 *)
Inst_VOP3__V_CVT_I32_F32(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_NE_I16()
void execute(GPUDynInstPtr) override
~Inst_SMEM__S_ATC_PROBE_BUFFER()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_O_F32()
~Inst_VOP2__V_LSHLREV_B32()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NLT_F16()
~Inst_FLAT__FLAT_ATOMIC_ADD()
Inst_VOPC__V_CMPX_NEQ_F16(InFmt_VOPC *)
Inst_VOPC__V_CMPX_O_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_TRUNC_F64()
Inst_SOP1__S_BITSET1_B64(InFmt_SOP1 *)
Inst_VOPC__V_CMPX_GT_F32(InFmt_VOPC *)
Inst_VOP3__V_CMP_NLT_F64(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_T_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GE_I32(InFmt_VOPC *)
~Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP_X2()
Inst_VOPC__V_CMPX_LE_F64(InFmt_VOPC *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_T_I16(InFmt_VOPC *)
Inst_MIMG__IMAGE_GATHER4_C_B_O(InFmt_MIMG *)
Inst_VOP2__V_MAC_F16(InFmt_VOP2 *)
Inst_MIMG__IMAGE_SAMPLE_C_CD_CL(InFmt_MIMG *)
~Inst_MUBUF__BUFFER_STORE_BYTE()
bool isReachingKernelEnd(Wavefront *wf)
Inst_SOP2__S_ANDN2_B32(InFmt_SOP2 *)
Inst_VOP1__V_BFREV_B32(InFmt_VOP1 *)
Inst_VOP1__V_NOT_B32(InFmt_VOP1 *)
~Inst_MUBUF__BUFFER_LOAD_SSHORT()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_GE_I64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_F32_U32(InFmt_VOP3 *)
~Inst_VOP3__V_MUL_HI_U32_U24()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAD_U32_U24(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_B_O()
~Inst_VINTRP__V_INTERP_P2_F32()
~Inst_DS__DS_MIN_RTN_F64()
void initiateAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_T_U16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_FFBL_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GT_I32()
Inst_SOP1__S_MOVRELS_B32(InFmt_SOP1 *)
Inst_MIMG__IMAGE_STORE_PCK(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_GETPC_B64(InFmt_SOP1 *)
~Inst_DS__DS_READ2ST64_B32()
Inst_VOPC__V_CMPX_EQ_F32(InFmt_VOPC *)
~Inst_VOP3__V_LSHLREV_B32()
Inst_MUBUF__BUFFER_LOAD_DWORD(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_LDEXP_F16(InFmt_VOP2 *)
~Inst_MIMG__IMAGE_LOAD_MIP_PCK_SGN()
Inst_VOP3__V_READLANE_B32(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_NLT_F64(InFmt_VOPC *)
~Inst_SOPC__S_CMP_LG_U64()
void execute(GPUDynInstPtr) override
~Inst_VOP2__V_SUBREV_U16()
Inst_MIMG__IMAGE_GATHER4_B_CL_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_EQ_U16(InFmt_VOP3 *)
RegisterManager * registerManager
Inst_VOP3__V_FREXP_EXP_I32_F32(InFmt_VOP3 *)
~Inst_SMEM__S_BUFFER_LOAD_DWORDX8()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_LOAD_SSHORT(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_DEC(InFmt_FLAT *)
~Inst_VOP1__V_CVT_F64_U32()
~Inst_SOPP__S_CBRANCH_CDBGUSER()
Inst_VOP3__V_CMP_T_U32(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_LE_F64()
Inst_SOP1__S_NOR_SAVEEXEC_B64(InFmt_SOP1 *)
~Inst_VOPC__V_CMP_NEQ_F32()
~Inst_DS__DS_XOR_SRC2_B32()
~Inst_VOPC__V_CMP_CLASS_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_FRACT_F16(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_LOAD_PCK()
Inst_VOP3__V_MIN_I16(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LE_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_LE_F32()
~Inst_VOP1__V_RNDNE_F16()
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_XOR()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_EQ_U16()
Inst_VOPC__V_CMP_U_F32(InFmt_VOPC *)
Inst_VOP3__V_MIN3_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NE_U32()
Inst_DS__DS_OR_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_DEC_RTN_U32(InFmt_DS *)
Inst_VOP3__V_FREXP_EXP_I16_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPP__S_SETHALT(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_L_O(InFmt_MIMG *)
Inst_VOP2__V_MAX_U16(InFmt_VOP2 *)
~Inst_DS__DS_MAX_RTN_U32()
Inst_MIMG__IMAGE_GET_RESINFO(InFmt_MIMG *)
Inst_DS__DS_CMPST_F64(InFmt_DS *)
void completeAcc(GPUDynInstPtr) override
~Inst_DS__DS_RSUB_SRC2_U64()
Inst_SOPP__S_CBRANCH_SCC1(InFmt_SOPP *)
~Inst_VOPC__V_CMP_CLASS_F64()
~Inst_VOP3__V_SUBREV_U16()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_CVT_U16_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MUL_U32_U24()
~Inst_SOPC__S_CMP_LG_I32()
Inst_SOP1__S_MOVRELD_B32(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_NLE_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_MOV_FED_B32()
~Inst_VOPC__V_CMP_NGT_F32()
Inst_MUBUF__BUFFER_WBINVL1(InFmt_MUBUF *)
Inst_VOP3__V_CMPX_NGT_F32(InFmt_VOP3 *)
~Inst_VOP1__V_TRUNC_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_EQ_F32()
~Inst_MUBUF__BUFFER_ATOMIC_ADD_X2()
~Inst_VOP3__V_TRUNC_F32()
Inst_VOP3__V_CMP_LG_F64(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_TRUNC_F16()
Inst_VOP3__V_DIV_FIXUP_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_SUB()
~Inst_VOP3__V_CMPX_LE_U32()
~Inst_DS__DS_GWS_SEMA_V()
Inst_VOP3__V_CMP_GE_I64(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_O_F64()
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_BCNT1_I32_B32()
Inst_VOP3__V_MED3_I32(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_NE_U16()
~Inst_DS__DS_MIN_SRC2_I64()
Inst_VOP3__V_CMP_GE_F16(InFmt_VOP3 *)
Inst_DS__DS_READ2_B64(InFmt_DS *)
Inst_VOP3__V_ALIGNBIT_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MIN_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MAD_U32_U24()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MQSAD_PK_U16_U8()
~Inst_VOP3__V_CMP_CLASS_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_MIN_SRC2_U32()
~Inst_SOPC__S_SET_GPR_IDX_ON()
void completeAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_TRU_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FREXP_EXP_I32_F64()
Inst_DS__DS_GWS_SEMA_RELEASE_ALL(InFmt_DS *)
ScalarRegI32 firstOppositeSignBit(ScalarRegI32 val)
Inst_VOPC__V_CMPX_T_U64(InFmt_VOPC *)
~Inst_SOP1__S_FLBIT_I32_B64()
Inst_FLAT__FLAT_STORE_DWORDX3(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NE_U32()
void execute(GPUDynInstPtr) override
Inst_VOP1__V_FLOOR_F64(InFmt_VOP1 *)
~Inst_VOP1__V_CVT_RPI_I32_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_FLOOR_F16()
~Inst_SOPK__S_CMPK_EQ_I32()
Inst_VOP3__V_CMPX_GT_I64(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_MIN_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_LOAD_UBYTE()
~Inst_DS__DS_MAX_SRC2_F32()
~Inst_VOP3__V_CMP_NLT_F64()
Inst_VOP3__V_CMP_LT_F32(InFmt_VOP3 *)
Inst_DS__DS_MAX_SRC2_I64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_LOAD_DWORD(InFmt_FLAT *)
Inst_VOP3__V_CVT_PK_U16_U32(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_NLT_F16(InFmt_VOPC *)
Inst_SOP1__S_SEXT_I32_I16(InFmt_SOP1 *)
~Inst_VOP3__V_SUBREV_F16()
Inst_VOP3__V_AND_B32(InFmt_VOP3 *)
~Inst_VOP3__V_FREXP_MANT_F64()
void execute(GPUDynInstPtr) override
~Inst_DS__DS_WRITE2_B64()
~Inst_DS__DS_MAX_SRC2_I64()
~Inst_VOPC__V_CMPX_GE_U16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NGE_F16()
Inst_DS__DS_DEC_RTN_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LE_F16()
~Inst_DS__DS_BPERMUTE_B32()
~Inst_VOP3__V_CVT_PKACCUM_U8_F32()
Inst_SOPC__S_CMP_GE_U32(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_INC_RTN_U64()
void execute(GPUDynInstPtr) override
T roundNearestEven(T val)
~Inst_SMEM__S_DCACHE_WB()
Inst_VOP3__V_XOR_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_SUBREV_F16(InFmt_VOP2 *)
~Inst_FLAT__FLAT_STORE_DWORD()
Inst_VOP3__V_MAX3_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_DEC_SRC2_U32()
Inst_SMEM__S_BUFFER_LOAD_DWORDX2(InFmt_SMEM *)
~Inst_SOPP__S_DECPERFLEVEL()
~Inst_MUBUF__BUFFER_ATOMIC_AND()
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MAX_U32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_EQ_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAX_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_SRC2_I32(InFmt_DS *)
Inst_VOP3__V_CMP_T_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_CBRANCH_CDBGSYS_AND_USER()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_LT_U16(InFmt_VOPC *)
~Inst_FLAT__FLAT_ATOMIC_XOR_X2()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_CLASS_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_WRXCHG2ST64_RTN_B64()
~Inst_VOP3__V_CMP_LT_F32()
void execute(GPUDynInstPtr) override
ScalarRegI32 findFirstOne(T val)
Inst_MIMG__IMAGE_SAMPLE_L(InFmt_MIMG *)
Inst_VOPC__V_CMPX_LT_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_SWIZZLE_B32()
Inst_SOPP__S_CBRANCH_EXECZ(InFmt_SOPP *)
Inst_VOP2__V_LSHLREV_B32(InFmt_VOP2 *)
LdsState & getLds() const
void execute(GPUDynInstPtr) override
Inst_VOP2__V_SUBREV_U16(InFmt_VOP2 *)
@ S_BARRIER
WF is stalled at a barrier.
Inst_VOPC__V_CMPX_EQ_F16(InFmt_VOPC *)
~Inst_SOPP__S_CBRANCH_EXECZ()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_SEXT_I32_I8(InFmt_SOP1 *)
Inst_VOP1__V_FFBH_U32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MAX_F32(InFmt_VOP2 *)
Inst_VOP2__V_MUL_HI_U32_U24(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_SEXT_I32_I16()
~Inst_FLAT__FLAT_ATOMIC_INC_X2()
Inst_FLAT__FLAT_ATOMIC_SMIN(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_DIV_FIXUP_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAD_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_GE_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_AND_X2(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_LE_I32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CVT_I32_F32(InFmt_VOP1 *)
Inst_FLAT__FLAT_LOAD_USHORT(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_FREXP_MANT_F16(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_GT_F16()
Inst_VOP3__V_CMPX_NEQ_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_WRITELANE_B32()
~Inst_MIMG__IMAGE_SAMPLE_C_L_O()
~Inst_SOP2__S_ANDN2_B32()
~Inst_MUBUF__BUFFER_STORE_SHORT()
~Inst_MIMG__IMAGE_SAMPLE_D_O()
Inst_VOPC__V_CMPX_NLG_F64(InFmt_VOPC *)
~Inst_SOPK__S_CBRANCH_I_FORK()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_DIV_FMAS_F64(InFmt_VOP3 *)
Inst_SOP2__S_XOR_B64(InFmt_SOP2 *)
Inst_VOPC__V_CMPX_GT_I32(InFmt_VOPC *)
Inst_MIMG__IMAGE_ATOMIC_CMPSWAP(InFmt_MIMG *)
~Inst_SOPP__S_CBRANCH_SCC0()
Inst_SOPC__S_CMP_LT_U32(InFmt_SOPC *)
~Inst_VOPC__V_CMP_TRU_F16()
~Inst_VOP3__V_QSAD_PK_U16_U8()
Inst_VOPC__V_CMP_O_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NLT_F16(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_LE_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NEQ_F16()
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LG_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_NOP(InFmt_VOP3 *)
Inst_VOP1__V_EXP_LEGACY_F32(InFmt_VOP1 *)
Inst_DS__DS_MIN_SRC2_F32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_ADD_F64(InFmt_VOP3 *)
~Inst_MUBUF__BUFFER_ATOMIC_AND_X2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_CLASS_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_SMAX_X2()
Inst_VOP1__V_COS_F32(InFmt_VOP1 *)
~Inst_MIMG__IMAGE_GATHER4_LZ()
Inst_VOPC__V_CMP_NLG_F32(InFmt_VOPC *)
~Inst_SOP1__S_SETPC_B64()
~Inst_VOPC__V_CMP_NLE_F64()
void completeAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_F_I16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP2__S_AND_B32(InFmt_SOP2 *)
Inst_DS__DS_SUB_RTN_U64(InFmt_DS *)
Inst_VOP3__V_LDEXP_F64(InFmt_VOP3 *)
Inst_MIMG__IMAGE_SAMPLE_C_B_CL_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_LOAD_MIP_PCK()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NGE_F64()
Inst_SOP1__S_FLBIT_I32_I64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_UMAX(InFmt_MUBUF *)
void initiateAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_CD_CL()
int scalarOutstandingReqsWrGm
Inst_VOP3__V_CVT_FLR_I32_F32(InFmt_VOP3 *)
Inst_VOP1__V_CVT_U32_F32(InFmt_VOP1 *)
Inst_DS__DS_MAX_RTN_I32(InFmt_DS *)
void initiateAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LE_I64()
~Inst_VOP3__V_CMP_NLG_F64()
Inst_DS__DS_MIN_SRC2_F64(InFmt_DS *)
~Inst_VOP3__V_RNDNE_F64()
Inst_VOP3__V_MED3_U32(InFmt_VOP3 *)
Inst_VOP3__V_CVT_I32_F64(InFmt_VOP3 *)
Inst_SOP2__S_ADD_U32(InFmt_SOP2 *)
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NGT_F64()
void execute(GPUDynInstPtr) override
Inst_SOPK__S_CBRANCH_I_FORK(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NE_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_STORE_DWORDX4()
~Inst_MIMG__IMAGE_ATOMIC_AND()
~Inst_VOPC__V_CMP_LE_U64()
void execute(GPUDynInstPtr) override
InFmt_VOP3_SDST_ENC instData
Inst_VOPC__V_CMP_LT_F16(InFmt_VOPC *)
Inst_VOPC__V_CMPX_LT_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CUBESC_F32()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_SMEM__S_BUFFER_LOAD_DWORDX4()
int popCount(uint64_t val)
Returns the number of set ones in the provided value.
Inst_SOP2__S_BFE_U32(InFmt_SOP2 *)
~Inst_VOP1__V_RNDNE_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_CVT_F32_UBYTE1()
Inst_VOP3__V_DIV_FIXUP_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NLE_F64(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_LE_U16()
Inst_DS__DS_CMPST_RTN_B64(InFmt_DS *)
~Inst_SOP1__S_FF0_I32_B32()
Inst_DS__DS_MIN_RTN_I32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NE_I16()
~Inst_MIMG__IMAGE_SAMPLE_L_O()
~Inst_SOPK__S_CMPK_LE_U32()
Inst_DS__DS_OR_RTN_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MIN_U16(InFmt_VOP2 *)
Inst_SOP1__S_MOV_B32(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CEIL_F32(InFmt_VOP1 *)
~Inst_VOP2__V_LDEXP_F16()
Inst_VOP1__V_RNDNE_F16(InFmt_VOP1 *)
~Inst_VOP3__V_CMPX_GE_F32()
~Inst_VOPC__V_CMP_T_U32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_CLASS_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_WRXCHG2_RTN_B32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NLT_F32(InFmt_VOP3 *)
~Inst_VOP2__V_MUL_HI_I32_I24()
Inst_VOP3__V_CMP_LE_U16(InFmt_VOP3 *)
Inst_VOP3__V_CMP_GT_I16(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_MUL_LO_U32()
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_CBRANCH_EXECNZ()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NLT_F32()
Inst_VOPC__V_CMP_NE_U64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_RCP_IFLAG_F32(InFmt_VOP3 *)
~Inst_VOP2__V_LSHRREV_B32()
~Inst_DS__DS_CMPST_RTN_F32()
Inst_VOPC__V_CMPX_NE_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_ORN2_B32(InFmt_SOP2 *)
Inst_VOP3__V_LERP_U8(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_LE_F32()
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_WRITE_B128()
Inst_VOP3__V_LSHLREV_B64(InFmt_VOP3 *)
Inst_VOP1__V_CVT_I16_F16(InFmt_VOP1 *)
~Inst_SOP1__S_MOVRELS_B64()
~Inst_MIMG__IMAGE_SAMPLE_LZ()
void execute(GPUDynInstPtr) override
Inst_DS__DS_READ2_B32(InFmt_DS *)
Inst_VOP3__V_CMPX_EQ_U64(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_EQ_F32()
~Inst_MIMG__IMAGE_GATHER4_C_CL()
Inst_MUBUF__BUFFER_ATOMIC_UMIN(InFmt_MUBUF *)
Inst_VOP3__V_CMPX_NLT_F64(InFmt_VOP3 *)
void calcAddr(GPUDynInstPtr gpuDynInst, VOFF v_off, VIDX v_idx, SRSRC s_rsrc_desc, SOFF s_offset, int inst_offset)
MUBUF insructions calculate their addresses as follows:
void execute(GPUDynInstPtr) override
Inst_VOP3__V_SUB_U32(InFmt_VOP3_SDST_ENC *)
Inst_SOP2__S_BFM_B32(InFmt_SOP2 *)
~Inst_VOP3__V_CMPX_LE_F16()
Inst_SOPK__S_MOVK_I32(InFmt_SOPK *)
def format Nop(code, *opt_flags)
~Inst_VOPC__V_CMP_LT_I16()
~Inst_VOP3__V_INTERP_P1LV_F16()
~Inst_VOPC__V_CMP_LE_U16()
~Inst_VOPC__V_CMP_NGE_F32()
~Inst_VOP3__V_CMPX_F_F32()
~Inst_DS__DS_WRXCHG2ST64_RTN_B32()
~Inst_VOP3__V_LSHLREV_B64()
Inst_VOPC__V_CMP_TRU_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_STORE_MIP_PCK()
Inst_MIMG__IMAGE_SAMPLE_B_CL(InFmt_MIMG *)
Inst_VOP3__V_CUBEID_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_INCPERFLEVEL()
~Inst_VOPC__V_CMPX_TRU_F16()
void setStatus(status_e newStatus)
~Inst_VOPC__V_CMP_F_F64()
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_CBRANCH_CDBGSYS()
void execute(GPUDynInstPtr) override
~Inst_SOPK__S_CMPK_LT_I32()
Inst_SMEM__S_LOAD_DWORDX2(InFmt_SMEM *)
Inst_VOPC__V_CMP_NGT_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_F_I16()
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_INC(InFmt_MUBUF *)
Inst_DS__DS_INC_U32(InFmt_DS *)
Inst_VOP2__V_MUL_F16(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CEIL_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_NE_I32(InFmt_VOPC *)
Inst_VOP1__V_CVT_F32_UBYTE2(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LE_I32(InFmt_VOP3 *)
Inst_VOP3__V_BCNT_U32_B32(InFmt_VOP3 *)
Inst_VOP3__V_MOV_FED_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPP__S_ICACHE_INV(InFmt_SOPP *)
Inst_FLAT__FLAT_ATOMIC_DEC_X2(InFmt_FLAT *)
Inst_MUBUF__BUFFER_ATOMIC_SMAX(InFmt_MUBUF *)
~Inst_VOPC__V_CMP_O_F32()
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_CBRANCH_JOIN()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_GT_U16(InFmt_VOP3 *)
Inst_VOP3__V_CMP_LT_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_LOAD_PCK_SGN()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MIN3_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_F_F64()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_FREXP_MANT_F16()
void execute(GPUDynInstPtr) override
Inst_SOP2__S_LSHR_B32(InFmt_SOP2 *)
~Inst_SOP2__S_ABSDIFF_I32()
~Inst_VOP3__V_CMPX_F_I64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_COS_F32(InFmt_VOP3 *)
Inst_FLAT__FLAT_ATOMIC_XOR_X2(InFmt_FLAT *)
Inst_VOP3__V_CMPX_F_F16(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_LOAD_SBYTE(InFmt_MUBUF *)
Inst_MIMG__IMAGE_ATOMIC_AND(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GE_U16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_EQ_I32(InFmt_VOP3 *)
Inst_MIMG__IMAGE_GATHER4(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP1__V_LOG_F16(InFmt_VOP1 *)
Inst_DS__DS_ORDERED_COUNT(InFmt_DS *)
Inst_VOP3__V_DIV_FIXUP_F16(InFmt_VOP3 *)
Inst_VOP3__V_LOG_F32(InFmt_VOP3 *)
Inst_VOP3__V_MAX3_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_ALIGNBIT_B32()
Inst_VOP1__V_CVT_F64_F32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_READ_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NE_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_FF0_I32_B64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LG_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_FLOOR_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_RTN_F32(InFmt_DS *)
Inst_VOPC__V_CMP_GE_F64(InFmt_VOPC *)
Inst_MUBUF__BUFFER_WBINVL1_VOL(InFmt_MUBUF *)
~Inst_VOP3__V_CMPX_LT_F16()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_STORE_LDS_DWORD()
~Inst_VOP2__V_SUBREV_U32()
~Inst_VOPC__V_CMPX_U_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE()
Inst_SOPC__S_CMP_EQ_I32(InFmt_SOPC *)
~Inst_VOPC__V_CMPX_F_I16()
~Inst_VOP3__V_LSHRREV_B32()
Inst_VOPC__V_CMPX_LT_I16(InFmt_VOPC *)
Stats::Scalar completedWfs
Inst_SOP1__S_BREV_B64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_LT_F64()
Inst_MIMG__IMAGE_SAMPLE_CL_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NGT_F16(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
void notifyWgCompl(Wavefront *wf)
When an end program instruction detects that the last WF in a WG has completed it will call this meth...
~Inst_SOPC__S_CMP_EQ_I32()
~Inst_MUBUF__BUFFER_ATOMIC_DEC()
~Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP()
GPUDispatcher & dispatcher()
~Inst_MIMG__IMAGE_GATHER4_C_O()
Inst_DS__DS_SUB_SRC2_U32(InFmt_DS *)
Inst_VOP3__V_CMPX_NE_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_O_F16()
Inst_VOP1__V_CVT_F32_F64(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_XOR_SAVEEXEC_B64(InFmt_SOP1 *)
Inst_MIMG__IMAGE_GATHER4_C(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_CVT_F32_UBYTE2()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_EQ_F16()
Inst_MIMG__IMAGE_GATHER4_C_LZ_O(InFmt_MIMG *)
~Inst_DS__DS_GWS_SEMA_BR()
~Inst_VOP3__V_MAD_I64_I32()
Inst_VOP3__V_CVT_OFF_F32_I4(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_SOP1__S_BCNT1_I32_B32(InFmt_SOP1 *)
void completeAcc(GPUDynInstPtr) override
Inst_DS__DS_READ_I16(InFmt_DS *)
~Inst_VOP3__V_CMPX_GE_U32()
void execute(GPUDynInstPtr) override
void flushBuf(int wfSlotId)
Inst_MIMG__IMAGE_SAMPLE_C_D_CL(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_D_CL_O(InFmt_MIMG *)
Inst_MIMG__IMAGE_SAMPLE_D_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_CONDXCHG32_RTN_B64()
~Inst_VOP3__V_CMP_LT_U16()
~Inst_VOPC__V_CMPX_NLE_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRXCHG2ST64_RTN_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_XNOR_B32(InFmt_SOP2 *)
Inst_VOP3__V_EXP_F32(InFmt_VOP3 *)
Inst_FLAT__FLAT_STORE_SHORT(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_GT_F32()
Inst_VOPC__V_CMPX_F_F64(InFmt_VOPC *)
Inst_VOP3__V_CMP_F_U64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_CMPST_RTN_B32(InFmt_DS *)
Inst_VOP3__V_LSHRREV_B32(InFmt_VOP3 *)
~Inst_VOP3__V_FRACT_F64()
ComputeUnit * computeUnit
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_B_CL_O()
Inst_VOP1__V_TRUNC_F32(InFmt_VOP1 *)
Inst_SOPP__S_SET_GPR_IDX_OFF(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_LT_F64(InFmt_VOPC *)
~Inst_SOPC__S_CMP_EQ_U64()
Inst_DS__DS_READ2ST64_B32(InFmt_DS *)
Inst_VOP3__V_ADDC_U32(InFmt_VOP3_SDST_ENC *)
Inst_VOP3__V_CMP_NE_U64(InFmt_VOP3 *)
void decMaxBarrierCnt(int bar_id)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP2__S_CSELECT_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_LOG_LEGACY_F32(InFmt_VOP1 *)
~Inst_SOPP__S_ICACHE_INV()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_FRACT_F16(InFmt_VOP3 *)
~Inst_VOP1__V_RCP_IFLAG_F32()
Inst_VOPC__V_CMPX_T_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MIN_RTN_U64(InFmt_DS *)
~Inst_FLAT__FLAT_LOAD_DWORDX2()
~Inst_VOPC__V_CMPX_EQ_U16()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_GT_F64(InFmt_VOPC *)
~Inst_VOPC__V_CMP_F_U32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_U_F64(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_O_F16(InFmt_VOP3 *)
Inst_VOPC__V_CMP_NLT_F32(InFmt_VOPC *)
~Inst_VOPC__V_CMP_GT_F64()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_O_F32(InFmt_VOPC *)
Inst_VOP2__V_LSHLREV_B16(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CVT_F32_UBYTE2()
Inst_VOP3__V_SUBREV_U16(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_LE_I16(InFmt_VOPC *)
~Inst_VOP3__V_CMP_GE_U64()
~Inst_VOP3__V_CMPX_LE_F32()
~Inst_VOP1__V_CVT_F32_UBYTE3()
Inst_VOP3__V_CMP_CLASS_F32(InFmt_VOP3 *)
Inst_VOPC__V_CMP_CLASS_F32(InFmt_VOPC *)
Inst_MUBUF__BUFFER_ATOMIC_AND_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_SAD_HI_U8()
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NLG_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_SMIN_X2()
Inst_VOP3__V_CMP_EQ_U64(InFmt_VOP3 *)
Inst_SMEM__S_LOAD_DWORDX4(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CVT_F32_UBYTE1(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_C_B_CL_O(InFmt_MIMG *)
~Inst_VOP1__V_FLOOR_F64()
~Inst_MIMG__IMAGE_SAMPLE_B()
~Inst_DS__DS_DEC_SRC2_U64()
Inst_DS__DS_GWS_SEMA_P(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_PKRTZ_F16_F32(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_F_U64()
~Inst_SOP1__S_XNOR_SAVEEXEC_B64()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_EQ_I32()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Read 1 dword from scalar data cache.
Inst_VOP3__V_RNDNE_F64(InFmt_VOP3 *)
~Inst_VOP1__V_CVT_FLR_I32_F32()
int scalarOutstandingReqsRdGm
void initiateAcc(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_SWAP_X2(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GT_U64()
Inst_VOPC__V_CMP_U_F64(InFmt_VOPC *)
Inst_VOP1__V_SQRT_F16(InFmt_VOP1 *)
~Inst_VOP2__V_ASHRREV_I32()
Inst_FLAT__FLAT_STORE_DWORD(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_U_F16()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_LZ(InFmt_MIMG *)
~Inst_VOPC__V_CMP_LE_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_EQ_U64()
Inst_MIMG__IMAGE_SAMPLE_CD_CL_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CUBEMA_F32()
Inst_MUBUF__BUFFER_STORE_LDS_DWORD(InFmt_MUBUF *)
~Inst_DS__DS_MIN_SRC2_F32()
Inst_VOP3__V_CMPX_U_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_F_F64(InFmt_VOP3 *)
Inst_VOP3__V_CMP_NE_U16(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_GT_F64(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP2__S_CBRANCH_G_FORK(InFmt_SOP2 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_O(InFmt_MIMG *)
~Inst_VOPC__V_CMP_LT_F32()
Inst_MUBUF__BUFFER_ATOMIC_UMIN_X2(InFmt_MUBUF *)
~Inst_VOP3__V_CMP_T_U16()
~Inst_SOPK__S_CMPK_GE_U32()
Inst_SOPC__S_SETVSKIP(InFmt_SOPC *)
Inst_MIMG__IMAGE_GATHER4_B_CL(InFmt_MIMG *)
~Inst_VOP3__V_CMPX_NLE_F16()
Inst_SOP1__S_ABS_I32(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPC__S_CMP_GT_U32(InFmt_SOPC *)
~Inst_VOP3__V_CMPX_CLASS_F64()
Inst_VOP3__V_SQRT_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LE_U32(InFmt_VOP3 *)
~Inst_VOP2__V_LSHLREV_B16()
~Inst_SOPK__S_GETREG_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_READ_B32(InFmt_DS *)
classes that represnt vector/scalar operands in GCN3 ISA.
Inst_VOP3__V_CEIL_F16(InFmt_VOP3 *)
~Inst_VOP1__V_TRUNC_F64()
~Inst_VOP3__V_MBCNT_LO_U32_B32()
void initiateAcc(GPUDynInstPtr) override
Inst_SOP2__S_MAX_U32(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_TRU_F64(InFmt_VOPC *)
~Inst_VOP3__V_CMP_TRU_F64()
Inst_VOP3__V_CMP_NE_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_SWAP(InFmt_MUBUF *)
void initiateAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_NE_I32(InFmt_VOPC *)
VecOperand< VecElemU32, true > ConstVecOperandU32
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_O_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_LOAD_SBYTE()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NLG_F32()
~Inst_VOP3__V_CMPX_NGE_F64()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_QUADMASK_B32(InFmt_SOP1 *)
~Inst_FLAT__FLAT_ATOMIC_CMPSWAP_X2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_OR()
Inst_DS__DS_WRITE_B32(InFmt_DS *)
~Inst_VOP1__V_READFIRSTLANE_B32()
~Inst_VOP3__V_LSHRREV_B64()
Inst_VOP3__V_CMPX_LE_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GT_I64()
Inst_SOP1__S_MOV_B64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FREXP_EXP_I32_F32()
void execute(GPUDynInstPtr) override
Inst_SOPK__S_CMPK_LG_I32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
int maxBarrierCnt(int bar_id)
~Inst_VOPC__V_CMP_NEQ_F64()
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_DS__DS_OR_SRC2_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NGE_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_CD_CL_O()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MUL_I32_I24()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GE_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LE_U16()
~Inst_FLAT__FLAT_STORE_DWORDX4()
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAX_U16(InFmt_VOP3 *)
~Inst_MIMG__IMAGE_ATOMIC_XOR()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
ScalarRegI32 findFirstOneMsb(T val)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_L()
Inst_VOP3__V_FLOOR_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_ADD_SRC2_U32(InFmt_DS *)
Inst_VOP2__V_MUL_F32(InFmt_VOP2 *)
Inst_SOPC__S_CMP_LG_U32(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_F_I64()
Inst_SOPK__S_CMPK_GE_U32(InFmt_SOPK *)
Inst_SOP2__S_BFE_U64(InFmt_SOP2 *)
~Inst_DS__DS_WRAP_RTN_B32()
Inst_VOP3__V_CMPX_LG_F64(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_CLASS_F32()
~Inst_SOP1__S_AND_SAVEEXEC_B64()
Inst_MIMG__IMAGE_LOAD_PCK_SGN(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_ANDN2_SAVEEXEC_B64()
~Inst_VOP3__V_CMPX_LE_U64()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_O(InFmt_MIMG *)
Inst_MUBUF__BUFFER_ATOMIC_SMIN_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_CVT_F32_U32()
Inst_VOP3__V_CUBETC_F32(InFmt_VOP3 *)
Inst_FLAT__FLAT_ATOMIC_AND(InFmt_FLAT *)
Inst_VOP1__V_RCP_F64(InFmt_VOP1 *)
Inst_VOP1__V_RCP_IFLAG_F32(InFmt_VOP1 *)
Inst_VOP3__V_CMPX_NEQ_F16(InFmt_VOP3 *)
~Inst_VOP1__V_FLOOR_F16()
Inst_VOP3__V_MAD_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_ATOMIC_UMAX(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LE_U64(InFmt_VOPC *)
Inst_VOPC__V_CMP_EQ_F16(InFmt_VOPC *)
Inst_DS__DS_MSKOR_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_INC_RTN_U32()
Inst_VOP3__V_MIN_F16(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_ATOMIC_SWAP_X2(InFmt_MUBUF *)
Inst_VOP1__V_EXP_F32(InFmt_VOP1 *)
~Inst_VOPC__V_CMPX_LT_I32()
Inst_FLAT__FLAT_ATOMIC_CMPSWAP(InFmt_FLAT *)
~Inst_DS__DS_CMPST_RTN_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_WBINVL1()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_PKACCUM_U8_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_I32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GT_I16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_F64_F32(InFmt_VOP3 *)
Inst_VOPC__V_CMP_NLE_F64(InFmt_VOPC *)
uint8_t permute(uint64_t in_dword2x, uint32_t sel)
~Inst_VOPC__V_CMPX_LT_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_RFE_B64(InFmt_SOP1 *)
~Inst_VOP3__V_MAD_LEGACY_F32()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_ATOMIC_OR()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_TRUNC_F16(InFmt_VOP1 *)
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NE_I32()
Inst_VOP3__V_CMP_GE_F64(InFmt_VOP3 *)
Inst_VOPC__V_CMP_NEQ_F16(InFmt_VOPC *)
Inst_VOP2__V_MAX_I32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_DEC_SRC2_U64(InFmt_DS *)
std::vector< VectorRegisterFile * > vrf
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_EQ_F64()
void completeAcc(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_TRIG_PREOP_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_ATOMIC_CMPSWAP()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_SQRT_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_L_O()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_L_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_BFREV_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPK__S_SETREG_B32(InFmt_SOPK *)
~Inst_SOP1__S_BITSET0_B32()
~Inst_VOPC__V_CMPX_NE_I16()
~Inst_VOPC__V_CMPX_LE_U64()
Inst_VOPC__V_CMP_NGE_F16(InFmt_VOPC *)
Inst_DS__DS_APPEND(InFmt_DS *)
Inst_SMEM__S_DCACHE_INV_VOL(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_LOAD(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NE_U64()
~Inst_VOP3__V_CVT_I32_F64()
~Inst_FLAT__FLAT_LOAD_DWORD()
Inst_SOP1__S_AND_SAVEEXEC_B64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_RTN_F64(InFmt_DS *)
Inst_VOP1__V_CEIL_F64(InFmt_VOP1 *)
~Inst_DS__DS_ORDERED_COUNT()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_ANDN2_SAVEEXEC_B64(InFmt_SOP1 *)
Inst_DS__DS_ADD_RTN_F32(InFmt_DS *)
Inst_VOPC__V_CMPX_GT_U64(InFmt_VOPC *)
~Inst_VOP3__V_CVT_F32_UBYTE0()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LT_F64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_AND()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NGT_F64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_INTERP_P1LL_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_FRACT_F16()
~Inst_VOP3__V_CMPX_NEQ_F64()
Inst_MIMG__IMAGE_SAMPLE_C_CD(InFmt_MIMG *)
Inst_FLAT__FLAT_LOAD_UBYTE(InFmt_FLAT *)
~Inst_SMEM__S_DCACHE_WB_VOL()
Inst_VOPC__V_CMPX_NEQ_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_MAX_SRC2_F64()
Inst_VOP3__V_OR_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_C_B_CL_O()
~Inst_DS__DS_MIN_SRC2_I32()
~Inst_VOP1__V_CVT_U32_F64()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_O()
~Inst_MUBUF__BUFFER_ATOMIC_DEC_X2()
~Inst_SMEM__S_BUFFER_LOAD_DWORD()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_FFBL_B32(InFmt_VOP1 *)
Inst_VOP3__V_CMPX_NLG_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CVT_PKNORM_U16_F32(InFmt_VOP3 *)
Inst_MIMG__IMAGE_SAMPLE_C_CL_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NEQ_F16(InFmt_VOP3 *)
Inst_DS__DS_RSUB_RTN_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPC__S_CMP_LG_I32(InFmt_SOPC *)
~Inst_VOP3__V_CMP_LE_F64()
Inst_VOPC__V_CMPX_U_F32(InFmt_VOPC *)
~Inst_VOP2__V_MADAK_F16()
void execute(GPUDynInstPtr) override
Inst_VOP1__V_RCP_F16(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_SOP1__S_ORN2_SAVEEXEC_B64()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_T_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_NGE_F64(InFmt_VOPC *)
~Inst_VOP3__V_CMP_LG_F16()
Inst_SOPK__S_CMPK_EQ_I32(InFmt_SOPK *)
Inst_FLAT__FLAT_ATOMIC_SMAX_X2(InFmt_FLAT *)
Inst_MIMG__IMAGE_GATHER4_C_L(InFmt_MIMG *)
Inst_VOP3__V_CMPX_F_U64(InFmt_VOP3 *)
~Inst_DS__DS_OR_SRC2_B64()
~Inst_FLAT__FLAT_ATOMIC_CMPSWAP()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_FREXP_MANT_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_F_U16()
~Inst_DS__DS_INC_SRC2_U32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_FLBIT_I32_B64(InFmt_SOP1 *)
~Inst_VOP3__V_CMP_TRU_F32()
~Inst_VOP3__V_CVT_F64_F32()
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_INTERP_MOV_F32()
void execute(GPUDynInstPtr) override
Inst_DS__DS_ADD_U64(InFmt_DS *)
Inst_VOP3__V_CMP_NLG_F32(InFmt_VOP3 *)
Inst_FLAT__FLAT_ATOMIC_SUB(InFmt_FLAT *)
~Inst_VOP3__V_CMPX_T_I64()
Inst_MUBUF__BUFFER_STORE_DWORDX2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MIN_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NGE_F16()
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_STORE_SHORT()
Inst_VOP1__V_LOG_F32(InFmt_VOP1 *)
Inst_VOP3__V_MAX3_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GE_I32()
~Inst_DS__DS_GWS_SEMA_P()
void execute(GPUDynInstPtr) override
Inst_VOP2__V_SUBREV_F32(InFmt_VOP2 *)
Inst_MIMG__IMAGE_GATHER4_C_LZ(InFmt_MIMG *)
Inst_VOPC__V_CMPX_NLG_F16(InFmt_VOPC *)
~Inst_VOP3__V_CVT_PKNORM_U16_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_STORE(InFmt_MIMG *)
Inst_VOP3__V_CMP_GE_U64(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_NGT_F64()
Inst_VOPC__V_CMP_LE_I16(InFmt_VOPC *)
~Inst_VOP3__V_CMP_LT_I64()
Inst_SOP1__S_NOT_B64(InFmt_SOP1 *)
~Inst_DS__DS_WRITE2ST64_B64()
Inst_SMEM__S_LOAD_DWORDX8(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MIN_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_EQ_I32(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_LE_I16()
~Inst_VOP3__V_CVT_U32_F64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_WRITE2ST64_B32()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_SUBREV_F32(InFmt_VOP3 *)
Inst_MIMG__IMAGE_GATHER4_C_B_CL(InFmt_MIMG *)
Inst_VOPC__V_CMPX_GE_U16(InFmt_VOPC *)
Inst_VOP3__V_MQSAD_U32_U8(InFmt_VOP3 *)
~Inst_SOPC__S_BITCMP0_B64()
~Inst_VOP3__V_CMP_NLE_F32()
Inst_VOP1__V_CLREXCP(InFmt_VOP1 *)
~Inst_VOP3__V_CMP_GT_I32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_O_F64(InFmt_VOP3 *)
Inst_SOP1__S_SETPC_B64(InFmt_SOP1 *)
~Inst_MUBUF__BUFFER_LOAD_DWORDX3()
Inst_VOPC__V_CMPX_NGE_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_SOPP__S_CBRANCH_CDBGSYS_OR_USER(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_BFM_B64(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_U_F32()
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRITE2ST64_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_EQ_F64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void releaseBarrier(int bar_id)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_GE_I16(InFmt_VOPC *)
Inst_DS__DS_READ2ST64_B64(InFmt_DS *)
~Inst_VOP2__V_SUBBREV_U32()
Inst_VOP1__V_RNDNE_F32(InFmt_VOP1 *)
~Inst_VOPC__V_CMPX_GT_F64()
Inst_VOP1__V_MOV_FED_B32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_INC_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NE_U64(InFmt_VOP3 *)
Inst_VOP2__V_SUBBREV_U32(InFmt_VOP2 *)
Inst_DS__DS_MAX_RTN_U32(InFmt_DS *)
~Inst_VOP3__V_CMPX_LG_F16()
Inst_VOPC__V_CMP_LE_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_EQ_I64()
Inst_FLAT__FLAT_ATOMIC_SMAX(InFmt_FLAT *)
Inst_VOP3__V_CMPX_LE_U16(InFmt_VOP3 *)
~Inst_SOP1__S_BCNT0_I32_B64()
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NGT_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NE_I16()
~Inst_VOPC__V_CMPX_O_F64()
FetchUnit & fetchUnit(int simdId)
void initiateAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GT_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_B_CL()
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRITE2ST64_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_F_U16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LT_U16(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_NEQ_F16()
Inst_VOPC__V_CMPX_NGT_F32(InFmt_VOPC *)
~Inst_MIMG__IMAGE_GATHER4_B()
Inst_SOP2__S_ADD_I32(InFmt_SOP2 *)
~Inst_VOP3__V_CMPX_NLG_F32()
Inst_VOPC__V_CMP_O_F32(InFmt_VOPC *)
~Inst_MIMG__IMAGE_ATOMIC_SMAX()
Inst_SMEM__S_DCACHE_INV(InFmt_SMEM *)
void validateRequestCounters()
Inst_VOP1__V_CVT_F64_I32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_DEC_U32(InFmt_DS *)
~Inst_DS__DS_ADD_RTN_F32()
~Inst_SOPP__S_SENDMSGHALT()
Inst_VOPC__V_CMPX_LT_F16(InFmt_VOPC *)
~Inst_VOP3__V_SUBBREV_U32()
~Inst_VOPC__V_CMP_LE_I64()
~Inst_VOPC__V_CMPX_F_U32()
~Inst_VOP3__V_CVT_PK_U8_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_EXP_LEGACY_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_BCNT1_I32_B64()
Inst_VOPC__V_CMP_T_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_OR_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_CLASS_F64()
Inst_DS__DS_WRXCHG2ST64_RTN_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NGE_F16(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_NLG_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_NLT_F64(InFmt_VOPC *)
Inst_DS__DS_WRITE_B96(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_LSHLREV_B16()
void execute(GPUDynInstPtr) override
~Inst_DS__DS_AND_RTN_B32()
Inst_FLAT__FLAT_ATOMIC_SUB_X2(InFmt_FLAT *)
~Inst_FLAT__FLAT_LOAD_SSHORT()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP2__S_NAND_B64(InFmt_SOP2 *)
Inst_DS__DS_CMPST_RTN_F32(InFmt_DS *)
void initiateAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_CD()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GE_U64(InFmt_VOPC *)
~Inst_SOP1__S_XOR_SAVEEXEC_B64()
Inst_DS__DS_MIN_I64(InFmt_DS *)
~Inst_VOP3__V_CMP_U_F64()
~Inst_VOPC__V_CMPX_TRU_F64()
~Inst_VOP3__V_CMPX_GE_I64()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LT_F32(InFmt_VOPC *)
void initiateAcc(GPUDynInstPtr) override
Inst_SMEM__S_BUFFER_STORE_DWORDX4(InFmt_SMEM *)
Inst_VOPC__V_CMP_GE_U32(InFmt_VOPC *)
~Inst_VOPC__V_CMPX_NLG_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP2__V_CNDMASK_B32()
~Inst_VOPC__V_CMPX_NLE_F64()
Inst_VOPC__V_CMPX_F_I16(InFmt_VOPC *)
Inst_SOP2__S_BFE_I32(InFmt_SOP2 *)
~Inst_VOP3__V_CMPX_NLT_F16()
~Inst_VOPC__V_CMP_T_U16()
~Inst_VOPC__V_CMPX_LT_F16()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NEQ_F64()
Inst_VOP3__V_SIN_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_T_I64()
Inst_VOPC__V_CMPX_NGE_F32(InFmt_VOPC *)
Inst_SOPP__S_WAKEUP(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NLG_F16()
~Inst_VOP3__V_LSHRREV_B16()
~Inst_VOP1__V_CVT_I32_F32()
~Inst_VOPC__V_CMP_T_I16()
~Inst_VOPC__V_CMP_NLT_F64()
~Inst_VOP3__V_CNDMASK_B32()
void execute(GPUDynInstPtr) override
Inst_DS__DS_MSKOR_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MAX_F16(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_DIV_SCALE_F64(InFmt_VOP3_SDST_ENC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MIN_F16(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_F_U64()
~Inst_VOP3__V_CMPX_LT_U64()
Inst_DS__DS_MAX_SRC2_U64(InFmt_DS *)
Inst_VOP3__V_CMPX_F_F64(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_EQ_U16()
Inst_VOP3__V_CMPX_EQ_U16(InFmt_VOP3 *)
Inst_VOP1__V_COS_F16(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GE_I16()
Inst_VOPC__V_CMP_F_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LE_I16(InFmt_VOP3 *)
Inst_VOP3__V_MAD_I32_I24(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_CLASS_F16()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NEQ_F16()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_U_F64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_LDEXP_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_F_F64()
~Inst_SMEM__S_LOAD_DWORDX8()
~Inst_VOPC__V_CMP_NLG_F32()
Inst_VOP3__V_ADD_F16(InFmt_VOP3 *)
~Inst_MUBUF__BUFFER_LOAD_DWORDX2()
~Inst_DS__DS_MSKOR_RTN_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Read 2 dwords from scalar data cache.
~Inst_MIMG__IMAGE_STORE_MIP()
Inst_SMEM__S_BUFFER_LOAD_DWORDX16(InFmt_SMEM *)
Inst_SOP1__S_XNOR_SAVEEXEC_B64(InFmt_SOP1 *)
Inst_SOP2__S_NOR_B64(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_ADD_F32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_ADD_F32(InFmt_DS *)
Inst_SOPP__S_SENDMSGHALT(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_SUB_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_SRC2_F32(InFmt_DS *)
Inst_VOP3__V_MBCNT_LO_U32_B32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MUL_I32_I24(InFmt_VOP2 *)
~Inst_VOP3__V_CMPX_LE_I16()
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_SAD_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_T_U64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FREXP_EXP_I16_F16()
Inst_SOPP__S_BRANCH(InFmt_SOPP *)
Inst_VOPC__V_CMPX_LE_U64(InFmt_VOPC *)
Inst_VOP2__V_ADDC_U32(InFmt_VOP2 *)
~Inst_SOPC__S_CMP_EQ_U32()
Inst_VOPC__V_CMPX_NGT_F64(InFmt_VOPC *)
~Inst_VOP3__V_CMPX_NLE_F64()
~Inst_DS__DS_OR_RTN_B64()
Inst_FLAT__FLAT_ATOMIC_OR_X2(InFmt_FLAT *)
Inst_VOPC__V_CMP_NE_U32(InFmt_VOPC *)
Inst_VOP1__V_CVT_F32_U32(InFmt_VOP1 *)
Inst_MUBUF__BUFFER_LOAD_SSHORT(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_SET_GPR_IDX_MODE()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LT_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_F_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_OR_RTN_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
~Inst_SMEM__S_STORE_DWORD()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_U_F64()
Inst_VOPC__V_CMPX_EQ_I16(InFmt_VOPC *)
~Inst_VOP3__V_CVT_I16_F16()
Inst_VOP3__V_CMPX_GT_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_LOAD_MIP()
Inst_VOP3__V_CMPX_TRU_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_B_CL()
Inst_VOP3__V_CMPX_O_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_XOR_SRC2_B64(InFmt_DS *)
Inst_VOP2__V_MADMK_F16(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_F_I16(InFmt_VOP3 *)
Inst_SOP2__S_BFE_I64(InFmt_SOP2 *)
Inst_VOPC__V_CMP_GT_U64(InFmt_VOPC *)
~Inst_VOP3__V_CVT_F64_U32()
~Inst_VOPC__V_CMP_LT_U64()
void execute(GPUDynInstPtr) override
~Inst_SOPC__S_CMP_LT_U32()
Inst_SOP2__S_ASHR_I64(InFmt_SOP2 *)
~Inst_MUBUF__BUFFER_ATOMIC_UMAX()
Inst_MIMG__IMAGE_ATOMIC_SUB(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_LZ_O()
~Inst_VOP3__V_CMPX_GT_U32()
Inst_VOPC__V_CMP_EQ_U32(InFmt_VOPC *)
Inst_DS__DS_INC_RTN_U32(InFmt_DS *)
void initiateAcc(GPUDynInstPtr) override
Inst_DS__DS_SUB_SRC2_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_EQ_U16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GT_I64(InFmt_VOPC *)
Inst_SOPP__S_SENDMSG(InFmt_SOPP *)
Inst_MIMG__IMAGE_ATOMIC_SMAX(InFmt_MIMG *)
~Inst_MUBUF__BUFFER_ATOMIC_SWAP()
Inst_FLAT__FLAT_STORE_BYTE(InFmt_FLAT *)
Inst_VOP1__V_FLOOR_F16(InFmt_VOP1 *)
Inst_MIMG__IMAGE_SAMPLE_B_O(InFmt_MIMG *)
Inst_VOP3__V_CMP_LE_F32(InFmt_VOP3 *)
~Inst_DS__DS_WRXCHG2_RTN_B64()
Inst_MUBUF__BUFFER_STORE_DWORDX3(InFmt_MUBUF *)
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_FLOOR_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NE_I64()
ScalarRegI32 countZeroBitsMsb(T val)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_MAX_RTN_I64()
Inst_VOP3__V_MAX_F64(InFmt_VOP3 *)
Inst_VOPC__V_CMP_LE_I32(InFmt_VOPC *)
void readSrc()
certain vector operands can read from the vrf/srf or constants.
Inst_VOP3__V_CMP_LE_F16(InFmt_VOP3 *)
~Inst_FLAT__FLAT_ATOMIC_SMAX_X2()
void initiateAcc(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_SMEM__S_LOAD_DWORDX16(InFmt_SMEM *)
~Inst_MIMG__IMAGE_STORE()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_ADD_F32(InFmt_VOP3 *)
Inst_DS__DS_MIN_RTN_U32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Synchronize waves within a workgroup.
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_F64_I32(InFmt_VOP3 *)
Inst_VOP3__V_CMP_GE_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LT_I64(InFmt_VOPC *)
Inst_VOP1__V_CVT_F32_UBYTE0(InFmt_VOP1 *)
Inst_SOPC__S_CMP_GT_I32(InFmt_SOPC *)
~Inst_VOP3__V_MAD_I32_I24()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GT_F16()
void execute(GPUDynInstPtr) override
~Inst_SMEM__S_LOAD_DWORDX16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NGT_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MAC_F32(InFmt_VOP2 *)
~Inst_VOP2__V_MUL_LEGACY_F32()
~Inst_VOPC__V_CMPX_NLT_F64()
Inst_VOPC__V_CMP_O_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NGT_F64(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_CL()
~Inst_VOPC__V_CMP_GT_I16()
~Inst_VOPC__V_CMP_LT_F16()
Inst_SOP1__S_BITSET0_B64(InFmt_SOP1 *)
Inst_VOP3__V_RCP_F64(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LT_U64(InFmt_VOPC *)
Inst_VOPC__V_CMPX_LG_F16(InFmt_VOPC *)
Inst_DS__DS_RSUB_SRC2_U32(InFmt_DS *)
Inst_DS__DS_WRXCHG_RTN_B64(InFmt_DS *)
Inst_VOP3__V_EXP_F16(InFmt_VOP3 *)
~Inst_VOP3__V_DIV_FIXUP_F32()
~Inst_VOPC__V_CMPX_F_U16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_LT_I32()
Inst_VOPC__V_CMP_NEQ_F64(InFmt_VOPC *)
Inst_VOP1__V_RSQ_F64(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
std::unordered_map< int, uint64_t > rawDist
~Inst_SOP2__S_CSELECT_B64()
Inst_VOP3__V_SAD_U8(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void decLGKMInstsIssued()
int numAtBarrier(int bar_id)
Inst_DS__DS_WRXCHG2_RTN_B64(InFmt_DS *)
~Inst_VOP3__V_LDEXP_F16()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_C_L_O()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_DS__DS_MSKOR_RTN_B64()
~Inst_DS__DS_MIN_RTN_I64()
Inst_SOP1__S_BCNT0_I32_B32(InFmt_SOP1 *)
~Inst_VOP3__V_CVT_F32_UBYTE3()
Inst_DS__DS_ADD_RTN_U64(InFmt_DS *)
Inst_DS__DS_NOP(InFmt_DS *)
~Inst_VOPC__V_CMPX_O_F16()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_NE_I32()
~Inst_VOPC__V_CMP_F_I64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LT_I32(InFmt_VOPC *)
~Inst_SOPK__S_SETREG_IMM32_B32()
Inst_SOP1__S_MOV_FED_B32(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_T_I64()
Inst_VOP3__V_CEIL_F64(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_NLE_F32(InFmt_VOP3 *)
Inst_VOP2__V_MUL_HI_I32_I24(InFmt_VOP2 *)
Inst_VOP1__V_CVT_F32_F16(InFmt_VOP1 *)
Inst_MIMG__IMAGE_GATHER4_LZ_O(InFmt_MIMG *)
Inst_VOP3__V_CMP_GT_I64(InFmt_VOP3 *)
Inst_VOP3__V_MUL_HI_U32(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_LT_U64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CUBEMA_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_GWS_SEMA_RELEASE_ALL()
~Inst_VOP3__V_LDEXP_F64()
Inst_SOP1__S_FF1_I32_B64(InFmt_SOP1 *)
~Inst_MIMG__IMAGE_SAMPLE_C_L()
~Inst_VOP3__V_CMP_NE_U64()
Inst_DS__DS_MIN_SRC2_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_ATOMIC_SWAP()
Inst_DS__DS_MIN_SRC2_I32(InFmt_DS *)
Inst_VOP3__V_FREXP_EXP_I32_F64(InFmt_VOP3 *)
Inst_DS__DS_WRXCHG_RTN_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_SOPK__S_CMPK_LG_U32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
~Inst_SOPK__S_CMOVK_I32()
Inst_VOP3__V_CMP_T_U64(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NLE_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_RNDNE_F32(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_GT_U16(InFmt_VOPC *)
Inst_FLAT__FLAT_LOAD_DWORDX3(InFmt_FLAT *)
Inst_VOP3__V_SUBB_U32(InFmt_VOP3_SDST_ENC *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_LZ(InFmt_MIMG *)
Inst_DS__DS_ADD_RTN_U32(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_PERMUTE_B32()
Inst_MUBUF__BUFFER_STORE_DWORD(InFmt_MUBUF *)
~Inst_VOPC__V_CMPX_NE_U64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GE_F64()
Inst_MUBUF__BUFFER_LOAD_DWORDX3(InFmt_MUBUF *)
Inst_VOP3__V_MIN_U32(InFmt_VOP3 *)
Inst_SOPK__S_CMPK_GT_U32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_T_U64()
~Inst_VOP3__V_CVT_F16_I16()
~Inst_VOP2__V_MADAK_F32()
Inst_VOP3__V_DIV_FMAS_F32(InFmt_VOP3 *)
Inst_VOP3__V_ASHRREV_I16(InFmt_VOP3 *)
Inst_VOP2__V_OR_B32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
~Inst_SOP2__S_ANDN2_B64()
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_UMIN_X2()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_U_F64()
Inst_VINTRP__V_INTERP_P2_F32(InFmt_VINTRP *)
Inst_VOPC__V_CMP_LG_F16(InFmt_VOPC *)
~Inst_FLAT__FLAT_ATOMIC_INC()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GT_U16()
Inst_MUBUF__BUFFER_ATOMIC_OR_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CVT_F64_I32()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NE_I32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_BFM_B32(InFmt_VOP3 *)
Inst_VOP1__V_FRACT_F64(InFmt_VOP1 *)
Inst_VOP3__V_LSHRREV_B64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_SOPK__S_ADDK_I32(InFmt_SOPK *)
Inst_SOP2__S_CSELECT_B32(InFmt_SOP2 *)
~Inst_SOPC__S_CMP_GE_I32()
~Inst_VOP3__V_FREXP_EXP_I16_F16()
~Inst_DS__DS_DEC_RTN_U32()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LG_F16()
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_SMIN()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NEQ_F32()
Inst_VOP3__V_CMP_GT_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_ATOMIC_UMAX()
Inst_VOP3__V_EXP_LEGACY_F32(InFmt_VOP3 *)
Inst_DS__DS_SUB_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Stats::Distribution readsPerWrite
~Inst_MIMG__IMAGE_SAMPLE_C_CL_O()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_EQ_I64()
Inst_VOP3__V_SUB_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_U_F32()
void execute(GPUDynInstPtr) override
Inst_SMEM__S_LOAD_DWORD(InFmt_SMEM *)
Inst_MIMG__IMAGE_GATHER4_C_CL_O(InFmt_MIMG *)
Inst_VOP3__V_INTERP_P2_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
VecElemU32 muladd(VecElemU64 &dst, VecElemU32 val_0, VecElemU32 val_1, VecElemU64 val_2)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_O()
Inst_VOP3__V_LOG_LEGACY_F32(InFmt_VOP3 *)
Inst_VOP3__V_SIN_F32(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_STORE_BYTE(InFmt_MUBUF *)
Inst_VOP1__V_FREXP_EXP_I32_F64(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GT_U64()
void execute(GPUDynInstPtr) override
Inst_VOP2__V_MUL_U32_U24(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NLT_F32()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_O_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_C_L_O(InFmt_MIMG *)
~Inst_VOP3__V_CMP_T_I32()
Inst_VOP2__V_SUB_U32(InFmt_VOP2 *)
~Inst_VOP3__V_CMP_NGE_F32()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GE_U32()
~Inst_FLAT__FLAT_LOAD_DWORDX4()
Inst_SOP2__S_ANDN2_B64(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
Inst_SOPK__S_SETREG_IMM32_B32(InFmt_SOPK *)
~Inst_VOPC__V_CMPX_NEQ_F64()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_CD_O(InFmt_MIMG *)
void completeAcc(GPUDynInstPtr) override
Inst_MIMG__IMAGE_ATOMIC_DEC(InFmt_MIMG *)
~Inst_VOP3__V_CMP_LT_I16()
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPP__S_NOP(InFmt_SOPP *)
Inst_VOP3__V_CUBESC_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_SQRT_F32(InFmt_VOP1 *)
~Inst_VOP3__V_CMPX_NGE_F16()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_BCNT1_I32_B64(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOP1__S_QUADMASK_B64()
~Inst_VOPC__V_CMPX_GE_I64()
~Inst_MUBUF__BUFFER_ATOMIC_SUB()
Inst_VOPC__V_CMPX_GE_U64(InFmt_VOPC *)
~Inst_MIMG__IMAGE_GATHER4_C_L()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NGE_F16()
Inst_VOP3__V_FMA_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_B_O()
void execute(GPUDynInstPtr) override
int decreaseRefCounter(const uint32_t dispatchId, const uint32_t wgId)
decrease the reference count after making sure it is in the list give back this chunk if the ref coun...
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_F_I16()
~Inst_VOPC__V_CMPX_EQ_U64()
Inst_VOP1__V_FREXP_MANT_F64(InFmt_VOP1 *)
~Inst_MIMG__IMAGE_GATHER4_C_B()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_U_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_GT_U32(InFmt_VOPC *)
Inst_VOP3__V_CMPX_F_U16(InFmt_VOP3 *)
Inst_SMEM__S_BUFFER_STORE_DWORD(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GE_F32()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FRACT_F64()
Inst_SOPK__S_CMPK_EQ_U32(InFmt_SOPK *)
Inst_MIMG__IMAGE_SAMPLE_D_CL_O(InFmt_MIMG *)
~Inst_VOP3__V_SUBREV_F32()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_CD_O()
Inst_VOP3__V_INTERP_MOV_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CVT_FLR_I32_F32()
Inst_VOP3__V_FREXP_MANT_F64(InFmt_VOP3 *)
Inst_VOP3__V_CMP_LT_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CVT_I32_F32()
Inst_VOP3__V_CMPX_F_U32(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
~Inst_DS__DS_RSUB_RTN_U32()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_CD_CL_O(InFmt_MIMG *)
Inst_VOPC__V_CMPX_F_I32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_LE_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NLE_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NLG_F16()
Inst_VOP3__V_CMPX_F_I64(InFmt_VOP3 *)
~Inst_SOP1__S_SWAPPC_B64()
Inst_VOPC__V_CMPX_CLASS_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MSKOR_RTN_B32(InFmt_DS *)
Inst_VOP3__V_CMP_U_F32(InFmt_VOP3 *)
void processSDWA_src(InFmt_VOP_SDWA sdwaInst, T &src0, T &origSrc0)
processSDWA_src is a helper function for implementing sub d-word addressing instructions for the src ...
Inst_SOPC__S_CMP_LG_U64(InFmt_SOPC *)
Inst_SOPP__S_WAITCNT(InFmt_SOPP *)
~Inst_VOP3__V_CVT_F32_F16()
void execute(GPUDynInstPtr) override
Inst_SOPC__S_BITCMP0_B32(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_ATOMIC_XOR()
Inst_VOPC__V_CMP_NGT_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOPK__S_CMPK_LG_U32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MUL_I32_I24(InFmt_VOP3 *)
Inst_FLAT__FLAT_ATOMIC_INC_X2(InFmt_FLAT *)
Inst_VOP3__V_CMP_F_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_F_U32()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_GT_F16()
Inst_VOPC__V_CMPX_GE_I32(InFmt_VOPC *)
Inst_DS__DS_DEC_U64(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_SUB_RTN_U32()
~Inst_FLAT__FLAT_ATOMIC_DEC()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_INC_X2(InFmt_MUBUF *)
Inst_MIMG__IMAGE_SAMPLE_CD_CL(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAX_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NE_U64()
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_EQ_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LG_F64(InFmt_VOPC *)
Inst_VOP3__V_LSHLREV_B16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NE_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MAD_U64_U32()
Inst_SOP1__S_BITSET0_B32(InFmt_SOP1 *)
~Inst_VOP3__V_CMP_F_F16()
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRAP_RTN_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_SRC2_U32(InFmt_DS *)
~Inst_VOPC__V_CMPX_NEQ_F32()
void execute(GPUDynInstPtr) override
Inst_SOP1__S_NAND_SAVEEXEC_B64(InFmt_SOP1 *)
Inst_VOP2__V_SUBREV_U32(InFmt_VOP2 *)
Inst_DS__DS_CMPST_RTN_F64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NLG_F64()
~Inst_VOPC__V_CMPX_F_F64()
Inst_MUBUF__BUFFER_ATOMIC_UMAX_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_LT_I16()
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_T_I32(InFmt_VOPC *)
~Inst_VOPC__V_CMP_TRU_F64()
~Inst_VOP3__V_CMPX_NGT_F32()
Inst_VOP3__V_MUL_HI_I32(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_NLE_F64()
Inst_VOP3__V_CMPX_GT_U64(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_GE_F64(InFmt_VOPC *)
~Inst_VOP1__V_CVT_OFF_F32_I4()
Inst_VOPC__V_CMPX_CLASS_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP2__S_OR_B32(InFmt_SOP2 *)
Inst_MIMG__IMAGE_ATOMIC_INC(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_GE_I16(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_F_I32()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FREXP_MANT_F32()
~Inst_VOPC__V_CMP_EQ_I16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPP__S_INCPERFLEVEL(InFmt_SOPP *)
Inst_DS__DS_WRITE_B16(InFmt_DS *)
Inst_VOP3__V_CMPX_EQ_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_LDEXP_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GATHER4_CL_O(InFmt_MIMG *)
Inst_VOP3__V_MUL_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_TRU_F32(InFmt_VOP3 *)
~Inst_SOP1__S_OR_SAVEEXEC_B64()
Inst_VOP3__V_FRACT_F32(InFmt_VOP3 *)
~Inst_DS__DS_AND_SRC2_B32()
Inst_VOP3__V_CMPX_EQ_F64(InFmt_VOP3 *)
Inst_VOP3__V_CMP_O_F64(InFmt_VOP3 *)
Inst_VOP3__V_CVT_F32_F64(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_ADD_RTN_U64()
~Inst_VOPC__V_CMPX_GE_I32()
~Inst_VOPC__V_CMPX_T_U64()
Inst_VOPC__V_CMP_NGT_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NLT_F16(InFmt_VOP3 *)
Inst_VOP3__V_FRACT_F64(InFmt_VOP3 *)
~Inst_MUBUF__BUFFER_ATOMIC_SWAP_X2()
~Inst_VOP3__V_CVT_U32_F32()
Inst_VOP3__V_CMP_LE_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NE_I64()
~Inst_VOP1__V_CVT_F16_I16()
~Inst_DS__DS_MIN_RTN_U64()
~Inst_MUBUF__BUFFER_LOAD_SBYTE()
Inst_SOPC__S_CMP_EQ_U64(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_DIV_SCALE_F32()
Inst_MIMG__IMAGE_SAMPLE_D_CL(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_DEC(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_LE_I16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_O_F64()
Inst_VOP3__V_CMP_EQ_F32(InFmt_VOP3 *)
~Inst_SMEM__S_MEMREALTIME()
Inst_VOP3__V_CMP_NLE_F32(InFmt_VOP3 *)
Inst_MIMG__IMAGE_SAMPLE_C(InFmt_MIMG *)
Inst_FLAT__FLAT_ATOMIC_ADD(InFmt_FLAT *)
~Inst_VOP3__V_CMPX_NE_I64()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GT_F16()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_LZ(InFmt_MIMG *)
Inst_VOPC__V_CMPX_LE_I32(InFmt_VOPC *)
~Inst_DS__DS_ADD_RTN_U32()
~Inst_VOP3__V_EXP_LEGACY_F32()
~Inst_FLAT__FLAT_STORE_BYTE()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FRACT_F16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LE_U64(InFmt_VOP3 *)
~Inst_SMEM__S_BUFFER_STORE_DWORDX2()
Inst_SOPC__S_CMP_LT_I32(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_RSUB_U32(InFmt_DS *)
Inst_VOP3__V_CMP_LT_U32(InFmt_VOP3 *)
~Inst_SOP2__S_RFE_RESTORE_B64()
Inst_DS__DS_AND_SRC2_B32(InFmt_DS *)
Inst_VOP3__V_CVT_F32_I32(InFmt_VOP3 *)
~Inst_VOP3__V_READLANE_B32()
Inst_VOP3__V_ASHRREV_I64(InFmt_VOP3 *)
~Inst_VOP3__V_SUBREV_U32()
Inst_SOPK__S_CMPK_LE_U32(InFmt_SOPK *)
~Inst_VOPC__V_CMPX_GT_I32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MUL_F16(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_LT_I32(InFmt_VOP3 *)
Inst_SOP2__S_NOR_B32(InFmt_SOP2 *)
~Inst_VOP1__V_CVT_F32_F64()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GT_I64()
~Inst_VOP3__V_CVT_PKRTZ_F16_F32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_T_U16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
T reverseBits(T val, std::size_t size=sizeof(T))
Takes a variable lenght word and returns the mirrored version (Bit by bit, LSB=>MSB).
Inst_VOPC__V_CMP_F_I16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_WRXCHG_RTN_B32()
Inst_VOPC__V_CMP_F_F64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_DS__DS_ADD_SRC2_U32()
Inst_VOP3__V_CVT_F64_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_F16_I16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_NEQ_F32(InFmt_VOPC *)
Inst_SOPP__S_BARRIER(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_U_F32()
Inst_VOPC__V_CMPX_LG_F64(InFmt_VOPC *)
~Inst_VOPC__V_CMPX_GT_F32()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_GET_LOD(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
std::enable_if< Condition, void >::type setBit(int bit, int bit_val)
bit access to scalar data.
~Inst_DS__DS_AND_SRC2_B64()
Inst_VOP3__V_MAD_LEGACY_F32(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_NLE_F64(InFmt_VOPC *)
Inst_VOPC__V_CMPX_F_F32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_GT_U64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LT_F16(InFmt_VOP3 *)
~Inst_VOP3__V_CMPX_T_U32()
~Inst_MUBUF__BUFFER_ATOMIC_UMIN()
~Inst_VOPC__V_CMPX_LT_I64()
~Inst_SMEM__S_BUFFER_STORE_DWORD()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LT_U32()
~Inst_MIMG__IMAGE_GATHER4_C_B_O()
~Inst_VOPC__V_CMPX_F_I32()
Inst_SOPP__S_SLEEP(InFmt_SOPP *)
Inst_VOPC__V_CMPX_T_U16(InFmt_VOPC *)
~Inst_VOPC__V_CMP_F_F16()
Inst_VOPC__V_CMP_CLASS_F16(InFmt_VOPC *)
void completeAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_CL_O()
~Inst_FLAT__FLAT_ATOMIC_ADD_X2()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_CLASS_F64()
Inst_VOP1__V_CVT_U16_F16(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_RNDNE_F64(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_D()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPK__S_CMOVK_I32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_ADD_U32(InFmt_VOP3_SDST_ENC *)
Inst_SOPP__S_DECPERFLEVEL(InFmt_SOPP *)
Inst_VOPC__V_CMP_GE_U16(InFmt_VOPC *)
~Inst_DS__DS_MAX_SRC2_U32()
~Inst_SOPP__S_CBRANCH_CDBGSYS_OR_USER()
~Inst_MIMG__IMAGE_SAMPLE_C_D_CL()
Inst_DS__DS_GWS_INIT(InFmt_DS *)
~Inst_VOPC__V_CMP_EQ_F32()
Inst_VOP3__V_CMPX_GT_F16(InFmt_VOP3 *)
Inst_SOPC__S_CMP_LE_U32(InFmt_SOPC *)
Inst_VOPC__V_CMP_NLT_F16(InFmt_VOPC *)
~Inst_FLAT__FLAT_STORE_DWORDX2()
Inst_VOPC__V_CMP_T_U16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
std::shared_ptr< GPUDynInst > GPUDynInstPtr
Inst_MUBUF__BUFFER_LOAD_UBYTE(InFmt_MUBUF *)
~Inst_SOP1__S_MOVRELD_B64()
Inst_VOP1__V_CVT_U32_F64(InFmt_VOP1 *)
Inst_VOP1__V_CEIL_F16(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_LE_I64()
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_T_I64()
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_SWAP()
void completeAcc(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_F_I32()
Inst_DS__DS_OR_SRC2_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_RSQ_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_F_I64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_U_F64(InFmt_VOPC *)
~Inst_SOPC__S_CMP_LE_U32()
~Inst_VOPC__V_CMPX_NGT_F32()
void sample(const U &v, int n=1)
Add a value to the distribtion n times.
Inst_DS__DS_XOR_B64(InFmt_DS *)
Inst_SOPC__S_SET_GPR_IDX_ON(InFmt_SOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Cycles is a wrapper class for representing cycle counts, i.e.
Inst_MIMG__IMAGE_GATHER4_B_O(InFmt_MIMG *)
Inst_VOPC__V_CMP_T_U64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_AND_B64(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOP1__V_FRACT_F32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_L_O(InFmt_MIMG *)
~Inst_MIMG__IMAGE_STORE_PCK()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_FREXP_MANT_F16(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_GE_U64()
Inst_SOP1__S_CMOV_B64(InFmt_SOP1 *)
Bitfield< 31, 16 > selector
~Inst_SOP1__S_FF1_I32_B32()
void execute(GPUDynInstPtr) override
Inst_VOP2__V_XOR_B32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
~Inst_SOPC__S_CMP_GT_U32()
void injectGlobalMemFence(GPUDynInstPtr gpuDynInst)
Inst_FLAT__FLAT_ATOMIC_UMIN_X2(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GE_U64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SMEM__S_STORE_DWORDX2(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_CD_O()
~Inst_VOP3__V_CMP_LT_U32()
Inst_VOPC__V_CMP_NE_U16(InFmt_VOPC *)
~Inst_VOP3__V_CMPX_GT_F64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_F_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
std::deque< GPUDynInstPtr > instructionBuffer
~Inst_VOP3__V_CMPX_LT_U16()
void execute(GPUDynInstPtr) override
Inst_SOPP__S_CBRANCH_VCCZ(InFmt_SOPP *)
~Inst_VOP3__V_CMPX_NLT_F64()
Inst_SOP1__S_CMOV_B32(InFmt_SOP1 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_CD()
void execute(GPUDynInstPtr) override
~Inst_DS__DS_AND_RTN_B64()
Inst_VOP3__V_MUL_HI_U32_U24(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_EQ_F32(InFmt_VOP3 *)
Inst_SOPP__S_TTRACEDATA(InFmt_SOPP *)
Inst_VOP1__V_FREXP_MANT_F32(InFmt_VOP1 *)
~Inst_SOPC__S_BITCMP0_B32()
Inst_MIMG__IMAGE_GATHER4_B(InFmt_MIMG *)
~Inst_VOPC__V_CMPX_GT_I16()
void execute(GPUDynInstPtr) override
void processSDWA_dst(InFmt_VOP_SDWA sdwaInst, T &dst, T &origDst)
processSDWA_dst is a helper function for implementing sub d-word addressing instructions for the dst ...
~Inst_VOP3__V_INTERP_P1_F32()
Inst_SOP2__S_MAX_I32(InFmt_SOP2 *)
Inst_VOP3__V_CMP_LE_I32(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_U_F64(InFmt_VOP3 *)
Inst_SMEM__S_ATC_PROBE_BUFFER(InFmt_SMEM *)
Inst_SOPK__S_GETREG_B32(InFmt_SOPK *)
~Inst_MIMG__IMAGE_ATOMIC_ADD()
~Inst_VOP3__V_CMP_GE_I64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MUL_LEGACY_F32()
void completeAcc(GPUDynInstPtr) override
~Inst_SOP1__S_NAND_SAVEEXEC_B64()
Inst_VOP3__V_CMPX_LT_U64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP2__S_ADDC_U32(InFmt_SOP2 *)
Inst_MIMG__IMAGE_STORE_MIP_PCK(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_EQ_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_DS__DS_GWS_SEMA_V(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CVT_FLR_I32_F32(InFmt_VOP1 *)
Inst_MIMG__IMAGE_ATOMIC_XOR(InFmt_MIMG *)
Inst_VOP1__V_EXP_F16(InFmt_VOP1 *)
~Inst_DS__DS_MAX_RTN_F64()
Inst_DS__DS_ADD_U32(InFmt_DS *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_U_F32()
Inst_SOP1__S_FF0_I32_B32(InFmt_SOP1 *)
Inst_DS__DS_BPERMUTE_B32(InFmt_DS *)
~Inst_VOPC__V_CMP_LT_I32()
~Inst_VOP3__V_CMPX_GT_U16()
Inst_VOP3__V_CMP_GE_F32(InFmt_VOP3 *)
~Inst_SOP1__S_MOVRELS_B32()
~Inst_VOP3__V_CMPX_EQ_I32()
~Inst_VOP3__V_TRIG_PREOP_F64()
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_LT_I16()
Inst_SMEM__S_BUFFER_LOAD_DWORDX8(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_D_CL_O()
Inst_MUBUF__BUFFER_ATOMIC_SMIN(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_LZ_O()
Inst_VOP3__V_CMPX_NE_U16(InFmt_VOP3 *)
Inst_VOPC__V_CMP_EQ_I32(InFmt_VOPC *)
Inst_VOP3__V_RNDNE_F16(InFmt_VOP3 *)
Inst_VOP3__V_FMA_F16(InFmt_VOP3 *)
Inst_SOP1__S_FLBIT_I32_B32(InFmt_SOP1 *)
Inst_VOP3__V_MED3_F32(InFmt_VOP3 *)
Inst_VOP3__V_MIN3_U32(InFmt_VOP3 *)
Inst_VOP3__V_RSQ_F64(InFmt_VOP3 *)
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_LOG_F16(InFmt_VOP3 *)
Inst_MIMG__IMAGE_GATHER4_L(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CVT_RPI_I32_F32()
Inst_VOP3__V_MUL_LEGACY_F32(InFmt_VOP3 *)
void completeAcc(GPUDynInstPtr) override
~Inst_DS__DS_MAX_RTN_U64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRITE_SRC2_B32(InFmt_DS *)
Inst_VOP3__V_MBCNT_HI_U32_B32(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_EQ_I32()
Inst_FLAT__FLAT_ATOMIC_SWAP(InFmt_FLAT *)
Inst_VOP3__V_CMPX_GT_F32(InFmt_VOP3 *)
Inst_VOP1__V_CVT_I32_F64(InFmt_VOP1 *)
Inst_VOP1__V_FLOOR_F32(InFmt_VOP1 *)
Inst_VOP3__V_FMA_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_STORE_DWORDX3()
Inst_VOP3__V_CVT_F32_UBYTE1(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_ATOMIC_CMPSWAP(InFmt_MUBUF *)
~Inst_FLAT__FLAT_ATOMIC_OR()
~Inst_VOP3__V_CMP_GT_F32()
void execute(GPUDynInstPtr) override
Inst_DS__DS_CONSUME(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_SMIN_X2(InFmt_FLAT *)
~Inst_VOPC__V_CMPX_T_U32()
Inst_VOPC__V_CMPX_LT_F32(InFmt_VOPC *)
Inst_SOP1__S_CBRANCH_JOIN(InFmt_SOP1 *)
Inst_VOP3__V_FFBH_U32(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_NGE_F32(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_EQ_I64()
int findLsbSet(uint64_t val)
Returns the bit position of the LSB that is set in the input.
~Inst_DS__DS_SUB_SRC2_U64()
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_CBRANCH_VCCNZ()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FREXP_MANT_F16()
void execute(GPUDynInstPtr) override
~Inst_SOPC__S_BITCMP1_B64()
~Inst_VOP3__V_CVT_PK_I16_I32()
~Inst_VOP2__V_ASHRREV_I16()
Inst_SOP2__S_LSHL_B64(InFmt_SOP2 *)
Inst_MIMG__IMAGE_SAMPLE_B_CL_O(InFmt_MIMG *)
void completeAcc(GPUDynInstPtr) override
void calcAddr(GPUDynInstPtr gpuDynInst, ConstVecOperandU32 &addr)
~Inst_DS__DS_MIN_RTN_I32()
Inst_VOP3__V_CVT_PK_U8_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NE_U16()
Inst_SOP2__S_OR_B64(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_NE_I64(InFmt_VOPC *)
Inst_VOP1__V_FFBH_I32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GE_U64(InFmt_VOP3 *)
Inst_SOP2__S_ORN2_B64(InFmt_SOP2 *)
~Inst_MUBUF__BUFFER_ATOMIC_UMAX_X2()
~Inst_VOP3__V_CMP_NGE_F64()
Inst_VOPC__V_CMPX_F_F16(InFmt_VOPC *)
~Inst_VOP3__V_MBCNT_HI_U32_B32()
~Inst_VOP2__V_MUL_I32_I24()
void execute(GPUDynInstPtr) override
Inst_SOPP__S_ENDPGM(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_LOAD_DWORDX2(InFmt_FLAT *)
~Inst_VOP3__V_CVT_OFF_F32_I4()
~Inst_SMEM__S_LOAD_DWORD()
~Inst_VOP3__V_ASHRREV_I16()
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LT_F64()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FRACT_F32()
Inst_MIMG__IMAGE_LOAD_PCK(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_MAX_SRC2_F64(InFmt_DS *)
~Inst_VOP3__V_CVT_F32_U32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NGE_F64(InFmt_VOP3 *)
~Inst_DS__DS_OR_RTN_B32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_T_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_F_I64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_SAMPLE_C_D_O()
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_STORE_DWORDX4(InFmt_MUBUF *)
Inst_VOP3__V_CMPX_NLT_F32(InFmt_VOP3 *)
Inst_SMEM__S_STORE_DWORDX4(InFmt_SMEM *)
~Inst_MIMG__IMAGE_ATOMIC_SUB()
void freeRegisters(Wavefront *w)
Inst_MIMG__IMAGE_ATOMIC_ADD(InFmt_MIMG *)
Inst_DS__DS_WRITE_B64(InFmt_DS *)
Inst_VOP3__V_CVT_F32_UBYTE3(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_F_U16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_EQ_U64()
Inst_DS__DS_MIN_SRC2_U32(InFmt_DS *)
~Inst_VOPC__V_CMPX_NE_U32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void read() override
read from the vrf.
Inst_DS__DS_GWS_BARRIER(InFmt_DS *)
Inst_VOP3__V_TRUNC_F32(InFmt_VOP3 *)
~Inst_SOPP__S_CBRANCH_VCCZ()
void initiateAcc(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LG_F32(InFmt_VOP3 *)
Inst_VOP3__V_CMPX_U_F32(InFmt_VOP3 *)
Inst_SOPK__S_CMPK_LT_U32(InFmt_SOPK *)
Inst_SMEM__S_MEMREALTIME(InFmt_SMEM *)
~Inst_SMEM__S_BUFFER_STORE_DWORDX4()
Inst_DS__DS_MAX_RTN_F32(InFmt_DS *)
Inst_DS__DS_WRITE_SRC2_B64(InFmt_DS *)
Inst_VOPC__V_CMP_EQ_I16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_MUBUF__BUFFER_LOAD_USHORT()
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_SOP2__S_MUL_I32(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_RNDNE_F16()
~Inst_VOP3__V_CMPX_GE_I32()
~Inst_VOP3__V_MOV_FED_B32()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
Inst_VOP3__V_CMP_F_F16(InFmt_VOP3 *)
~Inst_VOP2__V_LSHRREV_B16()
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_DS__DS_RSUB_U64(InFmt_DS *)
~Inst_DS__DS_WRITE_SRC2_B32()
Inst_VOP3__V_CMPX_GE_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MQSAD_PK_U16_U8(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_LG_F32()
~Inst_SMEM__S_BUFFER_LOAD_DWORDX2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP2__S_XNOR_B64(InFmt_SOP2 *)
Inst_VOP3__V_CMPX_GT_U16(InFmt_VOP3 *)
#define NAN
Define Not a number.
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_GE_F16()
Inst_VOP3__V_CVT_U32_F64(InFmt_VOP3 *)
Inst_VOP1__V_CVT_RPI_I32_F32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_LE_F64(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MQSAD_U32_U8()
~Inst_MUBUF__BUFFER_ATOMIC_SUB_X2()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_LE_I64(InFmt_VOPC *)
Inst_VOP3__V_SUB_F16(InFmt_VOP3 *)
Inst_DS__DS_INC_SRC2_U32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_EQ_U64(InFmt_VOPC *)
Inst_VOP3__V_CVT_PKNORM_I16_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_GATHER4_C_LZ()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_NOP(InFmt_VOP1 *)
Inst_VOP3__V_CMP_NGE_F32(InFmt_VOP3 *)
Inst_VOP3__V_CVT_F32_UBYTE2(InFmt_VOP3 *)
~Inst_MIMG__IMAGE_SAMPLE_C()
~Inst_SOPK__S_CMPK_EQ_U32()
~Inst_VOPC__V_CMP_CLASS_F32()
Inst_VOP3__V_CMP_EQ_I16(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_LE_F16(InFmt_VOPC *)
~Inst_VOP1__V_CVT_F32_F16()
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_B(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_SMAX_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_LOAD_SBYTE(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_F_I16(InFmt_VOP3 *)
void calcAddr(GPUDynInstPtr gpuDynInst, ConstVecOperandU64 &addr)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SMEM__S_MEMTIME(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
~Inst_DS__DS_INC_SRC2_U64()
Inst_MIMG__IMAGE_GATHER4_CL(InFmt_MIMG *)
void initiateAcc(GPUDynInstPtr) override
Inst_SOPP__S_TRAP(InFmt_SOPP *)
Inst_VOP3__V_SUB_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_SMEM__S_STORE_DWORDX4()
Inst_SMEM__S_ATC_PROBE(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NGT_F64()
~Inst_VOPC__V_CMP_T_I32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_RCP_F32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_EQ_U64(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LE_F64()
~Inst_VOP3__V_FLOOR_F64()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LT_U16()
Inst_SOPP__S_CBRANCH_EXECNZ(InFmt_SOPP *)
Inst_MIMG__IMAGE_SAMPLE_C_D(InFmt_MIMG *)
Inst_VOPC__V_CMP_LT_I16(InFmt_VOPC *)
Inst_VOP3__V_CVT_F16_F32(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_NGT_F16()
void execute(GPUDynInstPtr) override
~Inst_MIMG__IMAGE_ATOMIC_DEC()
Inst_DS__DS_AND_SRC2_B64(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_INTERP_P2_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_F_I32(InFmt_VOPC *)
Inst_SMEM__S_DCACHE_WB(InFmt_SMEM *)
~Inst_VOPC__V_CMPX_LE_I32()
~Inst_SOPK__S_CMPK_LG_I32()
~Inst_DS__DS_WRITE_SRC2_B64()
~Inst_VOPC__V_CMPX_LE_F16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_GT_F32(InFmt_VOP3 *)
Inst_VOP3__V_MSAD_U8(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_MAX_SRC2_I32()
Inst_SMEM__S_BUFFER_LOAD_DWORD(InFmt_SMEM *)
~Inst_VOP3__V_CMPX_GE_F64()
void completeAcc(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_CD(InFmt_MIMG *)
~Inst_VOP3__V_CMPX_NGE_F32()
~Inst_VOP3__V_CMPX_GT_F32()
Inst_DS__DS_XOR_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_RPI_I32_F32(InFmt_VOP3 *)
~Inst_SOP2__S_CBRANCH_G_FORK()
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_NE_U32()
Inst_VOP3__V_CMPX_GE_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_RNDNE_F32()
~Inst_VOP3__V_CMPX_TRU_F32()
~Inst_VOP3__V_CMP_TRU_F16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CVT_F32_UBYTE0(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOP2__V_SUB_F16(InFmt_VOP2 *)
void completeAcc(GPUDynInstPtr) override
Inst_VOP3__V_TRUNC_F64(InFmt_VOP3 *)
Inst_VOP3__V_SAD_HI_U8(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP2__V_LSHRREV_B32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_FREXP_MANT_F64()
~Inst_SOPC__S_CMP_GE_U32()
~Inst_DS__DS_MAX_SRC2_U64()
~Inst_MIMG__IMAGE_SAMPLE_C_B()
Inst_VOPC__V_CMP_EQ_I64(InFmt_VOPC *)
~Inst_VOPC__V_CMP_F_U16()
Inst_VOP3__V_CMP_GT_I32(InFmt_VOP3 *)
~Inst_DS__DS_CMPST_RTN_F64()
void execute(GPUDynInstPtr) override
Inst_DS__DS_WRITE_B8(InFmt_DS *)
Inst_VOPC__V_CMP_LE_U32(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_T_I32()
~Inst_SOP1__S_FLBIT_I32_I64()
Inst_VOP3__V_SAD_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_SOPK__S_CMPK_GT_U32()
Inst_VOP3__V_CMP_LT_F16(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_NLT_F16()
~Inst_VOP3__V_LOG_LEGACY_F32()
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_STORE_DWORDX2(InFmt_FLAT *)
~Inst_VOPC__V_CMP_GT_I64()
~Inst_VOP3__V_CMP_CLASS_F32()
~Inst_VOP2__V_MUL_U32_U24()
Inst_VOP3__V_COS_F16(InFmt_VOP3 *)
~Inst_MIMG__IMAGE_SAMPLE_L()
~Inst_VOP1__V_CVT_I16_F16()
void execute(GPUDynInstPtr) override
Inst_DS__DS_CMPST_B64(InFmt_DS *)
~Inst_SOPC__S_CMP_LT_I32()
~Inst_FLAT__FLAT_ATOMIC_UMAX()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_U_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_MUL_HI_I32_I24()
Inst_VOP3__V_BFE_I32(InFmt_VOP3 *)
~Inst_SOPC__S_CMP_LG_U32()
Inst_VOPC__V_CMPX_LT_I32(InFmt_VOPC *)
Inst_VOP3__V_CMP_GE_U32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_SOPP__S_SET_GPR_IDX_OFF()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_NLE_F32()
Inst_VOP3__V_MAC_F16(InFmt_VOP3 *)
~Inst_SOP1__S_GETPC_B64()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_GT_U32(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_T_U64()
Inst_SOPK__S_CMPK_LT_I32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_F_F16(InFmt_VOPC *)
Inst_SOPP__S_CBRANCH_SCC0(InFmt_SOPP *)
~Inst_VOP3__V_CMP_LT_U64()
Inst_VOPC__V_CMPX_NE_U32(InFmt_VOPC *)
Inst_VOP1__V_SQRT_F64(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_DS__DS_RSUB_SRC2_U32()
Inst_VOPC__V_CMP_NE_I16(InFmt_VOPC *)
~Inst_MUBUF__BUFFER_ATOMIC_OR_X2()
Inst_VOPC__V_CMP_F_U64(InFmt_VOPC *)
Inst_DS__DS_INC_RTN_U64(InFmt_DS *)
~Inst_DS__DS_ADD_SRC2_U64()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP1__V_RSQ_F16(InFmt_VOP1 *)
~Inst_DS__DS_READ2ST64_B64()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_CVT_F32_UBYTE0()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_DIV_SCALE_F32(InFmt_VOP3_SDST_ENC *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_SOPP__S_TTRACEDATA()
~Inst_MUBUF__BUFFER_ATOMIC_INC_X2()
void completeAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LE_U32()
void initiateAcc(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_FLOOR_F32()
void execute(GPUDynInstPtr) override
~Inst_DS__DS_GWS_BARRIER()
Inst_VOP2__V_MUL_LO_U16(InFmt_VOP2 *)
~Inst_DS__DS_MAX_RTN_I32()
~Inst_VOP3__V_CMP_LE_F16()
Inst_VOP3__V_MAD_F32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GT_F16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_SOP2__S_SUB_U32(InFmt_SOP2 *)
Inst_VOP3__V_CMP_GT_U64(InFmt_VOP3 *)
static const int InvalidID
Inst_SOP2__S_SUBB_U32(InFmt_SOP2 *)
#define ULL(N)
uint64_t constant
Inst_MIMG__IMAGE_SAMPLE_LZ_O(InFmt_MIMG *)
~Inst_VOPC__V_CMP_TRU_F32()
Inst_SMEM__S_DCACHE_WB_VOL(InFmt_SMEM *)
Inst_VOPC__V_CMPX_TRU_F16(InFmt_VOPC *)
Inst_VOP2__V_MADAK_F32(InFmt_VOP2 *)
void execute(GPUDynInstPtr) override
Inst_MUBUF__BUFFER_ATOMIC_SUB(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
~Inst_FLAT__FLAT_ATOMIC_UMAX_X2()
Inst_MUBUF__BUFFER_LOAD_USHORT(InFmt_MUBUF *)
~Inst_VOPC__V_CMPX_NLE_F32()
~Inst_MIMG__IMAGE_SAMPLE_B_CL()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_NLE_F16(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_GE_F16(InFmt_VOPC *)
Inst_VOP1__V_MOV_B32(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_LDEXP_F32()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MAD_F16(InFmt_VOP3 *)
~Inst_VOP3__V_CMP_LT_F64()
void completeAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NLG_F16()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_F_I32(InFmt_VOP3 *)
~Inst_SOPP__S_CBRANCH_SCC1()
~Inst_VOP1__V_CVT_U32_F32()
~Inst_VOP3__V_CMPX_EQ_U32()
~Inst_SOP1__S_BITSET1_B64()
Inst_VOPC__V_CMPX_NE_I16(InFmt_VOPC *)
Inst_VOPC__V_CMPX_NEQ_F32(InFmt_VOPC *)
Inst_DS__DS_PERMUTE_B32(InFmt_DS *)
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_ALIGNBYTE_B32()
~Inst_VOP3__V_CMP_EQ_U32()
~Inst_MUBUF__BUFFER_ATOMIC_ADD()
~Inst_VOPC__V_CMP_EQ_U64()
void processDPP(GPUDynInstPtr gpuDynInst, InFmt_VOP_DPP dppInst, T &src0)
processDPP is a helper function for implementing Data Parallel Primitive instructions.
Inst_DS__DS_MAX_F64(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CVT_OFF_F32_I4(InFmt_VOP1 *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMPX_LT_I64()
~Inst_VOPC__V_CMPX_TRU_F32()
Inst_DS__DS_WRITE2_B32(InFmt_DS *)
void execute(GPUDynInstPtr) override
void initiateAcc(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_NGT_F16()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_CLASS_F64(InFmt_VOP3 *)
Inst_VOP3__V_MAC_F32(InFmt_VOP3 *)
~Inst_SOPK__S_SETREG_B32()
Inst_MIMG__IMAGE_SAMPLE_C_D_O(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMPX_NLG_F64(InFmt_VOP3 *)
~Inst_MIMG__IMAGE_ATOMIC_INC()
~Inst_DS__DS_XOR_SRC2_B64()
Inst_FLAT__FLAT_ATOMIC_XOR(InFmt_FLAT *)
~Inst_SOP1__S_FLBIT_I32_B32()
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CVT_F32_UBYTE1()
void execute(GPUDynInstPtr) override
Inst_SOPK__S_MULK_I32(InFmt_SOPK *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_EQ_F64(InFmt_VOP3 *)
Inst_MUBUF__BUFFER_ATOMIC_ADD_X2(InFmt_MUBUF *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOP1__S_MOVRELS_B64(InFmt_SOP1 *)
Inst_VOPC__V_CMP_GT_I16(InFmt_VOPC *)
~Inst_MIMG__IMAGE_GATHER4_C()
~Inst_SMEM__S_BUFFER_LOAD_DWORDX16()
~Inst_MIMG__IMAGE_ATOMIC_UMIN()
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMPX_NLT_F32(InFmt_VOPC *)
~Inst_VOPC__V_CMP_GE_I16()
~Inst_VOPC__V_CMPX_CLASS_F32()
void execute(GPUDynInstPtr) override
void write() override
write to the vrf.
~Inst_VOPC__V_CMPX_EQ_F32()
Inst_VOP3__V_CMP_F_U32(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_NLG_F64()
Inst_SMEM__S_BUFFER_LOAD_DWORDX4(InFmt_SMEM *)
void execute(GPUDynInstPtr) override
Inst_MIMG__IMAGE_LOAD_MIP_PCK(InFmt_MIMG *)
Inst_VOP2__V_ASHRREV_I16(InFmt_VOP2 *)
Inst_MIMG__IMAGE_LOAD_MIP(InFmt_MIMG *)
~Inst_VOP3__V_CMPX_GE_F16()
void execute(GPUDynInstPtr) override
~Inst_VOP1__V_CVT_F32_I32()
Inst_DS__DS_SWIZZLE_B32(InFmt_DS *)
Inst_MIMG__IMAGE_LOAD_MIP_PCK_SGN(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_EQ_F16()
~Inst_MIMG__IMAGE_SAMPLE_CL()
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_LT_I32(InFmt_VOP3 *)
Inst_VOP3__V_CVT_PK_I16_I32(InFmt_VOP3 *)
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMPX_F_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOP3__V_CMP_EQ_F16(InFmt_VOP3 *)
Inst_VOP2__V_AND_B32(InFmt_VOP2 *)
Inst_SOP2__S_ASHR_I32(InFmt_SOP2 *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_SOPC__S_CMP_EQ_U32(InFmt_SOPC *)
Inst_VOPC__V_CMPX_EQ_I64(InFmt_VOPC *)
Inst_MIMG__IMAGE_SAMPLE_D(InFmt_MIMG *)
void execute(GPUDynInstPtr) override
void completeAcc(GPUDynInstPtr) override
Inst_MIMG__IMAGE_SAMPLE_C_L(InFmt_MIMG *)
Inst_DS__DS_MAX_F32(InFmt_DS *)
void execute(GPUDynInstPtr) override
Inst_VOP1__V_CVT_F32_UBYTE3(InFmt_VOP1 *)
Inst_VOP2__V_ADD_U16(InFmt_VOP2 *)
Inst_SOPP__S_SETKILL(InFmt_SOPP *)
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_LG_F32()
void execute(GPUDynInstPtr) override
void execute(GPUDynInstPtr) override
Inst_VOPC__V_CMP_GT_U16(InFmt_VOPC *)
void execute(GPUDynInstPtr) override
Inst_VOP3__V_MUL_HI_I32_I24(InFmt_VOP3 *)
~Inst_VOPC__V_CMPX_LT_U32()
Inst_DS__DS_WRXCHG2_RTN_B32(InFmt_DS *)
Inst_VOPC__V_CMP_GE_F32(InFmt_VOPC *)
~Inst_VOP3__V_FREXP_MANT_F32()
Inst_VOPC__V_CMPX_EQ_F64(InFmt_VOPC *)
Inst_VOP3__V_FFBH_I32(InFmt_VOP3 *)
Inst_VOPC__V_CMPX_T_I32(InFmt_VOPC *)
T bits(T val, int first, int last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
~Inst_MIMG__IMAGE_SAMPLE_D_CL_O()
~Inst_VOP3__V_FRACT_F32()
Inst_VOPC__V_CMPX_LE_U16(InFmt_VOPC *)
~Inst_DS__DS_CMPST_RTN_B64()
~Inst_DS__DS_ADD_SRC2_F32()
Inst_VOP3__V_CMPX_EQ_F16(InFmt_VOP3 *)
~Inst_VOPC__V_CMP_GE_F64()
void execute(GPUDynInstPtr) override
~Inst_VOPC__V_CMP_GT_U16()
void execute(GPUDynInstPtr) override
Inst_FLAT__FLAT_ATOMIC_OR(InFmt_FLAT *)
void execute(GPUDynInstPtr) override
~Inst_VOP3__V_CMP_O_F64()
~Inst_SOPK__S_CMPK_GT_I32()
Generated on Thu Mar 18 2021 12:09:11 for gem5 by doxygen 1.8.17