45 #include "arch/arm/generated/decoder.hh" 54 MacroMemOp::MacroMemOp(
const char *mnem,
ExtMachInst machInst,
57 bool load, uint32_t reglist) :
60 uint32_t regs = reglist;
62 uint32_t mem_ops = ones;
66 bool copy_base = (
bits(reglist, rn) && load) || !ones;
67 bool force_user = user & !
bits(reglist, 15);
68 bool exception_ret = user &
bits(reglist, 15);
69 bool pc_temp = load && writeback &&
bits(reglist, 15);
75 + ((ones % 2 == 0 && exception_ret) ? 1 : 0)
88 addr = (ones << 2) - 4;
98 *uop++ =
new MicroAddiUop(machInst,
INTREG_UREG0, rn, 0);
101 while (mem_ops != 0) {
103 if (load && mem_ops >= 2 &&
111 while (!
bits(regs, reg)) reg++;
116 while (!
bits(regs, reg)) reg++;
125 *uop =
new MicroLdr2Uop(machInst, reg_idx1, reg_idx2,
128 if (!writeback && reg_idx2 ==
INTREG_PC) {
130 (*uop)->setFlag(StaticInst::IsControl);
131 (*uop)->setFlag(StaticInst::IsIndirectControl);
134 (*uop)->setFlag(StaticInst::IsCondControl);
136 (*uop)->setFlag(StaticInst::IsUncondControl);
146 while (!
bits(regs, reg)) reg++;
157 }
else if (reg_idx ==
INTREG_PC && exception_ret) {
159 *uop =
new MicroLdrRetUop(machInst, reg_idx,
163 *uop =
new MicroLdrUop(machInst, reg_idx,
168 if (!writeback && reg_idx ==
INTREG_PC) {
169 (*uop)->setFlag(StaticInst::IsControl);
170 (*uop)->setFlag(StaticInst::IsIndirectControl);
173 (*uop)->setFlag(StaticInst::IsCondControl);
175 (*uop)->setFlag(StaticInst::IsUncondControl);
178 *uop =
new MicroStrUop(machInst, reg_idx, rn, up, addr);
190 if (writeback && ones) {
193 *uop++ =
new MicroAddiUop(machInst, rn, rn, ones * 4);
195 *uop++ =
new MicroSubiUop(machInst, rn, rn, ones * 4);
200 *uop =
new MicroUopRegMovRet(machInst, 0,
INTREG_UREG1);
204 (*uop)->setFlag(StaticInst::IsControl);
205 (*uop)->setFlag(StaticInst::IsIndirectControl);
208 (*uop)->setFlag(StaticInst::IsCondControl);
210 (*uop)->setFlag(StaticInst::IsUncondControl);
213 (*uop)->setFlag(StaticInst::IsReturn);
221 microOps[0]->setFirstMicroop();
224 if ((*uop)->isControl())
225 setFlag(StaticInst::IsControl);
226 if ((*uop)->isCondCtrl())
227 setFlag(StaticInst::IsCondControl);
228 if ((*uop)->isUncondCtrl())
229 setFlag(StaticInst::IsUncondControl);
230 if ((*uop)->isIndirectCtrl())
231 setFlag(StaticInst::IsIndirectControl);
232 if ((*uop)->isReturn())
236 (*uop)->setDelayedCommit();
241 uint32_t size,
bool fp,
bool load,
bool noAlloc,
242 bool signExt,
bool exclusive,
bool acrel,
252 numMicroops = (post ? 0 : 1) + ((size + 4) / 8) + (writeback ? 1 : 0);
254 numMicroops = (post ? 0 : 1) + (size / 4) + (writeback ? 1 : 0);
263 *uop++ =
new MicroAddXiSpAlignUop(machInst,
INTREG_UREG0, rn,
270 *uop++ =
new MicroLdFp16Uop(machInst, rt,
271 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
272 *uop++ =
new MicroLdFp16Uop(machInst, rt2,
273 post ? rn : INTREG_UREG0, 16, noAlloc, exclusive, acrel);
275 *uop++ =
new MicroStrQBFpXImmUop(machInst, rt,
276 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
277 *uop++ =
new MicroStrQTFpXImmUop(machInst, rt,
278 post ? rn : INTREG_UREG0, 0, noAlloc, exclusive, acrel);
279 *uop++ =
new MicroStrQBFpXImmUop(machInst, rt2,
280 post ? rn : INTREG_UREG0, 16, noAlloc, exclusive, acrel);
281 *uop++ =
new MicroStrQTFpXImmUop(machInst, rt2,
282 post ? rn : INTREG_UREG0, 16, noAlloc, exclusive, acrel);
284 }
else if (size == 8) {
286 *uop++ =
new MicroLdPairFp8Uop(machInst, rt, rt2,
287 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
289 *uop++ =
new MicroStrFpXImmUop(machInst, rt,
290 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
291 *uop++ =
new MicroStrFpXImmUop(machInst, rt2,
292 post ? rn : INTREG_UREG0, 8, noAlloc, exclusive, acrel);
294 }
else if (size == 4) {
296 *uop++ =
new MicroLdrDFpXImmUop(machInst, rt, rt2,
297 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
299 *uop++ =
new MicroStrDFpXImmUop(machInst, rt, rt2,
300 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
306 *uop++ =
new MicroLdPairUop(machInst, rt, rt2,
307 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
309 *uop++ =
new MicroStrXImmUop(machInst, rt, post ? rn :
INTREG_UREG0,
310 0, noAlloc, exclusive, acrel);
311 *uop++ =
new MicroStrXImmUop(machInst, rt2, post ? rn : INTREG_UREG0,
312 size, noAlloc, exclusive, acrel);
314 }
else if (size == 4) {
317 *uop++ =
new MicroLdrDSXImmUop(machInst, rt, rt2,
318 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
320 *uop++ =
new MicroLdrDUXImmUop(machInst, rt, rt2,
321 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
324 *uop++ =
new MicroStrDXImmUop(machInst, rt, rt2,
325 post ? rn :
INTREG_UREG0, 0, noAlloc, exclusive, acrel);
331 *uop++ =
new MicroAddXiUop(machInst, rn, post ? rn :
INTREG_UREG0,
341 (*curUop)->setDelayedCommit();
356 *uop =
new MicroLdFp16Uop(machInst, dest, base, imm);
358 *uop =
new MicroStrQBFpXImmUop(machInst, dest, base, imm);
359 (*uop)->setDelayedCommit();
360 *++uop =
new MicroStrQTFpXImmUop(machInst, dest, base, imm);
362 (*uop)->setLastMicroop();
377 *uop++ =
new MicroLdFp16Uop(machInst, dest, base, 0);
379 *uop++=
new MicroStrQBFpXImmUop(machInst, dest, base, 0);
380 *uop++ =
new MicroStrQTFpXImmUop(machInst, dest, base, 0);
382 *uop =
new MicroAddXiUop(machInst, base, base, imm);
383 (*uop)->setLastMicroop();
388 (*curUop)->setDelayedCommit();
403 *uop++ =
new MicroLdFp16Uop(machInst, dest, base, imm);
405 *uop++ =
new MicroStrQBFpXImmUop(machInst, dest, base, imm);
406 *uop++ =
new MicroStrQTFpXImmUop(machInst, dest, base, imm);
408 *uop =
new MicroAddXiUop(machInst, base, base, imm);
409 (*uop)->setLastMicroop();
414 (*curUop)->setDelayedCommit();
430 *uop =
new MicroLdFp16RegUop(machInst, dest, base,
433 *uop =
new MicroStrQBFpXRegUop(machInst, dest, base,
435 (*uop)->setDelayedCommit();
436 *++uop =
new MicroStrQTFpXRegUop(machInst, dest, base,
440 (*uop)->setLastMicroop();
452 microOps[0] =
new MicroLdFp16LitUop(machInst, dest, imm);
462 assert(regs > 0 && regs <= 4);
463 assert(regs % elems == 0);
466 bool wb = (rm != 15);
467 bool deinterleave = (elems > 1);
475 uint32_t noAlign = 0;
480 microOps[uopIdx++] = newNeonMemInst<MicroLdrNeon16Uop>(
482 microOps[uopIdx++] = newNeonMemInst<MicroLdrNeon16Uop>(
486 microOps[uopIdx++] = newNeonMemInst<MicroLdrNeon16Uop>(
488 microOps[uopIdx++] = newNeonMemInst<MicroLdrNeon8Uop>(
492 microOps[uopIdx++] = newNeonMemInst<MicroLdrNeon16Uop>(
496 microOps[uopIdx++] = newNeonMemInst<MicroLdrNeon8Uop>(
501 microOps[uopIdx++] =
new Unknown(machInst);
504 if (rm != 15 && rm != 13) {
506 new MicroAddUop(machInst, rn, rn, rm, 0,
ArmISA::LSL);
509 new MicroAddiUop(machInst, rn, rn, regs * 8);
516 microOps[uopIdx++] = newNeonMixInst<MicroDeintNeon8Uop>(
517 size,
machInst, vd * 2, rMid, inc * 2);
521 microOps[uopIdx++] = newNeonMixInst<MicroDeintNeon6Uop>(
522 size,
machInst, vd * 2, rMid, inc * 2);
525 assert(regs == 4 || regs == 2);
527 microOps[uopIdx++] = newNeonMixInst<MicroDeintNeon4Uop>(
528 size,
machInst, vd * 2, rMid, inc * 2);
529 microOps[uopIdx++] = newNeonMixInst<MicroDeintNeon4Uop>(
530 size,
machInst, vd * 2 + 2, rMid + 4, inc * 2);
532 microOps[uopIdx++] = newNeonMixInst<MicroDeintNeon4Uop>(
533 size,
machInst, vd * 2, rMid, inc * 2);
553 OpClass __opClass,
bool all,
unsigned elems,
555 unsigned inc, uint32_t size, uint32_t
align,
559 assert(regs > 0 && regs <= 4);
560 assert(regs % elems == 0);
562 unsigned eBytes = (1 << size);
563 unsigned loadSize = eBytes * elems;
564 unsigned loadRegs M5_VAR_USED =
565 (loadSize +
sizeof(uint32_t) - 1) /
sizeof(uint32_t);
567 assert(loadRegs > 0 && loadRegs <= 4);
570 bool wb = (rm != 15);
581 microOps[uopIdx++] =
new MicroLdrNeon1Uop<uint8_t>(
586 microOps[uopIdx++] =
new MicroLdrNeon2Uop<uint16_t>(
589 microOps[uopIdx++] =
new MicroLdrNeon2Uop<uint8_t>(
594 microOps[uopIdx++] =
new MicroLdrNeon3Uop<uint8_t>(
600 microOps[uopIdx++] =
new MicroLdrNeon4Uop<uint8_t>(
604 microOps[uopIdx++] =
new MicroLdrNeon4Uop<uint16_t>(
608 microOps[uopIdx++] =
new MicroLdrNeon4Uop<uint32_t>(
614 microOps[uopIdx++] =
new MicroLdrNeon6Uop<uint16_t>(
620 microOps[uopIdx++] =
new MicroLdrNeon8Uop<uint16_t>(
624 microOps[uopIdx++] =
new MicroLdrNeon8Uop<uint32_t>(
630 microOps[uopIdx++] =
new MicroLdrNeon12Uop<uint32_t>(
634 microOps[uopIdx++] =
new MicroLdrNeon16Uop<uint32_t>(
642 if (rm != 15 && rm != 13) {
644 new MicroAddUop(machInst, rn, rn, rm, 0,
ArmISA::LSL);
647 new MicroAddiUop(machInst, rn, rn, loadSize);
656 microOps[uopIdx++] =
new MicroUnpackAllNeon2to8Uop<uint8_t>(
659 microOps[uopIdx++] =
new MicroUnpackNeon2to8Uop<uint8_t>(
660 machInst, vd * 2, ufp0, inc * 2, lane);
665 microOps[uopIdx++] =
new MicroUnpackAllNeon2to8Uop<uint16_t>(
668 microOps[uopIdx++] =
new MicroUnpackNeon2to8Uop<uint16_t>(
669 machInst, vd * 2, ufp0, inc * 2, lane);
674 microOps[uopIdx++] =
new MicroUnpackAllNeon4to8Uop<uint32_t>(
677 microOps[uopIdx++] =
new MicroUnpackNeon4to8Uop<uint32_t>(
678 machInst, vd * 2, ufp0, inc * 2, lane);
692 microOps[uopIdx++] =
new MicroUnpackAllNeon2to6Uop<uint8_t>(
695 microOps[uopIdx++] =
new MicroUnpackNeon2to6Uop<uint8_t>(
696 machInst, vd * 2, ufp0, inc * 2, lane);
701 microOps[uopIdx++] =
new MicroUnpackAllNeon2to6Uop<uint16_t>(
704 microOps[uopIdx++] =
new MicroUnpackNeon2to6Uop<uint16_t>(
705 machInst, vd * 2, ufp0, inc * 2, lane);
710 microOps[uopIdx++] =
new MicroUnpackAllNeon4to6Uop<uint32_t>(
713 microOps[uopIdx++] =
new MicroUnpackNeon4to6Uop<uint32_t>(
714 machInst, vd * 2, ufp0, inc * 2, lane);
725 assert(loadRegs <= 2);
729 microOps[uopIdx++] =
new MicroUnpackAllNeon2to4Uop<uint8_t>(
732 microOps[uopIdx++] =
new MicroUnpackNeon2to4Uop<uint8_t>(
733 machInst, vd * 2, ufp0, inc * 2, lane);
738 microOps[uopIdx++] =
new MicroUnpackAllNeon2to4Uop<uint16_t>(
741 microOps[uopIdx++] =
new MicroUnpackNeon2to4Uop<uint16_t>(
742 machInst, vd * 2, ufp0, inc * 2, lane);
747 microOps[uopIdx++] =
new MicroUnpackAllNeon2to4Uop<uint32_t>(
750 microOps[uopIdx++] =
new MicroUnpackNeon2to4Uop<uint32_t>(
751 machInst, vd * 2, ufp0, inc * 2, lane);
761 assert(regs == 1 || (all && regs == 2));
762 assert(loadRegs <= 2);
768 new MicroUnpackAllNeon2to2Uop<uint8_t>(
772 new MicroUnpackNeon2to2Uop<uint8_t>(
779 new MicroUnpackAllNeon2to2Uop<uint16_t>(
783 new MicroUnpackNeon2to2Uop<uint16_t>(
790 new MicroUnpackAllNeon2to2Uop<uint32_t>(
794 new MicroUnpackNeon2to2Uop<uint32_t>(
825 assert(regs > 0 && regs <= 4);
826 assert(regs % elems == 0);
829 bool wb = (rm != 15);
830 bool interleave = (elems > 1);
836 uint32_t noAlign = 0;
845 microOps[uopIdx++] = newNeonMixInst<MicroInterNeon8Uop>(
846 size,
machInst, rMid, vd * 2, inc * 2);
850 microOps[uopIdx++] = newNeonMixInst<MicroInterNeon6Uop>(
851 size,
machInst, rMid, vd * 2, inc * 2);
854 assert(regs == 4 || regs == 2);
856 microOps[uopIdx++] = newNeonMixInst<MicroInterNeon4Uop>(
857 size,
machInst, rMid, vd * 2, inc * 2);
858 microOps[uopIdx++] = newNeonMixInst<MicroInterNeon4Uop>(
859 size,
machInst, rMid + 4, vd * 2 + 2, inc * 2);
861 microOps[uopIdx++] = newNeonMixInst<MicroInterNeon4Uop>(
862 size,
machInst, rMid, vd * 2, inc * 2);
872 microOps[uopIdx++] = newNeonMemInst<MicroStrNeon16Uop>(
874 microOps[uopIdx++] = newNeonMemInst<MicroStrNeon16Uop>(
878 microOps[uopIdx++] = newNeonMemInst<MicroStrNeon16Uop>(
880 microOps[uopIdx++] = newNeonMemInst<MicroStrNeon8Uop>(
884 microOps[uopIdx++] = newNeonMemInst<MicroStrNeon16Uop>(
888 microOps[uopIdx++] = newNeonMemInst<MicroStrNeon8Uop>(
893 microOps[uopIdx++] =
new Unknown(machInst);
896 if (rm != 15 && rm != 13) {
898 new MicroAddUop(machInst, rn, rn, rm, 0,
ArmISA::LSL);
901 new MicroAddiUop(machInst, rn, rn, regs * 8);
916 OpClass __opClass,
bool all,
unsigned elems,
918 unsigned inc, uint32_t size, uint32_t
align,
923 assert(regs > 0 && regs <= 4);
924 assert(regs % elems == 0);
926 unsigned eBytes = (1 << size);
927 unsigned storeSize = eBytes * elems;
928 unsigned storeRegs M5_VAR_USED =
929 (storeSize +
sizeof(uint32_t) - 1) /
sizeof(uint32_t);
931 assert(storeRegs > 0 && storeRegs <= 4);
934 bool wb = (rm != 15);
948 microOps[uopIdx++] =
new MicroPackNeon8to2Uop<uint8_t>(
949 machInst, ufp0, vd * 2, inc * 2, lane);
952 microOps[uopIdx++] =
new MicroPackNeon8to2Uop<uint16_t>(
953 machInst, ufp0, vd * 2, inc * 2, lane);
956 microOps[uopIdx++] =
new MicroPackNeon8to4Uop<uint32_t>(
957 machInst, ufp0, vd * 2, inc * 2, lane);
969 microOps[uopIdx++] =
new MicroPackNeon6to2Uop<uint8_t>(
970 machInst, ufp0, vd * 2, inc * 2, lane);
973 microOps[uopIdx++] =
new MicroPackNeon6to2Uop<uint16_t>(
974 machInst, ufp0, vd * 2, inc * 2, lane);
977 microOps[uopIdx++] =
new MicroPackNeon6to4Uop<uint32_t>(
978 machInst, ufp0, vd * 2, inc * 2, lane);
988 assert(storeRegs <= 2);
991 microOps[uopIdx++] =
new MicroPackNeon4to2Uop<uint8_t>(
992 machInst, ufp0, vd * 2, inc * 2, lane);
995 microOps[uopIdx++] =
new MicroPackNeon4to2Uop<uint16_t>(
996 machInst, ufp0, vd * 2, inc * 2, lane);
999 microOps[uopIdx++] =
new MicroPackNeon4to2Uop<uint32_t>(
1000 machInst, ufp0, vd * 2, inc * 2, lane);
1009 assert(regs == 1 || (all && regs == 2));
1010 assert(storeRegs <= 2);
1014 microOps[uopIdx++] =
new MicroPackNeon2to2Uop<uint8_t>(
1018 microOps[uopIdx++] =
new MicroPackNeon2to2Uop<uint16_t>(
1022 microOps[uopIdx++] =
new MicroPackNeon2to2Uop<uint32_t>(
1036 switch (storeSize) {
1038 microOps[uopIdx++] =
new MicroStrNeon1Uop<uint8_t>(
1043 microOps[uopIdx++] =
new MicroStrNeon2Uop<uint16_t>(
1046 microOps[uopIdx++] =
new MicroStrNeon2Uop<uint8_t>(
1051 microOps[uopIdx++] =
new MicroStrNeon3Uop<uint8_t>(
1057 microOps[uopIdx++] =
new MicroStrNeon4Uop<uint8_t>(
1061 microOps[uopIdx++] =
new MicroStrNeon4Uop<uint16_t>(
1065 microOps[uopIdx++] =
new MicroStrNeon4Uop<uint32_t>(
1071 microOps[uopIdx++] =
new MicroStrNeon6Uop<uint16_t>(
1077 microOps[uopIdx++] =
new MicroStrNeon8Uop<uint16_t>(
1081 microOps[uopIdx++] =
new MicroStrNeon8Uop<uint32_t>(
1087 microOps[uopIdx++] =
new MicroStrNeon12Uop<uint32_t>(
1091 microOps[uopIdx++] =
new MicroStrNeon16Uop<uint32_t>(
1099 if (rm != 15 && rm != 13) {
1101 new MicroAddUop(machInst, rn, rn, rm, 0,
ArmISA::LSL);
1104 new MicroAddiUop(machInst, rn, rn, storeSize);
1120 RegIndex rm, uint8_t eSize, uint8_t dataSize,
1121 uint8_t numStructElems, uint8_t numRegs,
bool wb) :
1130 int totNumBytes = numRegs * dataSize / 8;
1131 assert(totNumBytes <= 64);
1135 int numMemMicroops = totNumBytes / 16;
1136 int residuum = totNumBytes % 16;
1141 int numMarshalMicroops = numRegs / 2 + (numRegs % 2 ? 1 : 0);
1145 unsigned uopIdx = 0;
1149 for (; i < numMemMicroops - 1; ++
i) {
1150 microOps[uopIdx++] =
new MicroNeonLoad64(
1151 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags,
1152 baseIsSP, 16 , eSize);
1154 microOps[uopIdx++] =
new MicroNeonLoad64(
1155 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags, baseIsSP,
1156 residuum ? residuum : 16 , eSize);
1163 microOps[uopIdx++] =
new MicroAddXERegUop(machInst, rnsp, rnsp, rm,
1166 microOps[uopIdx++] =
new MicroAddXiUop(machInst, rnsp, rnsp,
1171 for (
int i = 0; i < numMarshalMicroops; ++
i) {
1173 case 1:
microOps[uopIdx++] =
new MicroDeintNeon64_1Reg(
1174 machInst, vd + (
RegIndex) (2 * i), vx, eSize, dataSize,
1175 numStructElems, 1, i );
1177 case 2:
microOps[uopIdx++] =
new MicroDeintNeon64_2Reg(
1178 machInst, vd + (
RegIndex) (2 * i), vx, eSize, dataSize,
1179 numStructElems, 2, i );
1181 case 3:
microOps[uopIdx++] =
new MicroDeintNeon64_3Reg(
1182 machInst, vd + (
RegIndex) (2 * i), vx, eSize, dataSize,
1183 numStructElems, 3, i );
1185 case 4:
microOps[uopIdx++] =
new MicroDeintNeon64_4Reg(
1186 machInst, vd + (
RegIndex) (2 * i), vx, eSize, dataSize,
1187 numStructElems, 4, i );
1189 default:
panic(
"Invalid number of registers");
1214 int totNumBytes = numRegs * dataSize / 8;
1215 assert(totNumBytes <= 64);
1219 int numMemMicroops = totNumBytes / 16;
1220 int residuum = totNumBytes % 16;
1225 int numMarshalMicroops = totNumBytes > 32 ? 2 : 1;
1229 unsigned uopIdx = 0;
1231 for (
int i = 0;
i < numMarshalMicroops; ++
i) {
1233 case 1:
microOps[uopIdx++] =
new MicroIntNeon64_1Reg(
1234 machInst, vx + (
RegIndex) (2 *
i), vd, eSize, dataSize,
1235 numStructElems, 1,
i );
1237 case 2:
microOps[uopIdx++] =
new MicroIntNeon64_2Reg(
1238 machInst, vx + (
RegIndex) (2 *
i), vd, eSize, dataSize,
1239 numStructElems, 2,
i );
1241 case 3:
microOps[uopIdx++] =
new MicroIntNeon64_3Reg(
1242 machInst, vx + (
RegIndex) (2 *
i), vd, eSize, dataSize,
1243 numStructElems, 3,
i );
1245 case 4:
microOps[uopIdx++] =
new MicroIntNeon64_4Reg(
1246 machInst, vx + (
RegIndex) (2 *
i), vd, eSize, dataSize,
1247 numStructElems, 4,
i );
1249 default:
panic(
"Invalid number of registers");
1256 for (; i < numMemMicroops - 1; ++
i) {
1257 microOps[uopIdx++] =
new MicroNeonStore64(
1258 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags,
1259 baseIsSP, 16 , eSize);
1261 microOps[uopIdx++] =
new MicroNeonStore64(
1262 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags, baseIsSP,
1263 residuum ? residuum : 16 , eSize);
1270 microOps[uopIdx++] =
new MicroAddXERegUop(machInst, rnsp, rnsp, rm,
1273 microOps[uopIdx++] =
new MicroAddXiUop(machInst, rnsp, rnsp,
1292 eSize(0), dataSize(0), numStructElems(0), index(0),
1293 wb(false), replicate(false)
1302 int eSizeBytes = 1 <<
eSize;
1303 int totNumBytes = numStructElems * eSizeBytes;
1304 assert(totNumBytes <= 64);
1308 int numMemMicroops = totNumBytes / 16;
1309 int residuum = totNumBytes % 16;
1314 int numMarshalMicroops = numStructElems / 2 + (numStructElems % 2 ? 1 : 0);
1318 unsigned uopIdx = 0;
1323 for (; i < numMemMicroops - 1; ++
i) {
1324 microOps[uopIdx++] =
new MicroNeonLoad64(
1325 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags,
1326 baseIsSP, 16 , eSize);
1328 microOps[uopIdx++] =
new MicroNeonLoad64(
1329 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags, baseIsSP,
1330 residuum ? residuum : 16 , eSize);
1337 microOps[uopIdx++] =
new MicroAddXERegUop(machInst, rnsp, rnsp, rm,
1340 microOps[uopIdx++] =
new MicroAddXiUop(machInst, rnsp, rnsp,
1345 for (
int i = 0; i < numMarshalMicroops; ++
i) {
1346 microOps[uopIdx++] =
new MicroUnpackNeon64(
1347 machInst, vd + (
RegIndex) (2 * i), vx, eSize, dataSize,
1348 numStructElems, index, i , replicate);
1365 eSize(0), dataSize(0), numStructElems(0), index(0),
1366 wb(false), replicate(false)
1374 int eSizeBytes = 1 <<
eSize;
1375 int totNumBytes = numStructElems * eSizeBytes;
1376 assert(totNumBytes <= 64);
1380 int numMemMicroops = totNumBytes / 16;
1381 int residuum = totNumBytes % 16;
1386 int numMarshalMicroops = totNumBytes > 32 ? 2 : 1;
1390 unsigned uopIdx = 0;
1392 for (
int i = 0;
i < numMarshalMicroops; ++
i) {
1393 microOps[uopIdx++] =
new MicroPackNeon64(
1394 machInst, vx + (
RegIndex) (2 *
i), vd, eSize, dataSize,
1395 numStructElems, index,
i , replicate);
1401 for (; i < numMemMicroops - 1; ++
i) {
1402 microOps[uopIdx++] =
new MicroNeonStore64(
1403 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags,
1404 baseIsSP, 16 , eSize);
1406 microOps[uopIdx++] =
new MicroNeonStore64(
1407 machInst, vx + (
RegIndex) i, rnsp, 16 * i, memaccessFlags, baseIsSP,
1408 residuum ? residuum : 16 , eSize);
1415 microOps[uopIdx++] =
new MicroAddXERegUop(machInst, rnsp, rnsp, rm,
1418 microOps[uopIdx++] =
new MicroAddXiUop(machInst, rnsp, rnsp,
1443 numMicroops = count * (single ? 1 : 2) + (writeback ? 1 : 0);
1455 microOps[i++] =
new MicroLdrFpUop(machInst, vd++, rn,
1458 microOps[i++] =
new MicroLdrDBFpUop(machInst, vd++, rn,
1460 microOps[i++] =
new MicroLdrDTFpUop(machInst, vd++, rn, tempUp,
1461 addr + (up ? 4 : -4));
1465 microOps[i++] =
new MicroStrFpUop(machInst, vd++, rn,
1468 microOps[i++] =
new MicroStrDBFpUop(machInst, vd++, rn,
1470 microOps[i++] =
new MicroStrDTFpUop(machInst, vd++, rn, tempUp,
1471 addr + (up ? 4 : -4));
1475 addr -= (single ? 4 : 8);
1483 addr += (single ? 4 : 8);
1490 new MicroAddiUop(machInst, rn, rn, 4 * offset);
1493 new MicroSubiUop(machInst, rn, rn, 4 * offset);
1512 std::stringstream
ss;
1526 std::stringstream
ss;
1540 std::stringstream
ss;
1550 std::stringstream
ss;
1563 std::stringstream
ss;
1575 std::stringstream
ss;
1589 std::stringstream
ss;
1607 std::stringstream
ss;
#define panic(...)
This implements a cprintf based panic() function.
void ccprintf(cp::Print &print)
static IntRegIndex makeSP(IntRegIndex reg)
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
void printMnemonic(std::ostream &os, const std::string &suffix="", bool withPred=true, bool withCond64=false, ConditionCode cond64=COND_UC) const
BigFpMemPostOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, bool load, IntRegIndex dest, IntRegIndex base, int64_t imm)
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
void printExtendOperand(bool firstOperand, std::ostream &os, IntRegIndex rm, ArmExtendType type, int64_t shiftAmt) const
VldSingleOp64(const char *mnem, ExtMachInst machInst, OpClass __opClass, RegIndex rn, RegIndex vd, RegIndex rm, uint8_t eSize, uint8_t dataSize, uint8_t numStructElems, uint8_t index, bool wb, bool replicate=false)
VstSingleOp64(const char *mnem, ExtMachInst machInst, OpClass __opClass, RegIndex rn, RegIndex vd, RegIndex rm, uint8_t eSize, uint8_t dataSize, uint8_t numStructElems, uint8_t index, bool wb, bool replicate=false)
MacroVFPMemOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, IntRegIndex rn, RegIndex vd, bool single, bool up, bool writeback, bool load, uint32_t offset)
Overload hash function for BasicBlockRange type.
BigFpMemLitOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, IntRegIndex dest, int64_t imm)
BigFpMemPreOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, bool load, IntRegIndex dest, IntRegIndex base, int64_t imm)
VstMultOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, unsigned width, RegIndex rn, RegIndex vd, unsigned regs, unsigned inc, uint32_t size, uint32_t align, RegIndex rm)
VldMultOp64(const char *mnem, ExtMachInst machInst, OpClass __opClass, RegIndex rn, RegIndex vd, RegIndex rm, uint8_t eSize, uint8_t dataSize, uint8_t numStructElems, uint8_t numRegs, bool wb)
static unsigned int number_of_ones(int32_t val)
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
PairMemOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, uint32_t size, bool fp, bool load, bool noAlloc, bool signExt, bool exclusive, bool acrel, int64_t imm, AddrMode mode, IntRegIndex rn, IntRegIndex rt, IntRegIndex rt2)
Utility functions and datatypes used by AArch64 NEON memory instructions.
BigFpMemImmOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, bool load, IntRegIndex dest, IntRegIndex base, int64_t imm)
const ExtMachInst machInst
The binary machine instruction.
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
void inc(scfx_mant &mant)
void align(const scfx_rep &lhs, const scfx_rep &rhs, int &new_wp, int &len_mant, scfx_mant_ref &lhs_mant, scfx_mant_ref &rhs_mant)
void replaceBits(T &val, int first, int last, B bit_val)
A convenience function to replace bits first to last of val with bit_val in place.
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
void printIntReg(std::ostream &os, RegIndex reg_idx, uint8_t opWidth=0) const
Print a register name for disassembly given the unique dependence tag number (FP or int)...
const int NumVecV8ArchRegs
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
VldMultOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, unsigned elems, RegIndex rn, RegIndex vd, unsigned regs, unsigned inc, uint32_t size, uint32_t align, RegIndex rm)
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
VstMultOp64(const char *mnem, ExtMachInst machInst, OpClass __opClass, RegIndex rn, RegIndex vd, RegIndex rm, uint8_t eSize, uint8_t dataSize, uint8_t numStructElems, uint8_t numRegs, bool wb)
VldSingleOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, bool all, unsigned elems, RegIndex rn, RegIndex vd, unsigned regs, unsigned inc, uint32_t size, uint32_t align, RegIndex rm, unsigned lane)
VstSingleOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, bool all, unsigned elems, RegIndex rn, RegIndex vd, unsigned regs, unsigned inc, uint32_t size, uint32_t align, RegIndex rm, unsigned lane)
Base class for predicated macro-operations.
Base class for Memory microops.
TheISA::ExtMachInst ExtMachInst
Binary extended machine instruction type.
void printFloatReg(std::ostream &os, RegIndex reg_idx) const
BigFpMemRegOp(const char *mnem, ExtMachInst machInst, OpClass __opClass, bool load, IntRegIndex dest, IntRegIndex base, IntRegIndex offset, ArmExtendType type, int64_t imm)
static bool isSP(IntRegIndex reg)
T bits(T val, int first, int last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it...
T * get() const
Directly access the pointer itself without taking a reference.
std::string generateDisassembly(Addr pc, const Loader::SymbolTable *symtab) const override
Internal function to generate disassembly string.
static int intRegInMode(OperatingMode mode, int reg)
bool isLastMicroop() const