develop/ds_8cc_source.html

/*

 * Copyright (c) 2024 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#include "arch/amdgpu/vega/insts/instructions.hh"


namespace gem5

{


namespace VegaISA

{

    // --- Inst_DS__DS_ADD_U32 class methods ---


    Inst_DS__DS_ADD_U32::Inst_DS__DS_ADD_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_u32")

    {

        setFlag(MemoryRef);

        setFlag(GroupSegment);

        setFlag(AtomicAdd);

        setFlag(AtomicNoReturn);

    } // Inst_DS__DS_ADD_U32


    Inst_DS__DS_ADD_U32::~Inst_DS__DS_ADD_U32()

    {

    } // ~Inst_DS__DS_ADD_U32


    // --- description from .arch file ---

    // 32b:

    // MEM[ADDR] += DATA;

    void


    Inst_DS__DS_ADD_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->a_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_ADD_U32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initAtomicAccess<VecElemU32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_ADD_U32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_SUB_U32 class methods ---


    Inst_DS__DS_SUB_U32::Inst_DS__DS_SUB_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_sub_u32")

    {

    } // Inst_DS__DS_SUB_U32


    Inst_DS__DS_SUB_U32::~Inst_DS__DS_SUB_U32()

    {

    } // ~Inst_DS__DS_SUB_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_SUB_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_RSUB_U32 class methods ---


    Inst_DS__DS_RSUB_U32::Inst_DS__DS_RSUB_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_rsub_u32")

    {

    } // Inst_DS__DS_RSUB_U32


    Inst_DS__DS_RSUB_U32::~Inst_DS__DS_RSUB_U32()

    {

    } // ~Inst_DS__DS_RSUB_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = DATA - MEM[ADDR];

    // RETURN_DATA = tmp.

    // Subtraction with reversed operands.

    void


    Inst_DS__DS_RSUB_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_INC_U32 class methods ---


    Inst_DS__DS_INC_U32::Inst_DS__DS_INC_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_inc_u32")

    {

    } // Inst_DS__DS_INC_U32


    Inst_DS__DS_INC_U32::~Inst_DS__DS_INC_U32()

    {

    } // ~Inst_DS__DS_INC_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp >= DATA) ? 0 : tmp + 1 (unsigned compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_INC_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_DEC_U32 class methods ---


    Inst_DS__DS_DEC_U32::Inst_DS__DS_DEC_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_dec_u32")

    {

    } // Inst_DS__DS_DEC_U32


    Inst_DS__DS_DEC_U32::~Inst_DS__DS_DEC_U32()

    {

    } // ~Inst_DS__DS_DEC_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp == 0 || tmp > DATA) ? DATA : tmp - 1

    // (unsigned compare); RETURN_DATA = tmp.

    void


    Inst_DS__DS_DEC_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_I32 class methods ---


    Inst_DS__DS_MIN_I32::Inst_DS__DS_MIN_I32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_i32")

    {

    } // Inst_DS__DS_MIN_I32


    Inst_DS__DS_MIN_I32::~Inst_DS__DS_MIN_I32()

    {

    } // ~Inst_DS__DS_MIN_I32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA < tmp) ? DATA : tmp (signed compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MIN_I32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_I32 class methods ---


    Inst_DS__DS_MAX_I32::Inst_DS__DS_MAX_I32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_i32")

    {

    } // Inst_DS__DS_MAX_I32


    Inst_DS__DS_MAX_I32::~Inst_DS__DS_MAX_I32()

    {

    } // ~Inst_DS__DS_MAX_I32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA > tmp) ? DATA : tmp (signed compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MAX_I32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_U32 class methods ---


    Inst_DS__DS_MIN_U32::Inst_DS__DS_MIN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_u32")

    {

    } // Inst_DS__DS_MIN_U32


    Inst_DS__DS_MIN_U32::~Inst_DS__DS_MIN_U32()

    {

    } // ~Inst_DS__DS_MIN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA < tmp) ? DATA : tmp (unsigned compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MIN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_U32 class methods ---


    Inst_DS__DS_MAX_U32::Inst_DS__DS_MAX_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_u32")

    {

    } // Inst_DS__DS_MAX_U32


    Inst_DS__DS_MAX_U32::~Inst_DS__DS_MAX_U32()

    {

    } // ~Inst_DS__DS_MAX_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA > tmp) ? DATA : tmp (unsigned compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MAX_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_AND_B32 class methods ---


    Inst_DS__DS_AND_B32::Inst_DS__DS_AND_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_and_b32")

    {

    } // Inst_DS__DS_AND_B32


    Inst_DS__DS_AND_B32::~Inst_DS__DS_AND_B32()

    {

    } // ~Inst_DS__DS_AND_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] &= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_AND_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_OR_B32 class methods ---


    Inst_DS__DS_OR_B32::Inst_DS__DS_OR_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_or_b32")

    {

        setFlag(MemoryRef);

        setFlag(GroupSegment);

        setFlag(AtomicOr);

        setFlag(AtomicNoReturn);

    } // Inst_DS__DS_OR_B32


    Inst_DS__DS_OR_B32::~Inst_DS__DS_OR_B32()

    {

    } // ~Inst_DS__DS_OR_B32


    // --- description from .arch file ---

    // 32b:

    // MEM[ADDR] |= DATA;

    void


    Inst_DS__DS_OR_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->a_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_OR_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initAtomicAccess<VecElemU32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_OR_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_XOR_B32 class methods ---


    Inst_DS__DS_XOR_B32::Inst_DS__DS_XOR_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_xor_b32")

    {

    } // Inst_DS__DS_XOR_B32


    Inst_DS__DS_XOR_B32::~Inst_DS__DS_XOR_B32()

    {

    } // ~Inst_DS__DS_XOR_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] ^= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_XOR_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MSKOR_B32 class methods ---


    Inst_DS__DS_MSKOR_B32::Inst_DS__DS_MSKOR_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_mskor_b32")

    {

    } // Inst_DS__DS_MSKOR_B32


    Inst_DS__DS_MSKOR_B32::~Inst_DS__DS_MSKOR_B32()

    {

    } // ~Inst_DS__DS_MSKOR_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (MEM_ADDR[ADDR] & ~DATA) | DATA2;

    // RETURN_DATA = tmp.

    // Masked dword OR, D0 contains the mask and D1 contains the new value.

    void


    Inst_DS__DS_MSKOR_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRITE_B32 class methods ---


    Inst_DS__DS_WRITE_B32::Inst_DS__DS_WRITE_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b32")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B32


    Inst_DS__DS_WRITE_B32::~Inst_DS__DS_WRITE_B32()

    {

    } // ~Inst_DS__DS_WRITE_B32


    // --- description from .arch file ---

    // 32b:

    // MEM[ADDR] = DATA.

    // Write dword.

    void


    Inst_DS__DS_WRITE_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->d_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<VecElemU32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_WRITE2_B32 class methods ---


    Inst_DS__DS_WRITE2_B32::Inst_DS__DS_WRITE2_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write2_b32")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE2_B32


    Inst_DS__DS_WRITE2_B32::~Inst_DS__DS_WRITE2_B32()

    {

    } // ~Inst_DS__DS_WRITE2_B32


    // --- description from .arch file ---

    // 32b:

    // MEM[ADDR_BASE + OFFSET0 * 4] = DATA;

    // MEM[ADDR_BASE + OFFSET1 * 4] = DATA2.

    // Write 2 dwords.

    void


    Inst_DS__DS_WRITE2_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data0(gpuDynInst, extData.DATA0);

        ConstVecOperandU32 data1(gpuDynInst, extData.DATA1);


        addr.read();

        data0.read();

        data1.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->d_data))[lane * 2]

                    = data0[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE2_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0 * 4;

        Addr offset1 = instData.OFFSET1 * 4;


        initDualMemWrite<VecElemU32>(gpuDynInst, offset0, offset1);

    }


    void


    Inst_DS__DS_WRITE2_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    }


    // --- Inst_DS__DS_WRITE2ST64_B32 class methods ---


    Inst_DS__DS_WRITE2ST64_B32::Inst_DS__DS_WRITE2ST64_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write2st64_b32")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE2ST64_B32


    Inst_DS__DS_WRITE2ST64_B32::~Inst_DS__DS_WRITE2ST64_B32()

    {

    } // ~Inst_DS__DS_WRITE2ST64_B32


    // --- description from .arch file ---

    // 32b:

    // MEM[ADDR_BASE + OFFSET0 * 4 * 64] = DATA;

    // MEM[ADDR_BASE + OFFSET1 * 4 * 64] = DATA2;

    // Write 2 dwords.

    void


    Inst_DS__DS_WRITE2ST64_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data0(gpuDynInst, extData.DATA0);

        ConstVecOperandU32 data1(gpuDynInst, extData.DATA1);


        addr.read();

        data0.read();

        data1.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->d_data))[lane * 2]

                    = data0[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE2ST64_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0 * 4 * 64;

        Addr offset1 = instData.OFFSET1 * 4 * 64;


        initDualMemWrite<VecElemU32>(gpuDynInst, offset0, offset1);

    }


    void


    Inst_DS__DS_WRITE2ST64_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    }


    // --- Inst_DS__DS_CMPST_B32 class methods ---


    Inst_DS__DS_CMPST_B32::Inst_DS__DS_CMPST_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_b32")

    {

    } // Inst_DS__DS_CMPST_B32


    Inst_DS__DS_CMPST_B32::~Inst_DS__DS_CMPST_B32()

    {

    } // ~Inst_DS__DS_CMPST_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Compare and store.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_CMPSWAP opcode.

    void


    Inst_DS__DS_CMPST_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_CMPST_F32 class methods ---


    Inst_DS__DS_CMPST_F32::Inst_DS__DS_CMPST_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_CMPST_F32


    Inst_DS__DS_CMPST_F32::~Inst_DS__DS_CMPST_F32()

    {

    } // ~Inst_DS__DS_CMPST_F32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Floating point compare and store that handles NaN/INF/denormal values.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_FCMPSWAP opcode.

    void


    Inst_DS__DS_CMPST_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_F32 class methods ---


    Inst_DS__DS_MIN_F32::Inst_DS__DS_MIN_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_MIN_F32


    Inst_DS__DS_MIN_F32::~Inst_DS__DS_MIN_F32()

    {

    } // ~Inst_DS__DS_MIN_F32


    // --- description from .arch file ---

    // 32b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (cmp < tmp) ? src : tmp.

    // Floating point minimum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMIN.

    void


    Inst_DS__DS_MIN_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_F32 class methods ---


    Inst_DS__DS_MAX_F32::Inst_DS__DS_MAX_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_MAX_F32


    Inst_DS__DS_MAX_F32::~Inst_DS__DS_MAX_F32()

    {

    } // ~Inst_DS__DS_MAX_F32


    // --- description from .arch file ---

    // 32b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (tmp > cmp) ? src : tmp.

    // Floating point maximum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMAX.

    void


    Inst_DS__DS_MAX_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_NOP class methods ---


    Inst_DS__DS_NOP::Inst_DS__DS_NOP(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_nop")

    {

        setFlag(Nop);

    } // Inst_DS__DS_NOP


    Inst_DS__DS_NOP::~Inst_DS__DS_NOP()

    {

    } // ~Inst_DS__DS_NOP


    // --- description from .arch file ---

    // Do nothing.

    void


    Inst_DS__DS_NOP::execute(GPUDynInstPtr gpuDynInst)

    {

        gpuDynInst->wavefront()->decLGKMInstsIssued();

        gpuDynInst->wavefront()->untrackLGKMInst(gpuDynInst);

    } // execute


    // --- Inst_DS__DS_ADD_F32 class methods ---


    Inst_DS__DS_ADD_F32::Inst_DS__DS_ADD_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_f32")

    {

        setFlag(F32);

        setFlag(MemoryRef);

        setFlag(GroupSegment);

        setFlag(AtomicAdd);

        setFlag(AtomicNoReturn);

    } // Inst_DS__DS_ADD_F32


    Inst_DS__DS_ADD_F32::~Inst_DS__DS_ADD_F32()

    {

    } // ~Inst_DS__DS_ADD_F32


    // --- description from .arch file ---

    // 32b:

    // MEM[ADDR] += DATA;

    // Floating point add that handles NaN/INF/denormal values.

    void


    Inst_DS__DS_ADD_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandF32 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemF32*>(gpuDynInst->a_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_ADD_F32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initAtomicAccess<VecElemF32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_ADD_F32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_WRITE_B8 class methods ---


    Inst_DS__DS_WRITE_B8::Inst_DS__DS_WRITE_B8(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b8")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B8


    Inst_DS__DS_WRITE_B8::~Inst_DS__DS_WRITE_B8()

    {

    } // ~Inst_DS__DS_WRITE_B8


    // --- description from .arch file ---

    // MEM[ADDR] = DATA[7:0].

    // Byte write.

    void


    Inst_DS__DS_WRITE_B8::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU8 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU8*>(gpuDynInst->d_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B8::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<VecElemU8>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B8::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_WRITE_B8_D16_HI class methods ---


    Inst_DS__DS_WRITE_B8_D16_HI::Inst_DS__DS_WRITE_B8_D16_HI(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b8_d16_hi")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B8_D16_HI


    Inst_DS__DS_WRITE_B8_D16_HI::~Inst_DS__DS_WRITE_B8_D16_HI()

    {

    } // ~Inst_DS__DS_WRITE_B8_D16_HI


    // --- description from .arch file ---

    // MEM[ADDR] = DATA[23:16].

    // Byte write in to high word.

    void


    Inst_DS__DS_WRITE_B8_D16_HI::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU8 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU8*>(gpuDynInst->d_data))[lane]

                    = bits(data[lane], 23, 16);

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B8_D16_HI::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<VecElemU8>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B8_D16_HI::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_WRITE_B16 class methods ---


    Inst_DS__DS_WRITE_B16::Inst_DS__DS_WRITE_B16(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b16")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B16


    Inst_DS__DS_WRITE_B16::~Inst_DS__DS_WRITE_B16()

    {

    } // ~Inst_DS__DS_WRITE_B16


    // --- description from .arch file ---

    // MEM[ADDR] = DATA[15:0]

    // Short write.

    void


    Inst_DS__DS_WRITE_B16::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU16 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU16*>(gpuDynInst->d_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B16::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<VecElemU16>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B16::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_ADD_RTN_U32 class methods ---


    Inst_DS__DS_ADD_RTN_U32::Inst_DS__DS_ADD_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_rtn_u32")

    {

        setFlag(MemoryRef);

        setFlag(AtomicAdd);

        setFlag(AtomicReturn);

    } // Inst_DS__DS_ADD_RTN_U32


    Inst_DS__DS_ADD_RTN_U32::~Inst_DS__DS_ADD_RTN_U32()

    {

    } // ~Inst_DS__DS_ADD_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] += DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_ADD_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->a_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_ADD_RTN_U32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initAtomicAccess<VecElemU32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_ADD_RTN_U32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane];

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_SUB_RTN_U32 class methods ---


    Inst_DS__DS_SUB_RTN_U32::Inst_DS__DS_SUB_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_sub_rtn_u32")

    {

    } // Inst_DS__DS_SUB_RTN_U32


    Inst_DS__DS_SUB_RTN_U32::~Inst_DS__DS_SUB_RTN_U32()

    {

    } // ~Inst_DS__DS_SUB_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_SUB_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_RSUB_RTN_U32 class methods ---


    Inst_DS__DS_RSUB_RTN_U32::Inst_DS__DS_RSUB_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_rsub_rtn_u32")

    {

    } // Inst_DS__DS_RSUB_RTN_U32


    Inst_DS__DS_RSUB_RTN_U32::~Inst_DS__DS_RSUB_RTN_U32()

    {

    } // ~Inst_DS__DS_RSUB_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = DATA - MEM[ADDR];

    // RETURN_DATA = tmp.

    // Subtraction with reversed operands.

    void


    Inst_DS__DS_RSUB_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_INC_RTN_U32 class methods ---


    Inst_DS__DS_INC_RTN_U32::Inst_DS__DS_INC_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_inc_rtn_u32")

    {

    } // Inst_DS__DS_INC_RTN_U32


    Inst_DS__DS_INC_RTN_U32::~Inst_DS__DS_INC_RTN_U32()

    {

    } // ~Inst_DS__DS_INC_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp >= DATA) ? 0 : tmp + 1 (unsigned compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_INC_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_DEC_RTN_U32 class methods ---


    Inst_DS__DS_DEC_RTN_U32::Inst_DS__DS_DEC_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_dec_rtn_u32")

    {

    } // Inst_DS__DS_DEC_RTN_U32


    Inst_DS__DS_DEC_RTN_U32::~Inst_DS__DS_DEC_RTN_U32()

    {

    } // ~Inst_DS__DS_DEC_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp == 0 || tmp > DATA) ? DATA : tmp - 1

    // (unsigned compare); RETURN_DATA = tmp.

    void


    Inst_DS__DS_DEC_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_RTN_I32 class methods ---


    Inst_DS__DS_MIN_RTN_I32::Inst_DS__DS_MIN_RTN_I32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_rtn_i32")

    {

    } // Inst_DS__DS_MIN_RTN_I32


    Inst_DS__DS_MIN_RTN_I32::~Inst_DS__DS_MIN_RTN_I32()

    {

    } // ~Inst_DS__DS_MIN_RTN_I32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA < tmp) ? DATA : tmp (signed compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MIN_RTN_I32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_RTN_I32 class methods ---


    Inst_DS__DS_MAX_RTN_I32::Inst_DS__DS_MAX_RTN_I32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_rtn_i32")

    {

    } // Inst_DS__DS_MAX_RTN_I32


    Inst_DS__DS_MAX_RTN_I32::~Inst_DS__DS_MAX_RTN_I32()

    {

    } // ~Inst_DS__DS_MAX_RTN_I32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA > tmp) ? DATA : tmp (signed compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MAX_RTN_I32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_RTN_U32 class methods ---


    Inst_DS__DS_MIN_RTN_U32::Inst_DS__DS_MIN_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_rtn_u32")

    {

    } // Inst_DS__DS_MIN_RTN_U32


    Inst_DS__DS_MIN_RTN_U32::~Inst_DS__DS_MIN_RTN_U32()

    {

    } // ~Inst_DS__DS_MIN_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA < tmp) ? DATA : tmp (unsigned compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MIN_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_RTN_U32 class methods ---


    Inst_DS__DS_MAX_RTN_U32::Inst_DS__DS_MAX_RTN_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_rtn_u32")

    {

    } // Inst_DS__DS_MAX_RTN_U32


    Inst_DS__DS_MAX_RTN_U32::~Inst_DS__DS_MAX_RTN_U32()

    {

    } // ~Inst_DS__DS_MAX_RTN_U32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (DATA > tmp) ? DATA : tmp (unsigned compare);

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_MAX_RTN_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_AND_RTN_B32 class methods ---


    Inst_DS__DS_AND_RTN_B32::Inst_DS__DS_AND_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_and_rtn_b32")

    {

    } // Inst_DS__DS_AND_RTN_B32


    Inst_DS__DS_AND_RTN_B32::~Inst_DS__DS_AND_RTN_B32()

    {

    } // ~Inst_DS__DS_AND_RTN_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] &= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_AND_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_OR_RTN_B32 class methods ---


    Inst_DS__DS_OR_RTN_B32::Inst_DS__DS_OR_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_or_rtn_b32")

    {

    } // Inst_DS__DS_OR_RTN_B32


    Inst_DS__DS_OR_RTN_B32::~Inst_DS__DS_OR_RTN_B32()

    {

    } // ~Inst_DS__DS_OR_RTN_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] |= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_OR_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_XOR_RTN_B32 class methods ---


    Inst_DS__DS_XOR_RTN_B32::Inst_DS__DS_XOR_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_xor_rtn_b32")

    {

    } // Inst_DS__DS_XOR_RTN_B32


    Inst_DS__DS_XOR_RTN_B32::~Inst_DS__DS_XOR_RTN_B32()

    {

    } // ~Inst_DS__DS_XOR_RTN_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] ^= DATA;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_XOR_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MSKOR_RTN_B32 class methods ---


    Inst_DS__DS_MSKOR_RTN_B32::Inst_DS__DS_MSKOR_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_mskor_rtn_b32")

    {

    } // Inst_DS__DS_MSKOR_RTN_B32


    Inst_DS__DS_MSKOR_RTN_B32::~Inst_DS__DS_MSKOR_RTN_B32()

    {

    } // ~Inst_DS__DS_MSKOR_RTN_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (MEM_ADDR[ADDR] & ~DATA) | DATA2;

    // RETURN_DATA = tmp.

    // Masked dword OR, D0 contains the mask and D1 contains the new value.

    void


    Inst_DS__DS_MSKOR_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRXCHG_RTN_B32 class methods ---


    Inst_DS__DS_WRXCHG_RTN_B32::Inst_DS__DS_WRXCHG_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrxchg_rtn_b32")

    {

    } // Inst_DS__DS_WRXCHG_RTN_B32


    Inst_DS__DS_WRXCHG_RTN_B32::~Inst_DS__DS_WRXCHG_RTN_B32()

    {

    } // ~Inst_DS__DS_WRXCHG_RTN_B32


    // --- description from .arch file ---

    // tmp = MEM[ADDR];

    // MEM[ADDR] = DATA;

    // RETURN_DATA = tmp.

    // Write-exchange operation.

    void


    Inst_DS__DS_WRXCHG_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRXCHG2_RTN_B32 class methods ---


    Inst_DS__DS_WRXCHG2_RTN_B32::Inst_DS__DS_WRXCHG2_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrxchg2_rtn_b32")

    {

    } // Inst_DS__DS_WRXCHG2_RTN_B32


    Inst_DS__DS_WRXCHG2_RTN_B32::~Inst_DS__DS_WRXCHG2_RTN_B32()

    {

    } // ~Inst_DS__DS_WRXCHG2_RTN_B32


    // --- description from .arch file ---

    // Write-exchange 2 separate dwords.

    void


    Inst_DS__DS_WRXCHG2_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRXCHG2ST64_RTN_B32 class methods ---


    Inst_DS__DS_WRXCHG2ST64_RTN_B32::Inst_DS__DS_WRXCHG2ST64_RTN_B32(

          InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrxchg2st64_rtn_b32")

    {

    } // Inst_DS__DS_WRXCHG2ST64_RTN_B32


    Inst_DS__DS_WRXCHG2ST64_RTN_B32::~Inst_DS__DS_WRXCHG2ST64_RTN_B32()

    {

    } // ~Inst_DS__DS_WRXCHG2ST64_RTN_B32


    // --- description from .arch file ---

    // Write-exchange 2 separate dwords with a stride of 64 dwords.

    void


    Inst_DS__DS_WRXCHG2ST64_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_CMPST_RTN_B32 class methods ---


    Inst_DS__DS_CMPST_RTN_B32::Inst_DS__DS_CMPST_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_rtn_b32")

    {

        setFlag(MemoryRef);

        setFlag(AtomicCAS);

        setFlag(AtomicReturn);

    } // Inst_DS__DS_CMPST_RTN_B32


    Inst_DS__DS_CMPST_RTN_B32::~Inst_DS__DS_CMPST_RTN_B32()

    {

    } // ~Inst_DS__DS_CMPST_RTN_B32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Compare and store.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_CMPSWAP opcode.

    void


    Inst_DS__DS_CMPST_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        //panicUnimplemented();

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));


        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 src(gpuDynInst, extData.DATA1);

        ConstVecOperandU32 cmp(gpuDynInst, extData.DATA0);


        addr.read();

        src.read();

        cmp.read();

        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(gpuDynInst->x_data))[lane]

                    = src[lane];

                (reinterpret_cast<VecElemU32*>(gpuDynInst->a_data))[lane]

                    = cmp[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);


    } // execute


    // --- Inst_DS__DS_CMPST_RTN_F32 class methods ---


    void


    Inst_DS__DS_CMPST_RTN_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initAtomicAccess<VecElemU32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_CMPST_RTN_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane];

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_CMPST_RTN_F32 class methods ---


    Inst_DS__DS_CMPST_RTN_F32::Inst_DS__DS_CMPST_RTN_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_rtn_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_CMPST_RTN_F32


    Inst_DS__DS_CMPST_RTN_F32::~Inst_DS__DS_CMPST_RTN_F32()

    {

    } // ~Inst_DS__DS_CMPST_RTN_F32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Floating point compare and store that handles NaN/INF/denormal values.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_FCMPSWAP opcode.

    void


    Inst_DS__DS_CMPST_RTN_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_RTN_F32 class methods ---


    Inst_DS__DS_MIN_RTN_F32::Inst_DS__DS_MIN_RTN_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_rtn_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_MIN_RTN_F32


    Inst_DS__DS_MIN_RTN_F32::~Inst_DS__DS_MIN_RTN_F32()

    {

    } // ~Inst_DS__DS_MIN_RTN_F32


    // --- description from .arch file ---

    // 32b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (cmp < tmp) ? src : tmp.

    // Floating point minimum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMIN.

    void


    Inst_DS__DS_MIN_RTN_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_RTN_F32 class methods ---


    Inst_DS__DS_MAX_RTN_F32::Inst_DS__DS_MAX_RTN_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_rtn_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_MAX_RTN_F32


    Inst_DS__DS_MAX_RTN_F32::~Inst_DS__DS_MAX_RTN_F32()

    {

    } // ~Inst_DS__DS_MAX_RTN_F32


    // --- description from .arch file ---

    // 32b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (tmp > cmp) ? src : tmp.

    // Floating point maximum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMAX.

    void


    Inst_DS__DS_MAX_RTN_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRAP_RTN_B32 class methods ---


    Inst_DS__DS_WRAP_RTN_B32::Inst_DS__DS_WRAP_RTN_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrap_rtn_b32")

    {

    } // Inst_DS__DS_WRAP_RTN_B32


    Inst_DS__DS_WRAP_RTN_B32::~Inst_DS__DS_WRAP_RTN_B32()

    {

    } // ~Inst_DS__DS_WRAP_RTN_B32


    // --- description from .arch file ---

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp >= DATA) ? tmp - DATA : tmp + DATA2;

    // RETURN_DATA = tmp.

    void


    Inst_DS__DS_WRAP_RTN_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_ADD_RTN_F32 class methods ---


    Inst_DS__DS_ADD_RTN_F32::Inst_DS__DS_ADD_RTN_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_rtn_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_ADD_RTN_F32


    Inst_DS__DS_ADD_RTN_F32::~Inst_DS__DS_ADD_RTN_F32()

    {

    } // ~Inst_DS__DS_ADD_RTN_F32


    // --- description from .arch file ---

    // 32b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] += DATA;

    // RETURN_DATA = tmp.

    // Floating point add that handles NaN/INF/denormal values.

    void


    Inst_DS__DS_ADD_RTN_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_READ_B32 class methods ---


    Inst_DS__DS_READ_B32::Inst_DS__DS_READ_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b32")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_B32


    Inst_DS__DS_READ_B32::~Inst_DS__DS_READ_B32()

    {

    } // ~Inst_DS__DS_READ_B32


    // --- description from .arch file ---

    // RETURN_DATA = MEM[ADDR].

    // Dword read.

    void


    Inst_DS__DS_READ_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU32>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane];

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ2_B32 class methods ---


    Inst_DS__DS_READ2_B32::Inst_DS__DS_READ2_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read2_b32")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ2_B32


    Inst_DS__DS_READ2_B32::~Inst_DS__DS_READ2_B32()

    {

    } // ~Inst_DS__DS_READ2_B32


    // --- description from .arch file ---

    // RETURN_DATA[0] = MEM[ADDR_BASE + OFFSET0 * 4];

    // RETURN_DATA[1] = MEM[ADDR_BASE + OFFSET1 * 4].

    // Read 2 dwords.

    void


    Inst_DS__DS_READ2_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ2_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0 * 4;

        Addr offset1 = instData.OFFSET1 * 4;


        initDualMemRead<VecElemU32>(gpuDynInst, offset0, offset1);

    } // initiateAcc


    void


    Inst_DS__DS_READ2_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst0(gpuDynInst, extData.VDST);

        VecOperandU32 vdst1(gpuDynInst, extData.VDST + 1);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst0[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 2];

                vdst1[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 2 + 1];

            }

        }


        vdst0.write();

        vdst1.write();

    } // completeAcc


    // --- Inst_DS__DS_READ2ST64_B32 class methods ---


    Inst_DS__DS_READ2ST64_B32::Inst_DS__DS_READ2ST64_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read2st64_b32")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ2ST64_B32


    Inst_DS__DS_READ2ST64_B32::~Inst_DS__DS_READ2ST64_B32()

    {

    } // ~Inst_DS__DS_READ2ST64_B32


    // --- description from .arch file ---

    // RETURN_DATA[0] = MEM[ADDR_BASE + OFFSET0 * 4 * 64];

    // RETURN_DATA[1] = MEM[ADDR_BASE + OFFSET1 * 4 * 64].

    // Read 2 dwords.

    void


    Inst_DS__DS_READ2ST64_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ2ST64_B32::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = (instData.OFFSET0 * 4 * 64);

        Addr offset1 = (instData.OFFSET1 * 4 * 64);


        initDualMemRead<VecElemU32>(gpuDynInst, offset0, offset1);

    }


    void


    Inst_DS__DS_READ2ST64_B32::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst0(gpuDynInst, extData.VDST);

        VecOperandU32 vdst1(gpuDynInst, extData.VDST + 1);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst0[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 2];

                vdst1[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 2 + 1];

            }

        }


        vdst0.write();

        vdst1.write();

    }


    // --- Inst_DS__DS_READ_I8 class methods ---


    Inst_DS__DS_READ_I8::Inst_DS__DS_READ_I8(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_i8")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_I8


    Inst_DS__DS_READ_I8::~Inst_DS__DS_READ_I8()

    {

    } // ~Inst_DS__DS_READ_I8


    // --- description from .arch file ---

    // RETURN_DATA = signext(MEM[ADDR][7:0]).

    // Signed byte read.

    void


    Inst_DS__DS_READ_I8::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_I8::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemI8>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_I8::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (VecElemU32)sext<8>((reinterpret_cast<VecElemI8*>(

                    gpuDynInst->d_data))[lane]);

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_U8 class methods ---


    Inst_DS__DS_READ_U8::Inst_DS__DS_READ_U8(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_u8")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_U8


    Inst_DS__DS_READ_U8::~Inst_DS__DS_READ_U8()

    {

    } // ~Inst_DS__DS_READ_U8


    // --- description from .arch file ---

    // RETURN_DATA = {24'h0,MEM[ADDR][7:0]}.

    // Unsigned byte read.

    void


    Inst_DS__DS_READ_U8::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_U8::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU8>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_U8::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (VecElemU32)(reinterpret_cast<VecElemU8*>(

                    gpuDynInst->d_data))[lane];

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_I16 class methods ---


    Inst_DS__DS_READ_I16::Inst_DS__DS_READ_I16(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_i16")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_I16


    Inst_DS__DS_READ_I16::~Inst_DS__DS_READ_I16()

    {

    } // ~Inst_DS__DS_READ_I16


    // --- description from .arch file ---

    // RETURN_DATA = signext(MEM[ADDR][15:0]).

    // Signed short read.

    void


    Inst_DS__DS_READ_I16::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_READ_U16 class methods ---


    Inst_DS__DS_READ_U16::Inst_DS__DS_READ_U16(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_u16")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_U16


    Inst_DS__DS_READ_U16::~Inst_DS__DS_READ_U16()

    {

    } // ~Inst_DS__DS_READ_U16


    // --- description from .arch file ---

    // RETURN_DATA = {16'h0,MEM[ADDR][15:0]}.

    // Unsigned short read.

    void


    Inst_DS__DS_READ_U16::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_U16::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU16>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_U16::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (VecElemU32)(reinterpret_cast<VecElemU16*>(

                    gpuDynInst->d_data))[lane];

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_U16_D16 class methods ---


    Inst_DS__DS_READ_U16_D16::

        Inst_DS__DS_READ_U16_D16(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_u16_d16_hi")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_U16_D16


    Inst_DS__DS_READ_U16_D16::~Inst_DS__DS_READ_U16_D16()

    {

    } // ~Inst_DS__DS_READ_U16_D16


    // --- description from .arch file ---

    // RETURN_DATA[15 : 0].u16 = MEM[ADDR].u16;

    // // RETURN_DATA[31:16] is preserved.

    void


    Inst_DS__DS_READ_U16_D16::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_U16_D16::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU16>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_U16_D16::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                VecElemU16 ds_val = reinterpret_cast<VecElemU16*>(

                    gpuDynInst->d_data)[lane];

                replaceBits(vdst[lane], 15, 0, ds_val);

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_U16_D16_HI class methods ---


    Inst_DS__DS_READ_U16_D16_HI::

        Inst_DS__DS_READ_U16_D16_HI(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_u16_d16_hi")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_U16_D16_HI


    Inst_DS__DS_READ_U16_D16_HI::~Inst_DS__DS_READ_U16_D16_HI()

    {

    } // ~Inst_DS__DS_READ_U16_D16_HI


    // --- description from .arch file ---

    // RETURN_DATA[31 : 16].u16 = MEM[ADDR].u16;

    // // RETURN_DATA[15:0] is preserved.

    void


    Inst_DS__DS_READ_U16_D16_HI::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_U16_D16_HI::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU16>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_U16_D16_HI::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                VecElemU16 ds_val = reinterpret_cast<VecElemU16*>(

                    gpuDynInst->d_data)[lane];

                replaceBits(vdst[lane], 31, 16, ds_val);

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_SWIZZLE_B32 class methods ---


    Inst_DS__DS_SWIZZLE_B32::Inst_DS__DS_SWIZZLE_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_swizzle_b32")

    {

         setFlag(Load);

         setFlag(ALU);

    } // Inst_DS__DS_SWIZZLE_B32


    Inst_DS__DS_SWIZZLE_B32::~Inst_DS__DS_SWIZZLE_B32()

    {

    } // ~Inst_DS__DS_SWIZZLE_B32


    // --- description from .arch file ---

    // RETURN_DATA = swizzle(vgpr_data, offset1:offset0).

    // Dword swizzle, no data is written to LDS memory; See ds_opcodes.docx for

    // ---  details.

    void


    Inst_DS__DS_SWIZZLE_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        wf->decLGKMInstsIssued();

        wf->untrackLGKMInst(gpuDynInst);


        if (gpuDynInst->exec_mask.none()) {

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(gpuDynInst->computeUnit()

                                ->cyclesToTicks(Cycles(24)));


        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);

        VecOperandU32 vdst(gpuDynInst, extData.VDST);

        VecElemU16 ds_pattern = ((instData.OFFSET1 << 8) | instData.OFFSET0);


        data.read();


        if (bits(ds_pattern, 15)) {

            // QDMode

            for (int lane = 0; lane < NumVecElemPerVecReg; lane += 4) {

                if (gpuDynInst->exec_mask[lane]) {

                    int index0 = lane + bits(ds_pattern, 1, 0);

                    panic_if(index0 >= NumVecElemPerVecReg, "%s: index0 (%d) "

                             "is out of bounds.\n", gpuDynInst->disassemble(),

                             index0);

                    vdst[lane]

                        = gpuDynInst->exec_mask[index0] ? data[index0]: 0;

                }

                if (gpuDynInst->exec_mask[lane + 1]) {

                    int index1 = lane + bits(ds_pattern, 3, 2);

                    panic_if(index1 >= NumVecElemPerVecReg, "%s: index1 (%d) "

                             "is out of bounds.\n", gpuDynInst->disassemble(),

                             index1);

                    vdst[lane + 1]

                        = gpuDynInst->exec_mask[index1] ? data[index1]: 0;

                }

                if (gpuDynInst->exec_mask[lane + 2]) {

                    int index2 = lane + bits(ds_pattern, 5, 4);

                    panic_if(index2 >= NumVecElemPerVecReg, "%s: index2 (%d) "

                             "is out of bounds.\n", gpuDynInst->disassemble(),

                             index2);

                    vdst[lane + 2]

                        = gpuDynInst->exec_mask[index2] ? data[index2]: 0;

                }

                if (gpuDynInst->exec_mask[lane + 3]) {

                    int index3 = lane + bits(ds_pattern, 7, 6);

                    panic_if(index3 >= NumVecElemPerVecReg, "%s: index3 (%d) "

                             "is out of bounds.\n", gpuDynInst->disassemble(),

                             index3);

                    vdst[lane + 3]

                        = gpuDynInst->exec_mask[index3] ? data[index3]: 0;

                }

            }

        } else {

            // Bit Mode

            int and_mask = bits(ds_pattern, 4, 0);

            int or_mask = bits(ds_pattern, 9, 5);

            int xor_mask = bits(ds_pattern, 14, 10);

            for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

                if (gpuDynInst->exec_mask[lane]) {

                    int index = (((lane & and_mask) | or_mask) ^ xor_mask);

                    // Adjust for the next 32 lanes.

                    if (lane > 31) {

                        index += 32;

                    }

                    panic_if(index >= NumVecElemPerVecReg, "%s: index (%d) is "

                             "out of bounds.\n", gpuDynInst->disassemble(),

                             index);

                    vdst[lane]

                        = gpuDynInst->exec_mask[index] ? data[index] : 0;

                }

            }

        }


        vdst.write();


        wf->computeUnit->vrf[wf->simdId]->

            scheduleWriteOperandsFromLoad(wf, gpuDynInst);

        wf->rdLmReqsInPipe--;

    } // execute


    // --- Inst_DS__DS_PERMUTE_B32 class methods ---


    Inst_DS__DS_PERMUTE_B32::Inst_DS__DS_PERMUTE_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_permute_b32")

    {

        setFlag(MemoryRef);

         setFlag(Load);

    } // Inst_DS__DS_PERMUTE_B32


    Inst_DS__DS_PERMUTE_B32::~Inst_DS__DS_PERMUTE_B32()

    {

    } // ~Inst_DS__DS_PERMUTE_B32


    // --- description from .arch file ---

    // Forward permute.

    void


    Inst_DS__DS_PERMUTE_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        wf->decLGKMInstsIssued();

        wf->untrackLGKMInst(gpuDynInst);


        if (gpuDynInst->exec_mask.none()) {

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(gpuDynInst->computeUnit()

                                ->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        addr.read();

        data.read();


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                assert(!instData.OFFSET1);

                int index = bits(addr[lane] + instData.OFFSET0, 7, 2);

                panic_if(index >= NumVecElemPerVecReg, "%s: index (%d) is out "

                         "of bounds.\n", gpuDynInst->disassemble(), index);

                if (wf->execMask(index)) {

                    vdst[index] = data[lane];

                } else {

                    vdst[index] = 0;

                }

            }

        }


        vdst.write();


        wf->computeUnit->vrf[wf->simdId]->

            scheduleWriteOperandsFromLoad(wf, gpuDynInst);

        wf->rdLmReqsInPipe--;

    } // execute


    // --- Inst_DS__DS_BPERMUTE_B32 class methods ---


    Inst_DS__DS_BPERMUTE_B32::Inst_DS__DS_BPERMUTE_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_bpermute_b32")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_BPERMUTE_B32


    Inst_DS__DS_BPERMUTE_B32::~Inst_DS__DS_BPERMUTE_B32()

    {

    } // ~Inst_DS__DS_BPERMUTE_B32


    // --- description from .arch file ---

    // Backward permute.

    void


    Inst_DS__DS_BPERMUTE_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        wf->decLGKMInstsIssued();

        wf->untrackLGKMInst(gpuDynInst);


        if (gpuDynInst->exec_mask.none()) {

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(gpuDynInst->computeUnit()

                                ->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data(gpuDynInst, extData.DATA0);

        VecOperandU32 vdst(gpuDynInst, extData.VDST);


        addr.read();

        data.read();


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                assert(!instData.OFFSET1);

                int index = bits(addr[lane] + instData.OFFSET0, 7, 2);

                panic_if(index >= NumVecElemPerVecReg, "%s: index (%d) is out "

                         "of bounds.\n", gpuDynInst->disassemble(), index);

                if (wf->execMask(index)) {

                    vdst[lane] = data[index];

                } else {

                    vdst[lane] = 0;

                }

            }

        }


        vdst.write();


        wf->computeUnit->vrf[wf->simdId]->

            scheduleWriteOperandsFromLoad(wf, gpuDynInst);

        wf->rdLmReqsInPipe--;

    } // execute


    // --- Inst_DS__DS_ADD_U64 class methods ---


    Inst_DS__DS_ADD_U64::Inst_DS__DS_ADD_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_u64")

    {

        setFlag(MemoryRef);

        setFlag(GroupSegment);

        setFlag(AtomicAdd);

        setFlag(AtomicNoReturn);

    } // Inst_DS__DS_ADD_U64


    Inst_DS__DS_ADD_U64::~Inst_DS__DS_ADD_U64()

    {

    } // ~Inst_DS__DS_ADD_U64


    // --- description from .arch file ---

    // 64b:

    // MEM[ADDR] += DATA[0:1];

    void


    Inst_DS__DS_ADD_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU64 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU64*>(gpuDynInst->a_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_ADD_U64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initAtomicAccess<VecElemU64>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_ADD_U64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_SUB_U64 class methods ---


    Inst_DS__DS_SUB_U64::Inst_DS__DS_SUB_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_sub_u64")

    {

    } // Inst_DS__DS_SUB_U64


    Inst_DS__DS_SUB_U64::~Inst_DS__DS_SUB_U64()

    {

    } // ~Inst_DS__DS_SUB_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_SUB_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_RSUB_U64 class methods ---


    Inst_DS__DS_RSUB_U64::Inst_DS__DS_RSUB_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_rsub_u64")

    {

    } // Inst_DS__DS_RSUB_U64


    Inst_DS__DS_RSUB_U64::~Inst_DS__DS_RSUB_U64()

    {

    } // ~Inst_DS__DS_RSUB_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = DATA - MEM[ADDR];

    // RETURN_DATA = tmp.

    // Subtraction with reversed operands.

    void


    Inst_DS__DS_RSUB_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_INC_U64 class methods ---


    Inst_DS__DS_INC_U64::Inst_DS__DS_INC_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_inc_u64")

    {

    } // Inst_DS__DS_INC_U64


    Inst_DS__DS_INC_U64::~Inst_DS__DS_INC_U64()

    {

    } // ~Inst_DS__DS_INC_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp >= DATA[0:1]) ? 0 : tmp + 1 (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_INC_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_DEC_U64 class methods ---


    Inst_DS__DS_DEC_U64::Inst_DS__DS_DEC_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_dec_u64")

    {

    } // Inst_DS__DS_DEC_U64


    Inst_DS__DS_DEC_U64::~Inst_DS__DS_DEC_U64()

    {

    } // ~Inst_DS__DS_DEC_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp == 0 || tmp > DATA[0:1]) ? DATA[0:1] : tmp - 1

    // (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_DEC_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_I64 class methods ---


    Inst_DS__DS_MIN_I64::Inst_DS__DS_MIN_I64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_i64")

    {

    } // Inst_DS__DS_MIN_I64


    Inst_DS__DS_MIN_I64::~Inst_DS__DS_MIN_I64()

    {

    } // ~Inst_DS__DS_MIN_I64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] < tmp) ? DATA[0:1] : tmp (signed compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MIN_I64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_I64 class methods ---


    Inst_DS__DS_MAX_I64::Inst_DS__DS_MAX_I64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_i64")

    {

    } // Inst_DS__DS_MAX_I64


    Inst_DS__DS_MAX_I64::~Inst_DS__DS_MAX_I64()

    {

    } // ~Inst_DS__DS_MAX_I64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] > tmp) ? DATA[0:1] : tmp (signed compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MAX_I64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_U64 class methods ---


    Inst_DS__DS_MIN_U64::Inst_DS__DS_MIN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_u64")

    {

    } // Inst_DS__DS_MIN_U64


    Inst_DS__DS_MIN_U64::~Inst_DS__DS_MIN_U64()

    {

    } // ~Inst_DS__DS_MIN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] < tmp) ? DATA[0:1] : tmp (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MIN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_U64 class methods ---


    Inst_DS__DS_MAX_U64::Inst_DS__DS_MAX_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_u64")

    {

    } // Inst_DS__DS_MAX_U64


    Inst_DS__DS_MAX_U64::~Inst_DS__DS_MAX_U64()

    {

    } // ~Inst_DS__DS_MAX_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] > tmp) ? DATA[0:1] : tmp (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MAX_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_AND_B64 class methods ---


    Inst_DS__DS_AND_B64::Inst_DS__DS_AND_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_and_b64")

    {

    } // Inst_DS__DS_AND_B64


    Inst_DS__DS_AND_B64::~Inst_DS__DS_AND_B64()

    {

    } // ~Inst_DS__DS_AND_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] &= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_AND_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_OR_B64 class methods ---


    Inst_DS__DS_OR_B64::Inst_DS__DS_OR_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_or_b64")

    {

    } // Inst_DS__DS_OR_B64


    Inst_DS__DS_OR_B64::~Inst_DS__DS_OR_B64()

    {

    } // ~Inst_DS__DS_OR_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] |= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_OR_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_XOR_B64 class methods ---


    Inst_DS__DS_XOR_B64::Inst_DS__DS_XOR_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_xor_b64")

    {

    } // Inst_DS__DS_XOR_B64


    Inst_DS__DS_XOR_B64::~Inst_DS__DS_XOR_B64()

    {

    } // ~Inst_DS__DS_XOR_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] ^= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_XOR_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MSKOR_B64 class methods ---


    Inst_DS__DS_MSKOR_B64::Inst_DS__DS_MSKOR_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_mskor_b64")

    {

    } // Inst_DS__DS_MSKOR_B64


    Inst_DS__DS_MSKOR_B64::~Inst_DS__DS_MSKOR_B64()

    {

    } // ~Inst_DS__DS_MSKOR_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (MEM_ADDR[ADDR] & ~DATA) | DATA2;

    // RETURN_DATA = tmp.

    // Masked dword OR, D0 contains the mask and D1 contains the new value.

    void


    Inst_DS__DS_MSKOR_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRITE_B64 class methods ---


    Inst_DS__DS_WRITE_B64::Inst_DS__DS_WRITE_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b64")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B64


    Inst_DS__DS_WRITE_B64::~Inst_DS__DS_WRITE_B64()

    {

    } // ~Inst_DS__DS_WRITE_B64


    // --- description from .arch file ---

    // 64b:

    // MEM[ADDR] = DATA.

    // Write qword.

    void


    Inst_DS__DS_WRITE_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU64 data(gpuDynInst, extData.DATA0);


        addr.read();

        data.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU64*>(gpuDynInst->d_data))[lane]

                    = data[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<VecElemU64>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_WRITE2_B64 class methods ---


    Inst_DS__DS_WRITE2_B64::Inst_DS__DS_WRITE2_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write2_b64")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE2_B64


    Inst_DS__DS_WRITE2_B64::~Inst_DS__DS_WRITE2_B64()

    {

    } // ~Inst_DS__DS_WRITE2_B64


    // --- description from .arch file ---

    // 64b:

    // MEM[ADDR_BASE + OFFSET0 * 8] = DATA;

    // MEM[ADDR_BASE + OFFSET1 * 8] = DATA2.

    // Write 2 qwords.

    void


    Inst_DS__DS_WRITE2_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU64 data0(gpuDynInst, extData.DATA0);

        ConstVecOperandU64 data1(gpuDynInst, extData.DATA1);


        addr.read();

        data0.read();

        data1.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2] = data0[lane];

                (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE2_B64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0 * 8;

        Addr offset1 = instData.OFFSET1 * 8;


        initDualMemWrite<VecElemU64>(gpuDynInst, offset0, offset1);

    }


    void


    Inst_DS__DS_WRITE2_B64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    }


    // --- Inst_DS__DS_WRITE2ST64_B64 class methods ---


    Inst_DS__DS_WRITE2ST64_B64::Inst_DS__DS_WRITE2ST64_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write2st64_b64")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE2ST64_B64


    Inst_DS__DS_WRITE2ST64_B64::~Inst_DS__DS_WRITE2ST64_B64()

    {

    } // ~Inst_DS__DS_WRITE2ST64_B64


    // --- description from .arch file ---

    // 64b:

    // MEM[ADDR_BASE + OFFSET0 * 8 * 64] = DATA;

    // MEM[ADDR_BASE + OFFSET1 * 8 * 64] = DATA2;

    // Write 2 qwords.

    void


    Inst_DS__DS_WRITE2ST64_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU64 data0(gpuDynInst, extData.DATA0);

        ConstVecOperandU64 data1(gpuDynInst, extData.DATA1);


        addr.read();

        data0.read();

        data1.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2] = data0[lane];

                (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2 + 1] = data1[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE2ST64_B64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0 * 8 * 64;

        Addr offset1 = instData.OFFSET1 * 8 * 64;


        initDualMemWrite<VecElemU64>(gpuDynInst, offset0, offset1);

    }


    void


    Inst_DS__DS_WRITE2ST64_B64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    }


    // --- Inst_DS__DS_CMPST_B64 class methods ---


    Inst_DS__DS_CMPST_B64::Inst_DS__DS_CMPST_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_b64")

    {

    } // Inst_DS__DS_CMPST_B64


    Inst_DS__DS_CMPST_B64::~Inst_DS__DS_CMPST_B64()

    {

    } // ~Inst_DS__DS_CMPST_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Compare and store.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_CMPSWAP_X2 opcode.

    void


    Inst_DS__DS_CMPST_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_CMPST_F64 class methods ---


    Inst_DS__DS_CMPST_F64::Inst_DS__DS_CMPST_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_CMPST_F64


    Inst_DS__DS_CMPST_F64::~Inst_DS__DS_CMPST_F64()

    {

    } // ~Inst_DS__DS_CMPST_F64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Floating point compare and store that handles NaN/INF/denormal values.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_FCMPSWAP_X2 opcode.

    void


    Inst_DS__DS_CMPST_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_F64 class methods ---


    Inst_DS__DS_MIN_F64::Inst_DS__DS_MIN_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_MIN_F64


    Inst_DS__DS_MIN_F64::~Inst_DS__DS_MIN_F64()

    {

    } // ~Inst_DS__DS_MIN_F64


    // --- description from .arch file ---

    // 64b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (cmp < tmp) ? src : tmp.

    // Floating point minimum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMIN_X2.

    void


    Inst_DS__DS_MIN_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_F64 class methods ---


    Inst_DS__DS_MAX_F64::Inst_DS__DS_MAX_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_MAX_F64


    Inst_DS__DS_MAX_F64::~Inst_DS__DS_MAX_F64()

    {

    } // ~Inst_DS__DS_MAX_F64


    // --- description from .arch file ---

    // 64b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (tmp > cmp) ? src : tmp.

    // Floating point maximum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMAX_X2.

    void


    Inst_DS__DS_MAX_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_ADD_RTN_U64 class methods ---


    Inst_DS__DS_ADD_RTN_U64::Inst_DS__DS_ADD_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_rtn_u64")

    {

    } // Inst_DS__DS_ADD_RTN_U64


    Inst_DS__DS_ADD_RTN_U64::~Inst_DS__DS_ADD_RTN_U64()

    {

    } // ~Inst_DS__DS_ADD_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] += DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_ADD_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_SUB_RTN_U64 class methods ---


    Inst_DS__DS_SUB_RTN_U64::Inst_DS__DS_SUB_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_sub_rtn_u64")

    {

    } // Inst_DS__DS_SUB_RTN_U64


    Inst_DS__DS_SUB_RTN_U64::~Inst_DS__DS_SUB_RTN_U64()

    {

    } // ~Inst_DS__DS_SUB_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_SUB_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_RSUB_RTN_U64 class methods ---


    Inst_DS__DS_RSUB_RTN_U64::Inst_DS__DS_RSUB_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_rsub_rtn_u64")

    {

    } // Inst_DS__DS_RSUB_RTN_U64


    Inst_DS__DS_RSUB_RTN_U64::~Inst_DS__DS_RSUB_RTN_U64()

    {

    } // ~Inst_DS__DS_RSUB_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = DATA - MEM[ADDR];

    // RETURN_DATA = tmp.

    // Subtraction with reversed operands.

    void


    Inst_DS__DS_RSUB_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_INC_RTN_U64 class methods ---


    Inst_DS__DS_INC_RTN_U64::Inst_DS__DS_INC_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_inc_rtn_u64")

    {

    } // Inst_DS__DS_INC_RTN_U64


    Inst_DS__DS_INC_RTN_U64::~Inst_DS__DS_INC_RTN_U64()

    {

    } // ~Inst_DS__DS_INC_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp >= DATA[0:1]) ? 0 : tmp + 1 (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_INC_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_DEC_RTN_U64 class methods ---


    Inst_DS__DS_DEC_RTN_U64::Inst_DS__DS_DEC_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_dec_rtn_u64")

    {

    } // Inst_DS__DS_DEC_RTN_U64


    Inst_DS__DS_DEC_RTN_U64::~Inst_DS__DS_DEC_RTN_U64()

    {

    } // ~Inst_DS__DS_DEC_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (tmp == 0 || tmp > DATA[0:1]) ? DATA[0:1] : tmp - 1

    // (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_DEC_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_RTN_I64 class methods ---


    Inst_DS__DS_MIN_RTN_I64::Inst_DS__DS_MIN_RTN_I64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_rtn_i64")

    {

    } // Inst_DS__DS_MIN_RTN_I64


    Inst_DS__DS_MIN_RTN_I64::~Inst_DS__DS_MIN_RTN_I64()

    {

    } // ~Inst_DS__DS_MIN_RTN_I64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] < tmp) ? DATA[0:1] : tmp (signed compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MIN_RTN_I64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_RTN_I64 class methods ---


    Inst_DS__DS_MAX_RTN_I64::Inst_DS__DS_MAX_RTN_I64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_rtn_i64")

    {

    } // Inst_DS__DS_MAX_RTN_I64


    Inst_DS__DS_MAX_RTN_I64::~Inst_DS__DS_MAX_RTN_I64()

    {

    } // ~Inst_DS__DS_MAX_RTN_I64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] > tmp) ? DATA[0:1] : tmp (signed compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MAX_RTN_I64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_RTN_U64 class methods ---


    Inst_DS__DS_MIN_RTN_U64::Inst_DS__DS_MIN_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_rtn_u64")

    {

    } // Inst_DS__DS_MIN_RTN_U64


    Inst_DS__DS_MIN_RTN_U64::~Inst_DS__DS_MIN_RTN_U64()

    {

    } // ~Inst_DS__DS_MIN_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] < tmp) ? DATA[0:1] : tmp (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MIN_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_RTN_U64 class methods ---


    Inst_DS__DS_MAX_RTN_U64::Inst_DS__DS_MAX_RTN_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_rtn_u64")

    {

    } // Inst_DS__DS_MAX_RTN_U64


    Inst_DS__DS_MAX_RTN_U64::~Inst_DS__DS_MAX_RTN_U64()

    {

    } // ~Inst_DS__DS_MAX_RTN_U64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] -= (DATA[0:1] > tmp) ? DATA[0:1] : tmp (unsigned compare);

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_MAX_RTN_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_AND_RTN_B64 class methods ---


    Inst_DS__DS_AND_RTN_B64::Inst_DS__DS_AND_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_and_rtn_b64")

    {

    } // Inst_DS__DS_AND_RTN_B64


    Inst_DS__DS_AND_RTN_B64::~Inst_DS__DS_AND_RTN_B64()

    {

    } // ~Inst_DS__DS_AND_RTN_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] &= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_AND_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_OR_RTN_B64 class methods ---


    Inst_DS__DS_OR_RTN_B64::Inst_DS__DS_OR_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_or_rtn_b64")

    {

    } // Inst_DS__DS_OR_RTN_B64


    Inst_DS__DS_OR_RTN_B64::~Inst_DS__DS_OR_RTN_B64()

    {

    } // ~Inst_DS__DS_OR_RTN_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] |= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_OR_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_XOR_RTN_B64 class methods ---


    Inst_DS__DS_XOR_RTN_B64::Inst_DS__DS_XOR_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_xor_rtn_b64")

    {

    } // Inst_DS__DS_XOR_RTN_B64


    Inst_DS__DS_XOR_RTN_B64::~Inst_DS__DS_XOR_RTN_B64()

    {

    } // ~Inst_DS__DS_XOR_RTN_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] ^= DATA[0:1];

    // RETURN_DATA[0:1] = tmp.

    void


    Inst_DS__DS_XOR_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MSKOR_RTN_B64 class methods ---


    Inst_DS__DS_MSKOR_RTN_B64::Inst_DS__DS_MSKOR_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_mskor_rtn_b64")

    {

    } // Inst_DS__DS_MSKOR_RTN_B64


    Inst_DS__DS_MSKOR_RTN_B64::~Inst_DS__DS_MSKOR_RTN_B64()

    {

    } // ~Inst_DS__DS_MSKOR_RTN_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // MEM[ADDR] = (MEM_ADDR[ADDR] & ~DATA) | DATA2;

    // RETURN_DATA = tmp.

    // Masked dword OR, D0 contains the mask and D1 contains the new value.

    void


    Inst_DS__DS_MSKOR_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRXCHG_RTN_B64 class methods ---


    Inst_DS__DS_WRXCHG_RTN_B64::Inst_DS__DS_WRXCHG_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrxchg_rtn_b64")

    {

    } // Inst_DS__DS_WRXCHG_RTN_B64


    Inst_DS__DS_WRXCHG_RTN_B64::~Inst_DS__DS_WRXCHG_RTN_B64()

    {

    } // ~Inst_DS__DS_WRXCHG_RTN_B64


    // --- description from .arch file ---

    // tmp = MEM[ADDR];

    // MEM[ADDR] = DATA;

    // RETURN_DATA = tmp.

    // Write-exchange operation.

    void


    Inst_DS__DS_WRXCHG_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRXCHG2_RTN_B64 class methods ---


    Inst_DS__DS_WRXCHG2_RTN_B64::Inst_DS__DS_WRXCHG2_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrxchg2_rtn_b64")

    {

    } // Inst_DS__DS_WRXCHG2_RTN_B64


    Inst_DS__DS_WRXCHG2_RTN_B64::~Inst_DS__DS_WRXCHG2_RTN_B64()

    {

    } // ~Inst_DS__DS_WRXCHG2_RTN_B64


    // --- description from .arch file ---

    // Write-exchange 2 separate qwords.

    void


    Inst_DS__DS_WRXCHG2_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRXCHG2ST64_RTN_B64 class methods ---


    Inst_DS__DS_WRXCHG2ST64_RTN_B64::Inst_DS__DS_WRXCHG2ST64_RTN_B64(

          InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_wrxchg2st64_rtn_b64")

    {

    } // Inst_DS__DS_WRXCHG2ST64_RTN_B64


    Inst_DS__DS_WRXCHG2ST64_RTN_B64::~Inst_DS__DS_WRXCHG2ST64_RTN_B64()

    {

    } // ~Inst_DS__DS_WRXCHG2ST64_RTN_B64


    // --- description from .arch file ---

    // Write-exchange 2 qwords with a stride of 64 qwords.

    void


    Inst_DS__DS_WRXCHG2ST64_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_CMPST_RTN_B64 class methods ---


    Inst_DS__DS_CMPST_RTN_B64::Inst_DS__DS_CMPST_RTN_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_rtn_b64")

    {

    } // Inst_DS__DS_CMPST_RTN_B64


    Inst_DS__DS_CMPST_RTN_B64::~Inst_DS__DS_CMPST_RTN_B64()

    {

    } // ~Inst_DS__DS_CMPST_RTN_B64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Compare and store.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_CMPSWAP_X2 opcode.

    void


    Inst_DS__DS_CMPST_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_CMPST_RTN_F64 class methods ---


    Inst_DS__DS_CMPST_RTN_F64::Inst_DS__DS_CMPST_RTN_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_cmpst_rtn_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_CMPST_RTN_F64


    Inst_DS__DS_CMPST_RTN_F64::~Inst_DS__DS_CMPST_RTN_F64()

    {

    } // ~Inst_DS__DS_CMPST_RTN_F64


    // --- description from .arch file ---

    // 64b:

    // tmp = MEM[ADDR];

    // src = DATA2;

    // cmp = DATA;

    // MEM[ADDR] = (tmp == cmp) ? src : tmp;

    // RETURN_DATA[0] = tmp.

    // Floating point compare and store that handles NaN/INF/denormal values.

    // Caution, the order of src and cmp are the *opposite* of the

    // ---  BUFFER_ATOMIC_FCMPSWAP_X2 opcode.

    void


    Inst_DS__DS_CMPST_RTN_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_RTN_F64 class methods ---


    Inst_DS__DS_MIN_RTN_F64::Inst_DS__DS_MIN_RTN_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_rtn_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_MIN_RTN_F64


    Inst_DS__DS_MIN_RTN_F64::~Inst_DS__DS_MIN_RTN_F64()

    {

    } // ~Inst_DS__DS_MIN_RTN_F64


    // --- description from .arch file ---

    // 64b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (cmp < tmp) ? src : tmp.

    // Floating point minimum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMIN_X2.

    void


    Inst_DS__DS_MIN_RTN_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_RTN_F64 class methods ---


    Inst_DS__DS_MAX_RTN_F64::Inst_DS__DS_MAX_RTN_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_rtn_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_MAX_RTN_F64


    Inst_DS__DS_MAX_RTN_F64::~Inst_DS__DS_MAX_RTN_F64()

    {

    } // ~Inst_DS__DS_MAX_RTN_F64


    // --- description from .arch file ---

    // 64b.

    // tmp = MEM[ADDR];

    // src = DATA;

    // cmp = DATA2;

    // MEM[ADDR] = (tmp > cmp) ? src : tmp.

    // Floating point maximum that handles NaN/INF/denormal values.

    // Note that this opcode is slightly more general-purpose than

    // ---  BUFFER_ATOMIC_FMAX_X2.

    void


    Inst_DS__DS_MAX_RTN_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_READ_B64 class methods ---


    Inst_DS__DS_READ_B64::Inst_DS__DS_READ_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b64")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_B64


    Inst_DS__DS_READ_B64::~Inst_DS__DS_READ_B64()

    {

    } // ~Inst_DS__DS_READ_B64


    // --- description from .arch file ---

    // RETURN_DATA = MEM[ADDR].

    // Read 1 qword.

    void


    Inst_DS__DS_READ_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU64>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU64 vdst(gpuDynInst, extData.VDST);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst[lane] = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane];

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ2_B64 class methods ---


    Inst_DS__DS_READ2_B64::Inst_DS__DS_READ2_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read2_b64")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ2_B64


    Inst_DS__DS_READ2_B64::~Inst_DS__DS_READ2_B64()

    {

    } // ~Inst_DS__DS_READ2_B64


    // --- description from .arch file ---

    // RETURN_DATA[0] = MEM[ADDR_BASE + OFFSET0 * 8];

    // RETURN_DATA[1] = MEM[ADDR_BASE + OFFSET1 * 8].

    // Read 2 qwords.

    void


    Inst_DS__DS_READ2_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ2_B64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0 * 8;

        Addr offset1 = instData.OFFSET1 * 8;


        initDualMemRead<VecElemU64>(gpuDynInst, offset0, offset1);

    } // initiateAcc


    void


    Inst_DS__DS_READ2_B64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU64 vdst0(gpuDynInst, extData.VDST);

        VecOperandU64 vdst1(gpuDynInst, extData.VDST + 2);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst0[lane] = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2];

                vdst1[lane] = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2 + 1];

            }

        }


        vdst0.write();

        vdst1.write();

    } // completeAcc


    // --- Inst_DS__DS_READ2ST64_B64 class methods ---


    Inst_DS__DS_READ2ST64_B64::Inst_DS__DS_READ2ST64_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read2st64_b64")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ2ST64_B64


    Inst_DS__DS_READ2ST64_B64::~Inst_DS__DS_READ2ST64_B64()

    {

    } // ~Inst_DS__DS_READ2ST64_B64


    // --- description from .arch file ---

    // RETURN_DATA[0] = MEM[ADDR_BASE + OFFSET0 * 8 * 64];

    // RETURN_DATA[1] = MEM[ADDR_BASE + OFFSET1 * 8 * 64].

    // Read 2 qwords.

    void


    Inst_DS__DS_READ2ST64_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            wf->untrackLGKMInst(gpuDynInst);

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ2ST64_B64::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = (instData.OFFSET0 * 8 * 64);

        Addr offset1 = (instData.OFFSET1 * 8 * 64);


        initDualMemRead<VecElemU64>(gpuDynInst, offset0, offset1);

    }


    void


    Inst_DS__DS_READ2ST64_B64::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU64 vdst0(gpuDynInst, extData.VDST);

        VecOperandU64 vdst1(gpuDynInst, extData.VDST + 2);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst0[lane] = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2];

                vdst1[lane] = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 2 + 1];

            }

        }


        vdst0.write();

        vdst1.write();

    }


    // --- Inst_DS__DS_CONDXCHG32_RTN_B64 class methods ---


    Inst_DS__DS_CONDXCHG32_RTN_B64::Inst_DS__DS_CONDXCHG32_RTN_B64(

          InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_condxchg32_rtn_b64")

    {

    } // Inst_DS__DS_CONDXCHG32_RTN_B64


    Inst_DS__DS_CONDXCHG32_RTN_B64::~Inst_DS__DS_CONDXCHG32_RTN_B64()

    {

    } // ~Inst_DS__DS_CONDXCHG32_RTN_B64


    // --- description from .arch file ---

    // Conditional write exchange.

    void


    Inst_DS__DS_CONDXCHG32_RTN_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_ADD_SRC2_U32 class methods ---


    Inst_DS__DS_ADD_SRC2_U32::Inst_DS__DS_ADD_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_src2_u32")

    {

    } // Inst_DS__DS_ADD_SRC2_U32


    Inst_DS__DS_ADD_SRC2_U32::~Inst_DS__DS_ADD_SRC2_U32()

    {

    } // ~Inst_DS__DS_ADD_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] + MEM[B].

    void


    Inst_DS__DS_ADD_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_SUB_SRC2_U32 class methods ---


    Inst_DS__DS_SUB_SRC2_U32::Inst_DS__DS_SUB_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_sub_src2_u32")

    {

    } // Inst_DS__DS_SUB_SRC2_U32


    Inst_DS__DS_SUB_SRC2_U32::~Inst_DS__DS_SUB_SRC2_U32()

    {

    } // ~Inst_DS__DS_SUB_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] - MEM[B].

    void


    Inst_DS__DS_SUB_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_RSUB_SRC2_U32 class methods ---


    Inst_DS__DS_RSUB_SRC2_U32::Inst_DS__DS_RSUB_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_rsub_src2_u32")

    {

    } // Inst_DS__DS_RSUB_SRC2_U32


    Inst_DS__DS_RSUB_SRC2_U32::~Inst_DS__DS_RSUB_SRC2_U32()

    {

    } // ~Inst_DS__DS_RSUB_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[B] - MEM[A].

    void


    Inst_DS__DS_RSUB_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_INC_SRC2_U32 class methods ---


    Inst_DS__DS_INC_SRC2_U32::Inst_DS__DS_INC_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_inc_src2_u32")

    {

    } // Inst_DS__DS_INC_SRC2_U32


    Inst_DS__DS_INC_SRC2_U32::~Inst_DS__DS_INC_SRC2_U32()

    {

    } // ~Inst_DS__DS_INC_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[A] >= MEM[B] ? 0 : MEM[A] + 1).

    void


    Inst_DS__DS_INC_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_DEC_SRC2_U32 class methods ---


    Inst_DS__DS_DEC_SRC2_U32::Inst_DS__DS_DEC_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_dec_src2_u32")

    {

    } // Inst_DS__DS_DEC_SRC2_U32


    Inst_DS__DS_DEC_SRC2_U32::~Inst_DS__DS_DEC_SRC2_U32()

    {

    } // ~Inst_DS__DS_DEC_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[A] == 0 || MEM[A] > MEM[B] ? MEM[B] : MEM[A] - 1).

    // Uint decrement.

    void


    Inst_DS__DS_DEC_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_SRC2_I32 class methods ---


    Inst_DS__DS_MIN_SRC2_I32::Inst_DS__DS_MIN_SRC2_I32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_src2_i32")

    {

    } // Inst_DS__DS_MIN_SRC2_I32


    Inst_DS__DS_MIN_SRC2_I32::~Inst_DS__DS_MIN_SRC2_I32()

    {

    } // ~Inst_DS__DS_MIN_SRC2_I32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = min(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MIN_SRC2_I32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_SRC2_I32 class methods ---


    Inst_DS__DS_MAX_SRC2_I32::Inst_DS__DS_MAX_SRC2_I32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_src2_i32")

    {

    } // Inst_DS__DS_MAX_SRC2_I32


    Inst_DS__DS_MAX_SRC2_I32::~Inst_DS__DS_MAX_SRC2_I32()

    {

    } // ~Inst_DS__DS_MAX_SRC2_I32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = max(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MAX_SRC2_I32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_SRC2_U32 class methods ---


    Inst_DS__DS_MIN_SRC2_U32::Inst_DS__DS_MIN_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_src2_u32")

    {

    } // Inst_DS__DS_MIN_SRC2_U32


    Inst_DS__DS_MIN_SRC2_U32::~Inst_DS__DS_MIN_SRC2_U32()

    {

    } // ~Inst_DS__DS_MIN_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = min(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MIN_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_SRC2_U32 class methods ---


    Inst_DS__DS_MAX_SRC2_U32::Inst_DS__DS_MAX_SRC2_U32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_src2_u32")

    {

    } // Inst_DS__DS_MAX_SRC2_U32


    Inst_DS__DS_MAX_SRC2_U32::~Inst_DS__DS_MAX_SRC2_U32()

    {

    } // ~Inst_DS__DS_MAX_SRC2_U32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = max(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MAX_SRC2_U32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_AND_SRC2_B32 class methods ---


    Inst_DS__DS_AND_SRC2_B32::Inst_DS__DS_AND_SRC2_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_and_src2_b32")

    {

    } // Inst_DS__DS_AND_SRC2_B32


    Inst_DS__DS_AND_SRC2_B32::~Inst_DS__DS_AND_SRC2_B32()

    {

    } // ~Inst_DS__DS_AND_SRC2_B32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] & MEM[B].

    void


    Inst_DS__DS_AND_SRC2_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_OR_SRC2_B32 class methods ---


    Inst_DS__DS_OR_SRC2_B32::Inst_DS__DS_OR_SRC2_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_or_src2_b32")

    {

    } // Inst_DS__DS_OR_SRC2_B32


    Inst_DS__DS_OR_SRC2_B32::~Inst_DS__DS_OR_SRC2_B32()

    {

    } // ~Inst_DS__DS_OR_SRC2_B32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] | MEM[B].

    void


    Inst_DS__DS_OR_SRC2_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_XOR_SRC2_B32 class methods ---


    Inst_DS__DS_XOR_SRC2_B32::Inst_DS__DS_XOR_SRC2_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_xor_src2_b32")

    {

    } // Inst_DS__DS_XOR_SRC2_B32


    Inst_DS__DS_XOR_SRC2_B32::~Inst_DS__DS_XOR_SRC2_B32()

    {

    } // ~Inst_DS__DS_XOR_SRC2_B32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] ^ MEM[B].

    void


    Inst_DS__DS_XOR_SRC2_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRITE_SRC2_B32 class methods ---


    Inst_DS__DS_WRITE_SRC2_B32::Inst_DS__DS_WRITE_SRC2_B32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_src2_b32")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_SRC2_B32


    Inst_DS__DS_WRITE_SRC2_B32::~Inst_DS__DS_WRITE_SRC2_B32()

    {

    } // ~Inst_DS__DS_WRITE_SRC2_B32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[B].

    // Write dword.

    void


    Inst_DS__DS_WRITE_SRC2_B32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_SRC2_F32 class methods ---


    Inst_DS__DS_MIN_SRC2_F32::Inst_DS__DS_MIN_SRC2_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_src2_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_MIN_SRC2_F32


    Inst_DS__DS_MIN_SRC2_F32::~Inst_DS__DS_MIN_SRC2_F32()

    {

    } // ~Inst_DS__DS_MIN_SRC2_F32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[B] < MEM[A]) ? MEM[B] : MEM[A].

    // Float, handles NaN/INF/denorm.

    void


    Inst_DS__DS_MIN_SRC2_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_SRC2_F32 class methods ---


    Inst_DS__DS_MAX_SRC2_F32::Inst_DS__DS_MAX_SRC2_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_src2_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_MAX_SRC2_F32


    Inst_DS__DS_MAX_SRC2_F32::~Inst_DS__DS_MAX_SRC2_F32()

    {

    } // ~Inst_DS__DS_MAX_SRC2_F32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[B] > MEM[A]) ? MEM[B] : MEM[A].

    // Float, handles NaN/INF/denorm.

    void


    Inst_DS__DS_MAX_SRC2_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_ADD_SRC2_F32 class methods ---


    Inst_DS__DS_ADD_SRC2_F32::Inst_DS__DS_ADD_SRC2_F32(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_src2_f32")

    {

        setFlag(F32);

    } // Inst_DS__DS_ADD_SRC2_F32


    Inst_DS__DS_ADD_SRC2_F32::~Inst_DS__DS_ADD_SRC2_F32()

    {

    } // ~Inst_DS__DS_ADD_SRC2_F32


    // --- description from .arch file ---

    // 32b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[B] + MEM[A].

    // Float, handles NaN/INF/denorm.

    void


    Inst_DS__DS_ADD_SRC2_F32::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_GWS_SEMA_RELEASE_ALL class methods ---


    Inst_DS__DS_GWS_SEMA_RELEASE_ALL::Inst_DS__DS_GWS_SEMA_RELEASE_ALL(

          InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_gws_sema_release_all")

    {

    } // Inst_DS__DS_GWS_SEMA_RELEASE_ALL


    Inst_DS__DS_GWS_SEMA_RELEASE_ALL::~Inst_DS__DS_GWS_SEMA_RELEASE_ALL()

    {

    } // ~Inst_DS__DS_GWS_SEMA_RELEASE_ALL


    // --- description from .arch file ---

    // GDS Only: The GWS resource (rid) indicated will process this opcode by

    // updating the counter and labeling the specified resource as a semaphore.

    // //Determine the GWS resource to work on

    // rid[5:0] = SH_SX_EXPCMD.gds_base[5:0] + offset0[5:0];

    // //Incr the state counter of the resource

    // state.counter[rid] = state.wave_in_queue;

    // state.type = SEMAPHORE;

    // return rd_done; //release calling wave

    // This action will release ALL queued waves; it Will have no effect if no

    // ---  waves are present.

    void


    Inst_DS__DS_GWS_SEMA_RELEASE_ALL::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_GWS_INIT class methods ---


    Inst_DS__DS_GWS_INIT::Inst_DS__DS_GWS_INIT(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_gws_init")

    {

    } // Inst_DS__DS_GWS_INIT


    Inst_DS__DS_GWS_INIT::~Inst_DS__DS_GWS_INIT()

    {

    } // ~Inst_DS__DS_GWS_INIT


    // --- description from .arch file ---

    // GDS Only: Initialize a barrier or semaphore resource.

    // //Determine the GWS resource to work on

    // rid[5:0] = SH_SX_EXPCMD.gds_base[5:0] + offset0[5:0];

    // //Get the value to use in init

    // index = find_first_valid(vector mask)

    // value = DATA[thread: index]

    // //Set the state of the resource

    // state.counter[rid] = lsb(value); //limit #waves

    // state.flag[rid] = 0;

    // return rd_done; //release calling wave

    void


    Inst_DS__DS_GWS_INIT::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_GWS_SEMA_V class methods ---


    Inst_DS__DS_GWS_SEMA_V::Inst_DS__DS_GWS_SEMA_V(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_gws_sema_v")

    {

    } // Inst_DS__DS_GWS_SEMA_V


    Inst_DS__DS_GWS_SEMA_V::~Inst_DS__DS_GWS_SEMA_V()

    {

    } // ~Inst_DS__DS_GWS_SEMA_V


    // --- description from .arch file ---

    // GDS Only: The GWS resource indicated will process this opcode by

    // updating the counter and labeling the resource as a semaphore.

    // //Determine the GWS resource to work on

    // rid[5:0] = SH_SX_EXPCMD.gds_base[5:0] + offset0[5:0];

    // //Incr the state counter of the resource

    // state.counter[rid]++;

    // state.type = SEMAPHORE;

    // return rd_done; //release calling wave

    // This action will release one waved if any are queued in this resource.

    void


    Inst_DS__DS_GWS_SEMA_V::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_GWS_SEMA_BR class methods ---


    Inst_DS__DS_GWS_SEMA_BR::Inst_DS__DS_GWS_SEMA_BR(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_gws_sema_br")

    {

    } // Inst_DS__DS_GWS_SEMA_BR


    Inst_DS__DS_GWS_SEMA_BR::~Inst_DS__DS_GWS_SEMA_BR()

    {

    } // ~Inst_DS__DS_GWS_SEMA_BR


    // --- description from .arch file ---

    // GDS Only: The GWS resource indicated will process this opcode by

    // updating the counter by the bulk release delivered count and labeling

    // the resource as a semaphore.

    // //Determine the GWS resource to work on

    // rid[5:0] = SH_SX_EXPCMD.gds_base[5:0] + offset0[5:0];

    // index =  find first valid (vector mask)

    // count = DATA[thread: index];

    // //Add count to the resource state counter

    // state.counter[rid] += count;

    // state.type = SEMAPHORE;

    // return rd_done; //release calling wave

    // This action will release count number of waves, immediately if queued,

    // or as they arrive from the noted resource.

    void


    Inst_DS__DS_GWS_SEMA_BR::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_GWS_SEMA_P class methods ---


    Inst_DS__DS_GWS_SEMA_P::Inst_DS__DS_GWS_SEMA_P(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_gws_sema_p")

    {

    } // Inst_DS__DS_GWS_SEMA_P


    Inst_DS__DS_GWS_SEMA_P::~Inst_DS__DS_GWS_SEMA_P()

    {

    } // ~Inst_DS__DS_GWS_SEMA_P


    // --- description from .arch file ---

    // GDS Only: The GWS resource indicated will process this opcode by

    // queueing it until counter enables a release and then decrementing the

    // counter of the resource as a semaphore.

    // //Determine the GWS resource to work on

    // rid[5:0] = SH_SX_EXPCMD.gds_base[5:0] + offset0[5:0];

    // state.type = SEMAPHORE;

    // ENQUEUE until(state[rid].counter > 0)

    // state[rid].counter--;

    // return rd_done

    void


    Inst_DS__DS_GWS_SEMA_P::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_GWS_BARRIER class methods ---


    Inst_DS__DS_GWS_BARRIER::Inst_DS__DS_GWS_BARRIER(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_gws_barrier")

    {

    } // Inst_DS__DS_GWS_BARRIER


    Inst_DS__DS_GWS_BARRIER::~Inst_DS__DS_GWS_BARRIER()

    {

    } // ~Inst_DS__DS_GWS_BARRIER


    // --- description from .arch file ---

    // GDS Only: The GWS resource indicated will process this opcode by

    // queueing it until barrier is satisfied. The number of waves needed is

    // passed in as DATA of first valid thread.

    // //Determine the GWS resource to work on

    // rid[5:0] = SH_SX_EXPCMD.gds_base[5:0] + OFFSET0[5:0];

    // index =  find first valid (vector mask);

    // value = DATA[thread: index];

    // // Input Decision Machine

    // state.type[rid] = BARRIER;

    // if (state[rid].counter <= 0) {

    //     thread[rid].flag = state[rid].flag;

    //     ENQUEUE;

    //     state[rid].flag = !state.flag;

    //     state[rid].counter = value;

    //     return rd_done;

    // } else {

    //     state[rid].counter--;

    //     thread.flag = state[rid].flag;

    //     ENQUEUE;

    // }

    // Since the waves deliver the count for the next barrier, this function

    // can have a different size barrier for each occurrence.

    // // Release Machine

    // if (state.type == BARRIER) {

    //     if (state.flag != thread.flag) {

    //         return rd_done;

    //     }

    // }

    void


    Inst_DS__DS_GWS_BARRIER::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_CONSUME class methods ---


    Inst_DS__DS_CONSUME::Inst_DS__DS_CONSUME(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_consume")

    {

    } // Inst_DS__DS_CONSUME


    Inst_DS__DS_CONSUME::~Inst_DS__DS_CONSUME()

    {

    } // ~Inst_DS__DS_CONSUME


    // --- description from .arch file ---

    // LDS & GDS. Subtract (count_bits(exec_mask)) from the value stored in DS

    // memory at (M0.base + instr_offset). Return the pre-operation value to

    // VGPRs.

    void


    Inst_DS__DS_CONSUME::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_APPEND class methods ---


    Inst_DS__DS_APPEND::Inst_DS__DS_APPEND(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_append")

    {

    } // Inst_DS__DS_APPEND


    Inst_DS__DS_APPEND::~Inst_DS__DS_APPEND()

    {

    } // ~Inst_DS__DS_APPEND


    // --- description from .arch file ---

    // LDS & GDS. Add (count_bits(exec_mask)) to the value stored in DS memory

    // at (M0.base + instr_offset). Return the pre-operation value to VGPRs.

    void


    Inst_DS__DS_APPEND::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_ORDERED_COUNT class methods ---


    Inst_DS__DS_ORDERED_COUNT::Inst_DS__DS_ORDERED_COUNT(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_ordered_count")

    {

    } // Inst_DS__DS_ORDERED_COUNT


    Inst_DS__DS_ORDERED_COUNT::~Inst_DS__DS_ORDERED_COUNT()

    {

    } // ~Inst_DS__DS_ORDERED_COUNT


    // --- description from .arch file ---

    // GDS-only. Add (count_bits(exec_mask)) to one of 4 dedicated

    // ordered-count counters (aka 'packers'). Additional bits of instr.offset

    // field are overloaded to hold packer-id, 'last'.

    void


    Inst_DS__DS_ORDERED_COUNT::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_ADD_SRC2_U64 class methods ---


    Inst_DS__DS_ADD_SRC2_U64::Inst_DS__DS_ADD_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_add_src2_u64")

    {

    } // Inst_DS__DS_ADD_SRC2_U64


    Inst_DS__DS_ADD_SRC2_U64::~Inst_DS__DS_ADD_SRC2_U64()

    {

    } // ~Inst_DS__DS_ADD_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] + MEM[B].

    void


    Inst_DS__DS_ADD_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_SUB_SRC2_U64 class methods ---


    Inst_DS__DS_SUB_SRC2_U64::Inst_DS__DS_SUB_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_sub_src2_u64")

    {

    } // Inst_DS__DS_SUB_SRC2_U64


    Inst_DS__DS_SUB_SRC2_U64::~Inst_DS__DS_SUB_SRC2_U64()

    {

    } // ~Inst_DS__DS_SUB_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] - MEM[B].

    void


    Inst_DS__DS_SUB_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_RSUB_SRC2_U64 class methods ---


    Inst_DS__DS_RSUB_SRC2_U64::Inst_DS__DS_RSUB_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_rsub_src2_u64")

    {

    } // Inst_DS__DS_RSUB_SRC2_U64


    Inst_DS__DS_RSUB_SRC2_U64::~Inst_DS__DS_RSUB_SRC2_U64()

    {

    } // ~Inst_DS__DS_RSUB_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[B] - MEM[A].

    void


    Inst_DS__DS_RSUB_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_INC_SRC2_U64 class methods ---


    Inst_DS__DS_INC_SRC2_U64::Inst_DS__DS_INC_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_inc_src2_u64")

    {

    } // Inst_DS__DS_INC_SRC2_U64


    Inst_DS__DS_INC_SRC2_U64::~Inst_DS__DS_INC_SRC2_U64()

    {

    } // ~Inst_DS__DS_INC_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[A] >= MEM[B] ? 0 : MEM[A] + 1).

    void


    Inst_DS__DS_INC_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_DEC_SRC2_U64 class methods ---


    Inst_DS__DS_DEC_SRC2_U64::Inst_DS__DS_DEC_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_dec_src2_u64")

    {

    } // Inst_DS__DS_DEC_SRC2_U64


    Inst_DS__DS_DEC_SRC2_U64::~Inst_DS__DS_DEC_SRC2_U64()

    {

    } // ~Inst_DS__DS_DEC_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[A] == 0 || MEM[A] > MEM[B] ? MEM[B] : MEM[A] - 1).

    // Uint decrement.

    void


    Inst_DS__DS_DEC_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_SRC2_I64 class methods ---


    Inst_DS__DS_MIN_SRC2_I64::Inst_DS__DS_MIN_SRC2_I64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_src2_i64")

    {

    } // Inst_DS__DS_MIN_SRC2_I64


    Inst_DS__DS_MIN_SRC2_I64::~Inst_DS__DS_MIN_SRC2_I64()

    {

    } // ~Inst_DS__DS_MIN_SRC2_I64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = min(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MIN_SRC2_I64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_SRC2_I64 class methods ---


    Inst_DS__DS_MAX_SRC2_I64::Inst_DS__DS_MAX_SRC2_I64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_src2_i64")

    {

    } // Inst_DS__DS_MAX_SRC2_I64


    Inst_DS__DS_MAX_SRC2_I64::~Inst_DS__DS_MAX_SRC2_I64()

    {

    } // ~Inst_DS__DS_MAX_SRC2_I64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = max(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MAX_SRC2_I64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_SRC2_U64 class methods ---


    Inst_DS__DS_MIN_SRC2_U64::Inst_DS__DS_MIN_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_src2_u64")

    {

    } // Inst_DS__DS_MIN_SRC2_U64


    Inst_DS__DS_MIN_SRC2_U64::~Inst_DS__DS_MIN_SRC2_U64()

    {

    } // ~Inst_DS__DS_MIN_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = min(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MIN_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_SRC2_U64 class methods ---


    Inst_DS__DS_MAX_SRC2_U64::Inst_DS__DS_MAX_SRC2_U64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_src2_u64")

    {

    } // Inst_DS__DS_MAX_SRC2_U64


    Inst_DS__DS_MAX_SRC2_U64::~Inst_DS__DS_MAX_SRC2_U64()

    {

    } // ~Inst_DS__DS_MAX_SRC2_U64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = max(MEM[A], MEM[B]).

    void


    Inst_DS__DS_MAX_SRC2_U64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_AND_SRC2_B64 class methods ---


    Inst_DS__DS_AND_SRC2_B64::Inst_DS__DS_AND_SRC2_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_and_src2_b64")

    {

    } // Inst_DS__DS_AND_SRC2_B64


    Inst_DS__DS_AND_SRC2_B64::~Inst_DS__DS_AND_SRC2_B64()

    {

    } // ~Inst_DS__DS_AND_SRC2_B64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] & MEM[B].

    void


    Inst_DS__DS_AND_SRC2_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_OR_SRC2_B64 class methods ---


    Inst_DS__DS_OR_SRC2_B64::Inst_DS__DS_OR_SRC2_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_or_src2_b64")

    {

    } // Inst_DS__DS_OR_SRC2_B64


    Inst_DS__DS_OR_SRC2_B64::~Inst_DS__DS_OR_SRC2_B64()

    {

    } // ~Inst_DS__DS_OR_SRC2_B64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] | MEM[B].

    void


    Inst_DS__DS_OR_SRC2_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_XOR_SRC2_B64 class methods ---


    Inst_DS__DS_XOR_SRC2_B64::Inst_DS__DS_XOR_SRC2_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_xor_src2_b64")

    {

    } // Inst_DS__DS_XOR_SRC2_B64


    Inst_DS__DS_XOR_SRC2_B64::~Inst_DS__DS_XOR_SRC2_B64()

    {

    } // ~Inst_DS__DS_XOR_SRC2_B64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[A] ^ MEM[B].

    void


    Inst_DS__DS_XOR_SRC2_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRITE_SRC2_B64 class methods ---


    Inst_DS__DS_WRITE_SRC2_B64::Inst_DS__DS_WRITE_SRC2_B64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_src2_b64")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_SRC2_B64


    Inst_DS__DS_WRITE_SRC2_B64::~Inst_DS__DS_WRITE_SRC2_B64()

    {

    } // ~Inst_DS__DS_WRITE_SRC2_B64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = MEM[B].

    // Write qword.

    void


    Inst_DS__DS_WRITE_SRC2_B64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MIN_SRC2_F64 class methods ---


    Inst_DS__DS_MIN_SRC2_F64::Inst_DS__DS_MIN_SRC2_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_min_src2_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_MIN_SRC2_F64


    Inst_DS__DS_MIN_SRC2_F64::~Inst_DS__DS_MIN_SRC2_F64()

    {

    } // ~Inst_DS__DS_MIN_SRC2_F64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[B] < MEM[A]) ? MEM[B] : MEM[A].

    // Float, handles NaN/INF/denorm.

    void


    Inst_DS__DS_MIN_SRC2_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_MAX_SRC2_F64 class methods ---


    Inst_DS__DS_MAX_SRC2_F64::Inst_DS__DS_MAX_SRC2_F64(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_max_src2_f64")

    {

        setFlag(F64);

    } // Inst_DS__DS_MAX_SRC2_F64


    Inst_DS__DS_MAX_SRC2_F64::~Inst_DS__DS_MAX_SRC2_F64()

    {

    } // ~Inst_DS__DS_MAX_SRC2_F64


    // --- description from .arch file ---

    // 64b:

    // A = ADDR_BASE;

    // B = A + 4*(offset1[7] ? {A[31],A[31:17]} :

    // ---  {offset1[6],offset1[6:0],offset0});

    // MEM[A] = (MEM[B] > MEM[A]) ? MEM[B] : MEM[A].

    // Float, handles NaN/INF/denorm.

    void


    Inst_DS__DS_MAX_SRC2_F64::execute(GPUDynInstPtr gpuDynInst)

    {

        panicUnimplemented();

    } // execute


    // --- Inst_DS__DS_WRITE_B96 class methods ---


    Inst_DS__DS_WRITE_B96::Inst_DS__DS_WRITE_B96(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b96")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B96


    Inst_DS__DS_WRITE_B96::~Inst_DS__DS_WRITE_B96()

    {

    } // ~Inst_DS__DS_WRITE_B96


    // --- description from .arch file ---

    // {MEM[ADDR + 8], MEM[ADDR + 4], MEM[ADDR]} = DATA[95:0].

    // Tri-dword write.

    void


    Inst_DS__DS_WRITE_B96::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data0(gpuDynInst, extData.DATA0);

        ConstVecOperandU32 data1(gpuDynInst, extData.DATA0 + 1);

        ConstVecOperandU32 data2(gpuDynInst, extData.DATA0 + 2);


        addr.read();

        data0.read();

        data1.read();

        data2.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 3] = data0[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 3 + 1] = data1[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 3 + 2] = data2[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B96::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<3>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B96::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_WRITE_B128 class methods ---


    Inst_DS__DS_WRITE_B128::Inst_DS__DS_WRITE_B128(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_write_b128")

    {

        setFlag(MemoryRef);

        setFlag(Store);

    } // Inst_DS__DS_WRITE_B128


    Inst_DS__DS_WRITE_B128::~Inst_DS__DS_WRITE_B128()

    {

    } // ~Inst_DS__DS_WRITE_B128


    // --- description from .arch file ---

    // {MEM[ADDR + 12], MEM[ADDR + 8], MEM[ADDR + 4], MEM[ADDR]} = DATA[127:0].

    // Qword write.

    void


    Inst_DS__DS_WRITE_B128::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);

        ConstVecOperandU32 data0(gpuDynInst, extData.DATA0);

        ConstVecOperandU32 data1(gpuDynInst, extData.DATA0 + 1);

        ConstVecOperandU32 data2(gpuDynInst, extData.DATA0 + 2);

        ConstVecOperandU32 data3(gpuDynInst, extData.DATA0 + 3);


        addr.read();

        data0.read();

        data1.read();

        data2.read();

        data3.read();


        calcAddr(gpuDynInst, addr);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4] = data0[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4 + 1] = data1[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4 + 2] = data2[lane];

                (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4 + 3] = data3[lane];

            }

        }


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_WRITE_B128::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemWrite<4>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_WRITE_B128::completeAcc(GPUDynInstPtr gpuDynInst)

    {

    } // completeAcc


    // --- Inst_DS__DS_READ_B96 class methods ---


    Inst_DS__DS_READ_B96::Inst_DS__DS_READ_B96(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b96")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_B96


    Inst_DS__DS_READ_B96::~Inst_DS__DS_READ_B96()

    {

    } // ~Inst_DS__DS_READ_B96


    // --- description from .arch file ---

    // Tri-dword read.

    void


    Inst_DS__DS_READ_B96::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B96::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<3>(gpuDynInst, offset);

    }


    void


    Inst_DS__DS_READ_B96::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst0(gpuDynInst, extData.VDST);

        VecOperandU32 vdst1(gpuDynInst, extData.VDST + 1);

        VecOperandU32 vdst2(gpuDynInst, extData.VDST + 2);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst0[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 3];

                vdst1[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 3 + 1];

                vdst2[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 3 + 2];

            }

        }


        vdst0.write();

        vdst1.write();

        vdst2.write();

    }


    // --- Inst_DS__DS_READ_B128 class methods ---


    Inst_DS__DS_READ_B128::Inst_DS__DS_READ_B128(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b128")

    {

        setFlag(MemoryRef);

        setFlag(Load);

    } // Inst_DS__DS_READ_B128


    Inst_DS__DS_READ_B128::~Inst_DS__DS_READ_B128()

    {

    } // ~Inst_DS__DS_READ_B128


    // --- description from .arch file ---

    // Qword read.

    void


    Inst_DS__DS_READ_B128::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();

        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B128::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<4>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B128::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst0(gpuDynInst, extData.VDST);

        VecOperandU32 vdst1(gpuDynInst, extData.VDST + 1);

        VecOperandU32 vdst2(gpuDynInst, extData.VDST + 2);

        VecOperandU32 vdst3(gpuDynInst, extData.VDST + 3);


        for (int lane = 0; lane < NumVecElemPerVecReg; ++lane) {

            if (gpuDynInst->exec_mask[lane]) {

                vdst0[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4];

                vdst1[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4 + 1];

                vdst2[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4 + 2];

                vdst3[lane] = (reinterpret_cast<VecElemU32*>(

                    gpuDynInst->d_data))[lane * 4 + 3];

            }

        }


        vdst0.write();

        vdst1.write();

        vdst2.write();

        vdst3.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_B64_TR_B4 class methods ---


    Inst_DS__DS_READ_B64_TR_B4::Inst_DS__DS_READ_B64_TR_B4(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b64_tr_b4")

    {

        setFlag(Load);

    } // Inst_DS__DS_READ_B64_TR_B4


    Inst_DS__DS_READ_B64_TR_B4::~Inst_DS__DS_READ_B64_TR_B4()

    {

    } // ~Inst_DS__DS_READ_B64_TR_B4


    void


    Inst_DS__DS_READ_B64_TR_B4::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B64_TR_B4::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU64>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B64_TR_B4::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU64 vdst(gpuDynInst, extData.VDST);


        // Operate on 16 threads per cycle. For simulation we do 4 passes.

        for (int pass = 0; pass < 4; ++pass) {

            // With 4-bit datatype and 64-bits per thread, there are at most

            // 1024 elements (e.g. 32x32 matrix).

            //

            // Pack into sixteen 16x 4-bit arrays to get memory-like layout

            // (a 8x16 matrix). Invert on each pass to 16x8 and get 32x16.

            // This looks like unpacked[0]  = 00h, 10h, 20h, ... f0h

            //                 unpacked[1]  = 01h, 11h, 21h, ... f1h

            //                 unpacked[2]  = 02h, 12h, 22h, ... f2h

            //                 unpacked[3]  = 03h, 13h, 23h, ... f3h

            //                 unpacked[4]  = 04h, 14h, 24h, ... f4h

            //                 unpacked[5]  = 05h, 15h, 25h, ... f5h

            //                                    ...

            //                 unpacked[15] = 0fh, 1fh, 2fh, ... ffh

            // 2nd pass has same values + 100h, 3rd pass has same + 200h and

            // 4th pass has same values + 300h.

            // +--------------+--------------+

            // | 16x16 pass 1 | 16x16 pass 2 |

            // +--------------+--------------+

            // | 16x16 pass 3 | 16x16 pass 4 |

            // +-------------+---------------+

            uint8_t unpacked[16][16];


            // 16 values per lane (64-bit read / 4-bit type).

            for (int x = 0; x < 16; ++x) {

                // 1 lane per column (16 values per lane and 16 rows)

                int lane = pass * 16 + x;

                VecElemU64 qword = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane];

                unpacked[x][0]  = bits(qword, 63, 60);

                unpacked[x][1]  = bits(qword, 59, 56);

                unpacked[x][2]  = bits(qword, 55, 52);

                unpacked[x][3]  = bits(qword, 51, 48);

                unpacked[x][4]  = bits(qword, 47, 44);

                unpacked[x][5]  = bits(qword, 43, 40);

                unpacked[x][6]  = bits(qword, 39, 36);

                unpacked[x][7]  = bits(qword, 35, 32);

                unpacked[x][8]  = bits(qword, 31, 28);

                unpacked[x][9]  = bits(qword, 27, 24);

                unpacked[x][10] = bits(qword, 23, 20);

                unpacked[x][11] = bits(qword, 19, 16);

                unpacked[x][12] = bits(qword, 15, 12);

                unpacked[x][13] = bits(qword, 11,  8);

                unpacked[x][14] = bits(qword,  7,  4);

                unpacked[x][15] = bits(qword,  3,  0);

            }


            // Next repack these 16 4-bit values into one dword for each lane.

            // The values are the ith element of each of the 16 x16 arrays.

            // +--------+--------+

            // |  16x16 | 16x16  |

            // | pass 1 | pass 2 |

            // +--------+--------+

            // |  16x16 | 16x16  |

            // | pass 3 | pass 4 |

            // +--------+--------+

            for (int i = 0; i < 16; ++i) {

                vdst[pass * 16 + i] = 0;

                replaceBits(vdst[pass * 16 + i], 63, 60, unpacked[0][i]);

                replaceBits(vdst[pass * 16 + i], 59, 56, unpacked[1][i]);

                replaceBits(vdst[pass * 16 + i], 55, 52, unpacked[2][i]);

                replaceBits(vdst[pass * 16 + i], 51, 48, unpacked[3][i]);

                replaceBits(vdst[pass * 16 + i], 47, 44, unpacked[4][i]);

                replaceBits(vdst[pass * 16 + i], 43, 40, unpacked[5][i]);

                replaceBits(vdst[pass * 16 + i], 39, 36, unpacked[6][i]);

                replaceBits(vdst[pass * 16 + i], 35, 32, unpacked[7][i]);

                replaceBits(vdst[pass * 16 + i], 31, 28, unpacked[8][i]);

                replaceBits(vdst[pass * 16 + i], 27, 24, unpacked[9][i]);

                replaceBits(vdst[pass * 16 + i], 23, 20, unpacked[10][i]);

                replaceBits(vdst[pass * 16 + i], 19, 16, unpacked[11][i]);

                replaceBits(vdst[pass * 16 + i], 15, 12, unpacked[12][i]);

                replaceBits(vdst[pass * 16 + i], 11,  8, unpacked[13][i]);

                replaceBits(vdst[pass * 16 + i],  7,  4, unpacked[14][i]);

                replaceBits(vdst[pass * 16 + i],  3,  0, unpacked[15][i]);

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_B96_TR_B6 class methods ---


    Inst_DS__DS_READ_B96_TR_B6::Inst_DS__DS_READ_B96_TR_B6(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b96_tr_b6")

    {

        setFlag(Load);

    } // Inst_DS__DS_READ_B96_TR_B6


    Inst_DS__DS_READ_B96_TR_B6::~Inst_DS__DS_READ_B96_TR_B6()

    {

    } // ~Inst_DS__DS_READ_B96_TR_B6


    void


    Inst_DS__DS_READ_B96_TR_B6::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B96_TR_B6::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<3>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B96_TR_B6::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU32 vdst0(gpuDynInst, extData.VDST + 0);

        VecOperandU32 vdst1(gpuDynInst, extData.VDST + 1);

        VecOperandU32 vdst2(gpuDynInst, extData.VDST + 2);


        // Operate on 16 threads per cycle. For simulation we do 4 passes.

        for (int pass = 0; pass < 4; ++pass) {

            // With 6-bit datatype and 96-bits per thread, there are at most

            // 1024 elements (e.g. 32x32 matrix).

            //

            // Pack into sixteen 16x 4-bit arrays to get memory-like layout

            // (a 8x16 matrix). Invert on each pass to 16x8 and get 32x16.

            // This looks like unpacked[0]  = 00h, 10h, 20h, ... f0h

            //                 unpacked[1]  = 01h, 11h, 21h, ... f1h

            //                 unpacked[2]  = 02h, 12h, 22h, ... f2h

            //                 unpacked[3]  = 03h, 13h, 23h, ... f3h

            //                 unpacked[4]  = 04h, 14h, 24h, ... f4h

            //                 unpacked[5]  = 05h, 15h, 25h, ... f5h

            //                                    ...

            //                 unpacked[15] = 0fh, 1fh, 2fh, ... ffh

            // 2nd pass has same values + 100h, 3rd pass has same + 200h and

            // 4th pass has same values + 300h.

            // +--------------+--------------+

            // | 16x16 pass 1 | 16x16 pass 2 |

            // +--------------+--------------+

            // | 16x16 pass 3 | 16x16 pass 4 |

            // +-------------+---------------+

            uint8_t unpacked[16][16];


            // 16 values per lane (64-bit read / 4-bit type).

            for (int x = 0; x < 16; ++x) {

                // 1 lane per column (16 values per lane and 16 rows)

                int lane = pass * 16 + x;

                VecElemU32 dword0 = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 4 + 0];

                VecElemU32 dword1 = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 4 + 1];

                VecElemU32 dword2 = (reinterpret_cast<VecElemU64*>(

                    gpuDynInst->d_data))[lane * 4 + 2];


                PackedReg<96, 6> tdword;

                tdword.setDword(0, dword0);

                tdword.setDword(1, dword1);

                tdword.setDword(2, dword2);


                unpacked[x][0]  = tdword.getElem(15);

                unpacked[x][1]  = tdword.getElem(14);

                unpacked[x][2]  = tdword.getElem(13);

                unpacked[x][3]  = tdword.getElem(12);

                unpacked[x][4]  = tdword.getElem(11);

                unpacked[x][5]  = tdword.getElem(10);

                unpacked[x][6]  = tdword.getElem(9);

                unpacked[x][7]  = tdword.getElem(8);

                unpacked[x][8]  = tdword.getElem(7);

                unpacked[x][9]  = tdword.getElem(6);

                unpacked[x][10] = tdword.getElem(5);

                unpacked[x][11] = tdword.getElem(4);

                unpacked[x][12] = tdword.getElem(3);

                unpacked[x][13] = tdword.getElem(2);

                unpacked[x][14] = tdword.getElem(1);

                unpacked[x][15] = tdword.getElem(0);

            }


            // Next repack these 16 6-bit values into 3 dwords for each lane.

            // Each lane is simply the values in the unpacked array, but some

            // value will span multiple dwords, so we use the PackedReg helper.

            // +--------+--------+

            // |  16x16 | 16x16  |

            // | pass 1 | pass 2 |

            // +--------+--------+

            // |  16x16 | 16x16  |

            // | pass 3 | pass 4 |

            // +--------+--------+

            for (int i = 0; i < 16; ++i) {

                PackedReg<96, 6> tdword;

                tdword.setDword(0, 0);

                tdword.setDword(1, 0);

                tdword.setDword(2, 0);


                tdword.setElem(15, unpacked[0][i]);

                tdword.setElem(14, unpacked[1][i]);

                tdword.setElem(13, unpacked[2][i]);

                tdword.setElem(12, unpacked[3][i]);

                tdword.setElem(11, unpacked[4][i]);

                tdword.setElem(10, unpacked[5][i]);

                tdword.setElem(9,  unpacked[6][i]);

                tdword.setElem(8,  unpacked[7][i]);

                tdword.setElem(7,  unpacked[8][i]);

                tdword.setElem(6,  unpacked[9][i]);

                tdword.setElem(5,  unpacked[10][i]);

                tdword.setElem(4,  unpacked[11][i]);

                tdword.setElem(3,  unpacked[12][i]);

                tdword.setElem(2,  unpacked[13][i]);

                tdword.setElem(1,  unpacked[14][i]);

                tdword.setElem(0,  unpacked[15][i]);

            }

        }


        vdst0.write();

        vdst1.write();

        vdst2.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_B64_TR_B8 class methods ---


    Inst_DS__DS_READ_B64_TR_B8::Inst_DS__DS_READ_B64_TR_B8(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b64_tr_b8")

    {

        setFlag(Load);

    } // Inst_DS__DS_READ_B64_TR_B8


    Inst_DS__DS_READ_B64_TR_B8::~Inst_DS__DS_READ_B64_TR_B8()

    {

    } // ~Inst_DS__DS_READ_B64_TR_B8


    void


    Inst_DS__DS_READ_B64_TR_B8::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B64_TR_B8::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU64>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B64_TR_B8::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU64 vdst(gpuDynInst, extData.VDST);


        // Operate on 16 threads per cycle. For simulation we do 4 passes.

        for (int pass = 0; pass < 4; ++pass) {

            // With 8-bit datatype and 64-bits per thread, there are at most

            // 512 elements (e.g. 16x32 matrix).

            //

            // Pack into eight 16x 8-bit arrays to get memory-like layout

            // (a 8x16 matrix). Invert on each pass to 16x8 and get 32x16.

            // This looks like unpacked[0] = 00h, 10h, 20h, ... f0h

            //                 unpacked[1] = 01h, 11h, 21h, ... f1h

            //                 unpacked[2] = 02h, 12h, 22h, ... f2h

            //                 unpacked[3] = 03h, 13h, 23h, ... f3h

            //                 unpacked[4] = 04h, 14h, 24h, ... f4h

            //                 unpacked[5] = 05h, 15h, 25h, ... f5h

            //                 unpacked[6] = 06h, 16h, 26h, ... f6h

            //                 unpacked[7] = 07h, 17h, 27h, ... f7h

            // 2nd pass has lower nibbles 8-f. 3rd and 4th have same as

            // 1st and 2nd pass with 100h added:

            // +-------------+-------------+

            // | 8x16 pass 1 | 8x16 pass 2 |

            // +-------------+-------------+

            // | 8x16 pass 3 | 8x16 pass 4 |

            // +-------------+-------------+

            uint8_t unpacked[8][16];


            // 8 values per lane (64-bit read / 8-bit type)

            for (int x = 0; x < 8; ++x) {

                // 2 lanes per column (8 values per lane and 16 rows)

                for (int y = 0; y < 2; ++y) {

                    int lane = pass * 16 + x * 2 + y;

                    VecElemU64 qword = (reinterpret_cast<VecElemU64*>(

                        gpuDynInst->d_data))[lane];

                    unpacked[x][y * 8 + 0] = bits(qword, 63, 56);

                    unpacked[x][y * 8 + 1] = bits(qword, 55, 48);

                    unpacked[x][y * 8 + 2] = bits(qword, 47, 40);

                    unpacked[x][y * 8 + 3] = bits(qword, 39, 32);

                    unpacked[x][y * 8 + 4] = bits(qword, 31, 24);

                    unpacked[x][y * 8 + 5] = bits(qword, 23, 16);

                    unpacked[x][y * 8 + 6] = bits(qword, 15, 8);

                    unpacked[x][y * 8 + 7] = bits(qword,  7, 0);

                }

            }


            // Next repack these 8 8-bit values into one dword for each lane.

            // The values are the ith element of each of the eight x16 arrays.

            // +--------+--------+

            // |  16x8  |  16x8  |

            // | pass 1 | pass 2 |

            // +--------+--------+

            // |  16x8  |  16x8  |

            // | pass 3 | pass 4 |

            // +--------+--------+

            for (int i = 0; i < 16; ++i) {

                vdst[pass * 16 + i] = 0;

                replaceBits(vdst[pass * 16 + i], 63, 56, unpacked[0][i]);

                replaceBits(vdst[pass * 16 + i], 55, 48, unpacked[1][i]);

                replaceBits(vdst[pass * 16 + i], 47, 40, unpacked[2][i]);

                replaceBits(vdst[pass * 16 + i], 39, 32, unpacked[3][i]);

                replaceBits(vdst[pass * 16 + i], 31, 24, unpacked[4][i]);

                replaceBits(vdst[pass * 16 + i], 23, 16, unpacked[5][i]);

                replaceBits(vdst[pass * 16 + i], 15,  8, unpacked[6][i]);

                replaceBits(vdst[pass * 16 + i],  7,  0, unpacked[7][i]);

            }

        }


        vdst.write();

    } // completeAcc


    // --- Inst_DS__DS_READ_B64_TR_B16 class methods ---


    Inst_DS__DS_READ_B64_TR_B16::Inst_DS__DS_READ_B64_TR_B16(InFmt_DS *iFmt)

        : Inst_DS(iFmt, "ds_read_b64_tr_b16")

    {

        setFlag(Load);

    } // Inst_DS__DS_READ_B64_TR_B16


    Inst_DS__DS_READ_B64_TR_B16::~Inst_DS__DS_READ_B64_TR_B16()

    {

    } // ~Inst_DS__DS_READ_B64_TR_B16


    void


    Inst_DS__DS_READ_B64_TR_B16::execute(GPUDynInstPtr gpuDynInst)

    {

        Wavefront *wf = gpuDynInst->wavefront();


        if (gpuDynInst->exec_mask.none()) {

            wf->decLGKMInstsIssued();

            return;

        }


        gpuDynInst->execUnitId = wf->execUnitId;

        gpuDynInst->latency.init(gpuDynInst->computeUnit());

        gpuDynInst->latency.set(

                gpuDynInst->computeUnit()->cyclesToTicks(Cycles(24)));

        ConstVecOperandU32 addr(gpuDynInst, extData.ADDR);


        addr.read();


        calcAddr(gpuDynInst, addr);


        gpuDynInst->computeUnit()->localMemoryPipe.issueRequest(gpuDynInst);

    } // execute


    void


    Inst_DS__DS_READ_B64_TR_B16::initiateAcc(GPUDynInstPtr gpuDynInst)

    {

        Addr offset0 = instData.OFFSET0;

        Addr offset1 = instData.OFFSET1;

        Addr offset = (offset1 << 8) | offset0;


        initMemRead<VecElemU64>(gpuDynInst, offset);

    } // initiateAcc


    void


    Inst_DS__DS_READ_B64_TR_B16::completeAcc(GPUDynInstPtr gpuDynInst)

    {

        VecOperandU64 vdst(gpuDynInst, extData.VDST);


        // Operate on 16 threads per cycle. For simulation we do 4 passes.

        for (int pass = 0; pass < 4; ++pass) {

            // With 16-bit datatype and 64-bits per thread, there are at most

            // 256 elements (e.g. 16x16 matrix).

            //

            // Pack into four 16x 16-bit arrays to get memory-like layout

            // (a 4x16 matrix). Inverts to a 16x4 on each pass to 16x16.

            // This looks like unpacked[0] = 00h, 10h, 20h, ... f0h

            //                 unpacked[1] = 01h, 11h, 21h, ... f1h

            //                 unpacked[2] = 02h, 12h, 22h, ... f2h

            //                 unpacked[3] = 03h, 13h, 23h, ... f3h

            // 2nd pass has lower nibbles 4-7, 3rd has 8-b, 4th has c-f.

            uint16_t unpacked[4][16];


            for (int x = 0; x < 4; ++x) {

                for (int y = 0; y < 4; ++y) {

                    int lane = pass * 16 + x * 4 + y;

                    VecElemU64 qword = (reinterpret_cast<VecElemU64*>(

                        gpuDynInst->d_data))[lane];

                    unpacked[x][y * 4 + 0] = bits(qword, 63, 48);

                    unpacked[x][y * 4 + 1] = bits(qword, 47, 32);

                    unpacked[x][y * 4 + 2] = bits(qword, 31, 16);

                    unpacked[x][y * 4 + 3] = bits(qword, 15, 0);

                }

            }


            // Next repack these 4 16-bit values into one dword for each lane.

            // The values are the ith element of each of the four x16 arrays.

            for (int i = 0; i < 16; ++i) {

                vdst[pass * 16 + i] = insertBits(vdst[pass * 16 + i], 63, 48,

                                                 unpacked[0][i]);

                vdst[pass * 16 + i] = insertBits(vdst[pass * 16 + i], 47, 32,

                                                 unpacked[1][i]);

                vdst[pass * 16 + i] = insertBits(vdst[pass * 16 + i], 31, 16,

                                                 unpacked[2][i]);

                vdst[pass * 16 + i] = insertBits(vdst[pass * 16 + i], 15, 0,

                                                 unpacked[3][i]);

            }

        }


        vdst.write();

    } // completeAcc


} // namespace VegaISA

} // namespace gem5

data
const char data[]
Definition circlebuf.test.cc:48

gem5::ComputeUnit::vrf
std::vector< VectorRegisterFile * > vrf
Definition compute_unit.hh:297

gem5::Cycles
Cycles is a wrapper class for representing cycle counts, i.e.
Definition types.hh:79

gem5::GPUStaticInst::setFlag
void setFlag(Flags flag)
Definition gpu_static_inst.hh:251

gem5::RiscvISA::Load
Definition mem.hh:57

gem5::RiscvISA::Store
Definition mem.hh:66

gem5::SparcISA::Nop
Nop class.
Definition nop.hh:49

gem5::VegaISA::Inst_DS__DS_ADD_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:749

gem5::VegaISA::Inst_DS__DS_ADD_F32::initiateAcc
void initiateAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:782

gem5::VegaISA::Inst_DS__DS_ADD_F32::Inst_DS__DS_ADD_F32
Inst_DS__DS_ADD_F32(InFmt_DS *)
Definition ds.cc:730

gem5::VegaISA::Inst_DS__DS_ADD_F32::~Inst_DS__DS_ADD_F32
~Inst_DS__DS_ADD_F32()
Definition ds.cc:740

gem5::VegaISA::Inst_DS__DS_ADD_F32::completeAcc
void completeAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:792

gem5::VegaISA::Inst_DS__DS_ADD_RTN_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1576

gem5::VegaISA::Inst_DS__DS_ADD_RTN_F32::~Inst_DS__DS_ADD_RTN_F32
~Inst_DS__DS_ADD_RTN_F32()
Definition ds.cc:1565

gem5::VegaISA::Inst_DS__DS_ADD_RTN_F32::Inst_DS__DS_ADD_RTN_F32
Inst_DS__DS_ADD_RTN_F32(InFmt_DS *)
Definition ds.cc:1559

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U32::~Inst_DS__DS_ADD_RTN_U32
~Inst_DS__DS_ADD_RTN_U32()
Definition ds.cc:994

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1004

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1036

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U32::Inst_DS__DS_ADD_RTN_U32
Inst_DS__DS_ADD_RTN_U32(InFmt_DS *)
Definition ds.cc:986

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1046

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U64::~Inst_DS__DS_ADD_RTN_U64
~Inst_DS__DS_ADD_RTN_U64()
Definition ds.cc:3072

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3082

gem5::VegaISA::Inst_DS__DS_ADD_RTN_U64::Inst_DS__DS_ADD_RTN_U64
Inst_DS__DS_ADD_RTN_U64(InFmt_DS *)
Definition ds.cc:3067

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_F32::~Inst_DS__DS_ADD_SRC2_F32
~Inst_DS__DS_ADD_SRC2_F32()
Definition ds.cc:4069

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_F32::Inst_DS__DS_ADD_SRC2_F32
Inst_DS__DS_ADD_SRC2_F32(InFmt_DS *)
Definition ds.cc:4063

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4081

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3741

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_U32::~Inst_DS__DS_ADD_SRC2_U32
~Inst_DS__DS_ADD_SRC2_U32()
Definition ds.cc:3730

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_U32::Inst_DS__DS_ADD_SRC2_U32
Inst_DS__DS_ADD_SRC2_U32(InFmt_DS *)
Definition ds.cc:3725

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4344

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_U64::Inst_DS__DS_ADD_SRC2_U64
Inst_DS__DS_ADD_SRC2_U64(InFmt_DS *)
Definition ds.cc:4328

gem5::VegaISA::Inst_DS__DS_ADD_SRC2_U64::~Inst_DS__DS_ADD_SRC2_U64
~Inst_DS__DS_ADD_SRC2_U64()
Definition ds.cc:4333

gem5::VegaISA::Inst_DS__DS_ADD_U32::Inst_DS__DS_ADD_U32
Inst_DS__DS_ADD_U32(InFmt_DS *)
Definition ds.cc:41

gem5::VegaISA::Inst_DS__DS_ADD_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:58

gem5::VegaISA::Inst_DS__DS_ADD_U32::~Inst_DS__DS_ADD_U32
~Inst_DS__DS_ADD_U32()
Definition ds.cc:50

gem5::VegaISA::Inst_DS__DS_ADD_U32::completeAcc
void completeAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:101

gem5::VegaISA::Inst_DS__DS_ADD_U32::initiateAcc
void initiateAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:91

gem5::VegaISA::Inst_DS__DS_ADD_U64::completeAcc
void completeAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:2502

gem5::VegaISA::Inst_DS__DS_ADD_U64::~Inst_DS__DS_ADD_U64
~Inst_DS__DS_ADD_U64()
Definition ds.cc:2451

gem5::VegaISA::Inst_DS__DS_ADD_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2459

gem5::VegaISA::Inst_DS__DS_ADD_U64::initiateAcc
void initiateAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:2492

gem5::VegaISA::Inst_DS__DS_ADD_U64::Inst_DS__DS_ADD_U64
Inst_DS__DS_ADD_U64(InFmt_DS *)
Definition ds.cc:2442

gem5::VegaISA::Inst_DS__DS_AND_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:290

gem5::VegaISA::Inst_DS__DS_AND_B32::~Inst_DS__DS_AND_B32
~Inst_DS__DS_AND_B32()
Definition ds.cc:280

gem5::VegaISA::Inst_DS__DS_AND_B32::Inst_DS__DS_AND_B32
Inst_DS__DS_AND_B32(InFmt_DS *)
Definition ds.cc:275

gem5::VegaISA::Inst_DS__DS_AND_B64::Inst_DS__DS_AND_B64
Inst_DS__DS_AND_B64(InFmt_DS *)
Definition ds.cc:2677

gem5::VegaISA::Inst_DS__DS_AND_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2692

gem5::VegaISA::Inst_DS__DS_AND_B64::~Inst_DS__DS_AND_B64
~Inst_DS__DS_AND_B64()
Definition ds.cc:2682

gem5::VegaISA::Inst_DS__DS_AND_RTN_B32::~Inst_DS__DS_AND_RTN_B32
~Inst_DS__DS_AND_RTN_B32()
Definition ds.cc:1235

gem5::VegaISA::Inst_DS__DS_AND_RTN_B32::Inst_DS__DS_AND_RTN_B32
Inst_DS__DS_AND_RTN_B32(InFmt_DS *)
Definition ds.cc:1230

gem5::VegaISA::Inst_DS__DS_AND_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1245

gem5::VegaISA::Inst_DS__DS_AND_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3273

gem5::VegaISA::Inst_DS__DS_AND_RTN_B64::~Inst_DS__DS_AND_RTN_B64
~Inst_DS__DS_AND_RTN_B64()
Definition ds.cc:3263

gem5::VegaISA::Inst_DS__DS_AND_RTN_B64::Inst_DS__DS_AND_RTN_B64
Inst_DS__DS_AND_RTN_B64(InFmt_DS *)
Definition ds.cc:3258

gem5::VegaISA::Inst_DS__DS_AND_SRC2_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3940

gem5::VegaISA::Inst_DS__DS_AND_SRC2_B32::~Inst_DS__DS_AND_SRC2_B32
~Inst_DS__DS_AND_SRC2_B32()
Definition ds.cc:3929

gem5::VegaISA::Inst_DS__DS_AND_SRC2_B32::Inst_DS__DS_AND_SRC2_B32
Inst_DS__DS_AND_SRC2_B32(InFmt_DS *)
Definition ds.cc:3924

gem5::VegaISA::Inst_DS__DS_AND_SRC2_B64::~Inst_DS__DS_AND_SRC2_B64
~Inst_DS__DS_AND_SRC2_B64()
Definition ds.cc:4532

gem5::VegaISA::Inst_DS__DS_AND_SRC2_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4543

gem5::VegaISA::Inst_DS__DS_AND_SRC2_B64::Inst_DS__DS_AND_SRC2_B64
Inst_DS__DS_AND_SRC2_B64(InFmt_DS *)
Definition ds.cc:4527

gem5::VegaISA::Inst_DS__DS_APPEND::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4302

gem5::VegaISA::Inst_DS__DS_APPEND::~Inst_DS__DS_APPEND
~Inst_DS__DS_APPEND()
Definition ds.cc:4294

gem5::VegaISA::Inst_DS__DS_APPEND::Inst_DS__DS_APPEND
Inst_DS__DS_APPEND(InFmt_DS *)
Definition ds.cc:4289

gem5::VegaISA::Inst_DS__DS_BPERMUTE_B32::~Inst_DS__DS_BPERMUTE_B32
~Inst_DS__DS_BPERMUTE_B32()
Definition ds.cc:2364

gem5::VegaISA::Inst_DS__DS_BPERMUTE_B32::Inst_DS__DS_BPERMUTE_B32
Inst_DS__DS_BPERMUTE_B32(InFmt_DS *)
Definition ds.cc:2352

gem5::VegaISA::Inst_DS__DS_BPERMUTE_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2371

gem5::VegaISA::Inst_DS__DS_CMPST_B32::Inst_DS__DS_CMPST_B32
Inst_DS__DS_CMPST_B32(InFmt_DS *)
Definition ds.cc:605

gem5::VegaISA::Inst_DS__DS_CMPST_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:625

gem5::VegaISA::Inst_DS__DS_CMPST_B32::~Inst_DS__DS_CMPST_B32
~Inst_DS__DS_CMPST_B32()
Definition ds.cc:610

gem5::VegaISA::Inst_DS__DS_CMPST_B64::~Inst_DS__DS_CMPST_B64
~Inst_DS__DS_CMPST_B64()
Definition ds.cc:2967

gem5::VegaISA::Inst_DS__DS_CMPST_B64::Inst_DS__DS_CMPST_B64
Inst_DS__DS_CMPST_B64(InFmt_DS *)
Definition ds.cc:2962

gem5::VegaISA::Inst_DS__DS_CMPST_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2982

gem5::VegaISA::Inst_DS__DS_CMPST_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:652

gem5::VegaISA::Inst_DS__DS_CMPST_F32::~Inst_DS__DS_CMPST_F32
~Inst_DS__DS_CMPST_F32()
Definition ds.cc:637

gem5::VegaISA::Inst_DS__DS_CMPST_F32::Inst_DS__DS_CMPST_F32
Inst_DS__DS_CMPST_F32(InFmt_DS *)
Definition ds.cc:631

gem5::VegaISA::Inst_DS__DS_CMPST_F64::~Inst_DS__DS_CMPST_F64
~Inst_DS__DS_CMPST_F64()
Definition ds.cc:2994

gem5::VegaISA::Inst_DS__DS_CMPST_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3009

gem5::VegaISA::Inst_DS__DS_CMPST_F64::Inst_DS__DS_CMPST_F64
Inst_DS__DS_CMPST_F64(InFmt_DS *)
Definition ds.cc:2988

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1445

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B32::Inst_DS__DS_CMPST_RTN_B32
Inst_DS__DS_CMPST_RTN_B32(InFmt_DS *)
Definition ds.cc:1373

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B32::~Inst_DS__DS_CMPST_RTN_B32
~Inst_DS__DS_CMPST_RTN_B32()
Definition ds.cc:1381

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1396

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1435

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B64::~Inst_DS__DS_CMPST_RTN_B64
~Inst_DS__DS_CMPST_RTN_B64()
Definition ds.cc:3406

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B64::Inst_DS__DS_CMPST_RTN_B64
Inst_DS__DS_CMPST_RTN_B64(InFmt_DS *)
Definition ds.cc:3401

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3421

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1481

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_F32::~Inst_DS__DS_CMPST_RTN_F32
~Inst_DS__DS_CMPST_RTN_F32()
Definition ds.cc:1466

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_F32::Inst_DS__DS_CMPST_RTN_F32
Inst_DS__DS_CMPST_RTN_F32(InFmt_DS *)
Definition ds.cc:1460

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3448

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_F64::~Inst_DS__DS_CMPST_RTN_F64
~Inst_DS__DS_CMPST_RTN_F64()
Definition ds.cc:3433

gem5::VegaISA::Inst_DS__DS_CMPST_RTN_F64::Inst_DS__DS_CMPST_RTN_F64
Inst_DS__DS_CMPST_RTN_F64(InFmt_DS *)
Definition ds.cc:3427

gem5::VegaISA::Inst_DS__DS_CONDXCHG32_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3719

gem5::VegaISA::Inst_DS__DS_CONDXCHG32_RTN_B64::~Inst_DS__DS_CONDXCHG32_RTN_B64
~Inst_DS__DS_CONDXCHG32_RTN_B64()
Definition ds.cc:3712

gem5::VegaISA::Inst_DS__DS_CONDXCHG32_RTN_B64::Inst_DS__DS_CONDXCHG32_RTN_B64
Inst_DS__DS_CONDXCHG32_RTN_B64(InFmt_DS *)
Definition ds.cc:3706

gem5::VegaISA::Inst_DS__DS_CONSUME::~Inst_DS__DS_CONSUME
~Inst_DS__DS_CONSUME()
Definition ds.cc:4274

gem5::VegaISA::Inst_DS__DS_CONSUME::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4283

gem5::VegaISA::Inst_DS__DS_CONSUME::Inst_DS__DS_CONSUME
Inst_DS__DS_CONSUME(InFmt_DS *)
Definition ds.cc:4269

gem5::VegaISA::Inst_DS__DS_DEC_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1140

gem5::VegaISA::Inst_DS__DS_DEC_RTN_U32::Inst_DS__DS_DEC_RTN_U32
Inst_DS__DS_DEC_RTN_U32(InFmt_DS *)
Definition ds.cc:1125

gem5::VegaISA::Inst_DS__DS_DEC_RTN_U32::~Inst_DS__DS_DEC_RTN_U32
~Inst_DS__DS_DEC_RTN_U32()
Definition ds.cc:1130

gem5::VegaISA::Inst_DS__DS_DEC_RTN_U64::~Inst_DS__DS_DEC_RTN_U64
~Inst_DS__DS_DEC_RTN_U64()
Definition ds.cc:3157

gem5::VegaISA::Inst_DS__DS_DEC_RTN_U64::Inst_DS__DS_DEC_RTN_U64
Inst_DS__DS_DEC_RTN_U64(InFmt_DS *)
Definition ds.cc:3152

gem5::VegaISA::Inst_DS__DS_DEC_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3168

gem5::VegaISA::Inst_DS__DS_DEC_SRC2_U32::Inst_DS__DS_DEC_SRC2_U32
Inst_DS__DS_DEC_SRC2_U32(InFmt_DS *)
Definition ds.cc:3813

gem5::VegaISA::Inst_DS__DS_DEC_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3830

gem5::VegaISA::Inst_DS__DS_DEC_SRC2_U32::~Inst_DS__DS_DEC_SRC2_U32
~Inst_DS__DS_DEC_SRC2_U32()
Definition ds.cc:3818

gem5::VegaISA::Inst_DS__DS_DEC_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4433

gem5::VegaISA::Inst_DS__DS_DEC_SRC2_U64::Inst_DS__DS_DEC_SRC2_U64
Inst_DS__DS_DEC_SRC2_U64(InFmt_DS *)
Definition ds.cc:4416

gem5::VegaISA::Inst_DS__DS_DEC_SRC2_U64::~Inst_DS__DS_DEC_SRC2_U64
~Inst_DS__DS_DEC_SRC2_U64()
Definition ds.cc:4421

gem5::VegaISA::Inst_DS__DS_DEC_U32::~Inst_DS__DS_DEC_U32
~Inst_DS__DS_DEC_U32()
Definition ds.cc:175

gem5::VegaISA::Inst_DS__DS_DEC_U32::Inst_DS__DS_DEC_U32
Inst_DS__DS_DEC_U32(InFmt_DS *)
Definition ds.cc:170

gem5::VegaISA::Inst_DS__DS_DEC_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:185

gem5::VegaISA::Inst_DS__DS_DEC_U64::~Inst_DS__DS_DEC_U64
~Inst_DS__DS_DEC_U64()
Definition ds.cc:2576

gem5::VegaISA::Inst_DS__DS_DEC_U64::Inst_DS__DS_DEC_U64
Inst_DS__DS_DEC_U64(InFmt_DS *)
Definition ds.cc:2571

gem5::VegaISA::Inst_DS__DS_DEC_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2587

gem5::VegaISA::Inst_DS__DS_GWS_BARRIER::Inst_DS__DS_GWS_BARRIER
Inst_DS__DS_GWS_BARRIER(InFmt_DS *)
Definition ds.cc:4224

gem5::VegaISA::Inst_DS__DS_GWS_BARRIER::~Inst_DS__DS_GWS_BARRIER
~Inst_DS__DS_GWS_BARRIER()
Definition ds.cc:4229

gem5::VegaISA::Inst_DS__DS_GWS_BARRIER::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4263

gem5::VegaISA::Inst_DS__DS_GWS_INIT::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4136

gem5::VegaISA::Inst_DS__DS_GWS_INIT::Inst_DS__DS_GWS_INIT
Inst_DS__DS_GWS_INIT(InFmt_DS *)
Definition ds.cc:4115

gem5::VegaISA::Inst_DS__DS_GWS_INIT::~Inst_DS__DS_GWS_INIT
~Inst_DS__DS_GWS_INIT()
Definition ds.cc:4120

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_BR::Inst_DS__DS_GWS_SEMA_BR
Inst_DS__DS_GWS_SEMA_BR(InFmt_DS *)
Definition ds.cc:4168

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_BR::~Inst_DS__DS_GWS_SEMA_BR
~Inst_DS__DS_GWS_SEMA_BR()
Definition ds.cc:4173

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_BR::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4192

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_P::Inst_DS__DS_GWS_SEMA_P
Inst_DS__DS_GWS_SEMA_P(InFmt_DS *)
Definition ds.cc:4198

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_P::~Inst_DS__DS_GWS_SEMA_P
~Inst_DS__DS_GWS_SEMA_P()
Definition ds.cc:4203

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_P::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4218

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_RELEASE_ALL::Inst_DS__DS_GWS_SEMA_RELEASE_ALL
Inst_DS__DS_GWS_SEMA_RELEASE_ALL(InFmt_DS *)
Definition ds.cc:4087

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_RELEASE_ALL::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4109

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_RELEASE_ALL::~Inst_DS__DS_GWS_SEMA_RELEASE_ALL
~Inst_DS__DS_GWS_SEMA_RELEASE_ALL()
Definition ds.cc:4093

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_V::Inst_DS__DS_GWS_SEMA_V
Inst_DS__DS_GWS_SEMA_V(InFmt_DS *)
Definition ds.cc:4142

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_V::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4162

gem5::VegaISA::Inst_DS__DS_GWS_SEMA_V::~Inst_DS__DS_GWS_SEMA_V
~Inst_DS__DS_GWS_SEMA_V()
Definition ds.cc:4147

gem5::VegaISA::Inst_DS__DS_INC_RTN_U32::Inst_DS__DS_INC_RTN_U32
Inst_DS__DS_INC_RTN_U32(InFmt_DS *)
Definition ds.cc:1104

gem5::VegaISA::Inst_DS__DS_INC_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1119

gem5::VegaISA::Inst_DS__DS_INC_RTN_U32::~Inst_DS__DS_INC_RTN_U32
~Inst_DS__DS_INC_RTN_U32()
Definition ds.cc:1109

gem5::VegaISA::Inst_DS__DS_INC_RTN_U64::~Inst_DS__DS_INC_RTN_U64
~Inst_DS__DS_INC_RTN_U64()
Definition ds.cc:3136

gem5::VegaISA::Inst_DS__DS_INC_RTN_U64::Inst_DS__DS_INC_RTN_U64
Inst_DS__DS_INC_RTN_U64(InFmt_DS *)
Definition ds.cc:3131

gem5::VegaISA::Inst_DS__DS_INC_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3146

gem5::VegaISA::Inst_DS__DS_INC_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3807

gem5::VegaISA::Inst_DS__DS_INC_SRC2_U32::~Inst_DS__DS_INC_SRC2_U32
~Inst_DS__DS_INC_SRC2_U32()
Definition ds.cc:3796

gem5::VegaISA::Inst_DS__DS_INC_SRC2_U32::Inst_DS__DS_INC_SRC2_U32
Inst_DS__DS_INC_SRC2_U32(InFmt_DS *)
Definition ds.cc:3791

gem5::VegaISA::Inst_DS__DS_INC_SRC2_U64::Inst_DS__DS_INC_SRC2_U64
Inst_DS__DS_INC_SRC2_U64(InFmt_DS *)
Definition ds.cc:4394

gem5::VegaISA::Inst_DS__DS_INC_SRC2_U64::~Inst_DS__DS_INC_SRC2_U64
~Inst_DS__DS_INC_SRC2_U64()
Definition ds.cc:4399

gem5::VegaISA::Inst_DS__DS_INC_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4410

gem5::VegaISA::Inst_DS__DS_INC_U32::Inst_DS__DS_INC_U32
Inst_DS__DS_INC_U32(InFmt_DS *)
Definition ds.cc:149

gem5::VegaISA::Inst_DS__DS_INC_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:164

gem5::VegaISA::Inst_DS__DS_INC_U32::~Inst_DS__DS_INC_U32
~Inst_DS__DS_INC_U32()
Definition ds.cc:154

gem5::VegaISA::Inst_DS__DS_INC_U64::~Inst_DS__DS_INC_U64
~Inst_DS__DS_INC_U64()
Definition ds.cc:2555

gem5::VegaISA::Inst_DS__DS_INC_U64::Inst_DS__DS_INC_U64
Inst_DS__DS_INC_U64(InFmt_DS *)
Definition ds.cc:2550

gem5::VegaISA::Inst_DS__DS_INC_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2565

gem5::VegaISA::Inst_DS__DS_MAX_F32::~Inst_DS__DS_MAX_F32
~Inst_DS__DS_MAX_F32()
Definition ds.cc:690

gem5::VegaISA::Inst_DS__DS_MAX_F32::Inst_DS__DS_MAX_F32
Inst_DS__DS_MAX_F32(InFmt_DS *)
Definition ds.cc:684

gem5::VegaISA::Inst_DS__DS_MAX_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:704

gem5::VegaISA::Inst_DS__DS_MAX_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3061

gem5::VegaISA::Inst_DS__DS_MAX_F64::~Inst_DS__DS_MAX_F64
~Inst_DS__DS_MAX_F64()
Definition ds.cc:3047

gem5::VegaISA::Inst_DS__DS_MAX_F64::Inst_DS__DS_MAX_F64
Inst_DS__DS_MAX_F64(InFmt_DS *)
Definition ds.cc:3041

gem5::VegaISA::Inst_DS__DS_MAX_I32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:227

gem5::VegaISA::Inst_DS__DS_MAX_I32::Inst_DS__DS_MAX_I32
Inst_DS__DS_MAX_I32(InFmt_DS *)
Definition ds.cc:212

gem5::VegaISA::Inst_DS__DS_MAX_I32::~Inst_DS__DS_MAX_I32
~Inst_DS__DS_MAX_I32()
Definition ds.cc:217

gem5::VegaISA::Inst_DS__DS_MAX_I64::Inst_DS__DS_MAX_I64
Inst_DS__DS_MAX_I64(InFmt_DS *)
Definition ds.cc:2614

gem5::VegaISA::Inst_DS__DS_MAX_I64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2629

gem5::VegaISA::Inst_DS__DS_MAX_I64::~Inst_DS__DS_MAX_I64
~Inst_DS__DS_MAX_I64()
Definition ds.cc:2619

gem5::VegaISA::Inst_DS__DS_MAX_RTN_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1533

gem5::VegaISA::Inst_DS__DS_MAX_RTN_F32::~Inst_DS__DS_MAX_RTN_F32
~Inst_DS__DS_MAX_RTN_F32()
Definition ds.cc:1519

gem5::VegaISA::Inst_DS__DS_MAX_RTN_F32::Inst_DS__DS_MAX_RTN_F32
Inst_DS__DS_MAX_RTN_F32(InFmt_DS *)
Definition ds.cc:1513

gem5::VegaISA::Inst_DS__DS_MAX_RTN_F64::Inst_DS__DS_MAX_RTN_F64
Inst_DS__DS_MAX_RTN_F64(InFmt_DS *)
Definition ds.cc:3480

gem5::VegaISA::Inst_DS__DS_MAX_RTN_F64::~Inst_DS__DS_MAX_RTN_F64
~Inst_DS__DS_MAX_RTN_F64()
Definition ds.cc:3486

gem5::VegaISA::Inst_DS__DS_MAX_RTN_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3500

gem5::VegaISA::Inst_DS__DS_MAX_RTN_I32::~Inst_DS__DS_MAX_RTN_I32
~Inst_DS__DS_MAX_RTN_I32()
Definition ds.cc:1172

gem5::VegaISA::Inst_DS__DS_MAX_RTN_I32::Inst_DS__DS_MAX_RTN_I32
Inst_DS__DS_MAX_RTN_I32(InFmt_DS *)
Definition ds.cc:1167

gem5::VegaISA::Inst_DS__DS_MAX_RTN_I32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1182

gem5::VegaISA::Inst_DS__DS_MAX_RTN_I64::Inst_DS__DS_MAX_RTN_I64
Inst_DS__DS_MAX_RTN_I64(InFmt_DS *)
Definition ds.cc:3195

gem5::VegaISA::Inst_DS__DS_MAX_RTN_I64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3210

gem5::VegaISA::Inst_DS__DS_MAX_RTN_I64::~Inst_DS__DS_MAX_RTN_I64
~Inst_DS__DS_MAX_RTN_I64()
Definition ds.cc:3200

gem5::VegaISA::Inst_DS__DS_MAX_RTN_U32::~Inst_DS__DS_MAX_RTN_U32
~Inst_DS__DS_MAX_RTN_U32()
Definition ds.cc:1214

gem5::VegaISA::Inst_DS__DS_MAX_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1224

gem5::VegaISA::Inst_DS__DS_MAX_RTN_U32::Inst_DS__DS_MAX_RTN_U32
Inst_DS__DS_MAX_RTN_U32(InFmt_DS *)
Definition ds.cc:1209

gem5::VegaISA::Inst_DS__DS_MAX_RTN_U64::~Inst_DS__DS_MAX_RTN_U64
~Inst_DS__DS_MAX_RTN_U64()
Definition ds.cc:3242

gem5::VegaISA::Inst_DS__DS_MAX_RTN_U64::Inst_DS__DS_MAX_RTN_U64
Inst_DS__DS_MAX_RTN_U64(InFmt_DS *)
Definition ds.cc:3237

gem5::VegaISA::Inst_DS__DS_MAX_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3252

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_F32::~Inst_DS__DS_MAX_SRC2_F32
~Inst_DS__DS_MAX_SRC2_F32()
Definition ds.cc:4045

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4057

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_F32::Inst_DS__DS_MAX_SRC2_F32
Inst_DS__DS_MAX_SRC2_F32(InFmt_DS *)
Definition ds.cc:4039

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_F64::Inst_DS__DS_MAX_SRC2_F64
Inst_DS__DS_MAX_SRC2_F64(InFmt_DS *)
Definition ds.cc:4642

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_F64::~Inst_DS__DS_MAX_SRC2_F64
~Inst_DS__DS_MAX_SRC2_F64()
Definition ds.cc:4648

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4660

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_I32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3874

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_I32::Inst_DS__DS_MAX_SRC2_I32
Inst_DS__DS_MAX_SRC2_I32(InFmt_DS *)
Definition ds.cc:3858

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_I32::~Inst_DS__DS_MAX_SRC2_I32
~Inst_DS__DS_MAX_SRC2_I32()
Definition ds.cc:3863

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_I64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4477

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_I64::~Inst_DS__DS_MAX_SRC2_I64
~Inst_DS__DS_MAX_SRC2_I64()
Definition ds.cc:4466

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_I64::Inst_DS__DS_MAX_SRC2_I64
Inst_DS__DS_MAX_SRC2_I64(InFmt_DS *)
Definition ds.cc:4461

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3918

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_U32::~Inst_DS__DS_MAX_SRC2_U32
~Inst_DS__DS_MAX_SRC2_U32()
Definition ds.cc:3907

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_U32::Inst_DS__DS_MAX_SRC2_U32
Inst_DS__DS_MAX_SRC2_U32(InFmt_DS *)
Definition ds.cc:3902

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_U64::~Inst_DS__DS_MAX_SRC2_U64
~Inst_DS__DS_MAX_SRC2_U64()
Definition ds.cc:4510

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4521

gem5::VegaISA::Inst_DS__DS_MAX_SRC2_U64::Inst_DS__DS_MAX_SRC2_U64
Inst_DS__DS_MAX_SRC2_U64(InFmt_DS *)
Definition ds.cc:4505

gem5::VegaISA::Inst_DS__DS_MAX_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:269

gem5::VegaISA::Inst_DS__DS_MAX_U32::~Inst_DS__DS_MAX_U32
~Inst_DS__DS_MAX_U32()
Definition ds.cc:259

gem5::VegaISA::Inst_DS__DS_MAX_U32::Inst_DS__DS_MAX_U32
Inst_DS__DS_MAX_U32(InFmt_DS *)
Definition ds.cc:254

gem5::VegaISA::Inst_DS__DS_MAX_U64::~Inst_DS__DS_MAX_U64
~Inst_DS__DS_MAX_U64()
Definition ds.cc:2661

gem5::VegaISA::Inst_DS__DS_MAX_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2671

gem5::VegaISA::Inst_DS__DS_MAX_U64::Inst_DS__DS_MAX_U64
Inst_DS__DS_MAX_U64(InFmt_DS *)
Definition ds.cc:2656

gem5::VegaISA::Inst_DS__DS_MIN_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:678

gem5::VegaISA::Inst_DS__DS_MIN_F32::Inst_DS__DS_MIN_F32
Inst_DS__DS_MIN_F32(InFmt_DS *)
Definition ds.cc:658

gem5::VegaISA::Inst_DS__DS_MIN_F32::~Inst_DS__DS_MIN_F32
~Inst_DS__DS_MIN_F32()
Definition ds.cc:664

gem5::VegaISA::Inst_DS__DS_MIN_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3035

gem5::VegaISA::Inst_DS__DS_MIN_F64::~Inst_DS__DS_MIN_F64
~Inst_DS__DS_MIN_F64()
Definition ds.cc:3021

gem5::VegaISA::Inst_DS__DS_MIN_F64::Inst_DS__DS_MIN_F64
Inst_DS__DS_MIN_F64(InFmt_DS *)
Definition ds.cc:3015

gem5::VegaISA::Inst_DS__DS_MIN_I32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:206

gem5::VegaISA::Inst_DS__DS_MIN_I32::Inst_DS__DS_MIN_I32
Inst_DS__DS_MIN_I32(InFmt_DS *)
Definition ds.cc:191

gem5::VegaISA::Inst_DS__DS_MIN_I32::~Inst_DS__DS_MIN_I32
~Inst_DS__DS_MIN_I32()
Definition ds.cc:196

gem5::VegaISA::Inst_DS__DS_MIN_I64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2608

gem5::VegaISA::Inst_DS__DS_MIN_I64::Inst_DS__DS_MIN_I64
Inst_DS__DS_MIN_I64(InFmt_DS *)
Definition ds.cc:2593

gem5::VegaISA::Inst_DS__DS_MIN_I64::~Inst_DS__DS_MIN_I64
~Inst_DS__DS_MIN_I64()
Definition ds.cc:2598

gem5::VegaISA::Inst_DS__DS_MIN_RTN_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1507

gem5::VegaISA::Inst_DS__DS_MIN_RTN_F32::~Inst_DS__DS_MIN_RTN_F32
~Inst_DS__DS_MIN_RTN_F32()
Definition ds.cc:1493

gem5::VegaISA::Inst_DS__DS_MIN_RTN_F32::Inst_DS__DS_MIN_RTN_F32
Inst_DS__DS_MIN_RTN_F32(InFmt_DS *)
Definition ds.cc:1487

gem5::VegaISA::Inst_DS__DS_MIN_RTN_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3474

gem5::VegaISA::Inst_DS__DS_MIN_RTN_F64::Inst_DS__DS_MIN_RTN_F64
Inst_DS__DS_MIN_RTN_F64(InFmt_DS *)
Definition ds.cc:3454

gem5::VegaISA::Inst_DS__DS_MIN_RTN_F64::~Inst_DS__DS_MIN_RTN_F64
~Inst_DS__DS_MIN_RTN_F64()
Definition ds.cc:3460

gem5::VegaISA::Inst_DS__DS_MIN_RTN_I32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1161

gem5::VegaISA::Inst_DS__DS_MIN_RTN_I32::~Inst_DS__DS_MIN_RTN_I32
~Inst_DS__DS_MIN_RTN_I32()
Definition ds.cc:1151

gem5::VegaISA::Inst_DS__DS_MIN_RTN_I32::Inst_DS__DS_MIN_RTN_I32
Inst_DS__DS_MIN_RTN_I32(InFmt_DS *)
Definition ds.cc:1146

gem5::VegaISA::Inst_DS__DS_MIN_RTN_I64::~Inst_DS__DS_MIN_RTN_I64
~Inst_DS__DS_MIN_RTN_I64()
Definition ds.cc:3179

gem5::VegaISA::Inst_DS__DS_MIN_RTN_I64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3189

gem5::VegaISA::Inst_DS__DS_MIN_RTN_I64::Inst_DS__DS_MIN_RTN_I64
Inst_DS__DS_MIN_RTN_I64(InFmt_DS *)
Definition ds.cc:3174

gem5::VegaISA::Inst_DS__DS_MIN_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1203

gem5::VegaISA::Inst_DS__DS_MIN_RTN_U32::Inst_DS__DS_MIN_RTN_U32
Inst_DS__DS_MIN_RTN_U32(InFmt_DS *)
Definition ds.cc:1188

gem5::VegaISA::Inst_DS__DS_MIN_RTN_U32::~Inst_DS__DS_MIN_RTN_U32
~Inst_DS__DS_MIN_RTN_U32()
Definition ds.cc:1193

gem5::VegaISA::Inst_DS__DS_MIN_RTN_U64::Inst_DS__DS_MIN_RTN_U64
Inst_DS__DS_MIN_RTN_U64(InFmt_DS *)
Definition ds.cc:3216

gem5::VegaISA::Inst_DS__DS_MIN_RTN_U64::~Inst_DS__DS_MIN_RTN_U64
~Inst_DS__DS_MIN_RTN_U64()
Definition ds.cc:3221

gem5::VegaISA::Inst_DS__DS_MIN_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3231

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_F32::Inst_DS__DS_MIN_SRC2_F32
Inst_DS__DS_MIN_SRC2_F32(InFmt_DS *)
Definition ds.cc:4015

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_F32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4033

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_F32::~Inst_DS__DS_MIN_SRC2_F32
~Inst_DS__DS_MIN_SRC2_F32()
Definition ds.cc:4021

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_F64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4636

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_F64::~Inst_DS__DS_MIN_SRC2_F64
~Inst_DS__DS_MIN_SRC2_F64()
Definition ds.cc:4624

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_F64::Inst_DS__DS_MIN_SRC2_F64
Inst_DS__DS_MIN_SRC2_F64(InFmt_DS *)
Definition ds.cc:4618

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_I32::~Inst_DS__DS_MIN_SRC2_I32
~Inst_DS__DS_MIN_SRC2_I32()
Definition ds.cc:3841

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_I32::Inst_DS__DS_MIN_SRC2_I32
Inst_DS__DS_MIN_SRC2_I32(InFmt_DS *)
Definition ds.cc:3836

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_I32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3852

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_I64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4455

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_I64::Inst_DS__DS_MIN_SRC2_I64
Inst_DS__DS_MIN_SRC2_I64(InFmt_DS *)
Definition ds.cc:4439

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_I64::~Inst_DS__DS_MIN_SRC2_I64
~Inst_DS__DS_MIN_SRC2_I64()
Definition ds.cc:4444

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_U32::Inst_DS__DS_MIN_SRC2_U32
Inst_DS__DS_MIN_SRC2_U32(InFmt_DS *)
Definition ds.cc:3880

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3896

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_U32::~Inst_DS__DS_MIN_SRC2_U32
~Inst_DS__DS_MIN_SRC2_U32()
Definition ds.cc:3885

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_U64::Inst_DS__DS_MIN_SRC2_U64
Inst_DS__DS_MIN_SRC2_U64(InFmt_DS *)
Definition ds.cc:4483

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_U64::~Inst_DS__DS_MIN_SRC2_U64
~Inst_DS__DS_MIN_SRC2_U64()
Definition ds.cc:4488

gem5::VegaISA::Inst_DS__DS_MIN_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4499

gem5::VegaISA::Inst_DS__DS_MIN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:248

gem5::VegaISA::Inst_DS__DS_MIN_U32::Inst_DS__DS_MIN_U32
Inst_DS__DS_MIN_U32(InFmt_DS *)
Definition ds.cc:233

gem5::VegaISA::Inst_DS__DS_MIN_U32::~Inst_DS__DS_MIN_U32
~Inst_DS__DS_MIN_U32()
Definition ds.cc:238

gem5::VegaISA::Inst_DS__DS_MIN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2650

gem5::VegaISA::Inst_DS__DS_MIN_U64::~Inst_DS__DS_MIN_U64
~Inst_DS__DS_MIN_U64()
Definition ds.cc:2640

gem5::VegaISA::Inst_DS__DS_MIN_U64::Inst_DS__DS_MIN_U64
Inst_DS__DS_MIN_U64(InFmt_DS *)
Definition ds.cc:2635

gem5::VegaISA::Inst_DS__DS_MSKOR_B32::~Inst_DS__DS_MSKOR_B32
~Inst_DS__DS_MSKOR_B32()
Definition ds.cc:388

gem5::VegaISA::Inst_DS__DS_MSKOR_B32::Inst_DS__DS_MSKOR_B32
Inst_DS__DS_MSKOR_B32(InFmt_DS *)
Definition ds.cc:383

gem5::VegaISA::Inst_DS__DS_MSKOR_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:399

gem5::VegaISA::Inst_DS__DS_MSKOR_B64::~Inst_DS__DS_MSKOR_B64
~Inst_DS__DS_MSKOR_B64()
Definition ds.cc:2745

gem5::VegaISA::Inst_DS__DS_MSKOR_B64::Inst_DS__DS_MSKOR_B64
Inst_DS__DS_MSKOR_B64(InFmt_DS *)
Definition ds.cc:2740

gem5::VegaISA::Inst_DS__DS_MSKOR_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2756

gem5::VegaISA::Inst_DS__DS_MSKOR_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1309

gem5::VegaISA::Inst_DS__DS_MSKOR_RTN_B32::Inst_DS__DS_MSKOR_RTN_B32
Inst_DS__DS_MSKOR_RTN_B32(InFmt_DS *)
Definition ds.cc:1293

gem5::VegaISA::Inst_DS__DS_MSKOR_RTN_B32::~Inst_DS__DS_MSKOR_RTN_B32
~Inst_DS__DS_MSKOR_RTN_B32()
Definition ds.cc:1298

gem5::VegaISA::Inst_DS__DS_MSKOR_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3337

gem5::VegaISA::Inst_DS__DS_MSKOR_RTN_B64::~Inst_DS__DS_MSKOR_RTN_B64
~Inst_DS__DS_MSKOR_RTN_B64()
Definition ds.cc:3326

gem5::VegaISA::Inst_DS__DS_MSKOR_RTN_B64::Inst_DS__DS_MSKOR_RTN_B64
Inst_DS__DS_MSKOR_RTN_B64(InFmt_DS *)
Definition ds.cc:3321

gem5::VegaISA::Inst_DS__DS_NOP::Inst_DS__DS_NOP
Inst_DS__DS_NOP(InFmt_DS *)
Definition ds.cc:710

gem5::VegaISA::Inst_DS__DS_NOP::~Inst_DS__DS_NOP
~Inst_DS__DS_NOP()
Definition ds.cc:716

gem5::VegaISA::Inst_DS__DS_NOP::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:723

gem5::VegaISA::Inst_DS__DS_ORDERED_COUNT::~Inst_DS__DS_ORDERED_COUNT
~Inst_DS__DS_ORDERED_COUNT()
Definition ds.cc:4313

gem5::VegaISA::Inst_DS__DS_ORDERED_COUNT::Inst_DS__DS_ORDERED_COUNT
Inst_DS__DS_ORDERED_COUNT(InFmt_DS *)
Definition ds.cc:4308

gem5::VegaISA::Inst_DS__DS_ORDERED_COUNT::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4322

gem5::VegaISA::Inst_DS__DS_OR_B32::completeAcc
void completeAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:356

gem5::VegaISA::Inst_DS__DS_OR_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:313

gem5::VegaISA::Inst_DS__DS_OR_B32::~Inst_DS__DS_OR_B32
~Inst_DS__DS_OR_B32()
Definition ds.cc:305

gem5::VegaISA::Inst_DS__DS_OR_B32::initiateAcc
void initiateAcc(GPUDynInstPtr gpuDynInst) override
Definition ds.cc:346

gem5::VegaISA::Inst_DS__DS_OR_B32::Inst_DS__DS_OR_B32
Inst_DS__DS_OR_B32(InFmt_DS *)
Definition ds.cc:296

gem5::VegaISA::Inst_DS__DS_OR_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2713

gem5::VegaISA::Inst_DS__DS_OR_B64::Inst_DS__DS_OR_B64
Inst_DS__DS_OR_B64(InFmt_DS *)
Definition ds.cc:2698

gem5::VegaISA::Inst_DS__DS_OR_B64::~Inst_DS__DS_OR_B64
~Inst_DS__DS_OR_B64()
Definition ds.cc:2703

gem5::VegaISA::Inst_DS__DS_OR_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1266

gem5::VegaISA::Inst_DS__DS_OR_RTN_B32::Inst_DS__DS_OR_RTN_B32
Inst_DS__DS_OR_RTN_B32(InFmt_DS *)
Definition ds.cc:1251

gem5::VegaISA::Inst_DS__DS_OR_RTN_B32::~Inst_DS__DS_OR_RTN_B32
~Inst_DS__DS_OR_RTN_B32()
Definition ds.cc:1256

gem5::VegaISA::Inst_DS__DS_OR_RTN_B64::Inst_DS__DS_OR_RTN_B64
Inst_DS__DS_OR_RTN_B64(InFmt_DS *)
Definition ds.cc:3279

gem5::VegaISA::Inst_DS__DS_OR_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3294

gem5::VegaISA::Inst_DS__DS_OR_RTN_B64::~Inst_DS__DS_OR_RTN_B64
~Inst_DS__DS_OR_RTN_B64()
Definition ds.cc:3284

gem5::VegaISA::Inst_DS__DS_OR_SRC2_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3962

gem5::VegaISA::Inst_DS__DS_OR_SRC2_B32::Inst_DS__DS_OR_SRC2_B32
Inst_DS__DS_OR_SRC2_B32(InFmt_DS *)
Definition ds.cc:3946

gem5::VegaISA::Inst_DS__DS_OR_SRC2_B32::~Inst_DS__DS_OR_SRC2_B32
~Inst_DS__DS_OR_SRC2_B32()
Definition ds.cc:3951

gem5::VegaISA::Inst_DS__DS_OR_SRC2_B64::Inst_DS__DS_OR_SRC2_B64
Inst_DS__DS_OR_SRC2_B64(InFmt_DS *)
Definition ds.cc:4549

gem5::VegaISA::Inst_DS__DS_OR_SRC2_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4565

gem5::VegaISA::Inst_DS__DS_OR_SRC2_B64::~Inst_DS__DS_OR_SRC2_B64
~Inst_DS__DS_OR_SRC2_B64()
Definition ds.cc:4554

gem5::VegaISA::Inst_DS__DS_PERMUTE_B32::Inst_DS__DS_PERMUTE_B32
Inst_DS__DS_PERMUTE_B32(InFmt_DS *)
Definition ds.cc:2263

gem5::VegaISA::Inst_DS__DS_PERMUTE_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2282

gem5::VegaISA::Inst_DS__DS_PERMUTE_B32::~Inst_DS__DS_PERMUTE_B32
~Inst_DS__DS_PERMUTE_B32()
Definition ds.cc:2275

gem5::VegaISA::Inst_DS__DS_READ2ST64_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1730

gem5::VegaISA::Inst_DS__DS_READ2ST64_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1763

gem5::VegaISA::Inst_DS__DS_READ2ST64_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1754

gem5::VegaISA::Inst_DS__DS_READ2ST64_B32::Inst_DS__DS_READ2ST64_B32
Inst_DS__DS_READ2ST64_B32(InFmt_DS *)
Definition ds.cc:1714

gem5::VegaISA::Inst_DS__DS_READ2ST64_B32::~Inst_DS__DS_READ2ST64_B32
~Inst_DS__DS_READ2ST64_B32()
Definition ds.cc:1721

gem5::VegaISA::Inst_DS__DS_READ2ST64_B64::~Inst_DS__DS_READ2ST64_B64
~Inst_DS__DS_READ2ST64_B64()
Definition ds.cc:3645

gem5::VegaISA::Inst_DS__DS_READ2ST64_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3654

gem5::VegaISA::Inst_DS__DS_READ2ST64_B64::Inst_DS__DS_READ2ST64_B64
Inst_DS__DS_READ2ST64_B64(InFmt_DS *)
Definition ds.cc:3638

gem5::VegaISA::Inst_DS__DS_READ2ST64_B64::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:3678

gem5::VegaISA::Inst_DS__DS_READ2ST64_B64::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:3687

gem5::VegaISA::Inst_DS__DS_READ2_B32::Inst_DS__DS_READ2_B32
Inst_DS__DS_READ2_B32(InFmt_DS *)
Definition ds.cc:1646

gem5::VegaISA::Inst_DS__DS_READ2_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1695

gem5::VegaISA::Inst_DS__DS_READ2_B32::~Inst_DS__DS_READ2_B32
~Inst_DS__DS_READ2_B32()
Definition ds.cc:1653

gem5::VegaISA::Inst_DS__DS_READ2_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1686

gem5::VegaISA::Inst_DS__DS_READ2_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1662

gem5::VegaISA::Inst_DS__DS_READ2_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3586

gem5::VegaISA::Inst_DS__DS_READ2_B64::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:3610

gem5::VegaISA::Inst_DS__DS_READ2_B64::~Inst_DS__DS_READ2_B64
~Inst_DS__DS_READ2_B64()
Definition ds.cc:3577

gem5::VegaISA::Inst_DS__DS_READ2_B64::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:3619

gem5::VegaISA::Inst_DS__DS_READ2_B64::Inst_DS__DS_READ2_B64
Inst_DS__DS_READ2_B64(InFmt_DS *)
Definition ds.cc:3570

gem5::VegaISA::Inst_DS__DS_READ_B128::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:4903

gem5::VegaISA::Inst_DS__DS_READ_B128::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:4893

gem5::VegaISA::Inst_DS__DS_READ_B128::~Inst_DS__DS_READ_B128
~Inst_DS__DS_READ_B128()
Definition ds.cc:4869

gem5::VegaISA::Inst_DS__DS_READ_B128::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4876

gem5::VegaISA::Inst_DS__DS_READ_B128::Inst_DS__DS_READ_B128
Inst_DS__DS_READ_B128(InFmt_DS *)
Definition ds.cc:4862

gem5::VegaISA::Inst_DS__DS_READ_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1631

gem5::VegaISA::Inst_DS__DS_READ_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1597

gem5::VegaISA::Inst_DS__DS_READ_B32::Inst_DS__DS_READ_B32
Inst_DS__DS_READ_B32(InFmt_DS *)
Definition ds.cc:1582

gem5::VegaISA::Inst_DS__DS_READ_B32::~Inst_DS__DS_READ_B32
~Inst_DS__DS_READ_B32()
Definition ds.cc:1589

gem5::VegaISA::Inst_DS__DS_READ_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1621

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B16::~Inst_DS__DS_READ_B64_TR_B16
~Inst_DS__DS_READ_B64_TR_B16()
Definition ds.cc:5331

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B16::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:5336

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B16::Inst_DS__DS_READ_B64_TR_B16
Inst_DS__DS_READ_B64_TR_B16(InFmt_DS *)
Definition ds.cc:5325

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B16::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:5359

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B16::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:5369

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B4::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:4964

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B4::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4941

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B4::Inst_DS__DS_READ_B64_TR_B4
Inst_DS__DS_READ_B64_TR_B4(InFmt_DS *)
Definition ds.cc:4930

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B4::~Inst_DS__DS_READ_B64_TR_B4
~Inst_DS__DS_READ_B64_TR_B4()
Definition ds.cc:4936

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B4::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:4974

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B8::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:5253

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B8::~Inst_DS__DS_READ_B64_TR_B8
~Inst_DS__DS_READ_B64_TR_B8()
Definition ds.cc:5215

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B8::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:5220

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B8::Inst_DS__DS_READ_B64_TR_B8
Inst_DS__DS_READ_B64_TR_B8(InFmt_DS *)
Definition ds.cc:5209

gem5::VegaISA::Inst_DS__DS_READ_B64_TR_B8::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:5243

gem5::VegaISA::Inst_DS__DS_READ_B64::Inst_DS__DS_READ_B64
Inst_DS__DS_READ_B64(InFmt_DS *)
Definition ds.cc:3506

gem5::VegaISA::Inst_DS__DS_READ_B64::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:3555

gem5::VegaISA::Inst_DS__DS_READ_B64::~Inst_DS__DS_READ_B64
~Inst_DS__DS_READ_B64()
Definition ds.cc:3513

gem5::VegaISA::Inst_DS__DS_READ_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3521

gem5::VegaISA::Inst_DS__DS_READ_B64::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:3545

gem5::VegaISA::Inst_DS__DS_READ_B96_TR_B6::Inst_DS__DS_READ_B96_TR_B6
Inst_DS__DS_READ_B96_TR_B6(InFmt_DS *)
Definition ds.cc:5060

gem5::VegaISA::Inst_DS__DS_READ_B96_TR_B6::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:5071

gem5::VegaISA::Inst_DS__DS_READ_B96_TR_B6::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:5094

gem5::VegaISA::Inst_DS__DS_READ_B96_TR_B6::~Inst_DS__DS_READ_B96_TR_B6
~Inst_DS__DS_READ_B96_TR_B6()
Definition ds.cc:5066

gem5::VegaISA::Inst_DS__DS_READ_B96_TR_B6::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:5104

gem5::VegaISA::Inst_DS__DS_READ_B96::~Inst_DS__DS_READ_B96
~Inst_DS__DS_READ_B96()
Definition ds.cc:4805

gem5::VegaISA::Inst_DS__DS_READ_B96::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:4829

gem5::VegaISA::Inst_DS__DS_READ_B96::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:4839

gem5::VegaISA::Inst_DS__DS_READ_B96::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4812

gem5::VegaISA::Inst_DS__DS_READ_B96::Inst_DS__DS_READ_B96
Inst_DS__DS_READ_B96(InFmt_DS *)
Definition ds.cc:4798

gem5::VegaISA::Inst_DS__DS_READ_I16::~Inst_DS__DS_READ_I16
~Inst_DS__DS_READ_I16()
Definition ds.cc:1917

gem5::VegaISA::Inst_DS__DS_READ_I16::Inst_DS__DS_READ_I16
Inst_DS__DS_READ_I16(InFmt_DS *)
Definition ds.cc:1910

gem5::VegaISA::Inst_DS__DS_READ_I16::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1925

gem5::VegaISA::Inst_DS__DS_READ_I8::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1797

gem5::VegaISA::Inst_DS__DS_READ_I8::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1831

gem5::VegaISA::Inst_DS__DS_READ_I8::~Inst_DS__DS_READ_I8
~Inst_DS__DS_READ_I8()
Definition ds.cc:1789

gem5::VegaISA::Inst_DS__DS_READ_I8::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1821

gem5::VegaISA::Inst_DS__DS_READ_I8::Inst_DS__DS_READ_I8
Inst_DS__DS_READ_I8(InFmt_DS *)
Definition ds.cc:1782

gem5::VegaISA::Inst_DS__DS_READ_U16_D16_HI::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2075

gem5::VegaISA::Inst_DS__DS_READ_U16_D16_HI::~Inst_DS__DS_READ_U16_D16_HI
~Inst_DS__DS_READ_U16_D16_HI()
Definition ds.cc:2067

gem5::VegaISA::Inst_DS__DS_READ_U16_D16_HI::Inst_DS__DS_READ_U16_D16_HI
Inst_DS__DS_READ_U16_D16_HI(InFmt_DS *)
Definition ds.cc:2060

gem5::VegaISA::Inst_DS__DS_READ_U16_D16_HI::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:2098

gem5::VegaISA::Inst_DS__DS_READ_U16_D16_HI::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:2108

gem5::VegaISA::Inst_DS__DS_READ_U16_D16::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:2043

gem5::VegaISA::Inst_DS__DS_READ_U16_D16::Inst_DS__DS_READ_U16_D16
Inst_DS__DS_READ_U16_D16(InFmt_DS *)
Definition ds.cc:1995

gem5::VegaISA::Inst_DS__DS_READ_U16_D16::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2010

gem5::VegaISA::Inst_DS__DS_READ_U16_D16::~Inst_DS__DS_READ_U16_D16
~Inst_DS__DS_READ_U16_D16()
Definition ds.cc:2002

gem5::VegaISA::Inst_DS__DS_READ_U16_D16::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:2033

gem5::VegaISA::Inst_DS__DS_READ_U16::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1979

gem5::VegaISA::Inst_DS__DS_READ_U16::~Inst_DS__DS_READ_U16
~Inst_DS__DS_READ_U16()
Definition ds.cc:1938

gem5::VegaISA::Inst_DS__DS_READ_U16::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1969

gem5::VegaISA::Inst_DS__DS_READ_U16::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1946

gem5::VegaISA::Inst_DS__DS_READ_U16::Inst_DS__DS_READ_U16
Inst_DS__DS_READ_U16(InFmt_DS *)
Definition ds.cc:1931

gem5::VegaISA::Inst_DS__DS_READ_U8::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1861

gem5::VegaISA::Inst_DS__DS_READ_U8::Inst_DS__DS_READ_U8
Inst_DS__DS_READ_U8(InFmt_DS *)
Definition ds.cc:1846

gem5::VegaISA::Inst_DS__DS_READ_U8::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:1895

gem5::VegaISA::Inst_DS__DS_READ_U8::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:1885

gem5::VegaISA::Inst_DS__DS_READ_U8::~Inst_DS__DS_READ_U8
~Inst_DS__DS_READ_U8()
Definition ds.cc:1853

gem5::VegaISA::Inst_DS__DS_RSUB_RTN_U32::Inst_DS__DS_RSUB_RTN_U32
Inst_DS__DS_RSUB_RTN_U32(InFmt_DS *)
Definition ds.cc:1082

gem5::VegaISA::Inst_DS__DS_RSUB_RTN_U32::~Inst_DS__DS_RSUB_RTN_U32
~Inst_DS__DS_RSUB_RTN_U32()
Definition ds.cc:1087

gem5::VegaISA::Inst_DS__DS_RSUB_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1098

gem5::VegaISA::Inst_DS__DS_RSUB_RTN_U64::~Inst_DS__DS_RSUB_RTN_U64
~Inst_DS__DS_RSUB_RTN_U64()
Definition ds.cc:3114

gem5::VegaISA::Inst_DS__DS_RSUB_RTN_U64::Inst_DS__DS_RSUB_RTN_U64
Inst_DS__DS_RSUB_RTN_U64(InFmt_DS *)
Definition ds.cc:3109

gem5::VegaISA::Inst_DS__DS_RSUB_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3125

gem5::VegaISA::Inst_DS__DS_RSUB_SRC2_U32::Inst_DS__DS_RSUB_SRC2_U32
Inst_DS__DS_RSUB_SRC2_U32(InFmt_DS *)
Definition ds.cc:3769

gem5::VegaISA::Inst_DS__DS_RSUB_SRC2_U32::~Inst_DS__DS_RSUB_SRC2_U32
~Inst_DS__DS_RSUB_SRC2_U32()
Definition ds.cc:3774

gem5::VegaISA::Inst_DS__DS_RSUB_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3785

gem5::VegaISA::Inst_DS__DS_RSUB_SRC2_U64::Inst_DS__DS_RSUB_SRC2_U64
Inst_DS__DS_RSUB_SRC2_U64(InFmt_DS *)
Definition ds.cc:4372

gem5::VegaISA::Inst_DS__DS_RSUB_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4388

gem5::VegaISA::Inst_DS__DS_RSUB_SRC2_U64::~Inst_DS__DS_RSUB_SRC2_U64
~Inst_DS__DS_RSUB_SRC2_U64()
Definition ds.cc:4377

gem5::VegaISA::Inst_DS__DS_RSUB_U32::~Inst_DS__DS_RSUB_U32
~Inst_DS__DS_RSUB_U32()
Definition ds.cc:132

gem5::VegaISA::Inst_DS__DS_RSUB_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:143

gem5::VegaISA::Inst_DS__DS_RSUB_U32::Inst_DS__DS_RSUB_U32
Inst_DS__DS_RSUB_U32(InFmt_DS *)
Definition ds.cc:127

gem5::VegaISA::Inst_DS__DS_RSUB_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2544

gem5::VegaISA::Inst_DS__DS_RSUB_U64::Inst_DS__DS_RSUB_U64
Inst_DS__DS_RSUB_U64(InFmt_DS *)
Definition ds.cc:2528

gem5::VegaISA::Inst_DS__DS_RSUB_U64::~Inst_DS__DS_RSUB_U64
~Inst_DS__DS_RSUB_U64()
Definition ds.cc:2533

gem5::VegaISA::Inst_DS__DS_SUB_RTN_U32::Inst_DS__DS_SUB_RTN_U32
Inst_DS__DS_SUB_RTN_U32(InFmt_DS *)
Definition ds.cc:1061

gem5::VegaISA::Inst_DS__DS_SUB_RTN_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1076

gem5::VegaISA::Inst_DS__DS_SUB_RTN_U32::~Inst_DS__DS_SUB_RTN_U32
~Inst_DS__DS_SUB_RTN_U32()
Definition ds.cc:1066

gem5::VegaISA::Inst_DS__DS_SUB_RTN_U64::Inst_DS__DS_SUB_RTN_U64
Inst_DS__DS_SUB_RTN_U64(InFmt_DS *)
Definition ds.cc:3088

gem5::VegaISA::Inst_DS__DS_SUB_RTN_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3103

gem5::VegaISA::Inst_DS__DS_SUB_RTN_U64::~Inst_DS__DS_SUB_RTN_U64
~Inst_DS__DS_SUB_RTN_U64()
Definition ds.cc:3093

gem5::VegaISA::Inst_DS__DS_SUB_SRC2_U32::~Inst_DS__DS_SUB_SRC2_U32
~Inst_DS__DS_SUB_SRC2_U32()
Definition ds.cc:3752

gem5::VegaISA::Inst_DS__DS_SUB_SRC2_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3763

gem5::VegaISA::Inst_DS__DS_SUB_SRC2_U32::Inst_DS__DS_SUB_SRC2_U32
Inst_DS__DS_SUB_SRC2_U32(InFmt_DS *)
Definition ds.cc:3747

gem5::VegaISA::Inst_DS__DS_SUB_SRC2_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4366

gem5::VegaISA::Inst_DS__DS_SUB_SRC2_U64::~Inst_DS__DS_SUB_SRC2_U64
~Inst_DS__DS_SUB_SRC2_U64()
Definition ds.cc:4355

gem5::VegaISA::Inst_DS__DS_SUB_SRC2_U64::Inst_DS__DS_SUB_SRC2_U64
Inst_DS__DS_SUB_SRC2_U64(InFmt_DS *)
Definition ds.cc:4350

gem5::VegaISA::Inst_DS__DS_SUB_U32::Inst_DS__DS_SUB_U32
Inst_DS__DS_SUB_U32(InFmt_DS *)
Definition ds.cc:106

gem5::VegaISA::Inst_DS__DS_SUB_U32::~Inst_DS__DS_SUB_U32
~Inst_DS__DS_SUB_U32()
Definition ds.cc:111

gem5::VegaISA::Inst_DS__DS_SUB_U32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:121

gem5::VegaISA::Inst_DS__DS_SUB_U64::Inst_DS__DS_SUB_U64
Inst_DS__DS_SUB_U64(InFmt_DS *)
Definition ds.cc:2507

gem5::VegaISA::Inst_DS__DS_SUB_U64::~Inst_DS__DS_SUB_U64
~Inst_DS__DS_SUB_U64()
Definition ds.cc:2512

gem5::VegaISA::Inst_DS__DS_SUB_U64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2522

gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::~Inst_DS__DS_SWIZZLE_B32
~Inst_DS__DS_SWIZZLE_B32()
Definition ds.cc:2136

gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::Inst_DS__DS_SWIZZLE_B32
Inst_DS__DS_SWIZZLE_B32(InFmt_DS *)
Definition ds.cc:2124

gem5::VegaISA::Inst_DS__DS_SWIZZLE_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2145

gem5::VegaISA::Inst_DS__DS_WRAP_RTN_B32::~Inst_DS__DS_WRAP_RTN_B32
~Inst_DS__DS_WRAP_RTN_B32()
Definition ds.cc:1544

gem5::VegaISA::Inst_DS__DS_WRAP_RTN_B32::Inst_DS__DS_WRAP_RTN_B32
Inst_DS__DS_WRAP_RTN_B32(InFmt_DS *)
Definition ds.cc:1539

gem5::VegaISA::Inst_DS__DS_WRAP_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1553

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B32::~Inst_DS__DS_WRITE2ST64_B32
~Inst_DS__DS_WRITE2ST64_B32()
Definition ds.cc:544

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:591

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:554

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B32::Inst_DS__DS_WRITE2ST64_B32
Inst_DS__DS_WRITE2ST64_B32(InFmt_DS *)
Definition ds.cc:537

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:600

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2911

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B64::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:2957

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B64::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:2948

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B64::Inst_DS__DS_WRITE2ST64_B64
Inst_DS__DS_WRITE2ST64_B64(InFmt_DS *)
Definition ds.cc:2894

gem5::VegaISA::Inst_DS__DS_WRITE2ST64_B64::~Inst_DS__DS_WRITE2ST64_B64
~Inst_DS__DS_WRITE2ST64_B64()
Definition ds.cc:2901

gem5::VegaISA::Inst_DS__DS_WRITE2_B32::Inst_DS__DS_WRITE2_B32
Inst_DS__DS_WRITE2_B32(InFmt_DS *)
Definition ds.cc:469

gem5::VegaISA::Inst_DS__DS_WRITE2_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:523

gem5::VegaISA::Inst_DS__DS_WRITE2_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:486

gem5::VegaISA::Inst_DS__DS_WRITE2_B32::~Inst_DS__DS_WRITE2_B32
~Inst_DS__DS_WRITE2_B32()
Definition ds.cc:476

gem5::VegaISA::Inst_DS__DS_WRITE2_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:532

gem5::VegaISA::Inst_DS__DS_WRITE2_B64::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:2880

gem5::VegaISA::Inst_DS__DS_WRITE2_B64::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:2889

gem5::VegaISA::Inst_DS__DS_WRITE2_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2843

gem5::VegaISA::Inst_DS__DS_WRITE2_B64::~Inst_DS__DS_WRITE2_B64
~Inst_DS__DS_WRITE2_B64()
Definition ds.cc:2833

gem5::VegaISA::Inst_DS__DS_WRITE2_B64::Inst_DS__DS_WRITE2_B64
Inst_DS__DS_WRITE2_B64(InFmt_DS *)
Definition ds.cc:2826

gem5::VegaISA::Inst_DS__DS_WRITE_B128::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4745

gem5::VegaISA::Inst_DS__DS_WRITE_B128::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:4783

gem5::VegaISA::Inst_DS__DS_WRITE_B128::Inst_DS__DS_WRITE_B128
Inst_DS__DS_WRITE_B128(InFmt_DS *)
Definition ds.cc:4730

gem5::VegaISA::Inst_DS__DS_WRITE_B128::~Inst_DS__DS_WRITE_B128
~Inst_DS__DS_WRITE_B128()
Definition ds.cc:4737

gem5::VegaISA::Inst_DS__DS_WRITE_B128::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:4793

gem5::VegaISA::Inst_DS__DS_WRITE_B16::Inst_DS__DS_WRITE_B16
Inst_DS__DS_WRITE_B16(InFmt_DS *)
Definition ds.cc:923

gem5::VegaISA::Inst_DS__DS_WRITE_B16::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:938

gem5::VegaISA::Inst_DS__DS_WRITE_B16::~Inst_DS__DS_WRITE_B16
~Inst_DS__DS_WRITE_B16()
Definition ds.cc:930

gem5::VegaISA::Inst_DS__DS_WRITE_B16::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:981

gem5::VegaISA::Inst_DS__DS_WRITE_B16::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:971

gem5::VegaISA::Inst_DS__DS_WRITE_B32::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:454

gem5::VegaISA::Inst_DS__DS_WRITE_B32::Inst_DS__DS_WRITE_B32
Inst_DS__DS_WRITE_B32(InFmt_DS *)
Definition ds.cc:405

gem5::VegaISA::Inst_DS__DS_WRITE_B32::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:464

gem5::VegaISA::Inst_DS__DS_WRITE_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:421

gem5::VegaISA::Inst_DS__DS_WRITE_B32::~Inst_DS__DS_WRITE_B32
~Inst_DS__DS_WRITE_B32()
Definition ds.cc:412

gem5::VegaISA::Inst_DS__DS_WRITE_B64::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:2811

gem5::VegaISA::Inst_DS__DS_WRITE_B64::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:2821

gem5::VegaISA::Inst_DS__DS_WRITE_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2778

gem5::VegaISA::Inst_DS__DS_WRITE_B64::~Inst_DS__DS_WRITE_B64
~Inst_DS__DS_WRITE_B64()
Definition ds.cc:2769

gem5::VegaISA::Inst_DS__DS_WRITE_B64::Inst_DS__DS_WRITE_B64
Inst_DS__DS_WRITE_B64(InFmt_DS *)
Definition ds.cc:2762

gem5::VegaISA::Inst_DS__DS_WRITE_B8_D16_HI::~Inst_DS__DS_WRITE_B8_D16_HI
~Inst_DS__DS_WRITE_B8_D16_HI()
Definition ds.cc:867

gem5::VegaISA::Inst_DS__DS_WRITE_B8_D16_HI::Inst_DS__DS_WRITE_B8_D16_HI
Inst_DS__DS_WRITE_B8_D16_HI(InFmt_DS *)
Definition ds.cc:860

gem5::VegaISA::Inst_DS__DS_WRITE_B8_D16_HI::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:918

gem5::VegaISA::Inst_DS__DS_WRITE_B8_D16_HI::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:908

gem5::VegaISA::Inst_DS__DS_WRITE_B8_D16_HI::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:875

gem5::VegaISA::Inst_DS__DS_WRITE_B8::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:845

gem5::VegaISA::Inst_DS__DS_WRITE_B8::~Inst_DS__DS_WRITE_B8
~Inst_DS__DS_WRITE_B8()
Definition ds.cc:804

gem5::VegaISA::Inst_DS__DS_WRITE_B8::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:812

gem5::VegaISA::Inst_DS__DS_WRITE_B8::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:855

gem5::VegaISA::Inst_DS__DS_WRITE_B8::Inst_DS__DS_WRITE_B8
Inst_DS__DS_WRITE_B8(InFmt_DS *)
Definition ds.cc:797

gem5::VegaISA::Inst_DS__DS_WRITE_B96::~Inst_DS__DS_WRITE_B96
~Inst_DS__DS_WRITE_B96()
Definition ds.cc:4673

gem5::VegaISA::Inst_DS__DS_WRITE_B96::Inst_DS__DS_WRITE_B96
Inst_DS__DS_WRITE_B96(InFmt_DS *)
Definition ds.cc:4666

gem5::VegaISA::Inst_DS__DS_WRITE_B96::initiateAcc
void initiateAcc(GPUDynInstPtr) override
Definition ds.cc:4715

gem5::VegaISA::Inst_DS__DS_WRITE_B96::completeAcc
void completeAcc(GPUDynInstPtr) override
Definition ds.cc:4725

gem5::VegaISA::Inst_DS__DS_WRITE_B96::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4681

gem5::VegaISA::Inst_DS__DS_WRITE_SRC2_B32::Inst_DS__DS_WRITE_SRC2_B32
Inst_DS__DS_WRITE_SRC2_B32(InFmt_DS *)
Definition ds.cc:3990

gem5::VegaISA::Inst_DS__DS_WRITE_SRC2_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4009

gem5::VegaISA::Inst_DS__DS_WRITE_SRC2_B32::~Inst_DS__DS_WRITE_SRC2_B32
~Inst_DS__DS_WRITE_SRC2_B32()
Definition ds.cc:3997

gem5::VegaISA::Inst_DS__DS_WRITE_SRC2_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4612

gem5::VegaISA::Inst_DS__DS_WRITE_SRC2_B64::~Inst_DS__DS_WRITE_SRC2_B64
~Inst_DS__DS_WRITE_SRC2_B64()
Definition ds.cc:4600

gem5::VegaISA::Inst_DS__DS_WRITE_SRC2_B64::Inst_DS__DS_WRITE_SRC2_B64
Inst_DS__DS_WRITE_SRC2_B64(InFmt_DS *)
Definition ds.cc:4593

gem5::VegaISA::Inst_DS__DS_WRXCHG2ST64_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1367

gem5::VegaISA::Inst_DS__DS_WRXCHG2ST64_RTN_B32::Inst_DS__DS_WRXCHG2ST64_RTN_B32
Inst_DS__DS_WRXCHG2ST64_RTN_B32(InFmt_DS *)
Definition ds.cc:1354

gem5::VegaISA::Inst_DS__DS_WRXCHG2ST64_RTN_B32::~Inst_DS__DS_WRXCHG2ST64_RTN_B32
~Inst_DS__DS_WRXCHG2ST64_RTN_B32()
Definition ds.cc:1360

gem5::VegaISA::Inst_DS__DS_WRXCHG2ST64_RTN_B64::Inst_DS__DS_WRXCHG2ST64_RTN_B64
Inst_DS__DS_WRXCHG2ST64_RTN_B64(InFmt_DS *)
Definition ds.cc:3382

gem5::VegaISA::Inst_DS__DS_WRXCHG2ST64_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3395

gem5::VegaISA::Inst_DS__DS_WRXCHG2ST64_RTN_B64::~Inst_DS__DS_WRXCHG2ST64_RTN_B64
~Inst_DS__DS_WRXCHG2ST64_RTN_B64()
Definition ds.cc:3388

gem5::VegaISA::Inst_DS__DS_WRXCHG2_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1348

gem5::VegaISA::Inst_DS__DS_WRXCHG2_RTN_B32::~Inst_DS__DS_WRXCHG2_RTN_B32
~Inst_DS__DS_WRXCHG2_RTN_B32()
Definition ds.cc:1341

gem5::VegaISA::Inst_DS__DS_WRXCHG2_RTN_B32::Inst_DS__DS_WRXCHG2_RTN_B32
Inst_DS__DS_WRXCHG2_RTN_B32(InFmt_DS *)
Definition ds.cc:1336

gem5::VegaISA::Inst_DS__DS_WRXCHG2_RTN_B64::~Inst_DS__DS_WRXCHG2_RTN_B64
~Inst_DS__DS_WRXCHG2_RTN_B64()
Definition ds.cc:3369

gem5::VegaISA::Inst_DS__DS_WRXCHG2_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3376

gem5::VegaISA::Inst_DS__DS_WRXCHG2_RTN_B64::Inst_DS__DS_WRXCHG2_RTN_B64
Inst_DS__DS_WRXCHG2_RTN_B64(InFmt_DS *)
Definition ds.cc:3364

gem5::VegaISA::Inst_DS__DS_WRXCHG_RTN_B32::~Inst_DS__DS_WRXCHG_RTN_B32
~Inst_DS__DS_WRXCHG_RTN_B32()
Definition ds.cc:1320

gem5::VegaISA::Inst_DS__DS_WRXCHG_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1330

gem5::VegaISA::Inst_DS__DS_WRXCHG_RTN_B32::Inst_DS__DS_WRXCHG_RTN_B32
Inst_DS__DS_WRXCHG_RTN_B32(InFmt_DS *)
Definition ds.cc:1315

gem5::VegaISA::Inst_DS__DS_WRXCHG_RTN_B64::Inst_DS__DS_WRXCHG_RTN_B64
Inst_DS__DS_WRXCHG_RTN_B64(InFmt_DS *)
Definition ds.cc:3343

gem5::VegaISA::Inst_DS__DS_WRXCHG_RTN_B64::~Inst_DS__DS_WRXCHG_RTN_B64
~Inst_DS__DS_WRXCHG_RTN_B64()
Definition ds.cc:3348

gem5::VegaISA::Inst_DS__DS_WRXCHG_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3358

gem5::VegaISA::Inst_DS__DS_XOR_B32::~Inst_DS__DS_XOR_B32
~Inst_DS__DS_XOR_B32()
Definition ds.cc:367

gem5::VegaISA::Inst_DS__DS_XOR_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:377

gem5::VegaISA::Inst_DS__DS_XOR_B32::Inst_DS__DS_XOR_B32
Inst_DS__DS_XOR_B32(InFmt_DS *)
Definition ds.cc:362

gem5::VegaISA::Inst_DS__DS_XOR_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:2734

gem5::VegaISA::Inst_DS__DS_XOR_B64::Inst_DS__DS_XOR_B64
Inst_DS__DS_XOR_B64(InFmt_DS *)
Definition ds.cc:2719

gem5::VegaISA::Inst_DS__DS_XOR_B64::~Inst_DS__DS_XOR_B64
~Inst_DS__DS_XOR_B64()
Definition ds.cc:2724

gem5::VegaISA::Inst_DS__DS_XOR_RTN_B32::~Inst_DS__DS_XOR_RTN_B32
~Inst_DS__DS_XOR_RTN_B32()
Definition ds.cc:1277

gem5::VegaISA::Inst_DS__DS_XOR_RTN_B32::Inst_DS__DS_XOR_RTN_B32
Inst_DS__DS_XOR_RTN_B32(InFmt_DS *)
Definition ds.cc:1272

gem5::VegaISA::Inst_DS__DS_XOR_RTN_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:1287

gem5::VegaISA::Inst_DS__DS_XOR_RTN_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3315

gem5::VegaISA::Inst_DS__DS_XOR_RTN_B64::Inst_DS__DS_XOR_RTN_B64
Inst_DS__DS_XOR_RTN_B64(InFmt_DS *)
Definition ds.cc:3300

gem5::VegaISA::Inst_DS__DS_XOR_RTN_B64::~Inst_DS__DS_XOR_RTN_B64
~Inst_DS__DS_XOR_RTN_B64()
Definition ds.cc:3305

gem5::VegaISA::Inst_DS__DS_XOR_SRC2_B32::~Inst_DS__DS_XOR_SRC2_B32
~Inst_DS__DS_XOR_SRC2_B32()
Definition ds.cc:3973

gem5::VegaISA::Inst_DS__DS_XOR_SRC2_B32::Inst_DS__DS_XOR_SRC2_B32
Inst_DS__DS_XOR_SRC2_B32(InFmt_DS *)
Definition ds.cc:3968

gem5::VegaISA::Inst_DS__DS_XOR_SRC2_B32::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:3984

gem5::VegaISA::Inst_DS__DS_XOR_SRC2_B64::Inst_DS__DS_XOR_SRC2_B64
Inst_DS__DS_XOR_SRC2_B64(InFmt_DS *)
Definition ds.cc:4571

gem5::VegaISA::Inst_DS__DS_XOR_SRC2_B64::execute
void execute(GPUDynInstPtr) override
Definition ds.cc:4587

gem5::VegaISA::Inst_DS__DS_XOR_SRC2_B64::~Inst_DS__DS_XOR_SRC2_B64
~Inst_DS__DS_XOR_SRC2_B64()
Definition ds.cc:4576

gem5::VegaISA::Inst_DS::instData
InFmt_DS instData
Definition op_encodings.hh:1016

gem5::VegaISA::Inst_DS::extData
InFmt_DS_1 extData
Definition op_encodings.hh:1018

gem5::VegaISA::Inst_DS::initMemRead
void initMemRead(GPUDynInstPtr gpuDynInst, Addr offset)
Definition op_encodings.hh:878

gem5::VegaISA::Inst_DS::initDualMemRead
void initDualMemRead(GPUDynInstPtr gpuDynInst, Addr offset0, Addr offset1)
Definition op_encodings.hh:913

gem5::VegaISA::Inst_DS::initMemWrite
void initMemWrite(GPUDynInstPtr gpuDynInst, Addr offset)
Definition op_encodings.hh:932

gem5::VegaISA::Inst_DS::Inst_DS
Inst_DS(InFmt_DS *, const std::string &opcode)
Definition op_encodings.cc:1339

gem5::VegaISA::Inst_DS::calcAddr
void calcAddr(GPUDynInstPtr gpuDynInst, ConstVecOperandU32 &addr)
Definition op_encodings.hh:1004

gem5::VegaISA::Inst_DS::initAtomicAccess
void initAtomicAccess(GPUDynInstPtr gpuDynInst, Addr offset)
Definition op_encodings.hh:984

gem5::VegaISA::Inst_DS::initDualMemWrite
void initDualMemWrite(GPUDynInstPtr gpuDynInst, Addr offset0, Addr offset1)
Definition op_encodings.hh:966

gem5::VegaISA::PackedReg
Definition operand.hh:860

gem5::VegaISA::PackedReg::getElem
uint32_t getElem(int elem)
Definition operand.hh:892

gem5::VegaISA::PackedReg::setDword
void setDword(int dw, uint32_t value)
Definition operand.hh:878

gem5::VegaISA::PackedReg::setElem
void setElem(int elem, uint32_t value)
Definition operand.hh:933

gem5::VegaISA::VEGAGPUStaticInst::panicUnimplemented
void panicUnimplemented() const
Definition gpu_static_inst.cc:54

gem5::VegaISA::VecOperand::read
void read() override
read from the vrf.
Definition operand.hh:148

gem5::VegaISA::VecOperand::write
void write() override
write to the vrf.
Definition operand.hh:203

gem5::Wavefront
Definition wavefront.hh:62

gem5::Wavefront::rdLmReqsInPipe
int rdLmReqsInPipe
Definition wavefront.hh:190

gem5::Wavefront::simdId
const int simdId
Definition wavefront.hh:102

gem5::Wavefront::computeUnit
ComputeUnit * computeUnit
Definition wavefront.hh:109

gem5::Wavefront::execUnitId
int execUnitId
Definition wavefront.hh:105

gem5::Wavefront::untrackLGKMInst
void untrackLGKMInst(GPUDynInstPtr gpu_dyn_inst)
Definition wavefront.cc:1529

gem5::Wavefront::decLGKMInstsIssued
void decLGKMInstsIssued()
Definition wavefront.cc:1464

gem5::Wavefront::execMask
VectorMask & execMask()
Definition wavefront.cc:1581

gem5::bits
constexpr T bits(T val, unsigned first, unsigned last)
Extract the bitfield from position 'first' to 'last' (inclusive) from 'val' and right justify it.
Definition bitfield.hh:79

gem5::insertBits
constexpr T insertBits(T val, unsigned first, unsigned last, B bit_val)
Returns val with bits first to last set to the LSBs of bit_val.
Definition bitfield.hh:185

gem5::sext
constexpr uint64_t sext(uint64_t val)
Sign-extend an N-bit value to 64 bits.
Definition bitfield.hh:129

gem5::replaceBits
constexpr void replaceBits(T &val, unsigned first, unsigned last, B bit_val)
A convenience function to replace bits first to last of val with bit_val in place.
Definition bitfield.hh:216

panic_if
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
Definition logging.hh:246

instructions.hh

gem5::ArmISA::i
Bitfield< 7 > i
Definition misc_types.hh:67

gem5::ArmISA::offset
Bitfield< 23, 0 > offset
Definition types.hh:144

gem5::MipsISA::index
Bitfield< 30, 0 > index
Definition pra_constants.hh:47

gem5::VegaISA
classes that represnt vector/scalar operands in VEGA ISA.
Definition faults.cc:39

gem5::VegaISA::ConstVecOperandF32
VecOperand< VecElemF32, true > ConstVecOperandF32
Definition operand.hh:846

gem5::VegaISA::VecOperandU32
VecOperand< VecElemU32, false > VecOperandU32
Definition operand.hh:829

gem5::VegaISA::x
Bitfield< 4 > x
Definition pagetable.hh:61

gem5::VegaISA::ConstVecOperandU8
VecOperand< VecElemU8, true, 1 > ConstVecOperandU8
Definition operand.hh:840

gem5::VegaISA::ConstVecOperandU32
VecOperand< VecElemU32, true > ConstVecOperandU32
Definition operand.hh:844

gem5::VegaISA::VecElemU16
uint16_t VecElemU16
Definition gpu_registers.hh:163

gem5::VegaISA::VecElemU32
uint32_t VecElemU32
Definition gpu_registers.hh:165

gem5::VegaISA::VecElemI8
int8_t VecElemI8
Definition gpu_registers.hh:162

gem5::VegaISA::ConstVecOperandU16
VecOperand< VecElemU16, true, 1 > ConstVecOperandU16
Definition operand.hh:842

gem5::VegaISA::VecElemF32
float VecElemF32
Definition gpu_registers.hh:167

gem5::VegaISA::NumVecElemPerVecReg
const int NumVecElemPerVecReg(64)

gem5::VegaISA::VecElemU8
uint8_t VecElemU8
Definition gpu_registers.hh:161

gem5::VegaISA::VecElemU64
uint64_t VecElemU64
Definition gpu_registers.hh:168

gem5::VegaISA::VecOperandU64
VecOperand< VecElemU64, false > VecOperandU64
Definition operand.hh:832

gem5::VegaISA::ConstVecOperandU64
VecOperand< VecElemU64, true > ConstVecOperandU64
Definition operand.hh:847

gem5::X86ISA::addr
Bitfield< 3 > addr
Definition types.hh:84

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::GPUDynInstPtr
std::shared_ptr< GPUDynInst > GPUDynInstPtr
Definition misc.hh:49

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::VegaISA::InFmt_DS
Definition gpu_decoder.hh:1780