release/current/gpu__command__processor_8hh_source.html

/*

 * Copyright (c) 2018 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#ifndef __DEV_HSA_GPU_COMMAND_PROCESSOR_HH__

#define __DEV_HSA_GPU_COMMAND_PROCESSOR_HH__


#include <cstdint>

#include <functional>


#include "arch/amdgpu/vega/gpu_registers.hh"

#include "base/logging.hh"

#include "base/trace.hh"

#include "base/types.hh"

#include "debug/GPUCommandProc.hh"

#include "dev/dma_virt_device.hh"

#include "dev/hsa/hsa_packet_processor.hh"

#include "dev/hsa/hsa_signal.hh"

#include "gpu-compute/dispatcher.hh"

#include "gpu-compute/gpu_compute_driver.hh"

#include "gpu-compute/hsa_queue_entry.hh"

#include "params/GPUCommandProcessor.hh"

#include "sim/full_system.hh"


namespace gem5

{


struct GPUCommandProcessorParams;

class GPUComputeDriver;

class GPUDispatcher;

class Shader;


class GPUCommandProcessor : public DmaVirtDevice

{

  public:

    typedef GPUCommandProcessorParams Params;

    typedef std::function<void(const uint64_t &)> HsaSignalCallbackFunction;


    GPUCommandProcessor() = delete;

    GPUCommandProcessor(const Params &p);


    HSAPacketProcessor& hsaPacketProc();

    RequestorID vramRequestorId();


    void setGPUDevice(AMDGPUDevice *gpu_device);

    void setShader(Shader *shader);

    Shader* shader();

    GPUComputeDriver* driver();


    struct KernelDispatchData

    {

        AMDKernelCode *akc;

        void *raw_pkt;

        uint32_t queue_id;

        Addr host_pkt_addr;

        PacketPtr readPkt;

    };

    struct KernelDispatchData {…};


    std::list<struct KernelDispatchData> kernelDispatchList;


    enum AgentCmd

    {

      Nop = 0,

      Steal = 1

    };

    enum AgentCmd {…};


    void performTimingRead(PacketPtr pkt);


    void completeTimingRead();


    void submitAgentDispatchPkt(void *raw_pkt, uint32_t queue_id,

                           Addr host_pkt_addr);

    void submitDispatchPkt(void *raw_pkt, uint32_t queue_id,

                           Addr host_pkt_addr);

    void submitVendorPkt(void *raw_pkt, uint32_t queue_id,

                         Addr host_pkt_addr);

    void attachDriver(GPUComputeDriver *driver);


    void dispatchKernelObject(AMDKernelCode *akc, void *raw_pkt,

                              uint32_t queue_id, Addr host_pkt_addr);

    void dispatchPkt(HSAQueueEntry *task);

    void signalWakeupEvent(uint32_t event_id);


    Tick write(PacketPtr pkt) override { return 0; }

    Tick read(PacketPtr pkt) override { return 0; }

    AddrRangeList getAddrRanges() const override;

    System *system();


    void sendCompletionSignal(Addr signal_handle);

    void updateHsaSignal(Addr signal_handle, uint64_t signal_value,

                         HsaSignalCallbackFunction function =

                            [] (const uint64_t &) { });

    void updateHsaSignalAsync(Addr signal_handle, int64_t diff);

    void updateHsaSignalData(Addr value_addr, int64_t diff,

                             uint64_t *prev_value);

    void updateHsaSignalDone(uint64_t *signal_value);

    void updateHsaMailboxData(Addr signal_handle, uint64_t *mailbox_value);

    void updateHsaEventData(Addr signal_handle, uint64_t *event_value);

    void updateHsaEventTs(Addr signal_handle, amd_event_t *event_value);


    uint64_t functionalReadHsaSignal(Addr signal_handle);


    Addr getHsaSignalValueAddr(Addr signal_handle)

    {

        return signal_handle + offsetof(amd_signal_t, value);

    }

    Addr getHsaSignalValueAddr(Addr signal_handle) {…}


    Addr getHsaSignalMailboxAddr(Addr signal_handle)

    {

        return signal_handle + offsetof(amd_signal_t, event_mailbox_ptr);

    }

    Addr getHsaSignalMailboxAddr(Addr signal_handle) {…}


    Addr getHsaSignalEventAddr(Addr signal_handle)

    {

        return signal_handle + offsetof(amd_signal_t, event_id);

    }

    Addr getHsaSignalEventAddr(Addr signal_handle) {…}


  private:

    Shader *_shader;

    GPUDispatcher &dispatcher;

    GPUComputeDriver *_driver;

    AMDGPUDevice *gpuDevice;

    VegaISA::Walker *walker;


    // Typedefing dmaRead and dmaWrite function pointer

    typedef void (DmaDevice::*DmaFnPtr)(Addr, int, Event*, uint8_t*, Tick);

    void initABI(HSAQueueEntry *task);

    void sanityCheckAKC(AMDKernelCode *akc);

    HSAPacketProcessor *hsaPP;

    TranslationGenPtr translate(Addr vaddr, Addr size) override;


    // Running counter of dispatched tasks

    int dynamic_task_id = 0;


    // Running counter of dispatched user (non-blit) kernels

    int non_blit_kernel_id = 0;


    // Skip all user (non-blit) kernels until reaching this kernel

    int target_non_blit_kernel_id = 0;


    // Keep track of start times for task dispatches.

    std::unordered_map<Addr, Tick> dispatchStartTime;


    void


    ReadDispIdOffsetDmaEvent(HSAQueueEntry *task,

                             const uint32_t &readDispIdOffset)

    {

        task->hostAMDQueueAddr = hsaPP->getQueueDesc(

            task->queueId())->hostReadIndexPtr - readDispIdOffset;


        auto *mqdDmaEvent = new DmaVirtCallback<int>(

            [ = ] (const int &) { MQDDmaEvent(task); });


        dmaReadVirt(task->hostAMDQueueAddr,

                    sizeof(_amd_queue_t), mqdDmaEvent, &task->amdQueue);

    }

    ReadDispIdOffsetDmaEvent(HSAQueueEntry *task, {…}


     void


     MQDDmaEvent(HSAQueueEntry *task)

     {

        if ((task->privMemPerItem() * VegaISA::NumVecElemPerVecReg) >

            task->amdQueue.compute_tmpring_size_wavesize * 1024) {

            // TODO: Raising this signal will potentially nuke scratch

            // space for in-flight kernels that were launched from this

            // queue.  We need to drain all kernels and deschedule the

            // queue before raising this signal. For now, just assert if

            // there are any in-flight kernels and tell the user that this

            // feature still needs to be implemented.

            fatal_if(hsaPP->inFlightPkts(task->queueId()) > 1,

                        "Needed more scratch, but kernels are in flight for "

                        "this queue and it is unsafe to reallocate scratch. "

                        "We need to implement additional intelligence in the "

                        "hardware scheduling logic to support CP-driven "

                        "queue draining and scheduling.");

            DPRINTF(GPUCommandProc, "Not enough scratch space to launch "

                    "kernel (%x available, %x requested bytes per "

                    "workitem). Asking host runtime to allocate more "

                    "space.\n",

                    task->amdQueue.compute_tmpring_size_wavesize * 1024,

                    task->privMemPerItem());


            updateHsaSignal(task->amdQueue.queue_inactive_signal.handle, 1,

                            [ = ] (const uint64_t &dma_buffer)

                                { WaitScratchDmaEvent(task, dma_buffer); });


        } else {

            DPRINTF(GPUCommandProc, "Sufficient scratch space, launching "

                    "kernel (%x available, %x requested bytes per "

                    "workitem).\n",

                    task->amdQueue.compute_tmpring_size_wavesize * 1024,

                    task->privMemPerItem());

            dispatchPkt(task);

        }

    }

     MQDDmaEvent(HSAQueueEntry *task) {…}


    void


    WaitScratchDmaEvent(HSAQueueEntry *task, const uint64_t &dmaBuffer)

    {

        if (dmaBuffer == 0) {

            DPRINTF(GPUCommandProc, "Host scratch allocation complete. "

                    "Attempting to re-read MQD\n");

            auto cb = new DmaVirtCallback<int>(

                [ = ] (const int &) { MQDDmaEvent(task); });


            dmaReadVirt(task->hostAMDQueueAddr, sizeof(_amd_queue_t), cb,

                        &task->amdQueue);

        } else {

            Addr value_addr = getHsaSignalValueAddr(

                task->amdQueue.queue_inactive_signal.handle);

            DPRINTF(GPUCommandProc, "Polling queue inactive signal at "

                    "%p.\n", value_addr);

            auto cb = new DmaVirtCallback<uint64_t>(

                [ = ] (const uint64_t &dma_buffer)

                { WaitScratchDmaEvent(task, dma_buffer); } );


            dmaReadVirt(value_addr, sizeof(Addr), cb, &cb->dmaBuffer, 1e9);

        }

    }

    WaitScratchDmaEvent(HSAQueueEntry *task, const uint64_t &dmaBuffer) {…}

};

class GPUCommandProcessor : public DmaVirtDevice {…};


} // namespace gem5


#endif // __DEV_HSA_GPU_COMMAND_PROCESSOR_HH__

trace.hh

DPRINTF
#define DPRINTF(x,...)
Definition trace.hh:209

types.hh
Defines global host-dependent types: Counter, Tick, and (indirectly) {int,uint}{8,...

gem5::AMDGPUDevice
Device model for an AMD GPU.
Definition amdgpu_device.hh:64

gem5::DmaDevice
Definition dma_device.hh:219

gem5::DmaVirtDevice::DmaVirtCallback
Wraps a std::function object in a DmaCallback.
Definition dma_virt_device.hh:52

gem5::DmaVirtDevice
Definition dma_virt_device.hh:42

gem5::DmaVirtDevice::dmaReadVirt
void dmaReadVirt(Addr host_addr, unsigned size, DmaCallback *cb, void *data, Tick delay=0)
Initiate a DMA read from virtual address host_addr.
Definition dma_virt_device.cc:38

gem5::Event
Definition eventq.hh:255

gem5::GPUCommandProcessor
Definition gpu_command_processor.hh:72

gem5::GPUCommandProcessor::completeTimingRead
void completeTimingRead()
Definition gpu_command_processor.cc:125

gem5::GPUCommandProcessor::sendCompletionSignal
void sendCompletionSignal(Addr signal_handle)
Definition gpu_command_processor.cc:387

gem5::GPUCommandProcessor::submitDispatchPkt
void submitDispatchPkt(void *raw_pkt, uint32_t queue_id, Addr host_pkt_addr)
submitDispatchPkt() is the entry point into the CP from the HSAPP and is only meant to be used with A...
Definition gpu_command_processor.cc:153

gem5::GPUCommandProcessor::ReadDispIdOffsetDmaEvent
void ReadDispIdOffsetDmaEvent(HSAQueueEntry *task, const uint32_t &readDispIdOffset)
Perform a DMA read of the read_dispatch_id_field_base_byte_offset field, which follows directly after...
Definition gpu_command_processor.hh:195

gem5::GPUCommandProcessor::vramRequestorId
RequestorID vramRequestorId()
Forward the VRAM requestor ID needed for device memory from GPU device.
Definition gpu_command_processor.cc:80

gem5::GPUCommandProcessor::dynamic_task_id
int dynamic_task_id
Definition gpu_command_processor.hh:171

gem5::GPUCommandProcessor::driver
GPUComputeDriver * driver()
Definition gpu_command_processor.cc:591

gem5::GPUCommandProcessor::getHsaSignalMailboxAddr
Addr getHsaSignalMailboxAddr(Addr signal_handle)
Definition gpu_command_processor.hh:146

gem5::GPUCommandProcessor::GPUCommandProcessor
GPUCommandProcessor()=delete

gem5::GPUCommandProcessor::DmaFnPtr
void(DmaDevice::* DmaFnPtr)(Addr, int, Event *, uint8_t *, Tick)
Definition gpu_command_processor.hh:164

gem5::GPUCommandProcessor::setGPUDevice
void setGPUDevice(AMDGPUDevice *gpu_device)
Definition gpu_command_processor.cc:836

gem5::GPUCommandProcessor::translate
TranslationGenPtr translate(Addr vaddr, Addr size) override
Function used to translate a range of addresses from virtual to physical addresses.
Definition gpu_command_processor.cc:86

gem5::GPUCommandProcessor::signalWakeupEvent
void signalWakeupEvent(uint32_t event_id)
Definition gpu_command_processor.cc:690

gem5::GPUCommandProcessor::updateHsaSignal
void updateHsaSignal(Addr signal_handle, uint64_t signal_value, HsaSignalCallbackFunction function=[](const uint64_t &) { })
Definition gpu_command_processor.cc:536

gem5::GPUCommandProcessor::updateHsaSignalDone
void updateHsaSignalDone(uint64_t *signal_value)
Definition gpu_command_processor.cc:521

gem5::GPUCommandProcessor::_driver
GPUComputeDriver * _driver
Definition gpu_command_processor.hh:159

gem5::GPUCommandProcessor::setShader
void setShader(Shader *shader)
Definition gpu_command_processor.cc:843

gem5::GPUCommandProcessor::hsaPacketProc
HSAPacketProcessor & hsaPacketProc()
Definition gpu_command_processor.cc:71

gem5::GPUCommandProcessor::target_non_blit_kernel_id
int target_non_blit_kernel_id
Definition gpu_command_processor.hh:177

gem5::GPUCommandProcessor::submitAgentDispatchPkt
void submitAgentDispatchPkt(void *raw_pkt, uint32_t queue_id, Addr host_pkt_addr)
submitAgentDispatchPkt() is for accepting agent dispatch packets.
Definition gpu_command_processor.cc:637

gem5::GPUCommandProcessor::kernelDispatchList
std::list< struct KernelDispatchData > kernelDispatchList
Definition gpu_command_processor.hh:97

gem5::GPUCommandProcessor::getHsaSignalValueAddr
Addr getHsaSignalValueAddr(Addr signal_handle)
Definition gpu_command_processor.hh:141

gem5::GPUCommandProcessor::updateHsaEventTs
void updateHsaEventTs(Addr signal_handle, amd_event_t *event_value)
Definition gpu_command_processor.cc:489

gem5::GPUCommandProcessor::hsaPP
HSAPacketProcessor * hsaPP
Definition gpu_command_processor.hh:167

gem5::GPUCommandProcessor::_shader
Shader * _shader
Definition gpu_command_processor.hh:157

gem5::GPUCommandProcessor::dispatchKernelObject
void dispatchKernelObject(AMDKernelCode *akc, void *raw_pkt, uint32_t queue_id, Addr host_pkt_addr)
Definition gpu_command_processor.cc:290

gem5::GPUCommandProcessor::MQDDmaEvent
void MQDDmaEvent(HSAQueueEntry *task)
Perform a DMA read of the MQD that corresponds to a hardware queue descriptor (HQD).
Definition gpu_command_processor.hh:227

gem5::GPUCommandProcessor::attachDriver
void attachDriver(GPUComputeDriver *driver)
Definition gpu_command_processor.cc:581

gem5::GPUCommandProcessor::initABI
void initABI(HSAQueueEntry *task)
The CP is responsible for traversing all HSA-ABI-related data structures from memory and initializing...
Definition gpu_command_processor.cc:702

gem5::GPUCommandProcessor::updateHsaSignalAsync
void updateHsaSignalAsync(Addr signal_handle, int64_t diff)
Definition gpu_command_processor.cc:414

gem5::GPUCommandProcessor::non_blit_kernel_id
int non_blit_kernel_id
Definition gpu_command_processor.hh:174

gem5::GPUCommandProcessor::dispatchStartTime
std::unordered_map< Addr, Tick > dispatchStartTime
Definition gpu_command_processor.hh:180

gem5::GPUCommandProcessor::getHsaSignalEventAddr
Addr getHsaSignalEventAddr(Addr signal_handle)
Definition gpu_command_processor.hh:151

gem5::GPUCommandProcessor::getAddrRanges
AddrRangeList getAddrRanges() const override
Every PIO device is obliged to provide an implementation that returns the address ranges the device r...
Definition gpu_command_processor.cc:829

gem5::GPUCommandProcessor::shader
Shader * shader()
Definition gpu_command_processor.cc:849

gem5::GPUCommandProcessor::submitVendorPkt
void submitVendorPkt(void *raw_pkt, uint32_t queue_id, Addr host_pkt_addr)
submitVendorPkt() is for accepting vendor-specific packets from the HSAPP.
Definition gpu_command_processor.cc:615

gem5::GPUCommandProcessor::sanityCheckAKC
void sanityCheckAKC(AMDKernelCode *akc)
Definition gpu_command_processor.cc:716

gem5::GPUCommandProcessor::dispatcher
GPUDispatcher & dispatcher
Definition gpu_command_processor.hh:158

gem5::GPUCommandProcessor::write
Tick write(PacketPtr pkt) override
Pure virtual function that the device must implement.
Definition gpu_command_processor.hh:122

gem5::GPUCommandProcessor::Params
GPUCommandProcessorParams Params
Definition gpu_command_processor.hh:74

gem5::GPUCommandProcessor::AgentCmd
AgentCmd
Definition gpu_command_processor.hh:100

gem5::GPUCommandProcessor::Steal
@ Steal
Definition gpu_command_processor.hh:102

gem5::GPUCommandProcessor::dispatchPkt
void dispatchPkt(HSAQueueEntry *task)
Once the CP has finished extracting all relevant information about a task and has initialized the ABI...
Definition gpu_command_processor.cc:684

gem5::GPUCommandProcessor::read
Tick read(PacketPtr pkt) override
Pure virtual function that the device must implement.
Definition gpu_command_processor.hh:123

gem5::GPUCommandProcessor::gpuDevice
AMDGPUDevice * gpuDevice
Definition gpu_command_processor.hh:160

gem5::GPUCommandProcessor::updateHsaMailboxData
void updateHsaMailboxData(Addr signal_handle, uint64_t *mailbox_value)
Definition gpu_command_processor.cc:427

gem5::GPUCommandProcessor::performTimingRead
void performTimingRead(PacketPtr pkt)
Definition gpu_command_processor.cc:105

gem5::GPUCommandProcessor::updateHsaEventData
void updateHsaEventData(Addr signal_handle, uint64_t *event_value)
Definition gpu_command_processor.cc:461

gem5::GPUCommandProcessor::HsaSignalCallbackFunction
std::function< void(const uint64_t &)> HsaSignalCallbackFunction
Definition gpu_command_processor.hh:75

gem5::GPUCommandProcessor::system
System * system()
Definition gpu_command_processor.cc:823

gem5::GPUCommandProcessor::functionalReadHsaSignal
uint64_t functionalReadHsaSignal(Addr signal_handle)
Definition gpu_command_processor.cc:527

gem5::GPUCommandProcessor::WaitScratchDmaEvent
void WaitScratchDmaEvent(HSAQueueEntry *task, const uint64_t &dmaBuffer)
Poll on queue_inactive signal until the runtime can get around to taking care of our lack of scratch ...
Definition gpu_command_processor.hh:281

gem5::GPUCommandProcessor::updateHsaSignalData
void updateHsaSignalData(Addr value_addr, int64_t diff, uint64_t *prev_value)
Definition gpu_command_processor.cc:507

gem5::GPUCommandProcessor::walker
VegaISA::Walker * walker
Definition gpu_command_processor.hh:161

gem5::GPUComputeDriver
Definition gpu_compute_driver.hh:63

gem5::GPUDispatcher
Definition dispatcher.hh:63

gem5::HSAPacketProcessor
Definition hsa_packet_processor.hh:240

gem5::HSAPacketProcessor::inFlightPkts
uint64_t inFlightPkts(uint32_t queId)
Definition hsa_packet_processor.hh:326

gem5::HSAPacketProcessor::getQueueDesc
HSAQueueDescriptor * getQueueDesc(uint32_t queId)
Definition hsa_packet_processor.hh:315

gem5::HSAQueueDescriptor::hostReadIndexPtr
uint64_t hostReadIndexPtr
Definition hsa_packet_processor.hh:86

gem5::HSAQueueEntry
Definition hsa_queue_entry.hh:61

gem5::HSAQueueEntry::amdQueue
_amd_queue_t amdQueue
Keep a copy of the AMD HSA queue because we need info from some of its fields to initialize register ...
Definition hsa_queue_entry.hh:333

gem5::HSAQueueEntry::queueId
uint32_t queueId() const
Definition hsa_queue_entry.hh:173

gem5::HSAQueueEntry::hostAMDQueueAddr
Addr hostAMDQueueAddr
Host-side addr of the amd_queue_t on which this task was queued.
Definition hsa_queue_entry.hh:326

gem5::HSAQueueEntry::privMemPerItem
int privMemPerItem() const
Definition hsa_queue_entry.hh:220

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::Shader
Definition shader.hh:84

gem5::SparcISA::Nop
Nop class.
Definition nop.hh:49

gem5::System
Definition system.hh:75

gem5::VegaISA::Walker
Definition pagetable_walker.hh:55

std::list
STL list class.
Definition stl.hh:51

dispatcher.hh
The GPUDispatcher is the component of the shader that is responsible for creating and dispatching WGs...

dma_virt_device.hh

full_system.hh

gpu_compute_driver.hh
The GPUComputeDriver implements an HSADriver for an HSA AMD GPU agent.

gpu_registers.hh

fatal_if
#define fatal_if(cond,...)
Conditional fatal macro that checks the supplied condition and only causes a fatal error if the condi...
Definition logging.hh:236

hsa_packet_processor.hh

hsa_queue_entry.hh
HSAQueuEntry is the simulator's internal representation of an AQL queue entry (task).

hsa_signal.hh

logging.hh

gem5::MipsISA::vaddr
vaddr
Definition pra_constants.hh:278

gem5::MipsISA::p
Bitfield< 0 > p
Definition pra_constants.hh:326

gem5::VegaISA::NumVecElemPerVecReg
const int NumVecElemPerVecReg(64)

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::Tick
uint64_t Tick
Tick count type.
Definition types.hh:58

gem5::RequestorID
uint16_t RequestorID
Definition request.hh:95

gem5::TranslationGenPtr
std::unique_ptr< TranslationGen > TranslationGenPtr
Definition translation_gen.hh:131

gem5::GEM5_PACKED
PM4 packets.
Definition pm4_defines.hh:78

gem5::GPUCommandProcessor::KernelDispatchData
Definition gpu_command_processor.hh:89

gem5::GPUCommandProcessor::KernelDispatchData::readPkt
PacketPtr readPkt
Definition gpu_command_processor.hh:94

gem5::GPUCommandProcessor::KernelDispatchData::host_pkt_addr
Addr host_pkt_addr
Definition gpu_command_processor.hh:93

gem5::GPUCommandProcessor::KernelDispatchData::akc
AMDKernelCode * akc
Definition gpu_command_processor.hh:90

gem5::GPUCommandProcessor::KernelDispatchData::queue_id
uint32_t queue_id
Definition gpu_command_processor.hh:92

gem5::GPUCommandProcessor::KernelDispatchData::raw_pkt
void * raw_pkt
Definition gpu_command_processor.hh:91

gem5::_amd_queue_t
Definition hsa_queue.hh:65

gem5::_amd_queue_t::queue_inactive_signal
_hsa_signal_t queue_inactive_signal
Definition hsa_queue.hh:87

gem5::_amd_queue_t::compute_tmpring_size_wavesize
uint32_t compute_tmpring_size_wavesize
Definition hsa_queue.hh:79

gem5::_hsa_signal_t::handle
uint64_t handle
Definition hsa_queue.hh:48

gem5::amd_signal_s
Definition hsa_signal.hh:51