release/current/hsa__packet__processor_8hh_source.html

/*

 * Copyright (c) 2015-2018 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#ifndef __DEV_HSA_HSA_PACKET_PROCESSOR__

#define __DEV_HSA_HSA_PACKET_PROCESSOR__


#include <algorithm>

#include <cstdint>

#include <vector>


#include "base/types.hh"

#include "debug/HSAPacketProcessor.hh"

#include "dev/dma_virt_device.hh"

#include "dev/hsa/hsa.h"

#include "dev/hsa/hsa_queue.hh"

#include "enums/GfxVersion.hh"

#include "params/HSAPacketProcessor.hh"

#include "sim/eventq.hh"


#define AQL_PACKET_SIZE 64

#define PAGE_SIZE 4096

#define NUM_DMA_BUFS 16

#define DMA_BUF_SIZE (AQL_PACKET_SIZE * NUM_DMA_BUFS)

// HSA runtime supports only 5 signals per barrier packet

#define NumSignalsPerBarrier 5


namespace gem5

{


class AMDGPUDevice;


// Ideally, each queue should store this status and

// the processPkt() should make decisions based on that

// status variable.


enum Q_STATE

{

    UNBLOCKED = 0, // Unblocked queue, can submit packets.

    BLOCKED_BBIT,  // Queue blocked by barrier bit.

                   // Can submit packet packets after

                   // previous packet completes.

    BLOCKED_BPKT,  // Queue blocked by barrier packet.

                   // Can submit packet packets after

                   // barrier packet completes.

};

enum Q_STATE {…};


class GPUCommandProcessor;

class HWScheduler;


// Our internal representation of an HSA queue


class HSAQueueDescriptor

{

    public:

        uint64_t     basePointer;

        uint64_t     doorbellPointer;

        uint64_t     writeIndex;

        uint64_t     readIndex;

        uint32_t     numElts;

        uint64_t     hostReadIndexPtr;

        bool         stalledOnDmaBufAvailability;

        bool         dmaInProgress;

        GfxVersion   gfxVersion;


        HSAQueueDescriptor(uint64_t base_ptr, uint64_t db_ptr,

                           uint64_t hri_ptr, uint32_t size,

                           GfxVersion gfxVersion)

          : basePointer(base_ptr), doorbellPointer(db_ptr),

            writeIndex(0), readIndex(0),

            numElts(size / AQL_PACKET_SIZE), hostReadIndexPtr(hri_ptr),

            stalledOnDmaBufAvailability(false),

            dmaInProgress(false), gfxVersion(gfxVersion)

        {  }

        HSAQueueDescriptor(uint64_t base_ptr, uint64_t db_ptr, {…}

        uint64_t spaceRemaining() { return numElts - (writeIndex - readIndex); }

        uint64_t spaceUsed() { return writeIndex - readIndex; }

        uint32_t objSize() { return AQL_PACKET_SIZE; }

        uint32_t numObjs() { return numElts; }

        bool isFull() { return spaceRemaining() == 0; }

        bool isEmpty() { return spaceRemaining() == numElts; }


        uint64_t ptr(uint64_t ix)

        {

            /*

             * Based on ROCm Documentation:

             * - https://github.com/RadeonOpenCompute/ROCm_Documentation/blob/

                     10ca0a99bbd0252f5bf6f08d1503e59f1129df4a/ROCm_Libraries/

                     rocr/src/core/runtime/amd_aql_queue.cpp#L99

             * - https://github.com/RadeonOpenCompute/ROCm_Documentation/blob/

                     10ca0a99bbd0252f5bf6f08d1503e59f1129df4a/ROCm_Libraries/

                     rocr/src/core/runtime/amd_aql_queue.cpp#L624

             *

             */

            uint64_t retAddr = 0ll;

            retAddr = basePointer + ((ix % numElts) * objSize());

            DPRINTF(HSAPacketProcessor, "ptr() gfx9: base: 0x%x, "

                    "index: 0x%x, numElts: 0x%x, objSize: 0x%x, "

                    "retAddr: 0x%x\n", basePointer, ix, numElts, objSize(),

                    retAddr);

            return retAddr;

        }

        uint64_t ptr(uint64_t ix) {…}

};

class HSAQueueDescriptor {…};


class AQLRingBuffer

{

   private:

     std::vector<hsa_kernel_dispatch_packet_t> _aqlBuf;

     std::string _name;

     std::vector<Addr> _hostDispAddresses;

     std::vector<bool> _aqlComplete;

     uint64_t _wrIdx;   // Points to next write location

     uint64_t _rdIdx;   // Read pointer of AQL buffer

     uint64_t _dispIdx; // Dispatch pointer of AQL buffer


  public:

     std::string name() {return _name;}

     AQLRingBuffer(uint32_t size, const std::string name);

     int allocEntry(uint32_t nBufReq);

     bool freeEntry(void *pkt);


     void


     saveHostDispAddr(Addr host_pkt_addr, int num_pkts, int ix)

     {

         for (int i = 0; i < num_pkts; ++i) {

            _hostDispAddresses[ix % numObjs()] = host_pkt_addr + i * objSize();

            ++ix;

         }

     }

     saveHostDispAddr(Addr host_pkt_addr, int num_pkts, int ix) {…}


     Addr


     hostDispAddr() const

     {

         return _hostDispAddresses[dispIdx() % numObjs()];

     }

     hostDispAddr() const {…}


     bool


     dispPending() const

     {

         int packet_type = (_aqlBuf[_dispIdx % _aqlBuf.size()].header

             >> HSA_PACKET_HEADER_TYPE) &

             ((1 << HSA_PACKET_HEADER_WIDTH_TYPE) - 1);

         return (_dispIdx < _wrIdx) && packet_type != HSA_PACKET_TYPE_INVALID;

     }

     dispPending() const {…}


     bool


     isLastOutstandingPkt() const

     {

       for (int i = _rdIdx + 1; i < _dispIdx; i++) {

         if (!_aqlComplete[i % _aqlBuf.size()]) {

           return false;

         }

       }

       return !_aqlComplete[_rdIdx % _aqlBuf.size()] && _rdIdx != _dispIdx;

     }

     isLastOutstandingPkt() const {…}


     uint32_t nFree() const { return _aqlBuf.size() - (_wrIdx - _rdIdx); }

     void *ptr(uint32_t ix) { return _aqlBuf.data() + (ix % _aqlBuf.size()); }

     uint32_t numObjs() const { return _aqlBuf.size(); };

     uint32_t objSize() const { return AQL_PACKET_SIZE; }

     uint64_t dispIdx() const { return _dispIdx; }

     uint64_t wrIdx() const { return _wrIdx; }

     uint64_t rdIdx() const { return _rdIdx; }

     uint64_t* rdIdxPtr() { return &_rdIdx; }

     void incRdIdx(uint64_t value) { _rdIdx += value; }

     void incWrIdx(uint64_t value) { _wrIdx += value; }

     void incDispIdx(uint64_t value) { _dispIdx += value; }

     uint64_t compltnPending() { return (_dispIdx - _rdIdx); }

     void setRdIdx(uint64_t value);

     void setWrIdx(uint64_t value);

     void setDispIdx(uint64_t value);

};

class AQLRingBuffer {…};


struct QCntxt

{

    HSAQueueDescriptor* qDesc;

    AQLRingBuffer* aqlBuf;

    // used for HSA packets that enforce synchronization with barrier bit

    bool barrierBit;


    QCntxt(HSAQueueDescriptor* q_desc, AQLRingBuffer* aql_buf) :

        qDesc(q_desc), aqlBuf(aql_buf), barrierBit(false)

    {}

    QCntxt(HSAQueueDescriptor* q_desc, AQLRingBuffer* aql_buf) : {…}

    QCntxt() : qDesc(NULL), aqlBuf(NULL), barrierBit(false) {}

};

struct QCntxt {…};


class HSAPacketProcessor: public DmaVirtDevice

{

    friend class HWScheduler;

  protected:

    typedef void (DmaDevice::*DmaFnPtr)(Addr, int, Event*, uint8_t*, Tick);

    GPUCommandProcessor *gpu_device;

    HWScheduler *hwSchdlr;

    AMDGPUDevice *gpuDevice;

    VegaISA::Walker *walker;


    // Structure to store the read values of dependency signals

    // from shared memory. Also used for tracking the status of

    // those reads while they are in progress


    class SignalState

    {

      public:


        SignalState()

            : pendingReads(0), allRead(false), discardRead(false)

        {

            values.resize(NumSignalsPerBarrier);

        }

        SignalState() {…}

        void handleReadDMA();

        int pendingReads;

        bool allRead;

        // If this queue is unmapped when there are pending reads, then

        // the pending reads has to be discarded.

        bool discardRead;

        // values stores the value of already read dependency signal

        std::vector<hsa_signal_value_t> values;

        void


        resetSigVals()

        {

            std::fill(values.begin(), values.end(), 1);

        }

        resetSigVals() {…}

    };

    class SignalState {…};


    class QueueProcessEvent : public Event

    {

      private:

        HSAPacketProcessor *hsaPP;

        uint32_t rqIdx;

      public:


        QueueProcessEvent(HSAPacketProcessor *_hsaPP, uint32_t _rqIdx)

            : Event(Default_Pri), hsaPP(_hsaPP), rqIdx(_rqIdx)

        {}

        QueueProcessEvent(HSAPacketProcessor *_hsaPP, uint32_t _rqIdx) {…}

        virtual void process();

        virtual const char *description() const;

    };

    class QueueProcessEvent : public Event {…};


    // Registered queue list entry; each entry has one queueDescriptor and

    // associated AQL buffer


    class RQLEntry

    {

      public:


        RQLEntry(HSAPacketProcessor *hsaPP, uint32_t rqIdx)

            : aqlProcessEvent(hsaPP, rqIdx) {}

        RQLEntry(HSAPacketProcessor *hsaPP, uint32_t rqIdx) {…}

        QCntxt qCntxt;

        bool dispPending() { return qCntxt.aqlBuf->dispPending() > 0; }

        uint64_t compltnPending() { return qCntxt.aqlBuf->compltnPending(); }

        SignalState depSignalRdState;

        QueueProcessEvent aqlProcessEvent;

        void setBarrierBit(bool set_val) { qCntxt.barrierBit = set_val; }

        bool getBarrierBit() const { return qCntxt.barrierBit; }


        bool isLastOutstandingPkt() const

        {

          return qCntxt.aqlBuf->isLastOutstandingPkt();

        }

        bool isLastOutstandingPkt() const {…}

    };

    class RQLEntry {…};

    // Keeps track of queueDescriptors of registered queues

    std::vector<class RQLEntry *> regdQList;


    Q_STATE processPkt(void* pkt, uint32_t rl_idx, Addr host_pkt_addr);

    void displayQueueDescriptor(int pid, uint32_t rl_idx);


  public:

    HSAQueueDescriptor*


    getQueueDesc(uint32_t queId)

    {

        return regdQList.at(queId)->qCntxt.qDesc;

    }

    getQueueDesc(uint32_t queId) {…}

    class RQLEntry*


    getRegdListEntry(uint32_t queId)

    {

        return regdQList.at(queId);

    }

    getRegdListEntry(uint32_t queId) {…}


    uint64_t


    inFlightPkts(uint32_t queId)

    {

        auto aqlBuf = regdQList.at(queId)->qCntxt.aqlBuf;

        return aqlBuf->dispIdx() - aqlBuf->rdIdx();

    }

    inFlightPkts(uint32_t queId) {…}


    int numHWQueues;

    Addr pioAddr;

    Addr pioSize;

    Tick pioDelay;

    const Tick pktProcessDelay;


    typedef HSAPacketProcessorParams Params;

    HSAPacketProcessor(const Params &p);

    ~HSAPacketProcessor();

    TranslationGenPtr translate(Addr vaddr, Addr size) override;

    void setDeviceQueueDesc(uint64_t hostReadIndexPointer,

                            uint64_t basePointer,

                            uint64_t queue_id,

                            uint32_t size, int doorbellSize,

                            GfxVersion gfxVersion,

                            Addr offset = 0, uint64_t rd_idx = 0);

    void unsetDeviceQueueDesc(uint64_t queue_id, int doorbellSize);

    void setDevice(GPUCommandProcessor * dev);

    void setGPUDevice(AMDGPUDevice *gpu_device);

    void updateReadIndex(int, uint32_t);

    void getCommandsFromHost(int pid, uint32_t rl_idx);

    HWScheduler *hwScheduler() { return hwSchdlr; }


    // PIO interface

    virtual Tick read(Packet*) override;

    virtual Tick write(Packet*) override;

    virtual AddrRangeList getAddrRanges() const override;

    void finishPkt(void *pkt, uint32_t rl_idx);

    void finishPkt(void *pkt) { finishPkt(pkt, 0); }

    void schedAQLProcessing(uint32_t rl_idx);

    void schedAQLProcessing(uint32_t rl_idx, Tick delay);


    void sendAgentDispatchCompletionSignal(void *pkt,

                                           hsa_signal_value_t signal);

    void sendCompletionSignal(hsa_signal_value_t signal);


    struct dma_series_ctx

    {

        // deal with the fact dma ops can complete out of issue order

        uint32_t pkts_ttl;

        uint32_t pkts_2_go;

        uint32_t start_ix;

        uint32_t rl_idx;


        dma_series_ctx(uint32_t _pkts_ttl,

                       uint32_t _pkts_2_go,

                       uint32_t _start_ix,

                       uint32_t _rl_idx)

            : pkts_ttl(_pkts_2_go), pkts_2_go(_pkts_2_go),

              start_ix(_start_ix), rl_idx(_rl_idx)

        {};

        dma_series_ctx(uint32_t _pkts_ttl, {…}

        ~dma_series_ctx() {};

    };

    struct dma_series_ctx {…};


    void updateReadDispIdDma();

    void cmdQueueCmdDma(HSAPacketProcessor *hsaPP, int pid, bool isRead,

            uint32_t ix_start, unsigned num_pkts,

            dma_series_ctx *series_ctx, void *dest_4debug);

    void handleReadDMA();

};

class HSAPacketProcessor: public DmaVirtDevice {…};


} // namespace gem5


#endif // __DEV_HSA_HSA_PACKET_PROCESSOR__

DPRINTF
#define DPRINTF(x,...)
Definition trace.hh:209

types.hh
Defines global host-dependent types: Counter, Tick, and (indirectly) {int,uint}{8,...

gem5::AMDGPUDevice
Device model for an AMD GPU.
Definition amdgpu_device.hh:64

gem5::AQLRingBuffer
Internal ring buffer which is used to prefetch/store copies of the in-memory HSA ring buffer.
Definition hsa_packet_processor.hh:142

gem5::AQLRingBuffer::setRdIdx
void setRdIdx(uint64_t value)
Definition hsa_packet_processor.cc:604

gem5::AQLRingBuffer::_aqlComplete
std::vector< bool > _aqlComplete
Definition hsa_packet_processor.hh:147

gem5::AQLRingBuffer::name
std::string name()
Definition hsa_packet_processor.hh:153

gem5::AQLRingBuffer::ptr
void * ptr(uint32_t ix)
Definition hsa_packet_processor.hh:211

gem5::AQLRingBuffer::allocEntry
int allocEntry(uint32_t nBufReq)
Definition hsa_packet_processor.cc:648

gem5::AQLRingBuffer::incDispIdx
void incDispIdx(uint64_t value)
Definition hsa_packet_processor.hh:220

gem5::AQLRingBuffer::setDispIdx
void setDispIdx(uint64_t value)
Definition hsa_packet_processor.cc:616

gem5::AQLRingBuffer::dispIdx
uint64_t dispIdx() const
Definition hsa_packet_processor.hh:214

gem5::AQLRingBuffer::_rdIdx
uint64_t _rdIdx
Definition hsa_packet_processor.hh:149

gem5::AQLRingBuffer::dispPending
bool dispPending() const
Definition hsa_packet_processor.hh:183

gem5::AQLRingBuffer::saveHostDispAddr
void saveHostDispAddr(Addr host_pkt_addr, int num_pkts, int ix)
the kernel may try to read from the dispatch packet, so we need to keep the host address that corresp...
Definition hsa_packet_processor.hh:168

gem5::AQLRingBuffer::rdIdxPtr
uint64_t * rdIdxPtr()
Definition hsa_packet_processor.hh:217

gem5::AQLRingBuffer::_name
std::string _name
Definition hsa_packet_processor.hh:145

gem5::AQLRingBuffer::setWrIdx
void setWrIdx(uint64_t value)
Definition hsa_packet_processor.cc:610

gem5::AQLRingBuffer::isLastOutstandingPkt
bool isLastOutstandingPkt() const
Packets aren't guaranteed to be completed in-order, and we need to know when the last packet is finis...
Definition hsa_packet_processor.hh:200

gem5::AQLRingBuffer::hostDispAddr
Addr hostDispAddr() const
Definition hsa_packet_processor.hh:177

gem5::AQLRingBuffer::compltnPending
uint64_t compltnPending()
Definition hsa_packet_processor.hh:221

gem5::AQLRingBuffer::numObjs
uint32_t numObjs() const
Definition hsa_packet_processor.hh:212

gem5::AQLRingBuffer::rdIdx
uint64_t rdIdx() const
Definition hsa_packet_processor.hh:216

gem5::AQLRingBuffer::objSize
uint32_t objSize() const
Definition hsa_packet_processor.hh:213

gem5::AQLRingBuffer::_aqlBuf
std::vector< hsa_kernel_dispatch_packet_t > _aqlBuf
Definition hsa_packet_processor.hh:144

gem5::AQLRingBuffer::incWrIdx
void incWrIdx(uint64_t value)
Definition hsa_packet_processor.hh:219

gem5::AQLRingBuffer::_hostDispAddresses
std::vector< Addr > _hostDispAddresses
Definition hsa_packet_processor.hh:146

gem5::AQLRingBuffer::wrIdx
uint64_t wrIdx() const
Definition hsa_packet_processor.hh:215

gem5::AQLRingBuffer::_wrIdx
uint64_t _wrIdx
Definition hsa_packet_processor.hh:148

gem5::AQLRingBuffer::freeEntry
bool freeEntry(void *pkt)
Definition hsa_packet_processor.cc:622

gem5::AQLRingBuffer::_dispIdx
uint64_t _dispIdx
Definition hsa_packet_processor.hh:150

gem5::AQLRingBuffer::nFree
uint32_t nFree() const
Definition hsa_packet_processor.hh:210

gem5::AQLRingBuffer::incRdIdx
void incRdIdx(uint64_t value)
Definition hsa_packet_processor.hh:218

gem5::DmaDevice
Definition dma_device.hh:219

gem5::DmaVirtDevice
Definition dma_virt_device.hh:42

gem5::Event
Definition eventq.hh:255

gem5::GPUCommandProcessor
Definition gpu_command_processor.hh:72

gem5::HSAPacketProcessor::QueueProcessEvent
Definition hsa_packet_processor.hh:276

gem5::HSAPacketProcessor::QueueProcessEvent::hsaPP
HSAPacketProcessor * hsaPP
Definition hsa_packet_processor.hh:278

gem5::HSAPacketProcessor::QueueProcessEvent::QueueProcessEvent
QueueProcessEvent(HSAPacketProcessor *_hsaPP, uint32_t _rqIdx)
Definition hsa_packet_processor.hh:281

gem5::HSAPacketProcessor::QueueProcessEvent::description
virtual const char * description() const
Return a C string describing the event.

gem5::HSAPacketProcessor::QueueProcessEvent::process
virtual void process()
Definition hsa_packet_processor.cc:431

gem5::HSAPacketProcessor::QueueProcessEvent::rqIdx
uint32_t rqIdx
Definition hsa_packet_processor.hh:279

gem5::HSAPacketProcessor::RQLEntry
Definition hsa_packet_processor.hh:291

gem5::HSAPacketProcessor::RQLEntry::aqlProcessEvent
QueueProcessEvent aqlProcessEvent
Definition hsa_packet_processor.hh:299

gem5::HSAPacketProcessor::RQLEntry::setBarrierBit
void setBarrierBit(bool set_val)
Definition hsa_packet_processor.hh:300

gem5::HSAPacketProcessor::RQLEntry::dispPending
bool dispPending()
Definition hsa_packet_processor.hh:296

gem5::HSAPacketProcessor::RQLEntry::RQLEntry
RQLEntry(HSAPacketProcessor *hsaPP, uint32_t rqIdx)
Definition hsa_packet_processor.hh:293

gem5::HSAPacketProcessor::RQLEntry::getBarrierBit
bool getBarrierBit() const
Definition hsa_packet_processor.hh:301

gem5::HSAPacketProcessor::RQLEntry::depSignalRdState
SignalState depSignalRdState
Definition hsa_packet_processor.hh:298

gem5::HSAPacketProcessor::RQLEntry::isLastOutstandingPkt
bool isLastOutstandingPkt() const
Definition hsa_packet_processor.hh:302

gem5::HSAPacketProcessor::RQLEntry::qCntxt
QCntxt qCntxt
Definition hsa_packet_processor.hh:295

gem5::HSAPacketProcessor::RQLEntry::compltnPending
uint64_t compltnPending()
Definition hsa_packet_processor.hh:297

gem5::HSAPacketProcessor::SignalState
Definition hsa_packet_processor.hh:253

gem5::HSAPacketProcessor::SignalState::values
std::vector< hsa_signal_value_t > values
Definition hsa_packet_processor.hh:267

gem5::HSAPacketProcessor::SignalState::SignalState
SignalState()
Definition hsa_packet_processor.hh:255

gem5::HSAPacketProcessor::SignalState::handleReadDMA
void handleReadDMA()
Definition hsa_packet_processor.cc:483

gem5::HSAPacketProcessor::SignalState::pendingReads
int pendingReads
Definition hsa_packet_processor.hh:261

gem5::HSAPacketProcessor::SignalState::discardRead
bool discardRead
Definition hsa_packet_processor.hh:265

gem5::HSAPacketProcessor::SignalState::allRead
bool allRead
Definition hsa_packet_processor.hh:262

gem5::HSAPacketProcessor::SignalState::resetSigVals
void resetSigVals()
Definition hsa_packet_processor.hh:269

gem5::HSAPacketProcessor
Definition hsa_packet_processor.hh:240

gem5::HSAPacketProcessor::sendAgentDispatchCompletionSignal
void sendAgentDispatchCompletionSignal(void *pkt, hsa_signal_value_t signal)
Definition hsa_packet_processor.cc:709

gem5::HSAPacketProcessor::numHWQueues
int numHWQueues
Definition hsa_packet_processor.hh:332

gem5::HSAPacketProcessor::regdQList
std::vector< class RQLEntry * > regdQList
Definition hsa_packet_processor.hh:308

gem5::HSAPacketProcessor::updateReadIndex
void updateReadIndex(int, uint32_t)
Definition hsa_packet_processor.cc:208

gem5::HSAPacketProcessor::write
virtual Tick write(Packet *) override
Definition hsa_packet_processor.cc:140

gem5::HSAPacketProcessor::cmdQueueCmdDma
void cmdQueueCmdDma(HSAPacketProcessor *hsaPP, int pid, bool isRead, uint32_t ix_start, unsigned num_pkts, dma_series_ctx *series_ctx, void *dest_4debug)
Definition hsa_packet_processor.cc:232

gem5::HSAPacketProcessor::DmaFnPtr
void(DmaDevice::* DmaFnPtr)(Addr, int, Event *, uint8_t *, Tick)
Definition hsa_packet_processor.hh:243

gem5::HSAPacketProcessor::inFlightPkts
uint64_t inFlightPkts(uint32_t queId)
Definition hsa_packet_processor.hh:326

gem5::HSAPacketProcessor::hwScheduler
HWScheduler * hwScheduler()
Definition hsa_packet_processor.hh:353

gem5::HSAPacketProcessor::sendCompletionSignal
void sendCompletionSignal(hsa_signal_value_t signal)
Definition hsa_packet_processor.cc:739

gem5::HSAPacketProcessor::gpu_device
GPUCommandProcessor * gpu_device
Definition hsa_packet_processor.hh:244

gem5::HSAPacketProcessor::updateReadDispIdDma
void updateReadDispIdDma()
this event is used to update the read_disp_id field (the read pointer) of the MQD,...
Definition hsa_packet_processor.cc:202

gem5::HSAPacketProcessor::pioSize
Addr pioSize
Definition hsa_packet_processor.hh:334

gem5::HSAPacketProcessor::hwSchdlr
HWScheduler * hwSchdlr
Definition hsa_packet_processor.hh:245

gem5::HSAPacketProcessor::setGPUDevice
void setGPUDevice(AMDGPUDevice *gpu_device)
Definition hsa_packet_processor.cc:97

gem5::HSAPacketProcessor::Params
HSAPacketProcessorParams Params
Definition hsa_packet_processor.hh:338

gem5::HSAPacketProcessor::getCommandsFromHost
void getCommandsFromHost(int pid, uint32_t rl_idx)
Definition hsa_packet_processor.cc:496

gem5::HSAPacketProcessor::pioDelay
Tick pioDelay
Definition hsa_packet_processor.hh:335

gem5::HSAPacketProcessor::translate
TranslationGenPtr translate(Addr vaddr, Addr size) override
Function used to translate a range of addresses from virtual to physical addresses.
Definition hsa_packet_processor.cc:178

gem5::HSAPacketProcessor::handleReadDMA
void handleReadDMA()

gem5::HSAPacketProcessor::finishPkt
void finishPkt(void *pkt)
Definition hsa_packet_processor.hh:360

gem5::HSAPacketProcessor::getRegdListEntry
class RQLEntry * getRegdListEntry(uint32_t queId)
Definition hsa_packet_processor.hh:320

gem5::HSAPacketProcessor::~HSAPacketProcessor
~HSAPacketProcessor()
Definition hsa_packet_processor.cc:89

gem5::HSAPacketProcessor::walker
VegaISA::Walker * walker
Definition hsa_packet_processor.hh:247

gem5::HSAPacketProcessor::setDeviceQueueDesc
void setDeviceQueueDesc(uint64_t hostReadIndexPointer, uint64_t basePointer, uint64_t queue_id, uint32_t size, int doorbellSize, GfxVersion gfxVersion, Addr offset=0, uint64_t rd_idx=0)
Definition hsa_packet_processor.cc:112

gem5::HSAPacketProcessor::displayQueueDescriptor
void displayQueueDescriptor(int pid, uint32_t rl_idx)
Definition hsa_packet_processor.cc:578

gem5::HSAPacketProcessor::pioAddr
Addr pioAddr
Definition hsa_packet_processor.hh:333

gem5::HSAPacketProcessor::getQueueDesc
HSAQueueDescriptor * getQueueDesc(uint32_t queId)
Definition hsa_packet_processor.hh:315

gem5::HSAPacketProcessor::processPkt
Q_STATE processPkt(void *pkt, uint32_t rl_idx, Addr host_pkt_addr)
Definition hsa_packet_processor.cc:283

gem5::HSAPacketProcessor::gpuDevice
AMDGPUDevice * gpuDevice
Definition hsa_packet_processor.hh:246

gem5::HSAPacketProcessor::finishPkt
void finishPkt(void *pkt, uint32_t rl_idx)
Definition hsa_packet_processor.cc:667

gem5::HSAPacketProcessor::getAddrRanges
virtual AddrRangeList getAddrRanges() const override
Every PIO device is obliged to provide an implementation that returns the address ranges the device r...
Definition hsa_packet_processor.cc:128

gem5::HSAPacketProcessor::unsetDeviceQueueDesc
void unsetDeviceQueueDesc(uint64_t queue_id, int doorbellSize)
Definition hsa_packet_processor.cc:106

gem5::HSAPacketProcessor::schedAQLProcessing
void schedAQLProcessing(uint32_t rl_idx)
Definition hsa_packet_processor.cc:277

gem5::HSAPacketProcessor::setDevice
void setDevice(GPUCommandProcessor *dev)
Definition hsa_packet_processor.cc:642

gem5::HSAPacketProcessor::pktProcessDelay
const Tick pktProcessDelay
Definition hsa_packet_processor.hh:336

gem5::HSAPacketProcessor::read
virtual Tick read(Packet *) override
Definition hsa_packet_processor.cc:170

gem5::HSAQueueDescriptor
Definition hsa_packet_processor.hh:79

gem5::HSAQueueDescriptor::HSAQueueDescriptor
HSAQueueDescriptor(uint64_t base_ptr, uint64_t db_ptr, uint64_t hri_ptr, uint32_t size, GfxVersion gfxVersion)
Definition hsa_packet_processor.hh:91

gem5::HSAQueueDescriptor::gfxVersion
GfxVersion gfxVersion
Definition hsa_packet_processor.hh:89

gem5::HSAQueueDescriptor::ptr
uint64_t ptr(uint64_t ix)
Definition hsa_packet_processor.hh:107

gem5::HSAQueueDescriptor::writeIndex
uint64_t writeIndex
Definition hsa_packet_processor.hh:83

gem5::HSAQueueDescriptor::spaceRemaining
uint64_t spaceRemaining()
Definition hsa_packet_processor.hh:100

gem5::HSAQueueDescriptor::readIndex
uint64_t readIndex
Definition hsa_packet_processor.hh:84

gem5::HSAQueueDescriptor::numObjs
uint32_t numObjs()
Definition hsa_packet_processor.hh:103

gem5::HSAQueueDescriptor::basePointer
uint64_t basePointer
Definition hsa_packet_processor.hh:81

gem5::HSAQueueDescriptor::objSize
uint32_t objSize()
Definition hsa_packet_processor.hh:102

gem5::HSAQueueDescriptor::isEmpty
bool isEmpty()
Definition hsa_packet_processor.hh:105

gem5::HSAQueueDescriptor::dmaInProgress
bool dmaInProgress
Definition hsa_packet_processor.hh:88

gem5::HSAQueueDescriptor::numElts
uint32_t numElts
Definition hsa_packet_processor.hh:85

gem5::HSAQueueDescriptor::doorbellPointer
uint64_t doorbellPointer
Definition hsa_packet_processor.hh:82

gem5::HSAQueueDescriptor::isFull
bool isFull()
Definition hsa_packet_processor.hh:104

gem5::HSAQueueDescriptor::hostReadIndexPtr
uint64_t hostReadIndexPtr
Definition hsa_packet_processor.hh:86

gem5::HSAQueueDescriptor::stalledOnDmaBufAvailability
bool stalledOnDmaBufAvailability
Definition hsa_packet_processor.hh:87

gem5::HSAQueueDescriptor::spaceUsed
uint64_t spaceUsed()
Definition hsa_packet_processor.hh:101

gem5::HWScheduler
Definition hw_scheduler.hh:51

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::VegaISA::Walker
Definition pagetable_walker.hh:55

std::list< AddrRange >

std::vector
STL vector class.
Definition stl.hh:37

dma_virt_device.hh

eventq.hh

gem5::EventBase::Default_Pri
static const Priority Default_Pri
Default is zero for historical reasons.
Definition eventq.hh:182

HSA_PACKET_HEADER_TYPE
@ HSA_PACKET_HEADER_TYPE
Packet type.
Definition hsa.h:2816

HSA_PACKET_TYPE_INVALID
@ HSA_PACKET_TYPE_INVALID
The packet has been processed in the past, but has not been reassigned to the packet processor.
Definition hsa.h:2756

HSA_PACKET_HEADER_WIDTH_TYPE
@ HSA_PACKET_HEADER_WIDTH_TYPE
Definition hsa.h:2858

hsa_signal_value_t
int32_t hsa_signal_value_t
Signal value.
Definition hsa.h:1322

hsa.h

NumSignalsPerBarrier
#define NumSignalsPerBarrier
Definition hsa_packet_processor.hh:53

AQL_PACKET_SIZE
#define AQL_PACKET_SIZE
Definition hsa_packet_processor.hh:48

hsa_queue.hh

gem5::ArmISA::i
Bitfield< 7 > i
Definition misc_types.hh:67

gem5::ArmISA::offset
Bitfield< 23, 0 > offset
Definition types.hh:144

gem5::MipsISA::vaddr
vaddr
Definition pra_constants.hh:278

gem5::MipsISA::p
Bitfield< 0 > p
Definition pra_constants.hh:326

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::Q_STATE
Q_STATE
Definition hsa_packet_processor.hh:64

gem5::BLOCKED_BBIT
@ BLOCKED_BBIT
Definition hsa_packet_processor.hh:66

gem5::BLOCKED_BPKT
@ BLOCKED_BPKT
Definition hsa_packet_processor.hh:69

gem5::UNBLOCKED
@ UNBLOCKED
Definition hsa_packet_processor.hh:65

gem5::Tick
uint64_t Tick
Tick count type.
Definition types.hh:58

gem5::TranslationGenPtr
std::unique_ptr< TranslationGen > TranslationGenPtr
Definition translation_gen.hh:131

gem5::HSAPacketProcessor::dma_series_ctx
Calls getCurrentEntry once the queueEntry has been dmaRead.
Definition hsa_packet_processor.hh:372

gem5::HSAPacketProcessor::dma_series_ctx::pkts_ttl
uint32_t pkts_ttl
Definition hsa_packet_processor.hh:374

gem5::HSAPacketProcessor::dma_series_ctx::rl_idx
uint32_t rl_idx
Definition hsa_packet_processor.hh:377

gem5::HSAPacketProcessor::dma_series_ctx::pkts_2_go
uint32_t pkts_2_go
Definition hsa_packet_processor.hh:375

gem5::HSAPacketProcessor::dma_series_ctx::start_ix
uint32_t start_ix
Definition hsa_packet_processor.hh:376

gem5::HSAPacketProcessor::dma_series_ctx::~dma_series_ctx
~dma_series_ctx()
Definition hsa_packet_processor.hh:386

gem5::HSAPacketProcessor::dma_series_ctx::dma_series_ctx
dma_series_ctx(uint32_t _pkts_ttl, uint32_t _pkts_2_go, uint32_t _start_ix, uint32_t _rl_idx)
Definition hsa_packet_processor.hh:379

gem5::QCntxt
Definition hsa_packet_processor.hh:228

gem5::QCntxt::QCntxt
QCntxt()
Definition hsa_packet_processor.hh:236

gem5::QCntxt::barrierBit
bool barrierBit
Definition hsa_packet_processor.hh:232

gem5::QCntxt::QCntxt
QCntxt(HSAQueueDescriptor *q_desc, AQLRingBuffer *aql_buf)
Definition hsa_packet_processor.hh:233

gem5::QCntxt::aqlBuf
AQLRingBuffer * aqlBuf
Definition hsa_packet_processor.hh:230

gem5::QCntxt::qDesc
HSAQueueDescriptor * qDesc
Definition hsa_packet_processor.hh:229