gem5  v22.0.0.2
pm4_packet_processor.hh
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2021 Advanced Micro Devices, Inc.
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are met:
7  *
8  * 1. Redistributions of source code must retain the above copyright notice,
9  * this list of conditions and the following disclaimer.
10  *
11  * 2. Redistributions in binary form must reproduce the above copyright notice,
12  * this list of conditions and the following disclaimer in the documentation
13  * and/or other materials provided with the distribution.
14  *
15  * 3. Neither the name of the copyright holder nor the names of its
16  * contributors may be used to endorse or promote products derived from this
17  * software without specific prior written permission.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
20  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
23  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29  * POSSIBILITY OF SUCH DAMAGE.
30  *
31  */
32 
33 #ifndef __DEV_AMDGPU_PM4_PACKET_PROCESSOR__
34 #define __DEV_AMDGPU_PM4_PACKET_PROCESSOR__
35 
36 #include <unordered_map>
37 
40 #include "dev/amdgpu/pm4_queues.hh"
41 #include "dev/dma_virt_device.hh"
42 #include "params/PM4PacketProcessor.hh"
43 
44 namespace gem5
45 {
46 
47 class AMDGPUDevice;
48 
49 
50 
51 
53 {
55  /* First graphics queue */
57  /* First compute queue */
59 
60  /* All PM4 queues, indexed by VMID */
61  std::unordered_map<uint16_t, PM4Queue *> queues;
62  /* A map of PM4 queues based on doorbell offset */
63  std::unordered_map<uint32_t, PM4Queue *> queuesMap;
64  public:
65  PM4PacketProcessor(const PM4PacketProcessorParams &p);
66 
67  void setGPUDevice(AMDGPUDevice *gpu_device);
68 
72  Tick write(PacketPtr pkt) override { return 0; }
73  Tick read(PacketPtr pkt) override { return 0; }
74  AddrRangeList getAddrRanges() const override;
75  void serialize(CheckpointOut &cp) const override;
76  void unserialize(CheckpointIn &cp) override;
77 
81  TranslationGenPtr translate(Addr vaddr, Addr size) override;
82 
83  uint32_t getKiqDoorbellOffset() { return kiq.doorbell & 0x1ffffffc; }
84  uint32_t getPqDoorbellOffset() { return pq.doorbellOffset; }
85 
86  Addr getGARTAddr(Addr addr) const;
87 
92  PM4Queue* getQueue(Addr offset, bool gfx = false);
98  void mapPq(Addr offset);
104  void mapKiq(Addr offset);
109  void newQueue(QueueDesc *q, Addr offset, PM4MapQueues *pkt = nullptr,
110  int id = -1);
111 
116  void process(PM4Queue *q, Addr wptrOffset);
117 
124  void updateReadIndex(Addr offset, uint64_t rd_idx);
125 
129  void decodeNext(PM4Queue *q);
135 
136  /* Methods that implement PM4 packets */
137  void writeData(PM4Queue *q, PM4WriteData *pkt);
139  void mapQueues(PM4Queue *q, PM4MapQueues *pkt);
140  void unmapQueues(PM4Queue *q, PM4UnmapQueues *pkt);
141  void doneMQDWrite(Addr mqdAddr, Addr addr);
142  void mapProcess(PM4Queue *q, PM4MapProcess *pkt);
143  void processMQD(PM4MapQueues *pkt, PM4Queue *q, Addr addr, QueueDesc *mqd,
144  uint16_t vmid);
146  SDMAQueueDesc *mqd, uint16_t vmid);
147  void releaseMem(PM4Queue *q, PM4ReleaseMem *pkt);
149  void runList(PM4Queue *q, PM4RunList *pkt);
151  void switchBuffer(PM4Queue *q, PM4SwitchBuf *pkt);
153  void waitRegMem(PM4Queue *q, PM4WaitRegMem *pkt);
154  void queryStatus(PM4Queue *q, PM4QueryStatus *pkt);
156 
157  /* Methods that implement MMIO regs */
158  void writeMMIO(PacketPtr pkt, Addr mmio_offset);
159 
160  void setHqdVmid(uint32_t data);
161  void setHqdActive(uint32_t data);
162  void setHqdPqBase(uint32_t data);
163  void setHqdPqBaseHi(uint32_t data);
164  void setHqdPqDoorbellCtrl(uint32_t data);
165  void setHqdPqPtr(uint32_t data);
166  void setHqdPqWptrLo(uint32_t data);
167  void setHqdPqWptrHi(uint32_t data);
168  void setHqdPqRptrReportAddr(uint32_t data);
169  void setHqdPqRptrReportAddrHi(uint32_t data);
170  void setHqdPqWptrPollAddr(uint32_t data);
171  void setHqdPqWptrPollAddrHi(uint32_t data);
172  void setHqdIbCtrl(uint32_t data);
173  void setRbVmid(uint32_t data);
174  void setRbCntl(uint32_t data);
175  void setRbWptrLo(uint32_t data);
176  void setRbWptrHi(uint32_t data);
177  void setRbRptrAddrLo(uint32_t data);
178  void setRbRptrAddrHi(uint32_t data);
179  void setRbWptrPollAddrLo(uint32_t data);
180  void setRbWptrPollAddrHi(uint32_t data);
181  void setRbBaseLo(uint32_t data);
182  void setRbBaseHi(uint32_t data);
183  void setRbDoorbellCntrl(uint32_t data);
184  void setRbDoorbellRangeLo(uint32_t data);
185  void setRbDoorbellRangeHi(uint32_t data);
186 };
187 
188 } // namespace gem5
189 
190 #endif //__DEV_AMDGPU_PM4_PACKET_PROCESSOR__
gem5::PM4PacketProcessor::mapPq
void mapPq(Addr offset)
The first graphics queue, the Primary Queueu a.k.a.
Definition: pm4_packet_processor.cc:121
gem5::PM4PacketProcessor::setRbRptrAddrLo
void setRbRptrAddrLo(uint32_t data)
Definition: pm4_packet_processor.cc:924
gem5::PM4PacketProcessor::decodeNext
void decodeNext(PM4Queue *q)
This method decodes the next packet in a PM4Queue.
Definition: pm4_packet_processor.cc:163
gem5::GEM5_PACKED
PM4 packets.
Definition: pm4_defines.hh:77
gem5::PM4PacketProcessor::queuesMap
std::unordered_map< uint32_t, PM4Queue * > queuesMap
Definition: pm4_packet_processor.hh:63
gem5::PM4PacketProcessor::mapProcess
void mapProcess(PM4Queue *q, PM4MapProcess *pkt)
Definition: pm4_packet_processor.cc:608
data
const char data[]
Definition: circlebuf.test.cc:48
gem5::PM4PacketProcessor::setRbWptrLo
void setRbWptrLo(uint32_t data)
Definition: pm4_packet_processor.cc:912
gem5::PM4PacketProcessor::queryStatusDone
void queryStatusDone(PM4Queue *q, PM4QueryStatus *pkt)
Definition: pm4_packet_processor.cc:722
gem5::PM4PacketProcessor::writeMMIO
void writeMMIO(PacketPtr pkt, Addr mmio_offset)
Definition: pm4_packet_processor.cc:731
gem5::CheckpointIn
Definition: serialize.hh:68
gem5::PM4PacketProcessor::setRbCntl
void setRbCntl(uint32_t data)
Definition: pm4_packet_processor.cc:906
gem5::PM4Queue
Class defining a PM4 queue.
Definition: pm4_queues.hh:361
gem5::PM4PacketProcessor::read
Tick read(PacketPtr pkt) override
Pure virtual function that the device must implement.
Definition: pm4_packet_processor.hh:73
header
output header
Definition: nop.cc:36
gem5::PM4PacketProcessor::setRbDoorbellCntrl
void setRbDoorbellCntrl(uint32_t data)
Definition: pm4_packet_processor.cc:960
gem5::PM4PacketProcessor::setRbDoorbellRangeHi
void setRbDoorbellRangeHi(uint32_t data)
Definition: pm4_packet_processor.cc:973
gem5::PM4PacketProcessor::serialize
void serialize(CheckpointOut &cp) const override
Serialize an object.
Definition: pm4_packet_processor.cc:979
gem5::PM4PacketProcessor::setHqdPqRptrReportAddr
void setHqdPqRptrReportAddr(uint32_t data)
Definition: pm4_packet_processor.cc:870
gem5::PM4PacketProcessor::process
void process(PM4Queue *q, Addr wptrOffset)
This method start processing a PM4Queue from the current read pointer to the newly communicated write...
Definition: pm4_packet_processor.cc:152
gem5::PM4PacketProcessor::getKiqDoorbellOffset
uint32_t getKiqDoorbellOffset()
Definition: pm4_packet_processor.hh:83
gem5::PM4PacketProcessor::newQueue
void newQueue(QueueDesc *q, Addr offset, PM4MapQueues *pkt=nullptr, int id=-1)
This method creates a new PM4Queue based on a queue descriptor and an offset.
Definition: pm4_packet_processor.cc:128
gem5::PM4PacketProcessor::setUconfigReg
void setUconfigReg(PM4Queue *q, PM4SetUconfigReg *pkt)
Definition: pm4_packet_processor.cc:668
gem5::PM4PacketProcessor::releaseMemDone
void releaseMemDone(PM4Queue *q, PM4ReleaseMem *pkt, Addr addr)
Definition: pm4_packet_processor.cc:487
gem5::PM4PacketProcessor::setRbBaseLo
void setRbBaseLo(uint32_t data)
Definition: pm4_packet_processor.cc:948
gem5::PM4PacketProcessor::switchBuffer
void switchBuffer(PM4Queue *q, PM4SwitchBuf *pkt)
Definition: pm4_packet_processor.cc:656
gem5::PM4PacketProcessor::releaseMem
void releaseMem(PM4Queue *q, PM4ReleaseMem *pkt)
Definition: pm4_packet_processor.cc:463
gem5::PM4PacketProcessor::mapKiq
void mapKiq(Addr offset)
The first compute queue, the Kernel Interface Queueu a.k.a.
Definition: pm4_packet_processor.cc:114
gem5::PrimaryQueue
Definition: pm4_queues.hh:333
gem5::PM4PacketProcessor::setHqdVmid
void setHqdVmid(uint32_t data)
Definition: pm4_packet_processor.cc:822
gem5::PM4PacketProcessor::setHqdPqRptrReportAddrHi
void setHqdPqRptrReportAddrHi(uint32_t data)
Definition: pm4_packet_processor.cc:876
gem5::VegaISA::p
Bitfield< 54 > p
Definition: pagetable.hh:70
gem5::PM4PacketProcessor::setRbWptrPollAddrHi
void setRbWptrPollAddrHi(uint32_t data)
Definition: pm4_packet_processor.cc:942
gem5::PM4PacketProcessor::setGPUDevice
void setGPUDevice(AMDGPUDevice *gpu_device)
Definition: pm4_packet_processor.cc:84
amdgpu_device.hh
gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition: packet.hh:291
gem5::Tick
uint64_t Tick
Tick count type.
Definition: types.hh:58
gem5::PM4PacketProcessor
Definition: pm4_packet_processor.hh:52
gem5::PM4PacketProcessor::setHqdPqPtr
void setHqdPqPtr(uint32_t data)
Definition: pm4_packet_processor.cc:852
gem5::PM4PacketProcessor::writeDataDone
void writeDataDone(PM4Queue *q, PM4WriteData *pkt, Addr addr)
Definition: pm4_packet_processor.cc:344
gem5::PM4PacketProcessor::write
Tick write(PacketPtr pkt) override
Inherited methods.
Definition: pm4_packet_processor.hh:72
gem5::PM4PacketProcessor::translate
TranslationGenPtr translate(Addr vaddr, Addr size) override
Method for functional translation.
Definition: pm4_packet_processor.cc:62
gem5::PM4PacketProcessor::setHqdPqWptrPollAddrHi
void setHqdPqWptrPollAddrHi(uint32_t data)
Definition: pm4_packet_processor.cc:888
gem5::PM4PacketProcessor::pq
PrimaryQueue pq
Definition: pm4_packet_processor.hh:56
gem5::ArmISA::offset
Bitfield< 23, 0 > offset
Definition: types.hh:144
gem5::PM4PacketProcessor::doneMQDWrite
void doneMQDWrite(Addr mqdAddr, Addr addr)
Definition: pm4_packet_processor.cc:602
gem5::PM4PacketProcessor::processSDMAMQD
void processSDMAMQD(PM4MapQueues *pkt, PM4Queue *q, Addr addr, SDMAQueueDesc *mqd, uint16_t vmid)
Definition: pm4_packet_processor.cc:439
gem5::AMDGPUDevice
Device model for an AMD GPU.
Definition: amdgpu_device.hh:60
pm4_queues.hh
gem5::PM4PacketProcessor::setHqdActive
void setHqdActive(uint32_t data)
Definition: pm4_packet_processor.cc:828
gem5::PM4PacketProcessor::setRbWptrHi
void setRbWptrHi(uint32_t data)
Definition: pm4_packet_processor.cc:918
gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:147
gem5::PM4PacketProcessor::queryStatus
void queryStatus(PM4Queue *q, PM4QueryStatus *pkt)
Definition: pm4_packet_processor.cc:697
gem5::PrimaryQueue::doorbellOffset
uint32_t doorbellOffset
Definition: pm4_queues.hh:353
gem5::PM4PacketProcessor::runList
void runList(PM4Queue *q, PM4RunList *pkt)
Definition: pm4_packet_processor.cc:624
gem5::PM4PacketProcessor::setHqdPqWptrLo
void setHqdPqWptrLo(uint32_t data)
Definition: pm4_packet_processor.cc:858
gem5::PM4PacketProcessor::setHqdPqBase
void setHqdPqBase(uint32_t data)
Definition: pm4_packet_processor.cc:834
gem5::GEM5_PACKED::doorbell
uint32_t doorbell
Definition: pm4_queues.hh:128
gem5::PM4PacketProcessor::decodeHeader
void decodeHeader(PM4Queue *q, PM4Header header)
This method calls other PM4 packet processing methods based on the header of a PM4 packet.
Definition: pm4_packet_processor.cc:190
gem5::PM4PacketProcessor::processMQD
void processMQD(PM4MapQueues *pkt, PM4Queue *q, Addr addr, QueueDesc *mqd, uint16_t vmid)
Definition: pm4_packet_processor.cc:405
gem5::PM4PacketProcessor::setHqdPqDoorbellCtrl
void setHqdPqDoorbellCtrl(uint32_t data)
Definition: pm4_packet_processor.cc:846
gem5::PM4PacketProcessor::indirectBuffer
void indirectBuffer(PM4Queue *q, PM4IndirectBuf *pkt)
Definition: pm4_packet_processor.cc:641
gem5::ArmISA::q
Bitfield< 27 > q
Definition: misc_types.hh:55
gem5::PM4PacketProcessor::PM4PacketProcessor
PM4PacketProcessor(const PM4PacketProcessorParams &p)
Definition: pm4_packet_processor.cc:49
gem5::PM4PacketProcessor::setRbWptrPollAddrLo
void setRbWptrPollAddrLo(uint32_t data)
Definition: pm4_packet_processor.cc:936
gem5::PM4PacketProcessor::setHqdPqBaseHi
void setHqdPqBaseHi(uint32_t data)
Definition: pm4_packet_processor.cc:840
gem5::PM4PacketProcessor::setHqdPqWptrHi
void setHqdPqWptrHi(uint32_t data)
Definition: pm4_packet_processor.cc:864
gem5::PM4PacketProcessor::getQueue
PM4Queue * getQueue(Addr offset, bool gfx=false)
Based on an offset communicated through doorbell write, the PM4PacketProcessor identifies which queue...
Definition: pm4_packet_processor.cc:100
gem5::PM4PacketProcessor::queues
std::unordered_map< uint16_t, PM4Queue * > queues
Definition: pm4_packet_processor.hh:61
gem5::PM4PacketProcessor::getAddrRanges
AddrRangeList getAddrRanges() const override
Every PIO device is obliged to provide an implementation that returns the address ranges the device r...
Definition: pm4_packet_processor.cc:77
gem5::PM4PacketProcessor::updateReadIndex
void updateReadIndex(Addr offset, uint64_t rd_idx)
Update read index on doorbell rings.
Definition: pm4_packet_processor.cc:508
gem5::CheckpointOut
std::ostream CheckpointOut
Definition: serialize.hh:66
pm4_defines.hh
dma_virt_device.hh
gem5::DmaVirtDevice
Definition: dma_virt_device.hh:41
gem5::PM4PacketProcessor::writeData
void writeData(PM4Queue *q, PM4WriteData *pkt)
Definition: pm4_packet_processor.cc:326
gem5::MipsISA::vaddr
vaddr
Definition: pra_constants.hh:278
std::list< AddrRange >
gem5::PM4PacketProcessor::mapQueues
void mapQueues(PM4Queue *q, PM4MapQueues *pkt)
Definition: pm4_packet_processor.cc:356
gem5::PM4PacketProcessor::setRbVmid
void setRbVmid(uint32_t data)
Definition: pm4_packet_processor.cc:900
gem5::PM4PacketProcessor::waitRegMem
void waitRegMem(PM4Queue *q, PM4WaitRegMem *pkt)
Definition: pm4_packet_processor.cc:681
gem5::PM4PacketProcessor::getPqDoorbellOffset
uint32_t getPqDoorbellOffset()
Definition: pm4_packet_processor.hh:84
gem5::PM4PacketProcessor::setRbRptrAddrHi
void setRbRptrAddrHi(uint32_t data)
Definition: pm4_packet_processor.cc:930
gem5
Reference material can be found at the JEDEC website: UFS standard http://www.jedec....
Definition: gpu_translation_state.hh:37
gem5::PM4PacketProcessor::setHqdPqWptrPollAddr
void setHqdPqWptrPollAddr(uint32_t data)
Definition: pm4_packet_processor.cc:882
gem5::PM4PacketProcessor::getGARTAddr
Addr getGARTAddr(Addr addr) const
Definition: pm4_packet_processor.cc:90
gem5::PM4PacketProcessor::unserialize
void unserialize(CheckpointIn &cp) override
Unserialize an object.
Definition: pm4_packet_processor.cc:1033
gem5::PM4PacketProcessor::setRbBaseHi
void setRbBaseHi(uint32_t data)
Definition: pm4_packet_processor.cc:954
gem5::PM4PacketProcessor::unmapQueues
void unmapQueues(PM4Queue *q, PM4UnmapQueues *pkt)
Definition: pm4_packet_processor.cc:515
gem5::PM4PacketProcessor::kiq
QueueDesc kiq
Definition: pm4_packet_processor.hh:58
gem5::PM4PacketProcessor::gpuDevice
AMDGPUDevice * gpuDevice
Definition: pm4_packet_processor.hh:54
gem5::TranslationGenPtr
std::unique_ptr< TranslationGen > TranslationGenPtr
Definition: translation_gen.hh:128
gem5::PM4PacketProcessor::setRbDoorbellRangeLo
void setRbDoorbellRangeLo(uint32_t data)
Definition: pm4_packet_processor.cc:967
gem5::X86ISA::addr
Bitfield< 3 > addr
Definition: types.hh:84
gem5::PM4PacketProcessor::setHqdIbCtrl
void setHqdIbCtrl(uint32_t data)
Definition: pm4_packet_processor.cc:894

Generated on Thu Jul 28 2022 13:32:30 for gem5 by doxygen 1.8.17