gem5 v23.0.0.0
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
amdgpu_vm.hh
Go to the documentation of this file.
1/*
2 * Copyright (c) 2021 Advanced Micro Devices, Inc.
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * 1. Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 *
11 * 2. Redistributions in binary form must reproduce the above copyright notice,
12 * this list of conditions and the following disclaimer in the documentation
13 * and/or other materials provided with the distribution.
14 *
15 * 3. Neither the name of the copyright holder nor the names of its
16 * contributors may be used to endorse or promote products derived from this
17 * software without specific prior written permission.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
20 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
23 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31
32#ifndef __DEV_AMDGPU_AMDGPU_VM_HH__
33#define __DEV_AMDGPU_AMDGPU_VM_HH__
34
35#include <vector>
36
38#include "base/intmath.hh"
40#include "mem/packet.hh"
42#include "sim/serialize.hh"
43
54#define mmVM_INVALIDATE_ENG17_ACK 0x08c6
55#define mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32 0x08eb
56#define mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32 0x08ec
57#define mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_LO32 0x090b
58#define mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_HI32 0x090c
59#define mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_LO32 0x092b
60#define mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_HI32 0x092c
61
62#define mmMC_VM_FB_OFFSET 0x096b
63#define mmMC_VM_FB_LOCATION_BASE 0x0980
64#define mmMC_VM_FB_LOCATION_TOP 0x0981
65#define mmMC_VM_AGP_TOP 0x0982
66#define mmMC_VM_AGP_BOT 0x0983
67#define mmMC_VM_AGP_BASE 0x0984
68#define mmMC_VM_SYSTEM_APERTURE_LOW_ADDR 0x0985
69#define mmMC_VM_SYSTEM_APERTURE_HIGH_ADDR 0x0986
70
71#define mmMMHUB_VM_INVALIDATE_ENG17_SEM 0x06e2
72#define mmMMHUB_VM_INVALIDATE_ENG17_REQ 0x06f4
73#define mmMMHUB_VM_INVALIDATE_ENG17_ACK 0x0706
74#define mmMMHUB_VM_FB_LOCATION_BASE 0x082c
75#define mmMMHUB_VM_FB_LOCATION_TOP 0x082d
76
77#define VEGA10_FB_LOCATION_BASE 0x6a0b0
78#define VEGA10_FB_LOCATION_TOP 0x6a0b4
79
80#define MI100_MEM_SIZE_REG 0x0378c
81#define MI100_FB_LOCATION_BASE 0x6ac00
82#define MI100_FB_LOCATION_TOP 0x6ac04
83
84#define MI200_MEM_SIZE_REG 0x0378c
85#define MI200_FB_LOCATION_BASE 0x6b300
86#define MI200_FB_LOCATION_TOP 0x6b304
87
88// AMD GPUs support 16 different virtual address spaces
89static constexpr int AMDGPU_VM_COUNT = 16;
90
91// These apertures have a fixed page size
92static constexpr int AMDGPU_AGP_PAGE_SIZE = 4096;
93static constexpr int AMDGPU_GART_PAGE_SIZE = 4096;
94static constexpr int AMDGPU_MMHUB_PAGE_SIZE = 4096;
95
96// Vega page size can be any power of 2 between 4kB and 1GB.
97static constexpr int AMDGPU_USER_PAGE_SIZE = 4096;
98
99namespace gem5
100{
101
102class AMDGPUVM : public Serializable
103{
104 private:
105 typedef struct GEM5_PACKED
106 {
107 // Page table addresses: from (Base + Start) to (End)
108 union
109 {
110 struct
111 {
112 uint32_t ptBaseL;
113 uint32_t ptBaseH;
114 };
116 };
117 union
118 {
119 struct
120 {
121 uint32_t ptStartL;
122 uint32_t ptStartH;
123 };
125 };
126 union
127 {
128 struct
129 {
130 uint32_t ptEndL;
131 uint32_t ptEndH;
132 };
134 };
136
138 {
147 } AMDGPUSysVMContext;
148
151
152 // MMHUB aperture. These addresses mirror the framebuffer, so addresses
153 // can be calculated by subtracting the base address.
154 uint64_t mmhubBase = 0x0;
155 uint64_t mmhubTop = 0x0;
156
162
163 public:
164 AMDGPUVM();
165
169 Addr gartBase();
173 Addr gartSize();
174
179 std::unordered_map<uint64_t, uint64_t> gartTable;
180
181 void readMMIO(PacketPtr pkt, Addr offset);
182 void writeMMIO(PacketPtr pkt, Addr offset);
183
187 bool
189 {
190 return ((vaddr >= vmContext0.agpBot) && (vaddr <= vmContext0.agpTop));
191 }
192
196
197 bool
199 {
200 return ((vaddr >= getMMHUBBase()) && (vaddr <= getMMHUBTop()));
201 }
202
205
208
209 bool
211 {
212 return ((vaddr >= vmContext0.fbBase) && (vaddr <= vmContext0.fbTop));
213 }
214
218
219 bool
221 {
222 return ((vaddr >= vmContext0.sysAddrL) &&
224 }
225
228
229 Addr
231 {
232 // Aperture ranges:
233 // NBIO 0x0 - 0x4280
234 // IH 0x4280 - 0x4980
235 // SDMA0 0x4980 - 0x5180
236 // SDMA1 0x5180 - 0x5980
237 // GRBM 0x8000 - 0xD000
238 // GFX 0x28000 - 0x3F000
239 // MMHUB 0x68000 - 0x6a120
240
241 if (IH_BASE <= addr && addr < IH_BASE + IH_SIZE)
242 return IH_BASE;
243 else if (SDMA0_BASE <= addr && addr < SDMA0_BASE + SDMA_SIZE)
244 return SDMA0_BASE;
245 else if (SDMA1_BASE <= addr && addr < SDMA1_BASE + SDMA_SIZE)
246 return SDMA1_BASE;
247 else if (GRBM_BASE <= addr && addr < GRBM_BASE + GRBM_SIZE)
248 return GRBM_BASE;
249 else if (GFX_BASE <= addr && addr < GFX_BASE + GFX_SIZE)
250 return GFX_BASE;
251 else if (MMHUB_BASE <= addr && addr < MMHUB_BASE + MMHUB_SIZE)
252 return MMHUB_BASE;
253 else {
254 warn_once("Accessing unsupported MMIO aperture! Assuming NBIO\n");
255 return NBIO_BASE;
256 }
257
258 }
259
260 // Gettig mapped aperture base addresses
261 Addr
263 {
264 if (addr < gartBase()) {
265 warn_once("Accessing unsupported frame apperture!\n");
266 return ~0;
267 } else if (gartBase() <= addr && addr < (gartBase() + gartSize())) {
268 return gartBase();
269 } else {
270 warn_once("Accessing unsupported frame apperture!\n");
271 return ~0;
272 }
273
274 }
275
279 void
280 setPageTableBase(uint16_t vmid, Addr ptBase)
281 {
282 vmContexts[vmid].ptBase = ptBase;
283 }
284
285 Addr
286 getPageTableBase(uint16_t vmid)
287 {
288 assert(vmid > 0 && vmid < vmContexts.size());
289 return vmContexts[vmid].ptBase;
290 }
291
292 Addr
293 getPageTableStart(uint16_t vmid)
294 {
295 assert(vmid > 0 && vmid < vmContexts.size());
296 return vmContexts[vmid].ptStart;
297 }
298
303 void invalidateTLBs();
304
305
306 void serialize(CheckpointOut &cp) const override;
307 void unserialize(CheckpointIn &cp) override;
308
317 {
318 private:
320
321 void translate(Range &range) const override;
322
323 public:
325 : TranslationGen(vaddr, size), vm(_vm)
326 {}
327 };
328
330 {
331 private:
333
334 void translate(Range &range) const override;
335
336 public:
338 : TranslationGen(vaddr, size), vm(_vm)
339 {}
340 };
341
343 {
344 private:
346
347 void translate(Range &range) const override;
348
349 public:
351 : TranslationGen(vaddr, size), vm(_vm)
352 {}
353 };
354
356 {
357 private:
360 int vmid;
361
362 void translate(Range &range) const override;
363
364 public:
365 UserTranslationGen(AMDGPUVM *_vm, VegaISA::Walker *_walker, int _vmid,
367 : TranslationGen(vaddr, size), vm(_vm), walker(_walker),
368 vmid(_vmid)
369 {}
370 };
371};
372
373} // namespace gem5
374
375#endif // __DEV_AMDGPU_AMDGPU_VM_HH__
static constexpr int AMDGPU_VM_COUNT
Definition amdgpu_vm.hh:89
static constexpr int AMDGPU_MMHUB_PAGE_SIZE
Definition amdgpu_vm.hh:94
static constexpr int AMDGPU_GART_PAGE_SIZE
Definition amdgpu_vm.hh:93
static constexpr int AMDGPU_USER_PAGE_SIZE
Definition amdgpu_vm.hh:97
static constexpr int AMDGPU_AGP_PAGE_SIZE
Definition amdgpu_vm.hh:92
Translation range generators.
Definition amdgpu_vm.hh:317
AGPTranslationGen(AMDGPUVM *_vm, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:324
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:285
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:301
GARTTranslationGen(AMDGPUVM *_vm, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:337
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:337
MMHUBTranslationGen(AMDGPUVM *_vm, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:350
UserTranslationGen(AMDGPUVM *_vm, VegaISA::Walker *_walker, int _vmid, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:365
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:353
uint64_t mmhubBase
Definition amdgpu_vm.hh:154
Addr getSysAddrRangeHigh()
Definition amdgpu_vm.hh:227
std::vector< AMDGPUVMContext > vmContexts
Definition amdgpu_vm.hh:150
void setMMHUBBase(Addr base)
Definition amdgpu_vm.hh:206
void invalidateTLBs()
Definition amdgpu_vm.cc:174
struct gem5::AMDGPUVM::GEM5_PACKED AMDGPUVMContext
Addr getSysAddrRangeLow()
Definition amdgpu_vm.hh:226
std::unordered_map< uint64_t, uint64_t > gartTable
Copy of GART table.
Definition amdgpu_vm.hh:179
bool inAGP(Addr vaddr)
Methods for resolving apertures.
Definition amdgpu_vm.hh:188
std::vector< VegaISA::GpuTLB * > gpu_tlbs
List of TLBs associated with the GPU device.
Definition amdgpu_vm.hh:161
void readMMIO(PacketPtr pkt, Addr offset)
Definition amdgpu_vm.cc:69
Addr getMMHUBTop()
Definition amdgpu_vm.hh:204
Addr getMmioAperture(Addr addr)
Definition amdgpu_vm.hh:230
Addr getFBOffset()
Definition amdgpu_vm.hh:217
void writeMMIO(PacketPtr pkt, Addr offset)
Definition amdgpu_vm.cc:105
uint64_t mmhubTop
Definition amdgpu_vm.hh:155
bool inFB(Addr vaddr)
Definition amdgpu_vm.hh:210
Addr getFrameAperture(Addr addr)
Definition amdgpu_vm.hh:262
AMDGPUSysVMContext vmContext0
Definition amdgpu_vm.hh:149
void setPageTableBase(uint16_t vmid, Addr ptBase)
Page table base/start accessors for user VMIDs.
Definition amdgpu_vm.hh:280
Addr getMMHUBBase()
Definition amdgpu_vm.hh:203
Addr getPageTableBase(uint16_t vmid)
Definition amdgpu_vm.hh:286
Addr gartBase()
Return base address of GART table in framebuffer.
Definition amdgpu_vm.cc:57
Addr getPageTableStart(uint16_t vmid)
Definition amdgpu_vm.hh:293
void unserialize(CheckpointIn &cp) override
Unserialize an object.
Definition amdgpu_vm.cc:235
bool inMMHUB(Addr vaddr)
Definition amdgpu_vm.hh:198
Addr gartSize()
Return size of GART in number of PTEs.
Definition amdgpu_vm.cc:63
void serialize(CheckpointOut &cp) const override
Serialize an object.
Definition amdgpu_vm.cc:184
Addr getAGPBase()
Definition amdgpu_vm.hh:195
void registerTLB(VegaISA::GpuTLB *tlb)
Control methods for TLBs associated with the GPU device.
Definition amdgpu_vm.cc:167
void setMMHUBTop(Addr top)
Definition amdgpu_vm.hh:207
bool inSys(Addr vaddr)
Definition amdgpu_vm.hh:220
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295
Basic support for object serialization.
Definition serialize.hh:170
TranslationGen is a base class for a generator object which returns information about address transla...
STL vector class.
Definition stl.hh:37
Definition test.h:63
#define warn_once(...)
Definition logging.hh:260
Bitfield< 23, 0 > offset
Definition types.hh:144
Bitfield< 59, 56 > tlb
Bitfield< 51, 12 > base
Definition pagetable.hh:141
Bitfield< 3 > addr
Definition types.hh:84
Reference material can be found at the JEDEC website: UFS standard http://www.jedec....
static constexpr uint32_t MMHUB_SIZE
static constexpr uint32_t SDMA_SIZE
static constexpr uint32_t GFX_BASE
std::ostream CheckpointOut
Definition serialize.hh:66
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147
static constexpr uint32_t MMHUB_BASE
static constexpr uint32_t SDMA0_BASE
static constexpr uint32_t GRBM_BASE
static constexpr uint32_t SDMA1_BASE
static constexpr uint32_t IH_BASE
static constexpr uint32_t GRBM_SIZE
static constexpr uint32_t NBIO_BASE
static constexpr uint32_t GFX_SIZE
static constexpr uint32_t IH_SIZE
Declaration of the Packet class.
This structure represents a single, contiguous translation, or carries information about whatever fau...

Generated on Mon Jul 10 2023 14:24:30 for gem5 by doxygen 1.9.7