gem5 [DEVELOP-FOR-25.1]
Loading...
Searching...
No Matches
amdgpu_vm.hh
Go to the documentation of this file.
1/*
2 * Copyright (c) 2021 Advanced Micro Devices, Inc.
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 * 1. Redistributions of source code must retain the above copyright notice,
9 * this list of conditions and the following disclaimer.
10 *
11 * 2. Redistributions in binary form must reproduce the above copyright notice,
12 * this list of conditions and the following disclaimer in the documentation
13 * and/or other materials provided with the distribution.
14 *
15 * 3. Neither the name of the copyright holder nor the names of its
16 * contributors may be used to endorse or promote products derived from this
17 * software without specific prior written permission.
18 *
19 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
20 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
23 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
24 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
25 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
26 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
27 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
28 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
29 * POSSIBILITY OF SUCH DAMAGE.
30 */
31
32#ifndef __DEV_AMDGPU_AMDGPU_VM_HH__
33#define __DEV_AMDGPU_AMDGPU_VM_HH__
34
35#include <vector>
36
38#include "base/intmath.hh"
40#include "mem/packet.hh"
42#include "sim/serialize.hh"
43
53
54#define mmVM_INVALIDATE_ENG17_ACK 0x08c6
55#define mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32 0x08eb
56#define mmVM_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32 0x08ec
57#define mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_LO32 0x090b
58#define mmVM_CONTEXT0_PAGE_TABLE_START_ADDR_HI32 0x090c
59#define mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_LO32 0x092b
60#define mmVM_CONTEXT0_PAGE_TABLE_END_ADDR_HI32 0x092c
61
62#define MI300X_CONTEXT0_PAGE_TABLE_BASE_ADDR_LO32 0x08cb
63#define MI300X_CONTEXT0_PAGE_TABLE_BASE_ADDR_HI32 0x08cc
64#define MI300X_CONTEXT0_PAGE_TABLE_START_ADDR_LO32 0x08eb
65#define MI300X_CONTEXT0_PAGE_TABLE_START_ADDR_HI32 0x08ec
66#define MI300X_CONTEXT0_PAGE_TABLE_END_ADDR_LO32 0x090b
67#define MI300X_CONTEXT0_PAGE_TABLE_END_ADDR_HI32 0x090c
68
69#define mmMC_VM_FB_OFFSET 0x096b
70#define mmMC_VM_FB_LOCATION_BASE 0x0980
71#define mmMC_VM_FB_LOCATION_TOP 0x0981
72#define mmMC_VM_AGP_TOP 0x0982
73#define mmMC_VM_AGP_BOT 0x0983
74#define mmMC_VM_AGP_BASE 0x0984
75#define mmMC_VM_SYSTEM_APERTURE_LOW_ADDR 0x0985
76#define mmMC_VM_SYSTEM_APERTURE_HIGH_ADDR 0x0986
77
78#define MI300X_VM_FB_OFFSET 0x0947
79#define MI300X_VM_FB_LOCATION_BASE 0x095c
80#define MI300X_VM_FB_LOCATION_TOP 0x095d
81#define MI300X_VM_AGP_TOP 0x095e
82#define MI300X_VM_AGP_BOT 0x095f
83#define MI300X_VM_AGP_BASE 0x0960
84#define MI300X_VM_SYSTEM_APERTURE_LOW_ADDR 0x0961
85#define MI300X_VM_SYSTEM_APERTURE_HIGH_ADDR 0x0962
86
87#define mmMMHUB_VM_INVALIDATE_ENG17_SEM 0x06e2
88#define mmMMHUB_VM_INVALIDATE_ENG17_REQ 0x06f4
89#define mmMMHUB_VM_INVALIDATE_ENG17_ACK 0x0706
90#define mmMMHUB_VM_FB_LOCATION_BASE 0x082c
91#define mmMMHUB_VM_FB_LOCATION_TOP 0x082d
92
93#define VEGA10_FB_LOCATION_BASE 0x6a0b0
94#define VEGA10_FB_LOCATION_TOP 0x6a0b4
95
96#define MI100_MEM_SIZE_REG 0x0378c
97#define MI100_FB_LOCATION_BASE 0x6ac00
98#define MI100_FB_LOCATION_TOP 0x6ac04
99
100#define MI200_MEM_SIZE_REG 0x0378c
101#define MI200_FB_LOCATION_BASE 0x6b300
102#define MI200_FB_LOCATION_TOP 0x6b304
103
104#define MI300X_MEM_SIZE_REG 0x0378c
105#define MI300X_FB_LOCATION_BASE 0x63270
106#define MI300X_FB_LOCATION_TOP 0x63274
107#define MI300X_VM_INVALIDATE_ENG17_ACK 0x08a6
108
109// AMD GPUs support 16 different virtual address spaces
110static constexpr int AMDGPU_VM_COUNT = 16;
111
112// These apertures have a fixed page size
113static constexpr int AMDGPU_AGP_PAGE_SIZE = 4096;
114static constexpr int AMDGPU_GART_PAGE_SIZE = 4096;
115static constexpr int AMDGPU_MMHUB_PAGE_SIZE = 4096;
116
117// Vega page size can be any power of 2 between 4kB and 1GB.
118static constexpr int AMDGPU_USER_PAGE_SIZE = 4096;
119
120namespace gem5
121{
122
133
134class AMDGPUDevice;
135
136class AMDGPUVM : public Serializable
137{
138 private:
140
141 typedef struct GEM5_PACKED
142 {
143 // Page table addresses: from (Base + Start) to (End)
144 union
145 {
146 struct
147 {
148 uint32_t ptBaseL;
149 uint32_t ptBaseH;
150 };
152 };
153 union
154 {
155 struct
156 {
157 uint32_t ptStartL;
158 uint32_t ptStartH;
159 };
161 };
162 union
163 {
164 struct
165 {
166 uint32_t ptEndL;
167 uint32_t ptEndH;
168 };
170 };
172
184
187
188 // MMHUB aperture. These addresses mirror the framebuffer, so addresses
189 // can be calculated by subtracting the base address.
190 uint64_t mmhubBase = 0x0;
191 uint64_t mmhubTop = 0x0;
192
198
205
206 std::array<AddrRange, NUM_MMIO_RANGES> mmioRanges;
207
208 public:
209 AMDGPUVM();
210
211 void setGPUDevice(AMDGPUDevice *gpu_device) { gpuDevice = gpu_device; }
212
216 Addr gartBase();
220 Addr gartSize();
221
222 bool
224 {
225 return ((paddr >= gartBase()) && (paddr <= (gartBase() + gartSize())));
226 }
227
232 std::unordered_map<uint64_t, uint64_t> gartTable;
233
234 void readMMIO(PacketPtr pkt, Addr offset);
235 void writeMMIO(PacketPtr pkt, Addr offset);
236
240 bool
242 {
243 return ((vaddr >= vmContext0.agpBot) && (vaddr <= vmContext0.agpTop));
244 }
245
246 Addr getAGPBot() { return vmContext0.agpBot; }
247 Addr getAGPTop() { return vmContext0.agpTop; }
248 Addr getAGPBase() { return vmContext0.agpBase; }
249
250 bool
252 {
253 return ((vaddr >= getMMHUBBase()) && (vaddr <= getMMHUBTop()));
254 }
255
258
261
262 bool
264 {
265 return ((vaddr >= vmContext0.fbBase) && (vaddr <= vmContext0.fbTop));
266 }
267
268 Addr getFBBase() { return vmContext0.fbBase; }
269 Addr getFBTop() { return vmContext0.fbTop; }
270 Addr getFBOffset() { return vmContext0.fbOffset; }
271
272 bool
274 {
275 return ((vaddr >= vmContext0.sysAddrL) &&
276 (vaddr <= vmContext0.sysAddrH));
277 }
278
279 Addr getSysAddrRangeLow () { return vmContext0.sysAddrL; }
280 Addr getSysAddrRangeHigh () { return vmContext0.sysAddrH; }
281
282 void setMMIOAperture(mmio_range_t mmio_aperture, AddrRange range);
284 AddrRange getMMIORange(mmio_range_t mmio_aperture);
285
286 // Getting mapped aperture base addresses
287 Addr
289 {
290 if (addr < gartBase()) {
291 warn_once("Accessing unsupported frame apperture!\n");
292 return ~0;
293 } else if (gartBase() <= addr && addr < (gartBase() + gartSize())) {
294 return gartBase();
295 } else {
296 warn_once("Accessing unsupported frame apperture!\n");
297 return ~0;
298 }
299
300 }
301
305 void
306 setPageTableBase(uint16_t vmid, Addr ptBase)
307 {
308 vmContexts[vmid].ptBase = ptBase;
309 }
310
311 void
312 setPageTableBaseL(uint16_t vmid, uint32_t ptBaseL)
313 {
314 vmContexts[vmid].ptBaseL = ptBaseL;
315 }
316
317 void
318 setPageTableBaseH(uint16_t vmid, uint32_t ptBaseH)
319 {
320 vmContexts[vmid].ptBaseH = ptBaseH;
321 }
322
323 Addr
324 getPageTableBase(uint16_t vmid)
325 {
326 assert(vmid > 0 && vmid < vmContexts.size());
327 return vmContexts[vmid].ptBase;
328 }
329
330 void
331 setPageTableStart(uint16_t vmid, Addr ptStart)
332 {
333 vmContexts[vmid].ptStart = ptStart;
334 }
335
336 void
337 setPageTableStartL(uint16_t vmid, uint32_t ptStartL)
338 {
339 vmContexts[vmid].ptStartL = ptStartL;
340 }
341
342 void
343 setPageTableStartH(uint16_t vmid, uint32_t ptStartH)
344 {
345 vmContexts[vmid].ptStartH = ptStartH;
346 }
347
348 Addr
349 getPageTableStart(uint16_t vmid)
350 {
351 assert(vmid > 0 && vmid < vmContexts.size());
352 return vmContexts[vmid].ptStart;
353 }
354
355 void
356 setPageTableEnd(uint16_t vmid, Addr ptEnd)
357 {
358 vmContexts[vmid].ptEnd = ptEnd;
359 }
360
361 void
362 setPageTableEndL(uint16_t vmid, uint32_t ptEndL)
363 {
364 vmContexts[vmid].ptEndL = ptEndL;
365 }
366
367 void
368 setPageTableEndH(uint16_t vmid, uint32_t ptEndH)
369 {
370 vmContexts[vmid].ptEndH = ptEndH;
371 }
372
377 void invalidateTLBs();
378
379
380 void serialize(CheckpointOut &cp) const override;
381 void unserialize(CheckpointIn &cp) override;
382
391 {
392 private:
394
395 void translate(Range &range) const override;
396
397 public:
401 };
402
404 {
405 private:
407
408 void translate(Range &range) const override;
409
410 public:
414 };
415
417 {
418 private:
420
421 void translate(Range &range) const override;
422
423 public:
427 };
428
430 {
431 private:
434 int vmid;
435
436 void translate(Range &range) const override;
437
438 public:
439 UserTranslationGen(AMDGPUVM *_vm, VegaISA::Walker *_walker, int _vmid,
441 : TranslationGen(vaddr, size), vm(_vm), walker(_walker),
442 vmid(_vmid)
443 {}
444 };
445};
446
447} // namespace gem5
448
449#endif // __DEV_AMDGPU_AMDGPU_VM_HH__
static constexpr int AMDGPU_VM_COUNT
Definition amdgpu_vm.hh:110
static constexpr int AMDGPU_MMHUB_PAGE_SIZE
Definition amdgpu_vm.hh:115
static constexpr int AMDGPU_GART_PAGE_SIZE
Definition amdgpu_vm.hh:114
static constexpr int AMDGPU_USER_PAGE_SIZE
Definition amdgpu_vm.hh:118
static constexpr int AMDGPU_AGP_PAGE_SIZE
Definition amdgpu_vm.hh:113
Device model for an AMD GPU.
AGPTranslationGen(AMDGPUVM *_vm, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:398
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:393
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:409
GARTTranslationGen(AMDGPUVM *_vm, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:411
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:445
MMHUBTranslationGen(AMDGPUVM *_vm, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:424
UserTranslationGen(AMDGPUVM *_vm, VegaISA::Walker *_walker, int _vmid, Addr vaddr, Addr size)
Definition amdgpu_vm.hh:439
void translate(Range &range) const override
Subclasses implement this function to complete TranslationGen.
Definition amdgpu_vm.cc:461
uint64_t mmhubBase
Definition amdgpu_vm.hh:190
void writeMMIOGfx900(PacketPtr pkt, Addr offset)
Different MMIO implements for different GFX versions with overlapping MMIO addresses.
Definition amdgpu_vm.cc:136
void setPageTableEndH(uint16_t vmid, uint32_t ptEndH)
Definition amdgpu_vm.hh:368
Addr getSysAddrRangeHigh()
Definition amdgpu_vm.hh:280
void setMMIOAperture(mmio_range_t mmio_aperture, AddrRange range)
Definition amdgpu_vm.cc:62
std::vector< AMDGPUVMContext > vmContexts
Definition amdgpu_vm.hh:186
void setPageTableStart(uint16_t vmid, Addr ptStart)
Definition amdgpu_vm.hh:331
std::array< AddrRange, NUM_MMIO_RANGES > mmioRanges
Definition amdgpu_vm.hh:206
void setMMHUBBase(Addr base)
Definition amdgpu_vm.hh:259
AddrRange getMMIORange(mmio_range_t mmio_aperture)
Definition amdgpu_vm.cc:68
void invalidateTLBs()
Definition amdgpu_vm.cc:282
struct gem5::AMDGPUVM::GEM5_PACKED AMDGPUVMContext
Addr getSysAddrRangeLow()
Definition amdgpu_vm.hh:279
void setPageTableEndL(uint16_t vmid, uint32_t ptEndL)
Definition amdgpu_vm.hh:362
std::unordered_map< uint64_t, uint64_t > gartTable
Copy of GART table.
Definition amdgpu_vm.hh:232
bool inAGP(Addr vaddr)
Methods for resolving apertures.
Definition amdgpu_vm.hh:241
std::vector< VegaISA::GpuTLB * > gpu_tlbs
List of TLBs associated with the GPU device.
Definition amdgpu_vm.hh:197
void readMMIO(PacketPtr pkt, Addr offset)
Definition amdgpu_vm.cc:99
void setPageTableStartL(uint16_t vmid, uint32_t ptStartL)
Definition amdgpu_vm.hh:337
void setPageTableBaseH(uint16_t vmid, uint32_t ptBaseH)
Definition amdgpu_vm.hh:318
Addr getMMHUBTop()
Definition amdgpu_vm.hh:257
const AddrRange & getMMIOAperture(Addr addr)
Definition amdgpu_vm.cc:74
void setPageTableBaseL(uint16_t vmid, uint32_t ptBaseL)
Definition amdgpu_vm.hh:312
gem5::AMDGPUVM::AMDGPUSysVMContext AMDGPUSysVMContext
Addr getFBOffset()
Definition amdgpu_vm.hh:270
void setGPUDevice(AMDGPUDevice *gpu_device)
Definition amdgpu_vm.hh:211
void writeMMIO(PacketPtr pkt, Addr offset)
Definition amdgpu_vm.cc:260
uint64_t mmhubTop
Definition amdgpu_vm.hh:191
bool inFB(Addr vaddr)
Definition amdgpu_vm.hh:263
Addr getFrameAperture(Addr addr)
Definition amdgpu_vm.hh:288
AMDGPUSysVMContext vmContext0
Definition amdgpu_vm.hh:185
void setPageTableBase(uint16_t vmid, Addr ptBase)
Page table base/start accessors for user VMIDs.
Definition amdgpu_vm.hh:306
Addr getMMHUBBase()
Definition amdgpu_vm.hh:256
AMDGPUDevice * gpuDevice
Definition amdgpu_vm.hh:139
Addr getPageTableBase(uint16_t vmid)
Definition amdgpu_vm.hh:324
Addr gartBase()
Return base address of GART table in framebuffer.
Definition amdgpu_vm.cc:87
void setPageTableEnd(uint16_t vmid, Addr ptEnd)
Definition amdgpu_vm.hh:356
Addr getPageTableStart(uint16_t vmid)
Definition amdgpu_vm.hh:349
void writeMMIOGfx940(PacketPtr pkt, Addr offset)
Definition amdgpu_vm.cc:198
bool inGARTRange(Addr paddr)
Definition amdgpu_vm.hh:223
void unserialize(CheckpointIn &cp) override
Unserialize an object.
Definition amdgpu_vm.cc:343
bool inMMHUB(Addr vaddr)
Definition amdgpu_vm.hh:251
void setPageTableStartH(uint16_t vmid, uint32_t ptStartH)
Definition amdgpu_vm.hh:343
Addr gartSize()
Return size of GART in number of PTEs.
Definition amdgpu_vm.cc:93
void serialize(CheckpointOut &cp) const override
Serialize an object.
Definition amdgpu_vm.cc:292
Addr getAGPBase()
Definition amdgpu_vm.hh:248
void registerTLB(VegaISA::GpuTLB *tlb)
Control methods for TLBs associated with the GPU device.
Definition amdgpu_vm.cc:275
void setMMHUBTop(Addr top)
Definition amdgpu_vm.hh:260
bool inSys(Addr vaddr)
Definition amdgpu_vm.hh:273
The AddrRange class encapsulates an address range, and supports a number of tests to check if two ran...
Definition addr_range.hh:82
TranslationGen(Addr new_start, Addr new_size)
The starting virtual address and the size of the entire region being translated.
STL vector class.
Definition stl.hh:37
Definition test.h:63
#define warn_once(...)
Definition logging.hh:292
Bitfield< 23, 0 > offset
Definition types.hh:144
Bitfield< 59, 56 > tlb
Bitfield< 3 > addr
Definition types.hh:84
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36
std::ostream CheckpointOut
Definition serialize.hh:66
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147
Packet * PacketPtr
mmio_range_t
Definition amdgpu_vm.hh:124
@ GRBM_MMIO_RANGE
Definition amdgpu_vm.hh:128
@ GFX_MMIO_RANGE
Definition amdgpu_vm.hh:127
@ IH_MMIO_RANGE
Definition amdgpu_vm.hh:129
@ MMHUB_MMIO_RANGE
Definition amdgpu_vm.hh:126
@ SMU_MMIO_RANGE
Definition amdgpu_vm.hh:130
@ NUM_MMIO_RANGES
Definition amdgpu_vm.hh:131
@ NBIO_MMIO_RANGE
Definition amdgpu_vm.hh:125
Declaration of the Packet class.
This structure represents a single, contiguous translation, or carries information about whatever fau...

Generated on Mon Oct 27 2025 04:13:01 for gem5 by doxygen 1.14.0