gem5
[DEVELOP-FOR-23.0]
|
Device model for an AMD GPU. More...
#include <amdgpu_device.hh>
Public Member Functions | |
AMDGPUDevice (const AMDGPUDeviceParams &p) | |
void | intrPost () |
Methods inherited from PciDevice. More... | |
Tick | writeConfig (PacketPtr pkt) override |
Write to the PCI config space data that is stored locally. More... | |
Tick | readConfig (PacketPtr pkt) override |
Read from the PCI config space data that is stored locally. More... | |
Tick | read (PacketPtr pkt) override |
Pure virtual function that the device must implement. More... | |
Tick | write (PacketPtr pkt) override |
Pure virtual function that the device must implement. More... | |
AddrRangeList | getAddrRanges () const override |
Every PIO device is obliged to provide an implementation that returns the address ranges the device responds to. More... | |
void | serialize (CheckpointOut &cp) const override |
Checkpoint support. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
AMDGPUInterruptHandler * | getIH () |
Get handles to GPU blocks. More... | |
SDMAEngine * | getSDMAById (int id) |
SDMAEngine * | getSDMAEngine (Addr offset) |
AMDGPUVM & | getVM () |
AMDGPUMemoryManager * | getMemMgr () |
GPUCommandProcessor * | CP () |
void | setDoorbellType (uint32_t offset, QueueType qt) |
Set handles to GPU blocks. More... | |
void | setSDMAEngine (Addr offset, SDMAEngine *eng) |
bool | haveRegVal (uint32_t addr) |
Register value getter/setter. More... | |
uint32_t | getRegVal (uint32_t addr) |
void | setRegVal (uint32_t addr, uint32_t value) |
RequestorID | vramRequestorId () |
Methods related to translations and system/device memory. More... | |
uint16_t | lastVMID () |
uint16_t | allocateVMID (uint16_t pasid) |
void | deallocateVmid (uint16_t vmid) |
void | deallocatePasid (uint16_t pasid) |
void | deallocateAllQueues () |
void | mapDoorbellToVMID (Addr doorbell, uint16_t vmid) |
uint16_t | getVMID (Addr doorbell) |
std::unordered_map< uint16_t, std::set< int > > & | getUsedVMIDs () |
void | insertQId (uint16_t vmid, int id) |
GfxVersion | getGfxVersion () const |
![]() | |
Addr | pciToDma (Addr pci_addr) const |
void | intrPost () |
void | intrClear () |
uint8_t | interruptLine () const |
AddrRangeList | getAddrRanges () const override |
Determine the address ranges that this device responds to. More... | |
PciDevice (const PciDeviceParams ¶ms) | |
Constructor for PCI Dev. More... | |
void | serialize (CheckpointOut &cp) const override |
Serialize this object to the given output stream. More... | |
void | unserialize (CheckpointIn &cp) override |
Reconstruct the state of this object from a checkpoint. More... | |
const PciBusAddr & | busAddr () const |
![]() | |
DmaDevice (const Params &p) | |
virtual | ~DmaDevice ()=default |
void | dmaWrite (Addr addr, int size, Event *event, uint8_t *data, uint32_t sid, uint32_t ssid, Tick delay=0) |
void | dmaWrite (Addr addr, int size, Event *event, uint8_t *data, Tick delay=0) |
void | dmaRead (Addr addr, int size, Event *event, uint8_t *data, uint32_t sid, uint32_t ssid, Tick delay=0) |
void | dmaRead (Addr addr, int size, Event *event, uint8_t *data, Tick delay=0) |
bool | dmaPending () const |
void | init () override |
init() is called after all C++ SimObjects have been created and all ports are connected. More... | |
unsigned int | cacheBlockSize () const |
Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) override |
Get a port with a given name and index. More... | |
![]() | |
PioDevice (const Params &p) | |
virtual | ~PioDevice () |
void | init () override |
init() is called after all C++ SimObjects have been created and all ports are connected. More... | |
Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) override |
Get a port with a given name and index. More... | |
![]() | |
ClockedObject (const ClockedObjectParams &p) | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
![]() | |
const Params & | params () const |
SimObject (const Params &p) | |
virtual | ~SimObject () |
virtual void | loadState (CheckpointIn &cp) |
loadState() is called on each SimObject when restoring from a checkpoint. More... | |
virtual void | initState () |
initState() is called on each SimObject when not restoring from a checkpoint. More... | |
virtual void | regProbePoints () |
Register probe points for this object. More... | |
virtual void | regProbeListeners () |
Register probe listeners for this object. More... | |
ProbeManager * | getProbeManager () |
Get the probe manager for this object. More... | |
virtual void | startup () |
startup() is the final initialization call before simulation. More... | |
DrainState | drain () override |
Provide a default implementation of the drain interface for objects that don't need draining. More... | |
virtual void | memWriteback () |
Write back dirty buffers to memory using functional writes. More... | |
virtual void | memInvalidate () |
Invalidate the contents of memory buffers. More... | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. More... | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. More... | |
![]() | |
EventQueue * | eventQueue () const |
void | schedule (Event &event, Tick when) |
void | deschedule (Event &event) |
void | reschedule (Event &event, Tick when, bool always=false) |
void | schedule (Event *event, Tick when) |
void | deschedule (Event *event) |
void | reschedule (Event *event, Tick when, bool always=false) |
void | wakeupEventQueue (Tick when=(Tick) -1) |
This function is not needed by the usual gem5 event loop but may be necessary in derived EventQueues which host gem5 on other schedulers. More... | |
void | setCurTick (Tick newVal) |
EventManager (EventManager &em) | |
Event manger manages events in the event queue. More... | |
EventManager (EventManager *em) | |
EventManager (EventQueue *eq) | |
![]() | |
Serializable () | |
virtual | ~Serializable () |
void | serializeSection (CheckpointOut &cp, const char *name) const |
Serialize an object into a new section. More... | |
void | serializeSection (CheckpointOut &cp, const std::string &name) const |
void | unserializeSection (CheckpointIn &cp, const char *name) |
Unserialize an a child object. More... | |
void | unserializeSection (CheckpointIn &cp, const std::string &name) |
![]() | |
DrainState | drainState () const |
Return the current drain state of an object. More... | |
virtual void | notifyFork () |
Notify a child process of a fork. More... | |
![]() | |
Group (Group *parent, const char *name=nullptr) | |
Construct a new statistics group. More... | |
virtual | ~Group () |
virtual void | regStats () |
Callback to set stat parameters. More... | |
virtual void | resetStats () |
Callback to reset stats. More... | |
virtual void | preDumpStats () |
Callback before stats are dumped. More... | |
void | addStat (statistics::Info *info) |
Register a stat with this group. More... | |
const std::map< std::string, Group * > & | getStatGroups () const |
Get all child groups associated with this object. More... | |
const std::vector< Info * > & | getStats () const |
Get all stats associated with this object. More... | |
void | addStatGroup (const char *name, Group *block) |
Add a stat block as a child of this block. More... | |
const Info * | resolveStat (std::string name) const |
Resolve a stat by its name within this group. More... | |
void | mergeStatGroup (Group *block) |
Merge the contents (stats & children) of a block to this block. More... | |
Group ()=delete | |
Group (const Group &)=delete | |
Group & | operator= (const Group &)=delete |
![]() | |
Named (const std::string &name_) | |
virtual | ~Named ()=default |
virtual std::string | name () const |
![]() | |
void | updateClockPeriod () |
Update the tick to the current tick. More... | |
Tick | clockEdge (Cycles cycles=Cycles(0)) const |
Determine the tick when a cycle begins, by default the current one, but the argument also enables the caller to determine a future cycle. More... | |
Cycles | curCycle () const |
Determine the current cycle, corresponding to a tick aligned to a clock edge. More... | |
Tick | nextCycle () const |
Based on the clock of the object, determine the start tick of the first cycle that is at least one cycle in the future. More... | |
uint64_t | frequency () const |
Tick | clockPeriod () const |
double | voltage () const |
Cycles | ticksToCycles (Tick t) const |
Tick | cyclesToTicks (Cycles c) const |
Private Types | |
using | GPURegMap = std::unordered_map< uint32_t, uint64_t > |
Structures to hold registers, doorbells, and some frame memory. More... | |
typedef void(SDMAEngine::* | sdmaFuncPtr) (uint32_t) |
Private Member Functions | |
void | dispatchAccess (PacketPtr pkt, bool read) |
Convert a PCI packet into a response. More... | |
void | readFrame (PacketPtr pkt, Addr offset) |
Helper methods to handle specific BAR read/writes. More... | |
void | readDoorbell (PacketPtr pkt, Addr offset) |
void | readMMIO (PacketPtr pkt, Addr offset) |
void | writeFrame (PacketPtr pkt, Addr offset) |
void | writeDoorbell (PacketPtr pkt, Addr offset) |
void | writeMMIO (PacketPtr pkt, Addr offset) |
bool | isROM (Addr addr) const |
void | readROM (PacketPtr pkt) |
void | writeROM (PacketPtr pkt) |
Private Attributes | |
GPURegMap | regs |
std::unordered_map< uint32_t, QueueType > | doorbells |
AddrRange | romRange |
VGA ROM methods. More... | |
std::array< uint8_t, ROM_SIZE > | rom |
AMDMMIOReader | mmioReader |
MMIO reader to populate device registers map. More... | |
AMDGPUNbio | nbio |
Blocks of the GPU. More... | |
AMDGPUMemoryManager * | gpuMemMgr |
AMDGPUInterruptHandler * | deviceIH |
AMDGPUVM | gpuvm |
PM4PacketProcessor * | pm4PktProc |
GPUCommandProcessor * | cp |
std::unordered_map< uint32_t, SDMAEngine * > | sdmaEngs |
std::unordered_map< uint32_t, SDMAEngine * > | sdmaIds |
std::unordered_map< uint32_t, AddrRange > | sdmaMmios |
std::unordered_map< uint32_t, sdmaFuncPtr > | sdmaFunc |
bool | checkpoint_before_mmios |
Initial checkpoint support variables. More... | |
int | init_interrupt_count |
std::unordered_map< uint16_t, uint16_t > | idMap |
std::unordered_map< Addr, uint16_t > | doorbellVMIDMap |
std::unordered_map< uint16_t, std::set< int > > | usedVMIDs |
uint16_t | _lastVMID |
memory::PhysicalMemory | deviceMem |
GfxVersion | gfx_version = GfxVersion::gfx900 |
Additional Inherited Members | |
![]() | |
typedef DmaDeviceParams | Params |
![]() | |
using | Params = PioDeviceParams |
![]() | |
using | Params = ClockedObjectParams |
Parameters of ClockedObject. More... | |
![]() | |
typedef SimObjectParams | Params |
![]() | |
static void | serializeAll (const std::string &cpt_dir) |
Create a checkpoint by serializing all SimObjects in the system. More... | |
static SimObject * | find (const char *name) |
Find the SimObject with the given name and return a pointer to it. More... | |
static void | setSimObjectResolver (SimObjectResolver *resolver) |
There is a single object name resolver, and it is only set when simulation is restoring from checkpoints. More... | |
static SimObjectResolver * | getSimObjectResolver () |
There is a single object name resolver, and it is only set when simulation is restoring from checkpoints. More... | |
![]() | |
static const std::string & | currentSection () |
Gets the fully-qualified name of the active section. More... | |
static void | generateCheckpointOut (const std::string &cpt_dir, std::ofstream &outstream) |
Generate a checkpoint file so that the serialization can be routed to it. More... | |
![]() | |
PowerState * | powerState |
![]() | |
bool | getBAR (Addr addr, int &num, Addr &offs) |
Which base address register (if any) maps the given address? More... | |
![]() | |
Drainable () | |
virtual | ~Drainable () |
virtual void | drainResume () |
Resume execution after a successful drain. More... | |
void | signalDrainDone () const |
Signal that an object is drained. More... | |
![]() | |
Clocked (ClockDomain &clk_domain) | |
Create a clocked object and set the clock domain based on the parameters. More... | |
Clocked (Clocked &)=delete | |
Clocked & | operator= (Clocked &)=delete |
virtual | ~Clocked () |
Virtual destructor due to inheritance. More... | |
void | resetClock () const |
Reset the object's clock using the current global tick value. More... | |
virtual void | clockPeriodUpdated () |
A hook subclasses can implement so they can do any extra work that's needed when the clock rate is changed. More... | |
![]() | |
const PciBusAddr | _busAddr |
PCIConfig | config |
The current config space. More... | |
std::vector< MSIXTable > | msix_table |
MSIX Table and PBA Structures. More... | |
std::vector< MSIXPbaEntry > | msix_pba |
std::array< PciBar *, 6 > | BARs {} |
PciHost::DeviceInterface | hostInterface |
Tick | pioDelay |
Tick | configDelay |
const int | PMCAP_BASE |
The capability list structures and base addresses. More... | |
const int | PMCAP_ID_OFFSET |
const int | PMCAP_PC_OFFSET |
const int | PMCAP_PMCS_OFFSET |
PMCAP | pmcap |
const int | MSICAP_BASE |
MSICAP | msicap |
const int | MSIXCAP_BASE |
const int | MSIXCAP_ID_OFFSET |
const int | MSIXCAP_MXC_OFFSET |
const int | MSIXCAP_MTAB_OFFSET |
const int | MSIXCAP_MPBA_OFFSET |
int | MSIX_TABLE_OFFSET |
int | MSIX_TABLE_END |
int | MSIX_PBA_OFFSET |
int | MSIX_PBA_END |
MSIXCAP | msixcap |
const int | PXCAP_BASE |
PXCAP | pxcap |
![]() | |
DmaPort | dmaPort |
![]() | |
System * | sys |
PioPort< PioDevice > | pioPort |
The pioPort that handles the requests for us and provides us requests that it sees. More... | |
![]() | |
const SimObjectParams & | _params |
Cached copy of the object parameters. More... | |
![]() | |
EventQueue * | eventq |
A pointer to this object's event queue. More... | |
Device model for an AMD GPU.
This models the interface between the PCI bus and the various IP blocks behind it. It translates requests to the various BARs and sends them to the appropriate IP block. BAR0 requests are VRAM requests that go to device memory, BAR2 are doorbells which are decoded and sent to the corresponding IP block. BAR5 is the MMIO interface which writes data values to registers controlling the IP blocks.
Definition at line 62 of file amdgpu_device.hh.
|
private |
Structures to hold registers, doorbells, and some frame memory.
Definition at line 89 of file amdgpu_device.hh.
|
private |
Definition at line 125 of file amdgpu_device.hh.
gem5::AMDGPUDevice::AMDGPUDevice | ( | const AMDGPUDeviceParams & | p | ) |
Definition at line 55 of file amdgpu_device.cc.
References AMDGPU_MP0_SMN_C2PMSG_33, gem5::PciDevice::config, cp, deviceIH, DPRINTF, gem5::AMDGPUMemoryManager::getRequestorID(), gfx_version, gpuMemMgr, gpuvm, gem5::GPUCommandProcessor::hsaPacketProc(), gem5::VegaISA::m, MI100_FB_LOCATION_BASE, MI100_FB_LOCATION_TOP, MI100_MEM_SIZE_REG, MI200_FB_LOCATION_BASE, MI200_FB_LOCATION_TOP, MI200_MEM_SIZE_REG, mmioReader, nbio, gem5::VegaISA::p, panic, pm4PktProc, gem5::RangeSize(), gem5::PioDevice::read(), gem5::AMDMMIOReader::readMMIOTrace(), rom, gem5::ROM_SIZE, romRange, gem5::VegaISA::s, sdmaFunc, sdmaIds, sdmaMmios, gem5::SDMAEngine::setGfxBaseHi(), gem5::SDMAEngine::setGfxBaseLo(), gem5::SDMAEngine::setGfxDoorbellLo(), gem5::SDMAEngine::setGfxDoorbellOffsetLo(), gem5::SDMAEngine::setGfxRptrHi(), gem5::SDMAEngine::setGfxRptrLo(), gem5::SDMAEngine::setGfxSize(), gem5::SDMAEngine::setGfxWptrHi(), gem5::SDMAEngine::setGfxWptrLo(), gem5::PM4PacketProcessor::setGPUDevice(), gem5::GPUCommandProcessor::setGPUDevice(), gem5::AMDGPUNbio::setGPUDevice(), gem5::AMDGPUInterruptHandler::setGPUDevice(), gem5::HSAPacketProcessor::setGPUDevice(), gem5::AMDGPUVM::setMMHUBBase(), gem5::AMDGPUVM::setMMHUBTop(), gem5::SDMAEngine::setPageBaseLo(), gem5::SDMAEngine::setPageDoorbellLo(), gem5::SDMAEngine::setPageDoorbellOffsetLo(), gem5::SDMAEngine::setPageRptrHi(), gem5::SDMAEngine::setPageRptrLo(), gem5::SDMAEngine::setPageSize(), gem5::SDMAEngine::setPageWptrLo(), setRegVal(), sc_dt::to_string(), VEGA10_FB_LOCATION_BASE, VEGA10_FB_LOCATION_TOP, and gem5::VGA_ROM_DEFAULT.
uint16_t gem5::AMDGPUDevice::allocateVMID | ( | uint16_t | pasid | ) |
Definition at line 714 of file amdgpu_device.cc.
References _lastVMID, gem5::AMDGPU_VM_COUNT, idMap, panic, and usedVMIDs.
Referenced by gem5::PM4PacketProcessor::mapProcess().
|
inline |
Definition at line 182 of file amdgpu_device.hh.
References cp.
Referenced by gem5::PM4PacketProcessor::mapProcess(), gem5::PM4PacketProcessor::processMQD(), and gem5::PM4PacketProcessor::unmapQueues().
void gem5::AMDGPUDevice::deallocateAllQueues | ( | ) |
Definition at line 747 of file amdgpu_device.cc.
References idMap, sdmaEngs, and usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
void gem5::AMDGPUDevice::deallocatePasid | ( | uint16_t | pasid | ) |
Definition at line 735 of file amdgpu_device.cc.
References idMap, and usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
void gem5::AMDGPUDevice::deallocateVmid | ( | uint16_t | vmid | ) |
Definition at line 729 of file amdgpu_device.cc.
References usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
|
private |
Convert a PCI packet into a response.
Definition at line 256 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Packet::makeAtomicResponse(), and read().
|
overridevirtual |
Every PIO device is obliged to provide an implementation that returns the address ranges the device responds to.
Implements gem5::PioDevice.
Definition at line 198 of file amdgpu_device.cc.
References gem5::PciDevice::getAddrRanges(), gem5::VegaISA::r, and romRange.
|
inline |
Definition at line 215 of file amdgpu_device.hh.
References gfx_version.
Referenced by gem5::PM4PacketProcessor::decodeHeader(), and gem5::GPUCommandProcessor::submitDispatchPkt().
|
inline |
Get handles to GPU blocks.
Definition at line 177 of file amdgpu_device.hh.
References deviceIH.
Referenced by gem5::PM4PacketProcessor::releaseMemDone(), and gem5::SDMAEngine::trap().
|
inline |
Definition at line 181 of file amdgpu_device.hh.
References gpuMemMgr.
Referenced by gem5::SDMAEngine::copy(), gem5::SDMAEngine::copyReadData(), gem5::SDMAEngine::ptePde(), and gem5::SDMAEngine::writeReadData().
uint32_t gem5::AMDGPUDevice::getRegVal | ( | uint32_t | addr | ) |
Definition at line 539 of file amdgpu_device.cc.
References gem5::X86ISA::addr, DPRINTF, and regs.
Referenced by gem5::AMDGPUNbio::readMMIO().
SDMAEngine * gem5::AMDGPUDevice::getSDMAById | ( | int | id | ) |
PM4 packets selected SDMAs using an integer ID. This method simply maps the integer ID to a pointer to the SDMA and checks for invalid IDs.
Definition at line 568 of file amdgpu_device.cc.
References gem5::ArmISA::id, and sdmaIds.
Referenced by gem5::PM4PacketProcessor::processSDMAMQD(), and writeMMIO().
SDMAEngine * gem5::AMDGPUDevice::getSDMAEngine | ( | Addr | offset | ) |
Definition at line 580 of file amdgpu_device.cc.
References gem5::ArmISA::offset, and sdmaEngs.
Referenced by writeDoorbell().
std::unordered_map< uint16_t, std::set< int > > & gem5::AMDGPUDevice::getUsedVMIDs | ( | ) |
Definition at line 764 of file amdgpu_device.cc.
References usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
|
inline |
Definition at line 180 of file amdgpu_device.hh.
References gpuvm.
Referenced by gem5::PM4PacketProcessor::decodeHeader(), gem5::SDMAEngine::getDeviceAddress(), gem5::PM4PacketProcessor::getGARTAddr(), gem5::SDMAEngine::getGARTAddr(), gem5::PM4PacketProcessor::mapProcess(), gem5::SDMAEngine::ptePde(), gem5::GPUCommandProcessor::submitDispatchPkt(), gem5::PM4PacketProcessor::translate(), gem5::GPUCommandProcessor::translate(), gem5::SDMAEngine::translate(), gem5::HSAPacketProcessor::translate(), gem5::VegaISA::GpuTLB::translationReturn(), gem5::AMDGPUNbio::writeFrame(), gem5::AMDGPUNbio::writeMMIO(), and gem5::SDMAEngine::writeReadData().
|
inline |
Definition at line 210 of file amdgpu_device.hh.
References doorbellVMIDMap.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
bool gem5::AMDGPUDevice::haveRegVal | ( | uint32_t | addr | ) |
Register value getter/setter.
Used by other GPU blocks to change values from incoming driver/user packets.
Definition at line 533 of file amdgpu_device.cc.
References gem5::X86ISA::addr, and regs.
Referenced by gem5::AMDGPUNbio::readMMIO().
void gem5::AMDGPUDevice::insertQId | ( | uint16_t | vmid, |
int | id | ||
) |
Definition at line 770 of file amdgpu_device.cc.
References usedVMIDs.
Referenced by gem5::PM4PacketProcessor::processMQD().
void gem5::AMDGPUDevice::intrPost | ( | ) |
Methods inherited from PciDevice.
Definition at line 586 of file amdgpu_device.cc.
References gem5::PciDevice::intrPost().
Referenced by gem5::AMDGPUInterruptHandler::intrPost().
|
inlineprivate |
Definition at line 97 of file amdgpu_device.hh.
References gem5::X86ISA::addr, gem5::AddrRange::contains(), and romRange.
Referenced by read(), write(), and writeROM().
|
inline |
Definition at line 204 of file amdgpu_device.hh.
References _lastVMID.
Referenced by gem5::PM4PacketProcessor::mapQueues().
void gem5::AMDGPUDevice::mapDoorbellToVMID | ( | Addr | doorbell, |
uint16_t | vmid | ||
) |
Definition at line 758 of file amdgpu_device.cc.
References doorbellVMIDMap.
Referenced by gem5::PM4PacketProcessor::mapQueues().
Pure virtual function that the device must implement.
Called when a read command is recieved by the port.
pkt | Packet describing this request |
Implements gem5::PioDevice.
Definition at line 463 of file amdgpu_device.cc.
References dispatchAccess(), gem5::DOORBELL_BAR, gem5::FRAMEBUFFER_BAR, gem5::Packet::getAddr(), gem5::PciDevice::getBAR(), isROM(), gem5::MMIO_BAR, gem5::ArmISA::offset, panic, gem5::PciDevice::pioDelay, readDoorbell(), readFrame(), readMMIO(), and readROM().
Referenced by dispatchAccess().
Read from the PCI config space data that is stored locally.
This may be overridden by the device but at some point it will eventually call this for normal operations that it does not need to override.
pkt | packet containing the write the offset into config space |
Reimplemented from gem5::PciDevice.
Definition at line 217 of file amdgpu_device.cc.
References checkpoint_before_mmios, gem5::PciDevice::config, gem5::curTick(), DPRINTF, gem5::exitSimLoop(), gem5::Packet::getAddr(), gem5::Packet::getSize(), init_interrupt_count, gem5::ArmISA::offset, PCI0_INTERRUPT_PIN, PCI_CONFIG_SIZE, and gem5::PciDevice::readConfig().
Definition at line 297 of file amdgpu_device.cc.
References gem5::DOORBELL_BAR, DPRINTF, mmioReader, gem5::ArmISA::offset, and gem5::AMDMMIOReader::readFromTrace().
Referenced by read().
Helper methods to handle specific BAR read/writes.
Offset is the address of the packet - base address of the BAR.
read/writeFrame are used for BAR0 requests read/writeDoorbell are used for BAR2 requests read/writeMMIO are used for BAR5 requests
Definition at line 266 of file amdgpu_device.cc.
References cp, gem5::Packet::createRead(), gem5::Packet::dataDynamic(), DPRINTF, gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Shader::gpuCmdProc, nbio, gem5::ArmISA::offset, gem5::AMDGPUNbio::readFrame(), gem5::Packet::setUintX(), gem5::GPUCommandProcessor::shader(), gem5::GPUCommandProcessor::system(), gem5::X86ISA::system, and vramRequestorId().
Referenced by read().
Definition at line 304 of file amdgpu_device.cc.
References DPRINTF, gem5::AMDGPUVM::getMmioAperture(), gpuvm, gem5::GRBM_BASE, gem5::GRBM_OFFSET_SHIFT, gem5::MMHUB_BASE, gem5::MMHUB_OFFSET_SHIFT, gem5::MMIO_BAR, mmioReader, nbio, gem5::NBIO_BASE, gem5::ArmISA::offset, gem5::AMDMMIOReader::readFromTrace(), gem5::AMDGPUNbio::readMMIO(), gem5::AMDGPUVM::readMMIO(), regs, and gem5::Packet::setUintX().
Referenced by read().
|
private |
Definition at line 171 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), rom, gem5::ROM_SIZE, and gem5::Packet::setUintX().
Referenced by read().
|
overridevirtual |
Checkpoint support.
Implements gem5::Serializable.
Definition at line 592 of file amdgpu_device.cc.
References cp, deviceMem, doorbells, gpuvm, regs, sdmaEngs, gem5::PciDevice::serialize(), SERIALIZE_ARRAY, SERIALIZE_SCALAR, and gem5::Serializable::serializeSection().
void gem5::AMDGPUDevice::setDoorbellType | ( | uint32_t | offset, |
QueueType | qt | ||
) |
Set handles to GPU blocks.
Definition at line 555 of file amdgpu_device.cc.
References doorbells, DPRINTF, and gem5::ArmISA::offset.
Referenced by gem5::PM4PacketProcessor::newQueue(), gem5::PM4PacketProcessor::processSDMAMQD(), gem5::SDMAEngine::setGfxDoorbellOffsetLo(), gem5::SDMAEngine::setPageDoorbellOffsetLo(), gem5::PM4PacketProcessor::writeMMIO(), gem5::AMDGPUInterruptHandler::writeMMIO(), and gem5::SDMAEngine::writeMMIO().
void gem5::AMDGPUDevice::setRegVal | ( | uint32_t | addr, |
uint32_t | value | ||
) |
Definition at line 547 of file amdgpu_device.cc.
References gem5::X86ISA::addr, DPRINTF, and regs.
Referenced by AMDGPUDevice(), gem5::PM4PacketProcessor::setUconfigReg(), and gem5::AMDGPUNbio::writeMMIO().
void gem5::AMDGPUDevice::setSDMAEngine | ( | Addr | offset, |
SDMAEngine * | eng | ||
) |
Definition at line 562 of file amdgpu_device.cc.
References gem5::ArmISA::offset, and sdmaEngs.
Referenced by gem5::PM4PacketProcessor::processSDMAMQD(), gem5::SDMAEngine::setGfxDoorbellOffsetLo(), gem5::SDMAEngine::setPageDoorbellOffsetLo(), and gem5::SDMAEngine::writeMMIO().
|
overridevirtual |
Unserialize an object.
Read an object's state from the current checkpoint section.
cp | Checkpoint state |
Implements gem5::Serializable.
Definition at line 650 of file amdgpu_device.cc.
References cp, deviceMem, doorbells, gpuvm, regs, sdmaEngs, sdmaIds, gem5::PciDevice::unserialize(), UNSERIALIZE_ARRAY, UNSERIALIZE_SCALAR, and gem5::Serializable::unserializeSection().
|
inline |
Methods related to translations and system/device memory.
Definition at line 201 of file amdgpu_device.hh.
References gem5::AMDGPUMemoryManager::getRequestorID(), and gpuMemMgr.
Referenced by readFrame(), gem5::GPUCommandProcessor::setGPUDevice(), gem5::SDMAEngine::setGPUDevice(), gem5::HSAPacketProcessor::setGPUDevice(), gem5::VegaISA::GpuTLB::translationReturn(), gem5::GPUCommandProcessor::vramRequestorId(), and writeFrame().
Pure virtual function that the device must implement.
Called when a write command is recieved by the port.
pkt | Packet describing this request |
Implements gem5::PioDevice.
Definition at line 492 of file amdgpu_device.cc.
References data, dispatchAccess(), gem5::DOORBELL_BAR, DPRINTF, gem5::FRAMEBUFFER_BAR, gem5::Packet::getAddr(), gem5::PciDevice::getBAR(), gem5::Packet::getUintX(), isROM(), gem5::MMIO_BAR, gem5::ArmISA::offset, panic, gem5::PciDevice::pioDelay, writeDoorbell(), writeFrame(), writeMMIO(), and writeROM().
Write to the PCI config space data that is stored locally.
This may be overridden by the device but at some point it will eventually call this for normal operations that it does not need to override.
pkt | packet containing the write the offset into config space |
Reimplemented from gem5::PciDevice.
Definition at line 245 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::ArmISA::offset, PCI_CONFIG_SIZE, and gem5::PciDevice::writeConfig().
Definition at line 371 of file amdgpu_device.cc.
References gem5::Compute, gem5::ComputeAQL, cp, deviceIH, doorbells, DPRINTF, gem5::Packet::getLE(), gem5::PM4PacketProcessor::getQueue(), getSDMAEngine(), gem5::Gfx, gem5::GPUCommandProcessor::hsaPacketProc(), gem5::HSAPacketProcessor::hwScheduler(), gem5::InterruptHandler, gem5::ArmISA::offset, panic, pm4PktProc, gem5::PM4PacketProcessor::process(), gem5::SDMAEngine::processGfx(), gem5::SDMAEngine::processPage(), gem5::SDMAEngine::processRLC(), gem5::RLC, gem5::SDMAGfx, gem5::SDMAPage, gem5::PM4PacketProcessor::updateReadIndex(), gem5::AMDGPUInterruptHandler::updateRptr(), warn, and gem5::HWScheduler::write().
Referenced by write().
Definition at line 337 of file amdgpu_device.cc.
References cp, gem5::Packet::createWrite(), gem5::Packet::dataDynamic(), DPRINTF, gem5::AMDGPUVM::gartBase(), gem5::AMDGPUVM::gartTable, gem5::AMDGPUVM::getFrameAperture(), gem5::Packet::getPtr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Shader::gpuCmdProc, gpuvm, nbio, gem5::ArmISA::offset, gem5::GPUCommandProcessor::shader(), gem5::GPUCommandProcessor::system(), gem5::X86ISA::system, vramRequestorId(), and gem5::AMDGPUNbio::writeFrame().
Referenced by write().
Definition at line 417 of file amdgpu_device.cc.
References deviceIH, DPRINTF, gem5::Packet::getLE(), gem5::AMDGPUVM::getMmioAperture(), getSDMAById(), gpuvm, gem5::GRBM_BASE, gem5::GRBM_OFFSET_SHIFT, gem5::IH_BASE, gem5::IH_OFFSET_SHIFT, nbio, gem5::NBIO_BASE, gem5::ArmISA::offset, pm4PktProc, sdmaFunc, sdmaIds, sdmaMmios, gem5::AMDGPUNbio::writeMMIO(), gem5::PM4PacketProcessor::writeMMIO(), gem5::AMDGPUInterruptHandler::writeMMIO(), and gem5::AMDGPUVM::writeMMIO().
Referenced by write().
|
private |
Definition at line 184 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), isROM(), rom, romRange, and gem5::AddrRange::start().
Referenced by write().
|
private |
Definition at line 142 of file amdgpu_device.hh.
Referenced by allocateVMID(), and lastVMID().
|
private |
Initial checkpoint support variables.
Definition at line 131 of file amdgpu_device.hh.
Referenced by readConfig().
|
private |
Definition at line 116 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), CP(), readFrame(), serialize(), unserialize(), writeDoorbell(), and writeFrame().
|
private |
Definition at line 113 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getIH(), writeDoorbell(), and writeMMIO().
|
private |
Definition at line 147 of file amdgpu_device.hh.
Referenced by serialize(), and unserialize().
|
private |
Definition at line 91 of file amdgpu_device.hh.
Referenced by serialize(), setDoorbellType(), unserialize(), and writeDoorbell().
|
private |
Definition at line 138 of file amdgpu_device.hh.
Referenced by getVMID(), and mapDoorbellToVMID().
|
private |
Definition at line 150 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and getGfxVersion().
|
private |
Definition at line 112 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getMemMgr(), and vramRequestorId().
|
private |
Definition at line 114 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getVM(), readMMIO(), serialize(), unserialize(), writeFrame(), and writeMMIO().
|
private |
Definition at line 136 of file amdgpu_device.hh.
Referenced by allocateVMID(), deallocateAllQueues(), and deallocatePasid().
|
private |
Definition at line 132 of file amdgpu_device.hh.
Referenced by readConfig().
|
private |
MMIO reader to populate device registers map.
Definition at line 106 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), readDoorbell(), and readMMIO().
|
private |
Blocks of the GPU.
Definition at line 111 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), readFrame(), readMMIO(), writeFrame(), and writeMMIO().
|
private |
Definition at line 115 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), writeDoorbell(), and writeMMIO().
|
private |
Definition at line 90 of file amdgpu_device.hh.
Referenced by getRegVal(), haveRegVal(), readMMIO(), serialize(), setRegVal(), and unserialize().
|
private |
Definition at line 101 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), readROM(), and writeROM().
|
private |
VGA ROM methods.
Definition at line 96 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getAddrRanges(), isROM(), and writeROM().
|
private |
Definition at line 119 of file amdgpu_device.hh.
Referenced by deallocateAllQueues(), getSDMAEngine(), serialize(), setSDMAEngine(), and unserialize().
|
private |
Definition at line 126 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and writeMMIO().
|
private |
Definition at line 121 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getSDMAById(), unserialize(), and writeMMIO().
|
private |
Definition at line 123 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and writeMMIO().
|
private |
Definition at line 140 of file amdgpu_device.hh.
Referenced by allocateVMID(), deallocateAllQueues(), deallocatePasid(), deallocateVmid(), getUsedVMIDs(), and insertQId().