gem5 v24.1.0.1
|
Device model for an AMD GPU. More...
#include <amdgpu_device.hh>
Classes | |
struct | AddrRangeHasher |
Public Member Functions | |
AMDGPUDevice (const AMDGPUDeviceParams &p) | |
void | intrPost () |
Methods inherited from PciDevice. | |
Tick | writeConfig (PacketPtr pkt) override |
Write to the PCI config space data that is stored locally. | |
Tick | readConfig (PacketPtr pkt) override |
Read from the PCI config space data that is stored locally. | |
Tick | read (PacketPtr pkt) override |
Pure virtual function that the device must implement. | |
Tick | write (PacketPtr pkt) override |
Pure virtual function that the device must implement. | |
AddrRangeList | getAddrRanges () const override |
Every PIO device is obliged to provide an implementation that returns the address ranges the device responds to. | |
void | serialize (CheckpointOut &cp) const override |
Checkpoint support. | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. | |
AMDGPUInterruptHandler * | getIH () |
Get handles to GPU blocks. | |
SDMAEngine * | getSDMAById (int id) |
SDMAEngine * | getSDMAEngine (Addr offset) |
AMDGPUVM & | getVM () |
AMDGPUMemoryManager * | getMemMgr () |
GPUCommandProcessor * | CP () |
void | setDoorbellType (uint32_t offset, QueueType qt, int ip_id=0) |
Set handles to GPU blocks. | |
void | unsetDoorbell (uint32_t offset) |
void | processPendingDoorbells (uint32_t offset) |
void | setSDMAEngine (Addr offset, SDMAEngine *eng) |
uint32_t | getRegVal (uint64_t addr) |
Register value getter/setter. | |
void | setRegVal (uint64_t addr, uint32_t value) |
RequestorID | vramRequestorId () |
Methods related to translations and system/device memory. | |
uint16_t | lastVMID () |
uint16_t | allocateVMID (uint16_t pasid) |
void | deallocateVmid (uint16_t vmid) |
void | deallocatePasid (uint16_t pasid) |
void | deallocateAllQueues (bool unmap_static) |
void | mapDoorbellToVMID (Addr doorbell, uint16_t vmid) |
uint16_t | getVMID (Addr doorbell) |
std::unordered_map< uint16_t, std::set< int > > & | getUsedVMIDs () |
void | insertQId (uint16_t vmid, int id) |
GfxVersion | getGfxVersion () const |
![]() | |
Addr | pciToDma (Addr pci_addr) const |
void | intrPost () |
void | intrClear () |
uint8_t | interruptLine () const |
AddrRangeList | getAddrRanges () const override |
Determine the address ranges that this device responds to. | |
PciDevice (const PciDeviceParams ¶ms) | |
Constructor for PCI Dev. | |
void | serialize (CheckpointOut &cp) const override |
Serialize this object to the given output stream. | |
void | unserialize (CheckpointIn &cp) override |
Reconstruct the state of this object from a checkpoint. | |
const PciBusAddr & | busAddr () const |
![]() | |
DmaDevice (const Params &p) | |
virtual | ~DmaDevice ()=default |
void | dmaWrite (Addr addr, int size, Event *event, uint8_t *data, uint32_t sid, uint32_t ssid, Tick delay=0) |
void | dmaWrite (Addr addr, int size, Event *event, uint8_t *data, Tick delay=0) |
void | dmaRead (Addr addr, int size, Event *event, uint8_t *data, uint32_t sid, uint32_t ssid, Tick delay=0) |
void | dmaRead (Addr addr, int size, Event *event, uint8_t *data, Tick delay=0) |
bool | dmaPending () const |
void | init () override |
init() is called after all C++ SimObjects have been created and all ports are connected. | |
Addr | cacheBlockSize () const |
Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) override |
Get a port with a given name and index. | |
![]() | |
PioDevice (const Params &p) | |
virtual | ~PioDevice () |
void | init () override |
init() is called after all C++ SimObjects have been created and all ports are connected. | |
Port & | getPort (const std::string &if_name, PortID idx=InvalidPortID) override |
Get a port with a given name and index. | |
![]() | |
ClockedObject (const ClockedObjectParams &p) | |
![]() | |
const Params & | params () const |
SimObject (const Params &p) | |
virtual | ~SimObject () |
virtual void | loadState (CheckpointIn &cp) |
loadState() is called on each SimObject when restoring from a checkpoint. | |
virtual void | initState () |
initState() is called on each SimObject when not restoring from a checkpoint. | |
virtual void | regProbePoints () |
Register probe points for this object. | |
virtual void | regProbeListeners () |
Register probe listeners for this object. | |
ProbeManager * | getProbeManager () |
Get the probe manager for this object. | |
virtual void | startup () |
startup() is the final initialization call before simulation. | |
DrainState | drain () override |
Provide a default implementation of the drain interface for objects that don't need draining. | |
virtual void | memWriteback () |
Write back dirty buffers to memory using functional writes. | |
virtual void | memInvalidate () |
Invalidate the contents of memory buffers. | |
void | serialize (CheckpointOut &cp) const override |
Serialize an object. | |
void | unserialize (CheckpointIn &cp) override |
Unserialize an object. | |
![]() | |
EventQueue * | eventQueue () const |
void | schedule (Event &event, Tick when) |
void | deschedule (Event &event) |
void | reschedule (Event &event, Tick when, bool always=false) |
void | schedule (Event *event, Tick when) |
void | deschedule (Event *event) |
void | reschedule (Event *event, Tick when, bool always=false) |
void | wakeupEventQueue (Tick when=(Tick) -1) |
This function is not needed by the usual gem5 event loop but may be necessary in derived EventQueues which host gem5 on other schedulers. | |
void | setCurTick (Tick newVal) |
EventManager (EventManager &em) | |
Event manger manages events in the event queue. | |
EventManager (EventManager *em) | |
EventManager (EventQueue *eq) | |
![]() | |
Serializable () | |
virtual | ~Serializable () |
void | serializeSection (CheckpointOut &cp, const char *name) const |
Serialize an object into a new section. | |
void | serializeSection (CheckpointOut &cp, const std::string &name) const |
void | unserializeSection (CheckpointIn &cp, const char *name) |
Unserialize an a child object. | |
void | unserializeSection (CheckpointIn &cp, const std::string &name) |
![]() | |
DrainState | drainState () const |
Return the current drain state of an object. | |
virtual void | notifyFork () |
Notify a child process of a fork. | |
![]() | |
Group (Group *parent, const char *name=nullptr) | |
Construct a new statistics group. | |
virtual | ~Group () |
virtual void | regStats () |
Callback to set stat parameters. | |
virtual void | resetStats () |
Callback to reset stats. | |
virtual void | preDumpStats () |
Callback before stats are dumped. | |
void | addStat (statistics::Info *info) |
Register a stat with this group. | |
const std::map< std::string, Group * > & | getStatGroups () const |
Get all child groups associated with this object. | |
const std::vector< Info * > & | getStats () const |
Get all stats associated with this object. | |
void | addStatGroup (const char *name, Group *block) |
Add a stat block as a child of this block. | |
const Info * | resolveStat (std::string name) const |
Resolve a stat by its name within this group. | |
void | mergeStatGroup (Group *block) |
Merge the contents (stats & children) of a block to this block. | |
Group (const Group &)=delete | |
Group & | operator= (const Group &)=delete |
![]() | |
Named (const std::string &name_) | |
virtual | ~Named ()=default |
virtual std::string | name () const |
![]() | |
void | updateClockPeriod () |
Update the tick to the current tick. | |
Tick | clockEdge (Cycles cycles=Cycles(0)) const |
Determine the tick when a cycle begins, by default the current one, but the argument also enables the caller to determine a future cycle. | |
Cycles | curCycle () const |
Determine the current cycle, corresponding to a tick aligned to a clock edge. | |
Tick | nextCycle () const |
Based on the clock of the object, determine the start tick of the first cycle that is at least one cycle in the future. | |
uint64_t | frequency () const |
Tick | clockPeriod () const |
double | voltage () const |
Cycles | ticksToCycles (Tick t) const |
Tick | cyclesToTicks (Cycles c) const |
Private Types | |
typedef void(SDMAEngine::* | sdmaFuncPtr) (uint32_t) |
Private Member Functions | |
void | dispatchAccess (PacketPtr pkt, bool read) |
Convert a PCI packet into a response. | |
void | readFrame (PacketPtr pkt, Addr offset) |
Helper methods to handle specific BAR read/writes. | |
void | readDoorbell (PacketPtr pkt, Addr offset) |
void | readMMIO (PacketPtr pkt, Addr offset) |
void | writeFrame (PacketPtr pkt, Addr offset) |
void | writeDoorbell (PacketPtr pkt, Addr offset) |
void | writeMMIO (PacketPtr pkt, Addr offset) |
bool | isROM (Addr addr) const |
void | readROM (PacketPtr pkt) |
void | writeROM (PacketPtr pkt) |
Private Attributes | |
std::unordered_map< uint32_t, DoorbellInfo > | doorbells |
Structures to hold registers, doorbells, and some frame memory. | |
std::unordered_map< uint32_t, PacketPtr > | pendingDoorbellPkts |
AddrRange | romRange |
VGA ROM methods. | |
std::array< uint8_t, ROM_SIZE > | rom |
AMDMMIOReader | mmioReader |
MMIO reader to populate device registers map. | |
AMDGPUNbio | nbio |
Blocks of the GPU. | |
AMDGPUGfx | gfx |
AMDGPUMemoryManager * | gpuMemMgr |
AMDGPUInterruptHandler * | deviceIH |
AMDGPUVM | gpuvm |
GPUCommandProcessor * | cp |
std::unordered_map< int, PM4PacketProcessor * > | pm4PktProcs |
std::unordered_map< AddrRange, PM4PacketProcessor *, AddrRangeHasher > | pm4Ranges |
std::unordered_map< uint32_t, SDMAEngine * > | sdmaEngs |
std::unordered_map< uint32_t, SDMAEngine * > | sdmaIds |
std::unordered_map< uint32_t, AddrRange > | sdmaMmios |
std::unordered_map< uint32_t, sdmaFuncPtr > | sdmaFunc |
bool | checkpoint_before_mmios |
Initial checkpoint support variables. | |
int | init_interrupt_count |
std::unordered_map< uint16_t, uint16_t > | idMap |
std::unordered_map< Addr, uint16_t > | doorbellVMIDMap |
std::unordered_map< uint16_t, std::set< int > > | usedVMIDs |
uint16_t | _lastVMID |
memory::PhysicalMemory | deviceMem |
GfxVersion | gfx_version = GfxVersion::gfx900 |
Additional Inherited Members | |
![]() | |
typedef DmaDeviceParams | Params |
![]() | |
using | Params = PioDeviceParams |
![]() | |
using | Params = ClockedObjectParams |
Parameters of ClockedObject. | |
![]() | |
typedef SimObjectParams | Params |
![]() | |
static void | serializeAll (const std::string &cpt_dir) |
Create a checkpoint by serializing all SimObjects in the system. | |
static SimObject * | find (const char *name) |
Find the SimObject with the given name and return a pointer to it. | |
static void | setSimObjectResolver (SimObjectResolver *resolver) |
There is a single object name resolver, and it is only set when simulation is restoring from checkpoints. | |
static SimObjectResolver * | getSimObjectResolver () |
There is a single object name resolver, and it is only set when simulation is restoring from checkpoints. | |
![]() | |
static const std::string & | currentSection () |
Gets the fully-qualified name of the active section. | |
static void | generateCheckpointOut (const std::string &cpt_dir, std::ofstream &outstream) |
Generate a checkpoint file so that the serialization can be routed to it. | |
![]() | |
PowerState * | powerState |
![]() | |
bool | getBAR (Addr addr, int &num, Addr &offs) |
Which base address register (if any) maps the given address? | |
![]() | |
Drainable () | |
virtual | ~Drainable () |
virtual void | drainResume () |
Resume execution after a successful drain. | |
void | signalDrainDone () const |
Signal that an object is drained. | |
![]() | |
Clocked (ClockDomain &clk_domain) | |
Create a clocked object and set the clock domain based on the parameters. | |
Clocked (Clocked &)=delete | |
Clocked & | operator= (Clocked &)=delete |
virtual | ~Clocked () |
Virtual destructor due to inheritance. | |
void | resetClock () const |
Reset the object's clock using the current global tick value. | |
virtual void | clockPeriodUpdated () |
A hook subclasses can implement so they can do any extra work that's needed when the clock rate is changed. | |
![]() | |
const PciBusAddr | _busAddr |
PCIConfig | config |
The current config space. | |
std::vector< MSIXTable > | msix_table |
MSIX Table and PBA Structures. | |
std::vector< MSIXPbaEntry > | msix_pba |
std::array< PciBar *, 6 > | BARs {} |
PciHost::DeviceInterface | hostInterface |
Tick | pioDelay |
Tick | configDelay |
const int | PMCAP_BASE |
The capability list structures and base addresses. | |
const int | PMCAP_ID_OFFSET |
const int | PMCAP_PC_OFFSET |
const int | PMCAP_PMCS_OFFSET |
PMCAP | pmcap |
const int | MSICAP_BASE |
MSICAP | msicap |
const int | MSIXCAP_BASE |
const int | MSIXCAP_ID_OFFSET |
const int | MSIXCAP_MXC_OFFSET |
const int | MSIXCAP_MTAB_OFFSET |
const int | MSIXCAP_MPBA_OFFSET |
int | MSIX_TABLE_OFFSET |
int | MSIX_TABLE_END |
int | MSIX_PBA_OFFSET |
int | MSIX_PBA_END |
MSIXCAP | msixcap |
const int | PXCAP_BASE |
PXCAP | pxcap |
![]() | |
DmaPort | dmaPort |
![]() | |
System * | sys |
PioPort< PioDevice > | pioPort |
The pioPort that handles the requests for us and provides us requests that it sees. | |
![]() | |
const SimObjectParams & | _params |
Cached copy of the object parameters. | |
![]() | |
EventQueue * | eventq |
A pointer to this object's event queue. | |
Device model for an AMD GPU.
This models the interface between the PCI bus and the various IP blocks behind it. It translates requests to the various BARs and sends them to the appropriate IP block. BAR0 requests are VRAM requests that go to device memory, BAR2 are doorbells which are decoded and sent to the corresponding IP block. BAR5 is the MMIO interface which writes data values to registers controlling the IP blocks.
Definition at line 63 of file amdgpu_device.hh.
|
private |
Definition at line 136 of file amdgpu_device.hh.
gem5::AMDGPUDevice::AMDGPUDevice | ( | const AMDGPUDeviceParams & | p | ) |
Definition at line 55 of file amdgpu_device.cc.
References AMDGPU_MP0_SMN_C2PMSG_33, gem5::PciDevice::config, cp, deviceIH, DPRINTF, fatal_if, gem5::AMDGPUMemoryManager::getRequestorID(), gem5::GFX_MMIO_RANGE, gfx_version, gpuMemMgr, gpuvm, gem5::GRBM_MMIO_RANGE, gem5::GPUCommandProcessor::hsaPacketProc(), gem5::IH_MMIO_RANGE, gem5::ArmISA::m, MI100_FB_LOCATION_BASE, MI100_FB_LOCATION_TOP, MI100_MEM_SIZE_REG, MI200_FB_LOCATION_BASE, MI200_FB_LOCATION_TOP, MI200_MEM_SIZE_REG, gem5::MMHUB_MMIO_RANGE, nbio, gem5::NBIO_MMIO_RANGE, gem5::MipsISA::p, panic, pm4PktProcs, pm4Ranges, gem5::RangeSize(), gem5::ROM_SIZE, romRange, gem5::ArmISA::s, sdmaFunc, sdmaIds, sdmaMmios, gem5::SDMAEngine::setGfxBaseHi(), gem5::SDMAEngine::setGfxBaseLo(), gem5::SDMAEngine::setGfxDoorbellLo(), gem5::SDMAEngine::setGfxDoorbellOffsetLo(), gem5::SDMAEngine::setGfxRptrHi(), gem5::SDMAEngine::setGfxRptrLo(), gem5::SDMAEngine::setGfxSize(), gem5::SDMAEngine::setGfxWptrHi(), gem5::SDMAEngine::setGfxWptrLo(), gem5::AMDGPUNbio::setGPUDevice(), gem5::AMDGPUInterruptHandler::setGPUDevice(), gem5::HSAPacketProcessor::setGPUDevice(), gem5::GPUCommandProcessor::setGPUDevice(), gem5::AMDGPUVM::setMMHUBBase(), gem5::AMDGPUVM::setMMHUBTop(), gem5::AMDGPUVM::setMMIOAperture(), gem5::SDMAEngine::setPageBaseLo(), gem5::SDMAEngine::setPageDoorbellLo(), gem5::SDMAEngine::setPageDoorbellOffsetLo(), gem5::SDMAEngine::setPageRptrHi(), gem5::SDMAEngine::setPageRptrLo(), gem5::SDMAEngine::setPageSize(), gem5::SDMAEngine::setPageWptrLo(), setRegVal(), VEGA10_FB_LOCATION_BASE, VEGA10_FB_LOCATION_TOP, and gem5::VGA_ROM_DEFAULT.
uint16_t gem5::AMDGPUDevice::allocateVMID | ( | uint16_t | pasid | ) |
Definition at line 915 of file amdgpu_device.cc.
References _lastVMID, gem5::AMDGPU_VM_COUNT, idMap, panic, gem5::pasid, and usedVMIDs.
Referenced by gem5::PM4PacketProcessor::mapProcess().
|
inline |
Definition at line 193 of file amdgpu_device.hh.
References cp.
Referenced by gem5::SDMAEngine::copyDone(), gem5::PM4PacketProcessor::mapProcess(), gem5::PM4PacketProcessor::processMQD(), gem5::SDMAEngine::ptePdeDone(), gem5::PM4PacketProcessor::unmapAllQueues(), gem5::PM4PacketProcessor::unserialize(), gem5::SDMAEngine::writeDone(), and writeFrame().
void gem5::AMDGPUDevice::deallocateAllQueues | ( | bool | unmap_static | ) |
Definition at line 948 of file amdgpu_device.cc.
References doorbells, doorbellVMIDMap, idMap, gem5::ArmISA::offset, sdmaEngs, and usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
void gem5::AMDGPUDevice::deallocatePasid | ( | uint16_t | pasid | ) |
Definition at line 936 of file amdgpu_device.cc.
References idMap, gem5::pasid, and usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
void gem5::AMDGPUDevice::deallocateVmid | ( | uint16_t | vmid | ) |
Definition at line 930 of file amdgpu_device.cc.
References usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
|
private |
Convert a PCI packet into a response.
Definition at line 339 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Packet::makeAtomicResponse(), and read().
|
overridevirtual |
Every PIO device is obliged to provide an implementation that returns the address ranges the device responds to.
Implements gem5::PioDevice.
Definition at line 228 of file amdgpu_device.cc.
References gem5::PciDevice::getAddrRanges(), gem5::MipsISA::r, and romRange.
|
inline |
Definition at line 227 of file amdgpu_device.hh.
References gfx_version.
Referenced by gem5::PM4PacketProcessor::decodeHeader(), gem5::GPUCommandProcessor::dispatchKernelObject(), and gem5::AMDGPUNbio::readMMIO().
|
inline |
Get handles to GPU blocks.
Definition at line 188 of file amdgpu_device.hh.
References deviceIH.
Referenced by gem5::PM4PacketProcessor::releaseMemDone(), and gem5::SDMAEngine::trap().
|
inline |
Definition at line 192 of file amdgpu_device.hh.
References gpuMemMgr.
Referenced by gem5::SDMAEngine::constFill(), gem5::SDMAEngine::copy(), gem5::SDMAEngine::copyReadData(), gem5::SDMAEngine::ptePde(), and gem5::SDMAEngine::writeReadData().
uint32_t gem5::AMDGPUDevice::getRegVal | ( | uint64_t | addr | ) |
Register value getter/setter.
Used by other GPU blocks to change values from incoming driver/user packets.
Definition at line 671 of file amdgpu_device.cc.
References gem5::X86ISA::addr, gem5::bits(), gem5::Packet::createRead(), gem5::Packet::dataStatic(), DPRINTF, gem5::Packet::getLE(), readMMIO(), and vramRequestorId().
Referenced by gem5::AMDGPUNbio::readMMIO().
SDMAEngine * gem5::AMDGPUDevice::getSDMAById | ( | int | id | ) |
PM4 packets selected SDMAs using an integer ID. This method simply maps the integer ID to a pointer to the SDMA and checks for invalid IDs.
Definition at line 730 of file amdgpu_device.cc.
References gem5::ArmISA::id, and sdmaIds.
Referenced by gem5::PM4PacketProcessor::processSDMAMQD(), and writeMMIO().
SDMAEngine * gem5::AMDGPUDevice::getSDMAEngine | ( | Addr | offset | ) |
Definition at line 742 of file amdgpu_device.cc.
References gem5::ArmISA::offset, and sdmaEngs.
Referenced by writeDoorbell().
std::unordered_map< uint16_t, std::set< int > > & gem5::AMDGPUDevice::getUsedVMIDs | ( | ) |
Definition at line 973 of file amdgpu_device.cc.
References usedVMIDs.
Referenced by gem5::PM4PacketProcessor::unmapAllQueues().
|
inline |
Definition at line 191 of file amdgpu_device.hh.
References gpuvm.
Referenced by gem5::SDMAEngine::copy(), gem5::SDMAEngine::copyReadData(), gem5::PM4PacketProcessor::decodeHeader(), gem5::SDMAEngine::getDeviceAddress(), gem5::PM4PacketProcessor::getGARTAddr(), gem5::SDMAEngine::getGARTAddr(), gem5::PM4PacketProcessor::mapProcess(), gem5::SDMAEngine::ptePde(), gem5::GPUCommandProcessor::submitDispatchPkt(), gem5::PM4PacketProcessor::translate(), gem5::SDMAEngine::translate(), gem5::HSAPacketProcessor::translate(), gem5::GPUCommandProcessor::translate(), gem5::VegaISA::GpuTLB::translationReturn(), gem5::AMDGPUNbio::writeFrame(), gem5::AMDGPUNbio::writeMMIO(), and gem5::SDMAEngine::writeReadData().
|
inline |
Definition at line 222 of file amdgpu_device.hh.
References doorbellVMIDMap.
Referenced by gem5::PM4PacketProcessor::unmapQueues().
void gem5::AMDGPUDevice::insertQId | ( | uint16_t | vmid, |
int | id | ||
) |
Definition at line 979 of file amdgpu_device.cc.
References usedVMIDs.
Referenced by gem5::PM4PacketProcessor::processMQD().
void gem5::AMDGPUDevice::intrPost | ( | ) |
Methods inherited from PciDevice.
Definition at line 748 of file amdgpu_device.cc.
References gem5::PciDevice::intrPost().
Referenced by gem5::AMDGPUInterruptHandler::intrPost().
|
inlineprivate |
Definition at line 97 of file amdgpu_device.hh.
References gem5::X86ISA::addr, gem5::AddrRange::contains(), and romRange.
Referenced by read(), write(), and writeROM().
|
inline |
Definition at line 216 of file amdgpu_device.hh.
References _lastVMID.
Referenced by gem5::PM4PacketProcessor::mapQueues().
void gem5::AMDGPUDevice::mapDoorbellToVMID | ( | Addr | doorbell, |
uint16_t | vmid | ||
) |
Definition at line 967 of file amdgpu_device.cc.
References doorbellVMIDMap.
Referenced by gem5::PM4PacketProcessor::mapQueues().
void gem5::AMDGPUDevice::processPendingDoorbells | ( | uint32_t | offset | ) |
Definition at line 660 of file amdgpu_device.cc.
References DPRINTF, gem5::ArmISA::offset, pendingDoorbellPkts, and writeDoorbell().
Referenced by gem5::PM4PacketProcessor::processMQD(), and gem5::PM4PacketProcessor::processSDMAMQD().
Pure virtual function that the device must implement.
Called when a read command is recieved by the port.
pkt | Packet describing this request |
Implements gem5::PioDevice.
Definition at line 590 of file amdgpu_device.cc.
References dispatchAccess(), gem5::DOORBELL_BAR, gem5::FRAMEBUFFER_BAR, gem5::Packet::getAddr(), gem5::PciDevice::getBAR(), isROM(), gem5::MMIO_BAR, gem5::ArmISA::offset, panic, gem5::PciDevice::pioDelay, readDoorbell(), readFrame(), readMMIO(), and readROM().
Referenced by dispatchAccess().
Read from the PCI config space data that is stored locally.
This may be overridden by the device but at some point it will eventually call this for normal operations that it does not need to override.
pkt | packet containing the write the offset into config space |
Reimplemented from gem5::PciDevice.
Definition at line 247 of file amdgpu_device.cc.
References gem5::PciDevice::_busAddr, checkpoint_before_mmios, gem5::PciDevice::configDelay, gem5::curTick(), PXCAP::data, gem5::PciBusAddr::dev, DPRINTF, gem5::exitSimLoop(), gem5::PciBusAddr::func, gem5::Packet::getAddr(), gem5::Packet::getLE(), gem5::Packet::getSize(), init_interrupt_count, gem5::Packet::makeAtomicResponse(), gem5::ArmISA::offset, panic, PCI0_INTERRUPT_PIN, PCI_CONFIG_SIZE, PCI_DEVICE_SPECIFIC, gem5::PciDevice::pxcap, gem5::PciDevice::PXCAP_BASE, gem5::PciDevice::readConfig(), gem5::Packet::setLE(), and warn.
Definition at line 394 of file amdgpu_device.cc.
References gem5::DOORBELL_BAR, DPRINTF, mmioReader, gem5::ArmISA::offset, and gem5::AMDMMIOReader::readFromTrace().
Referenced by read().
Helper methods to handle specific BAR read/writes.
Offset is the address of the packet - base address of the BAR.
read/writeFrame are used for BAR0 requests read/writeDoorbell are used for BAR2 requests read/writeMMIO are used for BAR5 requests
Definition at line 349 of file amdgpu_device.cc.
References gem5::memory::AbstractMemory::access(), gem5::Packet::cmd, cp, gem5::Packet::createRead(), gem5::Shader::cuList, gem5::Packet::dataDynamic(), DPRINTF, gem5::MemCmd::FunctionalReadError, gem5::System::getDeviceMemory(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Shader::gpuCmdProc, nbio, gem5::ArmISA::offset, gem5::AMDGPUNbio::readFrame(), gem5::MemCmd::ReadReq, gem5::Packet::req, gem5::Packet::setSuppressFuncError(), gem5::Packet::setUintX(), gem5::GPUCommandProcessor::shader(), gem5::X86ISA::system, gem5::GPUCommandProcessor::system(), and vramRequestorId().
Referenced by read().
Definition at line 401 of file amdgpu_device.cc.
References DPRINTF, gem5::AMDGPUVM::getMMIOAperture(), gem5::AMDGPUVM::getMMIORange(), gfx, gem5::GFX_MMIO_RANGE, gpuvm, gem5::GRBM_MMIO_RANGE, gem5::GRBM_OFFSET_SHIFT, gem5::MMHUB_MMIO_RANGE, gem5::MMHUB_OFFSET_SHIFT, gem5::MMIO_BAR, mmioReader, nbio, gem5::NBIO_MMIO_RANGE, gem5::ArmISA::offset, gem5::AMDMMIOReader::readFromTrace(), gem5::AMDGPUGfx::readMMIO(), gem5::AMDGPUNbio::readMMIO(), gem5::AMDGPUVM::readMMIO(), and gem5::AddrRange::start().
Referenced by getRegVal(), and read().
|
private |
Definition at line 201 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), rom, gem5::ROM_SIZE, and gem5::Packet::setUintX().
Referenced by read().
|
overridevirtual |
Checkpoint support.
Implements gem5::Serializable.
Definition at line 754 of file amdgpu_device.cc.
References cp, deviceMem, doorbells, gpuvm, sdmaEngs, gem5::PciDevice::serialize(), SERIALIZE_ARRAY, SERIALIZE_SCALAR, gem5::Serializable::serializeSection(), and usedVMIDs.
void gem5::AMDGPUDevice::setDoorbellType | ( | uint32_t | offset, |
QueueType | qt, | ||
int | ip_id = 0 |
||
) |
Set handles to GPU blocks.
Definition at line 710 of file amdgpu_device.cc.
References doorbells, DPRINTF, and gem5::ArmISA::offset.
Referenced by gem5::PM4PacketProcessor::newQueue(), gem5::PM4PacketProcessor::processSDMAMQD(), gem5::SDMAEngine::setGfxDoorbellOffsetLo(), gem5::SDMAEngine::setPageDoorbellOffsetLo(), gem5::AMDGPUInterruptHandler::writeMMIO(), gem5::PM4PacketProcessor::writeMMIO(), and gem5::SDMAEngine::writeMMIO().
void gem5::AMDGPUDevice::setRegVal | ( | uint64_t | addr, |
uint32_t | value | ||
) |
Definition at line 695 of file amdgpu_device.cc.
References gem5::X86ISA::addr, gem5::Packet::createWrite(), gem5::Packet::dataStatic(), DPRINTF, vramRequestorId(), and writeMMIO().
Referenced by AMDGPUDevice(), gem5::PM4PacketProcessor::setUconfigReg(), gem5::SDMAEngine::srbmWrite(), gem5::PM4PacketProcessor::writeData(), and gem5::AMDGPUNbio::writeMMIO().
void gem5::AMDGPUDevice::setSDMAEngine | ( | Addr | offset, |
SDMAEngine * | eng | ||
) |
Definition at line 724 of file amdgpu_device.cc.
References gem5::ArmISA::offset, and sdmaEngs.
Referenced by gem5::PM4PacketProcessor::processSDMAMQD(), gem5::SDMAEngine::setGfxDoorbellOffsetLo(), gem5::SDMAEngine::setPageDoorbellOffsetLo(), and gem5::SDMAEngine::writeMMIO().
|
overridevirtual |
Unserialize an object.
Read an object's state from the current checkpoint section.
cp | Checkpoint state |
Implements gem5::Serializable.
Definition at line 834 of file amdgpu_device.cc.
References cp, deviceMem, doorbells, gpuvm, sdmaEngs, sdmaIds, gem5::PciDevice::unserialize(), UNSERIALIZE_ARRAY, UNSERIALIZE_SCALAR, gem5::Serializable::unserializeSection(), and usedVMIDs.
void gem5::AMDGPUDevice::unsetDoorbell | ( | uint32_t | offset | ) |
Definition at line 718 of file amdgpu_device.cc.
References doorbells, and gem5::ArmISA::offset.
Referenced by gem5::SDMAEngine::unregisterRLCQueue().
|
inline |
Methods related to translations and system/device memory.
Definition at line 213 of file amdgpu_device.hh.
References gem5::AMDGPUMemoryManager::getRequestorID(), and gpuMemMgr.
Referenced by getRegVal(), readFrame(), gem5::SDMAEngine::setGPUDevice(), gem5::HSAPacketProcessor::setGPUDevice(), gem5::GPUCommandProcessor::setGPUDevice(), setRegVal(), gem5::VegaISA::GpuTLB::translationReturn(), gem5::GPUCommandProcessor::vramRequestorId(), and writeFrame().
Pure virtual function that the device must implement.
Called when a write command is recieved by the port.
pkt | Packet describing this request |
Implements gem5::PioDevice.
Definition at line 619 of file amdgpu_device.cc.
References data, dispatchAccess(), gem5::DOORBELL_BAR, DPRINTF, gem5::FRAMEBUFFER_BAR, gem5::Packet::getAddr(), gem5::PciDevice::getBAR(), gem5::Packet::getUintX(), isROM(), gem5::MMIO_BAR, gem5::ArmISA::offset, panic, gem5::PciDevice::pioDelay, writeDoorbell(), writeFrame(), writeMMIO(), and writeROM().
Write to the PCI config space data that is stored locally.
This may be overridden by the device but at some point it will eventually call this for normal operations that it does not need to override.
pkt | packet containing the write the offset into config space |
Reimplemented from gem5::PciDevice.
Definition at line 311 of file amdgpu_device.cc.
References gem5::PciDevice::configDelay, PXCAP::data, DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getConstPtr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Packet::makeAtomicResponse(), gem5::ArmISA::offset, PCI_CONFIG_SIZE, PCI_DEVICE_SPECIFIC, gem5::PciDevice::pxcap, gem5::PciDevice::PXCAP_BASE, and gem5::PciDevice::writeConfig().
Definition at line 470 of file amdgpu_device.cc.
References gem5::Compute, gem5::ComputeAQL, cp, gem5::Packet::createWrite(), gem5::Packet::dataDynamic(), deviceIH, doorbells, DPRINTF, gem5::Packet::getLE(), gem5::Packet::getPtr(), getSDMAEngine(), gem5::Packet::getSize(), gem5::Gfx, gem5::GPUCommandProcessor::hsaPacketProc(), gem5::HSAPacketProcessor::hwScheduler(), gem5::InterruptHandler, gem5::ArmISA::offset, panic, pendingDoorbellPkts, pm4PktProcs, gem5::SDMAEngine::processGfx(), gem5::SDMAEngine::processPage(), gem5::SDMAEngine::processRLC(), gem5::Packet::req, gem5::RLC, gem5::SDMAGfx, gem5::SDMAPage, gem5::AMDGPUInterruptHandler::updateRptr(), warn, and gem5::HWScheduler::write().
Referenced by processPendingDoorbells(), and write().
Definition at line 429 of file amdgpu_device.cc.
References gem5::memory::AbstractMemory::access(), cp, CP(), gem5::Packet::createWrite(), gem5::Shader::cuList, gem5::Packet::dataDynamic(), DPRINTF, gem5::AMDGPUVM::gartBase(), gem5::AMDGPUVM::gartTable, gem5::AMDGPUMemoryManager::getCacheLineSize(), gem5::System::getDeviceMemory(), gem5::AMDGPUVM::getFrameAperture(), gem5::Packet::getPtr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), gem5::Shader::gpuCmdProc, gpuMemMgr, gpuvm, nbio, gem5::ArmISA::offset, gem5::GPUCommandProcessor::shader(), gem5::X86ISA::system, gem5::GPUCommandProcessor::system(), vramRequestorId(), and gem5::AMDGPUNbio::writeFrame().
Referenced by write().
Definition at line 536 of file amdgpu_device.cc.
References deviceIH, DPRINTF, gem5::Packet::getLE(), gem5::AMDGPUVM::getMMIOAperture(), gem5::AMDGPUVM::getMMIORange(), getSDMAById(), gfx, gem5::GFX_MMIO_RANGE, gpuvm, gem5::GRBM_MMIO_RANGE, gem5::GRBM_OFFSET_SHIFT, gem5::IH_MMIO_RANGE, gem5::IH_OFFSET_SHIFT, nbio, gem5::NBIO_MMIO_RANGE, gem5::ArmISA::offset, pm4Ranges, sdmaFunc, sdmaIds, sdmaMmios, gem5::AddrRange::start(), gem5::AMDGPUInterruptHandler::writeMMIO(), gem5::AMDGPUGfx::writeMMIO(), gem5::AMDGPUNbio::writeMMIO(), and gem5::AMDGPUVM::writeMMIO().
Referenced by setRegVal(), and write().
|
private |
Definition at line 214 of file amdgpu_device.cc.
References DPRINTF, gem5::Packet::getAddr(), gem5::Packet::getSize(), gem5::Packet::getUintX(), isROM(), rom, romRange, and gem5::AddrRange::start().
Referenced by write().
|
private |
Definition at line 153 of file amdgpu_device.hh.
Referenced by allocateVMID(), and lastVMID().
|
private |
Initial checkpoint support variables.
Definition at line 142 of file amdgpu_device.hh.
Referenced by readConfig().
|
private |
Definition at line 116 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), CP(), readFrame(), serialize(), unserialize(), writeDoorbell(), and writeFrame().
|
private |
Definition at line 114 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getIH(), writeDoorbell(), and writeMMIO().
|
private |
Definition at line 158 of file amdgpu_device.hh.
Referenced by serialize(), and unserialize().
|
private |
Structures to hold registers, doorbells, and some frame memory.
Definition at line 90 of file amdgpu_device.hh.
Referenced by deallocateAllQueues(), serialize(), setDoorbellType(), unserialize(), unsetDoorbell(), and writeDoorbell().
|
private |
Definition at line 149 of file amdgpu_device.hh.
Referenced by deallocateAllQueues(), getVMID(), and mapDoorbellToVMID().
|
private |
Definition at line 112 of file amdgpu_device.hh.
Referenced by readMMIO(), and writeMMIO().
|
private |
Definition at line 161 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and getGfxVersion().
|
private |
Definition at line 113 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getMemMgr(), vramRequestorId(), and writeFrame().
|
private |
Definition at line 115 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getVM(), readMMIO(), serialize(), unserialize(), writeFrame(), and writeMMIO().
|
private |
Definition at line 147 of file amdgpu_device.hh.
Referenced by allocateVMID(), deallocateAllQueues(), and deallocatePasid().
|
private |
Definition at line 143 of file amdgpu_device.hh.
Referenced by readConfig().
|
private |
MMIO reader to populate device registers map.
Definition at line 106 of file amdgpu_device.hh.
Referenced by readDoorbell(), and readMMIO().
|
private |
Blocks of the GPU.
Definition at line 111 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), readFrame(), readMMIO(), writeFrame(), and writeMMIO().
|
private |
Definition at line 91 of file amdgpu_device.hh.
Referenced by processPendingDoorbells(), and writeDoorbell().
|
private |
Definition at line 125 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and writeDoorbell().
|
private |
Definition at line 127 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and writeMMIO().
|
private |
Definition at line 101 of file amdgpu_device.hh.
Referenced by readROM(), and writeROM().
|
private |
VGA ROM methods.
Definition at line 96 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getAddrRanges(), isROM(), and writeROM().
|
private |
Definition at line 130 of file amdgpu_device.hh.
Referenced by deallocateAllQueues(), getSDMAEngine(), serialize(), setSDMAEngine(), and unserialize().
|
private |
Definition at line 137 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and writeMMIO().
|
private |
Definition at line 132 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), getSDMAById(), unserialize(), and writeMMIO().
|
private |
Definition at line 134 of file amdgpu_device.hh.
Referenced by AMDGPUDevice(), and writeMMIO().
|
private |
Definition at line 151 of file amdgpu_device.hh.
Referenced by allocateVMID(), deallocateAllQueues(), deallocatePasid(), deallocateVmid(), getUsedVMIDs(), insertQId(), serialize(), and unserialize().