release/current/shader_8hh_source.html

/*

 * Copyright (c) 2011-2015 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#ifndef __SHADER_HH__

#define __SHADER_HH__


#include <functional>

#include <string>


#include "arch/gpu_isa.hh"

#include "base/statistics.hh"

#include "base/stats/group.hh"

#include "base/types.hh"

#include "cpu/simple/atomic.hh"

#include "cpu/simple/timing.hh"

#include "cpu/simple_thread.hh"

#include "cpu/thread_context.hh"

#include "cpu/thread_state.hh"

#include "dev/amdgpu/system_hub.hh"

#include "gpu-compute/compute_unit.hh"

#include "gpu-compute/gpu_dyn_inst.hh"

#include "gpu-compute/hsa_queue_entry.hh"

#include "gpu-compute/lds_state.hh"

#include "mem/page_table.hh"

#include "mem/port.hh"

#include "mem/request.hh"

#include "params/Shader.hh"

#include "sim/faults.hh"

#include "sim/process.hh"

#include "sim/sim_object.hh"


namespace gem5

{


class BaseTLB;

class GPUCommandProcessor;

class GPUDispatcher;


static const int LDS_SIZE = 65536;


// aperture (APE) registers define the base/limit

// pair for the ATC mapped memory space. currently

// the only APEs we consider are for GPUVM/LDS/scratch.

// the APEs are registered with unique values based

// on a per-device basis


struct ApertureRegister

{

    Addr base;

    Addr limit;

};

struct ApertureRegister {…};


// Class Shader: This describes a single shader instance. Most

// configurations will only have a single shader.


class Shader : public ClockedObject

{

  private:

    ApertureRegister _gpuVmApe;

    ApertureRegister _ldsApe;

    ApertureRegister _scratchApe;

    Addr shHiddenPrivateBaseVmid;


    // Hardware regs accessed by getreg/setreg instructions, set by queues

    std::unordered_map<int, uint32_t> hwRegs;


    // Number of active Cus attached to this shader

    int _activeCus;


    // Last tick that all CUs attached to this shader were inactive

    Tick _lastInactiveTick;


    // If a kernel-based exit event was requested, wait for all CUs in the

    // shader to complete before actually exiting so that stats are updated.

    bool kernelExitRequested = false;


    // Set to true by the dispatcher if the current kernel is a blit kernel

    bool blitKernel = false;


    // Number of pending non-instruction invalidates outstanding. The shader

    // should wait for these to be done to ensure correctness.

    int num_outstanding_invl2s = 0;

    std::vector<std::tuple<void *, uint32_t, Addr>> deferred_dispatches;


  public:

    typedef ShaderParams Params;

    enum hsail_mode_e {SIMT,VECTOR_SCALAR};


    GPUDispatcher &dispatcher();

    void sampleLoad(const Tick accessTime);

    void sampleStore(const Tick accessTime);

    void sampleInstRoundTrip(std::vector<Tick> roundTripTime);

    void sampleLineRoundTrip(const std::map<Addr,

        std::vector<Tick>> &roundTripTime);


    SimpleThread *cpuThread;

    ThreadContext *gpuTc;

    BaseCPU *cpuPointer;


    void


    setHwReg(int regIdx, uint32_t val)

    {

        hwRegs[regIdx] = val;

    }

    setHwReg(int regIdx, uint32_t val) {…}


    uint32_t


    getHwReg(int regIdx)

    {

        return hwRegs[regIdx];

    }

    getHwReg(int regIdx) {…}


    const ApertureRegister&


    gpuVmApe() const

    {

        return _gpuVmApe;

    }

    gpuVmApe() const {…}


    const ApertureRegister&


    ldsApe() const

    {

        return _ldsApe;

    }

    ldsApe() const {…}


    void


    setLdsApe(Addr base, Addr limit)

    {

        _ldsApe.base = base;

        _ldsApe.limit = limit;

    }

    setLdsApe(Addr base, Addr limit) {…}


    const ApertureRegister&


    scratchApe() const

    {

        return _scratchApe;

    }

    scratchApe() const {…}


    void


    setScratchApe(Addr base, Addr limit)

    {

        _scratchApe.base = base;

        _scratchApe.limit = limit;

    }

    setScratchApe(Addr base, Addr limit) {…}


    bool


    isGpuVmApe(Addr addr) const

    {

        bool is_gpu_vm = addr >= _gpuVmApe.base && addr <= _gpuVmApe.limit;


        return is_gpu_vm;

    }

    isGpuVmApe(Addr addr) const {…}


    bool


    isLdsApe(Addr addr) const

    {

        bool is_lds = addr >= _ldsApe.base && addr <= _ldsApe.limit;


        return is_lds;

    }

    isLdsApe(Addr addr) const {…}


    bool


    isScratchApe(Addr addr) const

    {

        bool is_scratch

            = addr >= _scratchApe.base && addr <= _scratchApe.limit;


        return is_scratch;

    }

    isScratchApe(Addr addr) const {…}


    Addr


    getScratchBase()

    {

        return _scratchApe.base;

    }

    getScratchBase() {…}


    Addr


    getHiddenPrivateBase()

    {

        return shHiddenPrivateBaseVmid;

    }

    getHiddenPrivateBase() {…}


    void


    initShHiddenPrivateBase(Addr queueBase, uint32_t offset)

    {

        Addr sh_hidden_base_new = queueBase - offset;


        // We are initializing sh_hidden_private_base_vmid from the

        // amd queue descriptor from the first queue.

        // The sh_hidden_private_base_vmid is supposed to be same for

        // all the queues from the same process

        if (shHiddenPrivateBaseVmid != sh_hidden_base_new) {

            // Do not panic if shHiddenPrivateBaseVmid == 0,

            // that is if it is uninitialized. Panic only

            // if the value is initilized and we get

            // a differnt base later.

            panic_if(shHiddenPrivateBaseVmid != 0,

                     "Currently we support only single process\n");

        }

        shHiddenPrivateBaseVmid = sh_hidden_base_new;

    }

    initShHiddenPrivateBase(Addr queueBase, uint32_t offset) {…}


    RequestorID vramRequestorId();


    EventFunctionWrapper tickEvent;


    // is this simulation going to be timing mode in the memory?

    bool timingSim;

    hsail_mode_e hsail_mode;


    // If set, issue acq packet @ kernel launch

    int impl_kern_launch_acq;

    // If set, issue rel packet @ kernel end

    int impl_kern_end_rel;

    // If set, fetch returns may be coissued with instructions

    int coissue_return;

    // If set, always dump all 64 gprs to trace

    int trace_vgpr_all;

    // Number of cu units in the shader

    int n_cu;

    // Number of wavefront slots per SIMD per CU

    int n_wf;

    //Number of cu units per sqc in the shader

    int n_cu_per_sqc;


    // The size of global memory

    int globalMemSize;


    // Tracks CU that rr dispatcher should attempt scheduling

    int nextSchedCu;


    // Size of scheduled add queue

    uint32_t sa_n;


    // Pointer to value to be increments

    std::vector<int*> sa_val;

    // When to do the increment

    std::vector<uint64_t> sa_when;

    // Amount to increment by

    std::vector<int32_t> sa_x;


    // List of Compute Units (CU's)

    std::vector<ComputeUnit*> cuList;


    GPUCommandProcessor &gpuCmdProc;

    GPUDispatcher &_dispatcher;

    AMDGPUSystemHub *systemHub;


    int64_t max_valu_insts;

    int64_t total_valu_insts;


    Shader(const Params &p);

    ~Shader();

    virtual void init();


    // Run shader scheduled adds

    void execScheduledAdds();


    // Schedule a 32-bit value to be incremented some time in the future

    void ScheduleAdd(int *val, Tick when, int x);

    bool processTimingPacket(PacketPtr pkt);


    void AccessMem(uint64_t address, void *ptr, uint32_t size, int cu_id,

                   MemCmd cmd, bool suppress_func_errors);


    void ReadMem(uint64_t address, void *ptr, uint32_t sz, int cu_id);


    void ReadMem(uint64_t address, void *ptr, uint32_t sz, int cu_id,

                 bool suppress_func_errors);


    void WriteMem(uint64_t address, void *ptr, uint32_t sz, int cu_id);


    void WriteMem(uint64_t address, void *ptr, uint32_t sz, int cu_id,

                  bool suppress_func_errors);


    void doFunctionalAccess(const RequestPtr &req, MemCmd cmd, void *data,

                            bool suppress_func_errors, int cu_id);


    void


    registerCU(int cu_id, ComputeUnit *compute_unit)

    {

        cuList[cu_id] = compute_unit;

    }

    registerCU(int cu_id, ComputeUnit *compute_unit) {…}


    void prepareInvalidate(HSAQueueEntry *task);

    void prepareFlush(GPUDynInstPtr gpuDynInst);


    bool dispatchWorkgroups(HSAQueueEntry *task);

    Addr mmap(int length);

    void functionalTLBAccess(PacketPtr pkt, int cu_id, BaseMMU::Mode mode);

    void updateContext(int cid);

    void notifyCuSleep();


    void


    incVectorInstSrcOperand(int num_operands)

    {

        stats.vectorInstSrcOperand[num_operands]++;

    }

    incVectorInstSrcOperand(int num_operands) {…}


    void


    incVectorInstDstOperand(int num_operands)

    {

        stats.vectorInstDstOperand[num_operands]++;

    }

    incVectorInstDstOperand(int num_operands) {…}


    void


    requestKernelExitEvent(bool is_blit_kernel)

    {

        kernelExitRequested = true;

        blitKernel = is_blit_kernel;

    }

    requestKernelExitEvent(bool is_blit_kernel) {…}


    void decNumOutstandingInvL2s();

    void incNumOutstandingInvL2s() { num_outstanding_invl2s++; };

    int getNumOutstandingInvL2s() const { return num_outstanding_invl2s; };


    void addDeferredDispatch(void *raw_pkt, uint32_t queue_id,

                             Addr host_pkt_addr);


  protected:


    struct ShaderStats : public statistics::Group

    {

        ShaderStats(statistics::Group *parent, int wf_size);


        // some stats for measuring latency

        statistics::Distribution allLatencyDist;

        statistics::Distribution loadLatencyDist;

        statistics::Distribution storeLatencyDist;


        // average ticks from vmem inst initiateAcc to coalescer issue,

        statistics::Distribution initToCoalesceLatency;


        // average ticks from coalescer issue to coalescer hit callback,

        statistics::Distribution rubyNetworkLatency;


        // average ticks from coalescer hit callback to GM pipe enqueue,

        statistics::Distribution gmEnqueueLatency;


        // average ticks spent in GM pipe's ordered resp buffer.

        statistics::Distribution gmToCompleteLatency;


        // average number of cache blocks requested by vmem inst

        statistics::Distribution coalsrLineAddresses;


        // average ticks for cache blocks to main memory for the Nth

        // cache block generated by a vmem inst.

        statistics::Distribution *cacheBlockRoundTrip;


        statistics::Scalar shaderActiveTicks;

        statistics::Vector vectorInstSrcOperand;

        statistics::Vector vectorInstDstOperand;

    } stats;

    struct ShaderStats : public statistics::Group {…};

};

class Shader : public ClockedObject {…};


} // namespace gem5


#endif // __SHADER_HH__

types.hh
Defines global host-dependent types: Counter, Tick, and (indirectly) {int,uint}{8,...

data
const char data[]
Definition circlebuf.test.cc:48

gem5::AMDGPUSystemHub
This class handles reads from the system/host memory space from the shader.
Definition system_hub.hh:51

gem5::BaseCPU
Definition base.hh:106

gem5::BaseMMU::Mode
Mode
Definition mmu.hh:56

gem5::ClockedObject
The ClockedObject class extends the SimObject with a clock and accessor functions to relate ticks to ...
Definition clocked_object.hh:235

gem5::ComputeUnit
Definition compute_unit.hh:203

gem5::EventFunctionWrapper
Definition eventq.hh:1137

gem5::GPUCommandProcessor
Definition gpu_command_processor.hh:72

gem5::GPUDispatcher
Definition dispatcher.hh:63

gem5::HSAQueueEntry
Definition hsa_queue_entry.hh:61

gem5::MemCmd
Definition packet.hh:77

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::Shader
Definition shader.hh:84

gem5::Shader::kernelExitRequested
bool kernelExitRequested
Definition shader.hh:102

gem5::Shader::timingSim
bool timingSim
Definition shader.hh:233

gem5::Shader::mmap
Addr mmap(int length)
Definition shader.cc:117

gem5::Shader::prepareInvalidate
void prepareInvalidate(HSAQueueEntry *task)
Definition shader.cc:203

gem5::Shader::AccessMem
void AccessMem(uint64_t address, void *ptr, uint32_t size, int cu_id, MemCmd cmd, bool suppress_func_errors)
Definition shader.cc:399

gem5::Shader::blitKernel
bool blitKernel
Definition shader.hh:105

gem5::Shader::notifyCuSleep
void notifyCuSleep()
Definition shader.cc:540

gem5::Shader::setLdsApe
void setLdsApe(Addr base, Addr limit)
Definition shader.hh:152

gem5::Shader::doFunctionalAccess
void doFunctionalAccess(const RequestPtr &req, MemCmd cmd, void *data, bool suppress_func_errors, int cu_id)
Definition shader.cc:307

gem5::Shader::execScheduledAdds
void execScheduledAdds()
Definition shader.cc:173

gem5::Shader::total_valu_insts
int64_t total_valu_insts
Definition shader.hh:275

gem5::Shader::_scratchApe
ApertureRegister _scratchApe
Definition shader.hh:88

gem5::Shader::hsail_mode_e
hsail_mode_e
Definition shader.hh:114

gem5::Shader::VECTOR_SCALAR
@ VECTOR_SCALAR
Definition shader.hh:114

gem5::Shader::SIMT
@ SIMT
Definition shader.hh:114

gem5::Shader::setScratchApe
void setScratchApe(Addr base, Addr limit)
Definition shader.hh:165

gem5::Shader::hsail_mode
hsail_mode_e hsail_mode
Definition shader.hh:234

gem5::Shader::tickEvent
EventFunctionWrapper tickEvent
Definition shader.hh:230

gem5::Shader::hwRegs
std::unordered_map< int, uint32_t > hwRegs
Definition shader.hh:92

gem5::Shader::cuList
std::vector< ComputeUnit * > cuList
Definition shader.hh:268

gem5::Shader::_ldsApe
ApertureRegister _ldsApe
Definition shader.hh:87

gem5::Shader::_gpuVmApe
ApertureRegister _gpuVmApe
Definition shader.hh:86

gem5::Shader::scratchApe
const ApertureRegister & scratchApe() const
Definition shader.hh:159

gem5::Shader::addDeferredDispatch
void addDeferredDispatch(void *raw_pkt, uint32_t queue_id, Addr host_pkt_addr)
Definition shader.cc:575

gem5::Shader::nextSchedCu
int nextSchedCu
Definition shader.hh:255

gem5::Shader::incNumOutstandingInvL2s
void incNumOutstandingInvL2s()
Definition shader.hh:339

gem5::Shader::registerCU
void registerCU(int cu_id, ComputeUnit *compute_unit)
Definition shader.hh:305

gem5::Shader::ScheduleAdd
void ScheduleAdd(int *val, Tick when, int x)
Definition shader.cc:380

gem5::Shader::_dispatcher
GPUDispatcher & _dispatcher
Definition shader.hh:271

gem5::Shader::sa_n
uint32_t sa_n
Definition shader.hh:258

gem5::Shader::trace_vgpr_all
int trace_vgpr_all
Definition shader.hh:243

gem5::Shader::Params
ShaderParams Params
Definition shader.hh:113

gem5::Shader::sampleLineRoundTrip
void sampleLineRoundTrip(const std::map< Addr, std::vector< Tick > > &roundTripTime)
Definition shader.cc:511

gem5::Shader::sa_when
std::vector< uint64_t > sa_when
Definition shader.hh:263

gem5::Shader::processTimingPacket
bool processTimingPacket(PacketPtr pkt)

gem5::Shader::getNumOutstandingInvL2s
int getNumOutstandingInvL2s() const
Definition shader.hh:340

gem5::Shader::init
virtual void init()
init() is called after all C++ SimObjects have been created and all ports are connected.
Definition shader.cc:150

gem5::Shader::isScratchApe
bool isScratchApe(Addr addr) const
Definition shader.hh:188

gem5::Shader::coissue_return
int coissue_return
Definition shader.hh:241

gem5::Shader::sa_x
std::vector< int32_t > sa_x
Definition shader.hh:265

gem5::Shader::ReadMem
void ReadMem(uint64_t address, void *ptr, uint32_t sz, int cu_id)
Definition shader.cc:417

gem5::Shader::stats
gem5::Shader::ShaderStats stats

gem5::Shader::ldsApe
const ApertureRegister & ldsApe() const
Definition shader.hh:146

gem5::Shader::deferred_dispatches
std::vector< std::tuple< void *, uint32_t, Addr > > deferred_dispatches
Definition shader.hh:110

gem5::Shader::isLdsApe
bool isLdsApe(Addr addr) const
Definition shader.hh:180

gem5::Shader::gpuTc
ThreadContext * gpuTc
Definition shader.hh:124

gem5::Shader::n_wf
int n_wf
Definition shader.hh:247

gem5::Shader::isGpuVmApe
bool isGpuVmApe(Addr addr) const
Definition shader.hh:172

gem5::Shader::dispatchWorkgroups
bool dispatchWorkgroups(HSAQueueEntry *task)
Definition shader.cc:258

gem5::Shader::dispatcher
GPUDispatcher & dispatcher()
Definition shader.cc:111

gem5::Shader::getScratchBase
Addr getScratchBase()
Definition shader.hh:197

gem5::Shader::decNumOutstandingInvL2s
void decNumOutstandingInvL2s()
Definition shader.cc:560

gem5::Shader::initShHiddenPrivateBase
void initShHiddenPrivateBase(Addr queueBase, uint32_t offset)
Definition shader.hh:209

gem5::Shader::impl_kern_launch_acq
int impl_kern_launch_acq
Definition shader.hh:237

gem5::Shader::incVectorInstDstOperand
void incVectorInstDstOperand(int num_operands)
Definition shader.hh:326

gem5::Shader::vramRequestorId
RequestorID vramRequestorId()
Forward the VRAM requestor ID needed for device memory from CP.
Definition shader.cc:586

gem5::Shader::systemHub
AMDGPUSystemHub * systemHub
Definition shader.hh:272

gem5::Shader::setHwReg
void setHwReg(int regIdx, uint32_t val)
Definition shader.hh:128

gem5::Shader::cpuThread
SimpleThread * cpuThread
Definition shader.hh:123

gem5::Shader::updateContext
void updateContext(int cid)
Definition shader.cc:165

gem5::Shader::n_cu_per_sqc
int n_cu_per_sqc
Definition shader.hh:249

gem5::Shader::max_valu_insts
int64_t max_valu_insts
Definition shader.hh:274

gem5::Shader::WriteMem
void WriteMem(uint64_t address, void *ptr, uint32_t sz, int cu_id)
Definition shader.cc:431

gem5::Shader::globalMemSize
int globalMemSize
Definition shader.hh:252

gem5::Shader::requestKernelExitEvent
void requestKernelExitEvent(bool is_blit_kernel)
Definition shader.hh:332

gem5::Shader::impl_kern_end_rel
int impl_kern_end_rel
Definition shader.hh:239

gem5::Shader::getHwReg
uint32_t getHwReg(int regIdx)
Definition shader.hh:134

gem5::Shader::prepareFlush
void prepareFlush(GPUDynInstPtr gpuDynInst)
dispatcher/shader arranges flush requests to the CUs
Definition shader.cc:245

gem5::Shader::sampleInstRoundTrip
void sampleInstRoundTrip(std::vector< Tick > roundTripTime)
Definition shader.cc:491

gem5::Shader::sampleLoad
void sampleLoad(const Tick accessTime)
Definition shader.cc:484

gem5::Shader::~Shader
~Shader()
Definition shader.cc:158

gem5::Shader::gpuVmApe
const ApertureRegister & gpuVmApe() const
Definition shader.hh:140

gem5::Shader::incVectorInstSrcOperand
void incVectorInstSrcOperand(int num_operands)
Definition shader.hh:320

gem5::Shader::functionalTLBAccess
void functionalTLBAccess(PacketPtr pkt, int cu_id, BaseMMU::Mode mode)
Definition shader.cc:450

gem5::Shader::num_outstanding_invl2s
int num_outstanding_invl2s
Definition shader.hh:109

gem5::Shader::sampleStore
void sampleStore(const Tick accessTime)
Definition shader.cc:474

gem5::Shader::cpuPointer
BaseCPU * cpuPointer
Definition shader.hh:125

gem5::Shader::gpuCmdProc
GPUCommandProcessor & gpuCmdProc
Definition shader.hh:270

gem5::Shader::n_cu
int n_cu
Definition shader.hh:245

gem5::Shader::shHiddenPrivateBaseVmid
Addr shHiddenPrivateBaseVmid
Definition shader.hh:89

gem5::Shader::_lastInactiveTick
Tick _lastInactiveTick
Definition shader.hh:98

gem5::Shader::sa_val
std::vector< int * > sa_val
Definition shader.hh:261

gem5::Shader::getHiddenPrivateBase
Addr getHiddenPrivateBase()
Definition shader.hh:203

gem5::Shader::_activeCus
int _activeCus
Definition shader.hh:95

gem5::SimpleThread
The SimpleThread object provides a combination of the ThreadState object and the ThreadContext interf...
Definition simple_thread.hh:94

gem5::ThreadContext
ThreadContext is the external interface to all thread state for anything outside of the CPU.
Definition thread_context.hh:89

gem5::statistics::Distribution
A simple distribution stat.
Definition statistics.hh:2084

gem5::statistics::Group
Statistics container.
Definition group.hh:93

gem5::statistics::Scalar
This is a simple scalar statistic, like a counter.
Definition statistics.hh:1930

gem5::statistics::Vector
A vector of scalar stats.
Definition statistics.hh:2006

std::vector
STL vector class.
Definition stl.hh:37

compute_unit.hh

atomic.hh

timing.hh

thread_context.hh

gpu_dyn_inst.hh

group.hh

panic_if
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
Definition logging.hh:214

hsa_queue_entry.hh
HSAQueuEntry is the simulator's internal representation of an AQL queue entry (task).

lds_state.hh

port.hh
Port Object Declaration.

gem5::ArmISA::mode
Bitfield< 4, 0 > mode
Definition misc_types.hh:74

gem5::ArmISA::offset
Bitfield< 23, 0 > offset
Definition types.hh:144

gem5::MipsISA::p
Bitfield< 0 > p
Definition pra_constants.hh:326

gem5::RiscvISA::x
Bitfield< 3 > x
Definition pagetable.hh:74

gem5::X86ISA::base
Bitfield< 51, 12 > base
Definition pagetable.hh:141

gem5::X86ISA::val
Bitfield< 63 > val
Definition misc.hh:804

gem5::X86ISA::limit
BitfieldType< SegDescriptorLimit > limit
Definition misc.hh:959

gem5::X86ISA::addr
Bitfield< 3 > addr
Definition types.hh:84

gem5
Copyright (c) 2024 Arm Limited All rights reserved.
Definition binary32.hh:36

gem5::RequestPtr
std::shared_ptr< Request > RequestPtr
Definition request.hh:94

gem5::GPUDynInstPtr
std::shared_ptr< GPUDynInst > GPUDynInstPtr
Definition misc.hh:49

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

gem5::Tick
uint64_t Tick
Tick count type.
Definition types.hh:58

gem5::RequestorID
uint16_t RequestorID
Definition request.hh:95

gem5::LDS_SIZE
static const int LDS_SIZE
Definition shader.hh:67

page_table.hh
Declarations of a non-full system Page Table.

request.hh
Declaration of a request, the overall memory request consisting of the parts of the request that are ...

faults.hh

process.hh

sim_object.hh

simple_thread.hh

statistics.hh
Declaration of Statistics objects.

gem5::ApertureRegister
Definition shader.hh:75

gem5::ApertureRegister::base
Addr base
Definition shader.hh:76

gem5::ApertureRegister::limit
Addr limit
Definition shader.hh:77

gem5::Shader::ShaderStats
Definition shader.hh:347

gem5::Shader::ShaderStats::vectorInstSrcOperand
statistics::Vector vectorInstSrcOperand
Definition shader.hh:375

gem5::Shader::ShaderStats::storeLatencyDist
statistics::Distribution storeLatencyDist
Definition shader.hh:353

gem5::Shader::ShaderStats::initToCoalesceLatency
statistics::Distribution initToCoalesceLatency
Definition shader.hh:356

gem5::Shader::ShaderStats::shaderActiveTicks
statistics::Scalar shaderActiveTicks
Definition shader.hh:374

gem5::Shader::ShaderStats::loadLatencyDist
statistics::Distribution loadLatencyDist
Definition shader.hh:352

gem5::Shader::ShaderStats::allLatencyDist
statistics::Distribution allLatencyDist
Definition shader.hh:351

gem5::Shader::ShaderStats::gmToCompleteLatency
statistics::Distribution gmToCompleteLatency
Definition shader.hh:365

gem5::Shader::ShaderStats::coalsrLineAddresses
statistics::Distribution coalsrLineAddresses
Definition shader.hh:368

gem5::Shader::ShaderStats::vectorInstDstOperand
statistics::Vector vectorInstDstOperand
Definition shader.hh:376

gem5::Shader::ShaderStats::rubyNetworkLatency
statistics::Distribution rubyNetworkLatency
Definition shader.hh:359

gem5::Shader::ShaderStats::cacheBlockRoundTrip
statistics::Distribution * cacheBlockRoundTrip
Definition shader.hh:372

gem5::Shader::ShaderStats::gmEnqueueLatency
statistics::Distribution gmEnqueueLatency
Definition shader.hh:362

system_hub.hh

thread_state.hh