release/current/fetch__unit_8hh_source.html

/*

 * Copyright (c) 2014-2017 Advanced Micro Devices, Inc.

 * All rights reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions are met:

 *

 * 1. Redistributions of source code must retain the above copyright notice,

 * this list of conditions and the following disclaimer.

 *

 * 2. Redistributions in binary form must reproduce the above copyright notice,

 * this list of conditions and the following disclaimer in the documentation

 * and/or other materials provided with the distribution.

 *

 * 3. Neither the name of the copyright holder nor the names of its

 * contributors may be used to endorse or promote products derived from this

 * software without specific prior written permission.

 *

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"

 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE

 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE

 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR

 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF

 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS

 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN

 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)

 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE

 * POSSIBILITY OF SUCH DAMAGE.

 */


#ifndef __FETCH_UNIT_HH__

#define __FETCH_UNIT_HH__


#include <cassert>

#include <cstdint>

#include <deque>

#include <map>

#include <utility>

#include <vector>


#include "arch/gpu_decoder.hh"

#include "base/types.hh"

#include "config/the_gpu_isa.hh"

#include "gpu-compute/scheduler.hh"

#include "mem/packet.hh"

#include "sim/eventq.hh"


namespace gem5

{


class ComputeUnit;

class Wavefront;


class FetchUnit

{

  public:

    FetchUnit(const ComputeUnitParams &p, ComputeUnit &cu);

    ~FetchUnit();

    void init();

    void exec();

    void bindWaveList(std::vector<Wavefront*> *list);

    void initiateFetch(Wavefront *wavefront);

    void fetch(PacketPtr pkt, Wavefront *wavefront);

    void processFetchReturn(PacketPtr pkt);

    void flushBuf(int wfSlotId);

    static uint32_t globalFetchUnitID;


  private:


    class FetchBufDesc

    {

      public:


        FetchBufDesc() : bufStart(nullptr), bufEnd(nullptr),

            readPtr(nullptr), fetchDepth(0), maxIbSize(0), maxFbSize(0),

            cacheLineSize(0), restartFromBranch(false), wavefront(nullptr),

            _decoder(nullptr)

        {

        }


        ~FetchBufDesc()

        {

            delete[] bufStart;

        }


        void allocateBuf(int fetch_depth, int cache_line_size, Wavefront *wf);


        int


        bufferedAndReservedLines() const

        {

            return bufferedLines() + reservedLines();

        }


        int bufferedLines() const { return bufferedPCs.size(); }

        int bufferedBytes() const { return bufferedLines() * cacheLineSize; }

        int reservedLines() const { return reservedPCs.size(); }

        bool hasFreeSpace() const { return !freeList.empty(); }

        void flushBuf();

        Addr nextFetchAddr();


        void reserveBuf(Addr vaddr);


        uint8_t*


        reservedBuf(Addr vaddr) const

        {

            auto reserved_pc = reservedPCs.find(vaddr);

            assert(reserved_pc != reservedPCs.end());

            assert(reserved_pc == reservedPCs.begin());


            return reserved_pc->second;

        }


        bool


        isReserved(Addr vaddr) const

        {

            auto reserved_pc = reservedPCs.find(vaddr);

            bool is_reserved = (reserved_pc != reservedPCs.end());

            return is_reserved;

        }


        void fetchDone(PacketPtr ptr);


        bool hasFetchDataToProcess() const;


        void decodeInsts();


        void checkWaveReleaseBuf();


        void


        decoder(TheGpuISA::Decoder *dec)

        {

            _decoder = dec;

        }


        bool


        pcBuffered(Addr pc) const

        {

            bool buffered = bufferedPCs.find(pc) != bufferedPCs.end()

                            && reservedPCs.find(pc) != reservedPCs.end();


            return buffered;

        }


        int fetchBytesRemaining() const;


      private:

        void decodeSplitInst();


        bool splitDecode() const;


        std::map<Addr, uint8_t*> bufferedPCs;

        std::map<Addr, uint8_t*> reservedPCs;


        std::deque<uint8_t*> freeList;


        uint8_t *bufStart;

        uint8_t *bufEnd;

        uint8_t *readPtr;

        // how many lines the fetch unit may buffer

        int fetchDepth;

        // maximum size (in number of insts) of the WF's IB

        int maxIbSize;

        // maximum size (in bytes) of this fetch buffer

        int maxFbSize;

        int cacheLineSize;

        int cacheLineBits;

        bool restartFromBranch;

        // wavefront whose IB is serviced by this fetch buffer

        Wavefront *wavefront;

        TheGpuISA::Decoder *_decoder;

    };


    class SystemHubEvent : public Event

    {

      FetchUnit *fetchUnit;

      PacketPtr reqPkt;


      public:


        SystemHubEvent(PacketPtr pkt, FetchUnit *fetch_unit)

            : fetchUnit(fetch_unit), reqPkt(pkt)

        {

            setFlags(Event::AutoDelete);

        }


        void process();

    };


    bool timingSim;

    ComputeUnit &computeUnit;

    TheGpuISA::Decoder decoder;


    // Fetch scheduler; Selects one wave from

    // the fetch queue for instruction fetching.

    // The selection is made according to

    // a scheduling policy

    Scheduler fetchScheduler;


    // Stores the list of waves that are

    // ready to be fetched this cycle

    std::vector<Wavefront*> fetchQueue;


    // Stores the fetch status of all waves dispatched to this SIMD.

    // TRUE implies the wave is ready to fetch and is already

    // moved to fetchQueue

    std::vector<std::pair<Wavefront*, bool>> fetchStatusQueue;


    // Pointer to list of waves dispatched on to this SIMD unit

    std::vector<Wavefront*> *waveList;

    // holds the fetch buffers. each wave has 1 entry.

    std::vector<FetchBufDesc> fetchBuf;

    int fetchDepth;

};


} // namespace gem5


#endif // __FETCH_UNIT_HH__

types.hh
Defines global host-dependent types: Counter, Tick, and (indirectly) {int,uint}{8,...

gem5::ComputeUnit
Definition compute_unit.hh:203

gem5::EventBase::AutoDelete
static const FlagsType AutoDelete
Definition eventq.hh:110

gem5::Event
Definition eventq.hh:255

gem5::Event::setFlags
void setFlags(Flags _flags)
Definition eventq.hh:331

gem5::FetchUnit::FetchBufDesc
fetch buffer descriptor.
Definition fetch_unit.hh:75

gem5::FetchUnit::FetchBufDesc::nextFetchAddr
Addr nextFetchAddr()
Definition fetch_unit.cc:392

gem5::FetchUnit::FetchBufDesc::FetchBufDesc
FetchBufDesc()
Definition fetch_unit.hh:77

gem5::FetchUnit::FetchBufDesc::reservedLines
int reservedLines() const
Definition fetch_unit.hh:104

gem5::FetchUnit::FetchBufDesc::reservedPCs
std::map< Addr, uint8_t * > reservedPCs
Definition fetch_unit.hh:205

gem5::FetchUnit::FetchBufDesc::decodeSplitInst
void decodeSplitInst()
Definition fetch_unit.cc:613

gem5::FetchUnit::FetchBufDesc::reserveBuf
void reserveBuf(Addr vaddr)
reserve an entry in the fetch buffer for PC = vaddr,
Definition fetch_unit.cc:447

gem5::FetchUnit::FetchBufDesc::decoder
void decoder(TheGpuISA::Decoder *dec)
Definition fetch_unit.hh:168

gem5::FetchUnit::FetchBufDesc::flushBuf
void flushBuf()
Definition fetch_unit.cc:370

gem5::FetchUnit::FetchBufDesc::readPtr
uint8_t * readPtr
pointer that points to the next chunk of inst data to be decoded.
Definition fetch_unit.hh:227

gem5::FetchUnit::FetchBufDesc::fetchBytesRemaining
int fetchBytesRemaining() const
calculates the number of fetched bytes that have yet to be decoded.
Definition fetch_unit.cc:663

gem5::FetchUnit::FetchBufDesc::checkWaveReleaseBuf
void checkWaveReleaseBuf()
checks if the wavefront can release any of its fetch buffer entries.
Definition fetch_unit.cc:518

gem5::FetchUnit::FetchBufDesc::hasFetchDataToProcess
bool hasFetchDataToProcess() const
checks if the buffer contains valid data.
Definition fetch_unit.cc:512

gem5::FetchUnit::FetchBufDesc::bufEnd
uint8_t * bufEnd
Definition fetch_unit.hh:222

gem5::FetchUnit::FetchBufDesc::bufferedPCs
std::map< Addr, uint8_t * > bufferedPCs
the set of PCs (fetch addresses) that are currently buffered.
Definition fetch_unit.hh:204

gem5::FetchUnit::FetchBufDesc::bufferedAndReservedLines
int bufferedAndReservedLines() const
Definition fetch_unit.hh:97

gem5::FetchUnit::FetchBufDesc::fetchDepth
int fetchDepth
Definition fetch_unit.hh:229

gem5::FetchUnit::FetchBufDesc::isReserved
bool isReserved(Addr vaddr) const
returns true if there is an entry reserved for this address, and false otherwise
Definition fetch_unit.hh:134

gem5::FetchUnit::FetchBufDesc::allocateBuf
void allocateBuf(int fetch_depth, int cache_line_size, Wavefront *wf)
allocate the fetch buffer space, and set the fetch depth (number of lines that may be buffered),...
Definition fetch_unit.cc:346

gem5::FetchUnit::FetchBufDesc::wavefront
Wavefront * wavefront
Definition fetch_unit.hh:238

gem5::FetchUnit::FetchBufDesc::bufferedLines
int bufferedLines() const
Definition fetch_unit.hh:102

gem5::FetchUnit::FetchBufDesc::restartFromBranch
bool restartFromBranch
Definition fetch_unit.hh:236

gem5::FetchUnit::FetchBufDesc::maxIbSize
int maxIbSize
Definition fetch_unit.hh:231

gem5::FetchUnit::FetchBufDesc::~FetchBufDesc
~FetchBufDesc()
Definition fetch_unit.hh:84

gem5::FetchUnit::FetchBufDesc::maxFbSize
int maxFbSize
Definition fetch_unit.hh:233

gem5::FetchUnit::FetchBufDesc::hasFreeSpace
bool hasFreeSpace() const
Definition fetch_unit.hh:105

gem5::FetchUnit::FetchBufDesc::fetchDone
void fetchDone(PacketPtr ptr)
Definition fetch_unit.cc:472

gem5::FetchUnit::FetchBufDesc::reservedBuf
uint8_t * reservedBuf(Addr vaddr) const
return a pointer to the raw fetch buffer data.
Definition fetch_unit.hh:120

gem5::FetchUnit::FetchBufDesc::pcBuffered
bool pcBuffered(Addr pc) const
Definition fetch_unit.hh:174

gem5::FetchUnit::FetchBufDesc::cacheLineSize
int cacheLineSize
Definition fetch_unit.hh:234

gem5::FetchUnit::FetchBufDesc::splitDecode
bool splitDecode() const
check if the next instruction to be processed out of the fetch buffer is split across the end/beginni...
Definition fetch_unit.cc:651

gem5::FetchUnit::FetchBufDesc::decodeInsts
void decodeInsts()
each time the fetch stage is ticked, we check if there are any data in the fetch buffer that may be d...
Definition fetch_unit.cc:575

gem5::FetchUnit::FetchBufDesc::bufStart
uint8_t * bufStart
raw instruction buffer.
Definition fetch_unit.hh:221

gem5::FetchUnit::FetchBufDesc::cacheLineBits
int cacheLineBits
Definition fetch_unit.hh:235

gem5::FetchUnit::FetchBufDesc::_decoder
TheGpuISA::Decoder * _decoder
Definition fetch_unit.hh:239

gem5::FetchUnit::FetchBufDesc::bufferedBytes
int bufferedBytes() const
Definition fetch_unit.hh:103

gem5::FetchUnit::FetchBufDesc::freeList
std::deque< uint8_t * > freeList
represents the fetch buffer free list.
Definition fetch_unit.hh:215

gem5::FetchUnit::SystemHubEvent
Definition fetch_unit.hh:243

gem5::FetchUnit::SystemHubEvent::process
void process()
Definition fetch_unit.cc:684

gem5::FetchUnit::SystemHubEvent::SystemHubEvent
SystemHubEvent(PacketPtr pkt, FetchUnit *fetch_unit)
Definition fetch_unit.hh:248

gem5::FetchUnit::SystemHubEvent::reqPkt
PacketPtr reqPkt
Definition fetch_unit.hh:245

gem5::FetchUnit::SystemHubEvent::fetchUnit
FetchUnit * fetchUnit
Definition fetch_unit.hh:244

gem5::FetchUnit
Definition fetch_unit.hh:56

gem5::FetchUnit::init
void init()
Definition fetch_unit.cc:65

gem5::FetchUnit::globalFetchUnitID
static uint32_t globalFetchUnitID
Definition fetch_unit.hh:67

gem5::FetchUnit::~FetchUnit
~FetchUnit()
Definition fetch_unit.cc:58

gem5::FetchUnit::fetchScheduler
Scheduler fetchScheduler
Definition fetch_unit.hh:265

gem5::FetchUnit::waveList
std::vector< Wavefront * > * waveList
Definition fetch_unit.hh:277

gem5::FetchUnit::bindWaveList
void bindWaveList(std::vector< Wavefront * > *list)
Definition fetch_unit.cc:339

gem5::FetchUnit::FetchUnit
FetchUnit(const ComputeUnitParams &p, ComputeUnit &cu)
Definition fetch_unit.cc:52

gem5::FetchUnit::fetch
void fetch(PacketPtr pkt, Wavefront *wavefront)
Definition fetch_unit.cc:230

gem5::FetchUnit::fetchQueue
std::vector< Wavefront * > fetchQueue
Definition fetch_unit.hh:269

gem5::FetchUnit::timingSim
bool timingSim
Definition fetch_unit.hh:257

gem5::FetchUnit::initiateFetch
void initiateFetch(Wavefront *wavefront)
Definition fetch_unit.cc:136

gem5::FetchUnit::exec
void exec()
Definition fetch_unit.cc:84

gem5::FetchUnit::fetchDepth
int fetchDepth
number of cache lines we can fetch and buffer.
Definition fetch_unit.hh:286

gem5::FetchUnit::decoder
TheGpuISA::Decoder decoder
Definition fetch_unit.hh:259

gem5::FetchUnit::computeUnit
ComputeUnit & computeUnit
Definition fetch_unit.hh:258

gem5::FetchUnit::processFetchReturn
void processFetchReturn(PacketPtr pkt)
Definition fetch_unit.cc:307

gem5::FetchUnit::fetchBuf
std::vector< FetchBufDesc > fetchBuf
Definition fetch_unit.hh:279

gem5::FetchUnit::flushBuf
void flushBuf(int wfSlotId)
Definition fetch_unit.cc:333

gem5::FetchUnit::fetchStatusQueue
std::vector< std::pair< Wavefront *, bool > > fetchStatusQueue
Definition fetch_unit.hh:274

gem5::Packet
A Packet is used to encapsulate a transfer between two objects in the memory system (e....
Definition packet.hh:295

gem5::Scheduler
Definition scheduler.hh:45

gem5::Wavefront
Definition wavefront.hh:61

std::deque
STL deque class.
Definition stl.hh:44

std::vector
STL vector class.
Definition stl.hh:37

eventq.hh

scheduler.hh

gem5::MipsISA::pc
Bitfield< 4 > pc
Definition pra_constants.hh:243

gem5::MipsISA::vaddr
vaddr
Definition pra_constants.hh:278

gem5::MipsISA::p
Bitfield< 0 > p
Definition pra_constants.hh:326

gem5
Copyright (c) 2024 - Pranith Kumar Copyright (c) 2020 Inria All rights reserved.
Definition binary32.hh:36

gem5::Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition types.hh:147

packet.hh
Declaration of the Packet class.