gem5  v21.0.0.0
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
hsa_driver.cc
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2015-2018 Advanced Micro Devices, Inc.
3  * All rights reserved.
4  *
5  * For use for simulation and test purposes only
6  *
7  * Redistribution and use in source and binary forms, with or without
8  * modification, are permitted provided that the following conditions are met:
9  *
10  * 1. Redistributions of source code must retain the above copyright notice,
11  * this list of conditions and the following disclaimer.
12  *
13  * 2. Redistributions in binary form must reproduce the above copyright notice,
14  * this list of conditions and the following disclaimer in the documentation
15  * and/or other materials provided with the distribution.
16  *
17  * 3. Neither the name of the copyright holder nor the names of its
18  * contributors may be used to endorse or promote products derived from this
19  * software without specific prior written permission.
20  *
21  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31  * POSSIBILITY OF SUCH DAMAGE.
32  */
33 
34 #include "dev/hsa/hsa_driver.hh"
35 
36 #include "cpu/thread_context.hh"
37 #include "debug/HSADriver.hh"
38 #include "dev/hsa/hsa_device.hh"
41 #include "dev/hsa/kfd_ioctl.h"
42 #include "params/HSADriver.hh"
43 #include "sim/process.hh"
44 #include "sim/proxy_ptr.hh"
45 #include "sim/syscall_emul_buf.hh"
46 
47 HSADriver::HSADriver(const HSADriverParams &p)
48  : EmulatedDriver(p), device(p.device), queueId(0)
49 {
50 }
51 
55 int
56 HSADriver::open(ThreadContext *tc, int mode, int flags)
57 {
58  DPRINTF(HSADriver, "Opened %s\n", filename);
59  auto process = tc->getProcessPtr();
60  auto device_fd_entry = std::make_shared<DeviceFDEntry>(this, filename);
61  int tgt_fd = process->fds->allocFD(device_fd_entry);
62  return tgt_fd;
63 }
64 
69 Addr
70 HSADriver::mmap(ThreadContext *tc, Addr start, uint64_t length, int prot,
71  int tgt_flags, int tgt_fd, off_t offset)
72 {
73  // Is this a signal event mmap
74  bool is_event_mmap = false;
75  // If addr == 0, then we may need to do mmap.
76  bool should_mmap = (start == 0);
77  auto process = tc->getProcessPtr();
78  auto mem_state = process->memState;
79  // Check if mmap is for signal events first
80  if (((offset >> PAGE_SHIFT) & KFD_MMAP_TYPE_MASK) ==
82  is_event_mmap = true;
83  DPRINTF(HSADriver, "amdkfd mmap for events(start: %p, length: 0x%x,"
84  "offset: 0x%x, )\n", start, length, offset);
85  panic_if(start != 0,
86  "Start address should be provided by KFD\n");
87  panic_if(length != 8 * KFD_SIGNAL_EVENT_LIMIT,
88  "Requested length %d, expected length %d; length mismatch\n",
89  length, 8 * KFD_SIGNAL_EVENT_LIMIT);
90  // For signal event, do mmap only is eventPage is uninitialized
91  should_mmap = (!eventPage);
92  } else {
93  DPRINTF(HSADriver, "amdkfd doorbell mmap (start: %p, length: 0x%x,"
94  "offset: 0x%x)\n", start, length, offset);
95  }
96 
97  // Extend global mmap region if necessary.
98  if (should_mmap) {
99  // Assume mmap grows down, as in x86 Linux
100  start = mem_state->getMmapEnd() - length;
101  mem_state->setMmapEnd(start);
102  }
103 
104  if (is_event_mmap) {
105  if (should_mmap) {
106  eventPage = start;
107  }
108  } else {
109  // Now map this virtual address to our PIO doorbell interface
110  // in the page tables (non-cacheable)
111  process->pTable->map(start, device->hsaPacketProc().pioAddr,
112  length, false);
113 
114  DPRINTF(HSADriver, "amdkfd doorbell mapped to %xp\n", start);
115  }
116 
117  return start;
118 }
119 
127 void
129 {
130  VPtr<kfd_ioctl_create_queue_args> args(ioc_buf, tc);
131 
132  if (queueId >= 0x1000) {
133  fatal("%s: Exceeded maximum number of HSA queues allowed\n", name());
134  }
135 
136  args->queue_id = queueId++;
137  auto &hsa_pp = device->hsaPacketProc();
139  args->ring_base_address, args->queue_id,
140  args->ring_size);
141 }
142 
143 const char*
145 {
146  return "DriverWakeupEvent";
147 }
148 
149 void
151 {
152  assert(driver);
153  driver->schedule(this, curTick() + wakeup_delay);
154 }
155 
156 void
158 {
159  panic_if(event_id >= eventSlotIndex,
160  "Trying wakeup on an event that is not yet created\n");
161  if (ETable[event_id].threadWaiting) {
162  panic_if(!ETable[event_id].tc,
163  "No thread context to wake up\n");
164  ThreadContext *tc = ETable[event_id].tc;
166  "Signal event: Waking up CPU %d\n", tc->cpuId());
167  // Wake up this thread
168  tc->activate();
169  // Remove events that can wake up this thread
170  TCEvents[tc].clearEvents();
171  } else {
172  // This may be a race condition between an ioctl call asking to wait on
173  // this event and this signalWakeupEvent. Taking care of this race
174  // condition here by setting the event here. The ioctl call should take
175  // the necessary action when waiting on an already set event. However,
176  // this may be a genuine instance in which the runtime has decided not
177  // to wait on this event. But since we cannot distinguish this case with
178  // the race condition, we are any way setting the event.
179  ETable[event_id].setEvent = true;
180  }
181 }
182 
183 void
185 {
187  "Timer event: Waking up CPU %d\n", tc->cpuId());
188  // Wake up this thread
189  tc->activate();
190  // Remove events that can wake up this thread
191  driver->TCEvents[tc].clearEvents();
192 }
fatal
#define fatal(...)
This implements a cprintf based fatal() function.
Definition: logging.hh:183
KFD_SIGNAL_EVENT_LIMIT
#define KFD_SIGNAL_EVENT_LIMIT
Definition: kfd_ioctl.h:210
kfd_ioctl_create_queue_args::read_pointer_address
uint64_t read_pointer_address
Definition: kfd_ioctl.h:48
ThreadContext::activate
virtual void activate()=0
Set the status to Active.
HSADriver::DriverWakeupEvent::process
void process() override
Definition: hsa_driver.cc:184
hsa_packet_processor.hh
hsa_driver.hh
EmulatedDriver::filename
const std::string & filename
filename for opening this driver (under /dev)
Definition: emul_driver.hh:58
ProxyPtr
Definition: proxy_ptr.hh:235
Tick
uint64_t Tick
Tick count type.
Definition: types.hh:59
HSADriver::DriverWakeupEvent::scheduleWakeup
void scheduleWakeup(Tick wakeup_delay)
Definition: hsa_driver.cc:150
proxy_ptr.hh
ThreadContext::getProcessPtr
virtual Process * getProcessPtr()=0
syscall_emul_buf.hh
HSADriver::HSADriver
HSADriver(const HSADriverParams &p)
Definition: hsa_driver.cc:47
HSAPacketProcessor::pioAddr
Addr pioAddr
Definition: hsa_packet_processor.hh:313
HSAPacketProcessor::setDeviceQueueDesc
void setDeviceQueueDesc(uint64_t hostReadIndexPointer, uint64_t basePointer, uint64_t queue_id, uint32_t size)
Definition: hsa_packet_processor.cc:100
KFD_MMAP_TYPE_MASK
#define KFD_MMAP_TYPE_MASK
Definition: kfd_event_defines.h:40
HSADriver::TCEvents
std::unordered_map< ThreadContext *, EventList > TCEvents
Definition: hsa_driver.hh:147
EmulatedDriver
EmulatedDriver is an abstract base class for fake SE-mode device drivers.
Definition: emul_driver.hh:52
ThreadContext
ThreadContext is the external interface to all thread state for anything outside of the CPU.
Definition: thread_context.hh:88
HSADriver::queueId
uint32_t queueId
Definition: hsa_driver.hh:153
kfd_ioctl_create_queue_args::ring_base_address
uint64_t ring_base_address
Definition: kfd_ioctl.h:46
DPRINTF
#define DPRINTF(x,...)
Definition: trace.hh:237
kfd_ioctl_create_queue_args::queue_id
uint32_t queue_id
Definition: kfd_ioctl.h:56
process.hh
PAGE_SHIFT
#define PAGE_SHIFT
Definition: kfd_event_defines.h:38
ArmISA::mode
Bitfield< 4, 0 > mode
Definition: miscregs_types.hh:70
kfd_event_defines.h
HSADriver::DriverWakeupEvent::description
const char * description() const override
Return a C string describing the event.
Definition: hsa_driver.cc:144
ThreadContext::cpuId
virtual int cpuId() const =0
X86ISA::prot
Bitfield< 7 > prot
Definition: misc.hh:582
Addr
uint64_t Addr
Address type This will probably be moved somewhere else in the near future.
Definition: types.hh:148
KFD_MMAP_TYPE_EVENTS
#define KFD_MMAP_TYPE_EVENTS
Definition: kfd_event_defines.h:42
SimObject::name
virtual const std::string name() const
Definition: sim_object.hh:182
panic_if
#define panic_if(cond,...)
Conditional panic macro that checks the supplied condition and only panics if the condition is true a...
Definition: logging.hh:197
HSADevice::hsaPacketProc
HSAPacketProcessor & hsaPacketProc()
Definition: hsa_device.cc:40
HSADriver::eventSlotIndex
uint32_t eventSlotIndex
Definition: hsa_driver.hh:112
kfd_ioctl_create_queue_args::ring_size
uint32_t ring_size
Definition: kfd_ioctl.h:51
HSADriver::signalWakeupEvent
virtual void signalWakeupEvent(uint32_t event_id)
Definition: hsa_driver.cc:157
curTick
Tick curTick()
The universal simulation clock.
Definition: cur_tick.hh:43
HSADriver
Definition: hsa_driver.hh:61
MipsISA::p
Bitfield< 0 > p
Definition: pra_constants.hh:323
HSADriver::ETable
std::unordered_map< uint32_t, ETEntry > ETable
Definition: hsa_driver.hh:114
HSADriver::device
HSADevice * device
HSA agent (device) that is controled by this driver.
Definition: hsa_driver.hh:152
hsa_device.hh
HSADriver::eventPage
Addr eventPage
Definition: hsa_driver.hh:111
HSADriver::allocateQueue
void allocateQueue(ThreadContext *tc, Addr ioc_buf)
Forward relevant parameters to packet processor; queueID is used to link doorbell.
Definition: hsa_driver.cc:128
kfd_ioctl.h
thread_context.hh
HSADriver::mmap
Addr mmap(ThreadContext *tc, Addr start, uint64_t length, int prot, int tgt_flags, int tgt_fd, off_t offset)
Currently, mmap() will simply setup a mapping for the associated device's packet processor's doorbell...
Definition: hsa_driver.cc:70
Process::memState
std::shared_ptr< MemState > memState
Definition: process.hh:274
HSADriver::open
int open(ThreadContext *tc, int mode, int flags)
Create an FD entry for the KFD inside of the owning process.
Definition: hsa_driver.cc:56
ArmISA::offset
Bitfield< 23, 0 > offset
Definition: types.hh:153

Generated on Tue Mar 23 2021 19:41:26 for gem5 by doxygen 1.8.17