gem5 v23.0.0.1
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros Modules Pages
scoreboard.cc
Go to the documentation of this file.
1/*
2 * Copyright (c) 2013-2014, 2016-2017 ARM Limited
3 * All rights reserved
4 *
5 * The license below extends only to copyright in the software and shall
6 * not be construed as granting a license to any other intellectual
7 * property including but not limited to intellectual property relating
8 * to a hardware implementation of the functionality of the software
9 * licensed hereunder. You may use the software subject to the license
10 * terms below provided that you ensure that this notice is replicated
11 * unmodified and in its entirety in all distributions of the software,
12 * modified or unmodified, in source code or in binary form.
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions are
16 * met: redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer;
18 * redistributions in binary form must reproduce the above copyright
19 * notice, this list of conditions and the following disclaimer in the
20 * documentation and/or other materials provided with the distribution;
21 * neither the name of the copyright holders nor the names of its
22 * contributors may be used to endorse or promote products derived from
23 * this software without specific prior written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
26 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
27 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
28 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
29 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
30 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
31 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
32 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
33 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
34 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
35 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 */
37
39
40#include "cpu/reg_class.hh"
41#include "debug/MinorScoreboard.hh"
42#include "debug/MinorTiming.hh"
43
44namespace gem5
45{
46
47namespace minor
48{
49
50bool
51Scoreboard::findIndex(const RegId& reg, Index &scoreboard_index)
52{
53 bool ret = false;
54
55 switch (reg.classValue()) {
56 case IntRegClass:
57 scoreboard_index = reg.index();
58 ret = true;
59 break;
60 case FloatRegClass:
61 scoreboard_index = floatRegOffset + reg.index();
62 ret = true;
63 break;
64 case VecRegClass:
65 case VecElemClass:
66 scoreboard_index = vecRegOffset + reg.index();
67 ret = true;
68 break;
69 case VecPredRegClass:
70 scoreboard_index = vecPredRegOffset + reg.index();
71 ret = true;
72 break;
73 case MatRegClass:
74 scoreboard_index = matRegOffset + reg.index();
75 ret = true;
76 break;
77 case CCRegClass:
78 scoreboard_index = ccRegOffset + reg.index();
79 ret = true;
80 break;
81 case MiscRegClass:
82 /* Don't bother with Misc registers */
83 ret = false;
84 break;
85 case InvalidRegClass:
86 ret = false;
87 break;
88 default:
89 panic("Unknown register class: %d", reg.classValue());
90 }
91
92 return ret;
93}
94
95void
97 ThreadContext *thread_context, bool mark_unpredictable)
98{
99 if (inst->isFault())
100 return;
101
102 StaticInstPtr staticInst = inst->staticInst;
103 unsigned int num_dests = staticInst->numDestRegs();
104
105 auto *isa = thread_context->getIsaPtr();
106
108 for (unsigned int dest_index = 0; dest_index < num_dests;
109 dest_index++)
110 {
111 RegId reg = staticInst->destRegIdx(dest_index).flatten(*isa);
112 Index index;
113
114 if (findIndex(reg, index)) {
115 if (mark_unpredictable)
117
118 inst->flatDestRegIdx[dest_index] = reg;
119
120 numResults[index]++;
121 returnCycle[index] = retire_time;
122 /* We should be able to rely on only being given accending
123 * execSeqNums, but sanity check */
124 if (inst->id.execSeqNum > writingInst[index]) {
125 writingInst[index] = inst->id.execSeqNum;
126 fuIndices[index] = inst->fuIndex;
127 }
128
129 DPRINTF(MinorScoreboard, "Marking up inst: %s"
130 " regIndex: %d final numResults: %d returnCycle: %d\n",
132 } else {
133 /* Use an invalid ID to mark invalid/untracked dests */
134 inst->flatDestRegIdx[dest_index] = RegId();
135 }
136 }
137}
138
141 ThreadContext *thread_context)
142{
143 InstSeqNum ret = 0;
144
145 if (inst->isFault())
146 return ret;
147
148 StaticInstPtr staticInst = inst->staticInst;
149 unsigned int num_srcs = staticInst->numSrcRegs();
150
151 auto *isa = thread_context->getIsaPtr();
152
153 for (unsigned int src_index = 0; src_index < num_srcs; src_index++) {
154 RegId reg = staticInst->srcRegIdx(src_index).flatten(*isa);
155 unsigned short int index;
156
157 if (findIndex(reg, index)) {
158 if (writingInst[index] > ret)
159 ret = writingInst[index];
160 }
161 }
162
163 DPRINTF(MinorScoreboard, "Inst: %s depends on execSeqNum: %d\n",
164 *inst, ret);
165
166 return ret;
167}
168
169void
170Scoreboard::clearInstDests(MinorDynInstPtr inst, bool clear_unpredictable)
171{
172 if (inst->isFault())
173 return;
174
175 StaticInstPtr staticInst = inst->staticInst;
176 unsigned int num_dests = staticInst->numDestRegs();
177
179 for (unsigned int dest_index = 0; dest_index < num_dests;
180 dest_index++)
181 {
182 const RegId& reg = inst->flatDestRegIdx[dest_index];
183 Index index;
184
185 if (findIndex(reg, index)) {
186 if (clear_unpredictable && numUnpredictableResults[index] != 0)
188
189 numResults[index] --;
190
191 if (numResults[index] == 0) {
193 writingInst[index] = 0;
195 }
196
197 DPRINTF(MinorScoreboard, "Clearing inst: %s"
198 " regIndex: %d final numResults: %d\n",
199 *inst, index, numResults[index]);
200 }
201 }
202}
203
204bool
206 const std::vector<Cycles> *src_reg_relative_latencies,
207 const std::vector<bool> *cant_forward_from_fu_indices,
208 Cycles now, ThreadContext *thread_context)
209{
210 /* Always allow fault to be issued */
211 if (inst->isFault())
212 return true;
213
214 StaticInstPtr staticInst = inst->staticInst;
215 unsigned int num_srcs = staticInst->numSrcRegs();
216
217 /* Default to saying you can issue */
218 bool ret = true;
219
220 unsigned int num_relative_latencies = 0;
221 Cycles default_relative_latency = Cycles(0);
222
223 /* Where relative latencies are given, the default is the last
224 * one as that allows the rel. lat. list to be shorted than the
225 * number of src. regs */
226 if (src_reg_relative_latencies &&
227 src_reg_relative_latencies->size() != 0)
228 {
229 num_relative_latencies = src_reg_relative_latencies->size();
230 default_relative_latency = (*src_reg_relative_latencies)
231 [num_relative_latencies-1];
232 }
233
234 auto *isa = thread_context->getIsaPtr();
235
236 /* For each source register, find the latest result */
237 unsigned int src_index = 0;
238 while (src_index < num_srcs && /* More registers */
239 ret /* Still possible */)
240 {
241 RegId reg = staticInst->srcRegIdx(src_index).flatten(*isa);
242 unsigned short int index;
243
244 if (findIndex(reg, index)) {
245 int src_reg_fu = fuIndices[index];
246 bool cant_forward = src_reg_fu != invalidFUIndex &&
247 cant_forward_from_fu_indices &&
248 src_reg_fu < cant_forward_from_fu_indices->size() &&
249 (*cant_forward_from_fu_indices)[src_reg_fu];
250
251 Cycles relative_latency = (cant_forward ? Cycles(0) :
252 (src_index >= num_relative_latencies ?
253 default_relative_latency :
254 (*src_reg_relative_latencies)[src_index]));
255
256 if (returnCycle[index] > (now + relative_latency) ||
258 {
259 ret = false;
260 }
261 }
262 src_index++;
263 }
264
265 if (debug::MinorTiming) {
266 if (ret && num_srcs > num_relative_latencies &&
267 num_relative_latencies != 0)
268 {
269 DPRINTF(MinorTiming, "Warning, inst: %s timing extra decode has"
270 " more src. regs: %d than relative latencies: %d\n",
271 staticInst->disassemble(0), num_srcs, num_relative_latencies);
272 }
273 }
274
275 return ret;
276}
277
278void
280{
281 std::ostringstream result_stream;
282
283 bool printed_element = false;
284
285 unsigned int i = 0;
286 while (i < numRegs) {
287 unsigned short int num_results = numResults[i];
288 unsigned short int num_unpredictable_results =
290
291 if (!(num_results == 0 && num_unpredictable_results == Cycles(0))) {
292 if (printed_element)
293 result_stream << ',';
294
295 result_stream << '(' << i << ','
296 << num_results << '/'
297 << num_unpredictable_results << '/'
298 << returnCycle[i] << '/'
299 << writingInst[i] << ')';
300
301 printed_element = true;
302 }
303
304 i++;
305 }
306
307 minor::minorTrace("busy=%s\n", result_stream.str());
308}
309
310} // namespace minor
311} // namespace gem5
#define DPRINTF(x,...)
Definition trace.hh:210
Cycles is a wrapper class for representing cycle counts, i.e.
Definition types.hh:79
Register ID: describe an architectural register with its class and index.
Definition reg_class.hh:93
RegId flatten(const BaseISA &isa) const
Definition reg_class.hh:279
virtual const std::string & disassemble(Addr pc, const loader::SymbolTable *symtab=nullptr) const
Return string representation of disassembled instruction.
uint8_t numSrcRegs() const
Number of source registers.
uint8_t numDestRegs() const
Number of destination registers.
const RegId & destRegIdx(int i) const
Return logical index (architectural reg num) of i'th destination reg.
const RegId & srcRegIdx(int i) const
Return logical index (architectural reg num) of i'th source reg.
ThreadContext is the external interface to all thread state for anything outside of the CPU.
virtual BaseISA * getIsaPtr() const =0
std::vector< Index > numUnpredictableResults
Count of the number of results which can't be predicted.
Definition scoreboard.hh:93
void clearInstDests(MinorDynInstPtr inst, bool clear_unpredictable)
Clear down the dependencies for this instruction.
std::vector< Cycles > returnCycle
The estimated cycle number that the result will be presented.
static constexpr int invalidFUIndex
Definition scoreboard.hh:97
const unsigned floatRegOffset
Definition scoreboard.hh:71
bool canInstIssue(MinorDynInstPtr inst, const std::vector< Cycles > *src_reg_relative_latencies, const std::vector< bool > *cant_forward_from_fu_indices, Cycles now, ThreadContext *thread_context)
Can this instruction be issued.
InstSeqNum execSeqNumToWaitFor(MinorDynInstPtr inst, ThreadContext *thread_context)
Returns the exec sequence number of the most recent inst on which the given inst depends.
const unsigned matRegOffset
Definition scoreboard.hh:75
const unsigned vecRegOffset
Definition scoreboard.hh:73
unsigned short int Index
Type to use when indexing numResults.
Definition scoreboard.hh:86
const unsigned ccRegOffset
Definition scoreboard.hh:72
std::vector< Index > numResults
Count of the number of in-flight instructions that have results for each register.
Definition scoreboard.hh:90
std::vector< int > fuIndices
Index of the FU generating this result.
Definition scoreboard.hh:96
const unsigned vecPredRegOffset
Definition scoreboard.hh:74
bool findIndex(const RegId &reg, Index &scoreboard_index)
Sets scoreboard_index to the index into numResults of the given register index.
Definition scoreboard.cc:51
void markupInstDests(MinorDynInstPtr inst, Cycles retire_time, ThreadContext *thread_context, bool mark_unpredictable)
Mark up an instruction's effects by incrementing numResults counts.
Definition scoreboard.cc:96
std::vector< InstSeqNum > writingInst
The execute sequence number of the most recent inst to generate this register value.
void minorTrace() const
MinorTraceIF interface.
const unsigned numRegs
The number of registers in the Scoreboard.
Definition scoreboard.hh:83
STL vector class.
Definition stl.hh:37
#define panic(...)
This implements a cprintf based panic() function.
Definition logging.hh:188
A simple instruction scoreboard for tracking dependencies in Execute.
Bitfield< 7 > i
Definition misc_types.hh:67
Bitfield< 30, 0 > index
Bitfield< 5, 3 > reg
Definition types.hh:92
void minorTrace(const char *fmt, Args ...args)
DPRINTFN for MinorTrace reporting.
Definition trace.hh:66
Reference material can be found at the JEDEC website: UFS standard http://www.jedec....
uint64_t InstSeqNum
Definition inst_seq.hh:40
@ VecPredRegClass
Definition reg_class.hh:66
@ MatRegClass
Matrix Register.
Definition reg_class.hh:67
@ FloatRegClass
Floating-point register.
Definition reg_class.hh:61
@ CCRegClass
Condition-code register.
Definition reg_class.hh:68
@ VecRegClass
Vector Register.
Definition reg_class.hh:63
@ IntRegClass
Integer register.
Definition reg_class.hh:60
@ InvalidRegClass
Definition reg_class.hh:70
@ MiscRegClass
Control (misc) register.
Definition reg_class.hh:69
@ VecElemClass
Vector Register Native Elem lane.
Definition reg_class.hh:65
Minor contains all the definitions within the MinorCPU apart from the CPU class itself.

Generated on Mon Jul 10 2023 15:32:01 for gem5 by doxygen 1.9.7