gem5  v22.0.0.2
FaultModel.cc
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2011 Massachusetts Institute of Technology
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions are
7  * met: redistributions of source code must retain the above copyright
8  * notice, this list of conditions and the following disclaimer;
9  * redistributions in binary form must reproduce the above copyright
10  * notice, this list of conditions and the following disclaimer in the
11  * documentation and/or other materials provided with the distribution;
12  * neither the name of the copyright holders nor the names of its
13  * contributors may be used to endorse or promote products derived from
14  * this software without specific prior written permission.
15  *
16  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27  */
28 
29 /*
30  * Official Tool Website: www.mit.edu/~kaisopos/FaultModel
31  *
32  * If you use our tool for academic research, we request that you cite:
33  * Konstantinos Aisopos, Chia-Hsin Owen Chen, and Li-Shiuan Peh. Enabling
34  * System-Level Modeling of Variation-Induced Faults in Networks-on-Chip.
35  * Proceedings of the 48th Design Automation Conference (DAC'11)
36  */
37 
38 // C++ includes
39 #include <cassert>
40 #include <fstream>
41 #include <iostream>
42 #include <vector>
43 
44 // GEM5 includes
45 #include "FaultModel.hh"
46 #include "base/logging.hh"
47 
48 #define MAX(a,b) ((a > b) ? (a) : (b))
49 
50 namespace gem5
51 {
52 
53 namespace ruby
54 {
55 
57 {
58  // read configurations into "configurations" vector
59  // format: <buff/vc> <vcs> <10 fault types>
60  bool more_records = true;
61  for (int i = 0; more_records; i += (fields_per_conf_record)){
62  system_conf configuration;
63  configuration.buff_per_vc =
64  p.baseline_fault_vector_database[i + conf_record_buff_per_vc];
65  configuration.vcs =
66  p.baseline_fault_vector_database[i + conf_record_vcs];
67  for (int fault_index = 0; fault_index < number_of_fault_types;
68  fault_index++){
69  configuration.fault_type[fault_index] =
70  p.baseline_fault_vector_database[i +
71  conf_record_first_fault_type + fault_index] / 100;
72  }
73  configurations.push_back(configuration);
74  if (p.baseline_fault_vector_database[i+fields_per_conf_record] < 0){
75  more_records = false;
76  }
77  }
78 
79  // read temperature weights into "temperature_weights" vector
80  // format: <temperature> <weight>
81  more_records = true;
82  for (int i = 0; more_records; i += (fields_per_temperature_record)){
83  int record_temperature =
84  p.temperature_weights_database[i + temperature_record_temp];
85  int record_weight =
86  p.temperature_weights_database[i + temperature_record_weight];
87  static int first_record = true;
88  if (first_record){
89  for (int temperature = 0; temperature < record_temperature;
90  temperature++){
91  temperature_weights.push_back(0);
92  }
93  first_record = false;
94  }
95  assert(record_temperature == temperature_weights.size());
96  temperature_weights.push_back(record_weight);
97  if (p.temperature_weights_database[i +
99  more_records = false;
100  }
101  }
102 }
103 
104 std::string
106 {
107  if (ft == data_corruption__few_bits){
108  return "data_corruption__few_bits";
109  } else if (ft == data_corruption__all_bits){
110  return "data_corruption__all_bits";
111  } else if (ft == flit_conservation__flit_duplication){
112  return "flit_conservation__flit_duplication";
113  } else if (ft == flit_conservation__flit_loss_or_split){
114  return "flit_conservation__flit_loss_or_split";
115  } else if (ft == misrouting){
116  return "misrouting";
117  } else if (ft == credit_conservation__credit_generation){
118  return "credit_conservation__credit_generation";
119  } else if (ft == credit_conservation__credit_loss){
120  return "credit_conservation__credit_loss";
121  } else if (ft == erroneous_allocation__VC){
122  return "erroneous_allocation__VC";
123  } else if (ft == erroneous_allocation__switch){
124  return "erroneous_allocation__switch";
125  } else if (ft == unfair_arbitration){
126  return "unfair_arbitration";
127  } else if (ft == number_of_fault_types){
128  return "none";
129  } else {
130  return "none";
131  }
132 }
133 
134 
135 int
136 FaultModel::declare_router(int number_of_inputs,
137  int number_of_outputs,
138  int number_of_vcs_per_input,
139  int number_of_buff_per_data_vc,
140  int number_of_buff_per_ctrl_vc)
141 {
142  // check inputs (are they legal?)
143  if (number_of_inputs <= 0 || number_of_outputs <= 0 ||
144  number_of_vcs_per_input <= 0 || number_of_buff_per_data_vc <= 0 ||
145  number_of_buff_per_ctrl_vc <= 0){
146  fatal("Fault Model: ERROR in argument of FaultModel_declare_router!");
147  }
148  int number_of_buffers_per_vc = MAX(number_of_buff_per_data_vc,
149  number_of_buff_per_ctrl_vc);
150  int total_vcs = number_of_inputs * number_of_vcs_per_input;
151  if (total_vcs > MAX_VCs){
152  fatal("Fault Model: ERROR! Number inputs*VCs (MAX_VCs) unsupported");
153  }
154  if (number_of_buffers_per_vc > MAX_BUFFERS_per_VC){
155  fatal("Fault Model: ERROR! buffers/VC (MAX_BUFFERS_per_VC) too high");
156  }
157 
158  // link the router to a DB record
159  int record_hit = -1;
160  for (int record = 0; record < configurations.size(); record++){
161  if ((configurations[record].buff_per_vc == number_of_buffers_per_vc)&&
162  (configurations[record].vcs == total_vcs)){
163  record_hit = record;
164  }
165  }
166  if (record_hit == -1){
167  panic("Fault Model: ERROR! configuration not found in DB. BUG?");
168  }
169 
170  // remember the router and return its ID
171  routers.push_back(configurations[record_hit]);
172  static int router_index = 0;
173  return router_index++;
174 }
175 
176 bool
178  int temperature_input,
179  float fault_vector[])
180 {
181  bool ok = true;
182 
183  // is the routerID recorded?
184  if (routerID < 0 || routerID >= ((int) routers.size())){
185  warn("Fault Model: ERROR! unknown router ID argument.");
186  fatal("Fault Model: Did you enable the fault model flag)?");
187  }
188 
189  // is the temperature too high/too low?
190  int temperature = temperature_input;
191  if (temperature_input >= ((int) temperature_weights.size())){
192  ok = false;
193  warn_once("Fault Model: Temperature exceeded simulated upper bound.");
194  warn_once("Fault Model: The fault model is not accurate any more.");
195  temperature = (temperature_weights.size() - 1);
196  } else if (temperature_input < 0){
197  ok = false;
198  warn_once("Fault Model: Temperature exceeded simulated lower bound.");
199  warn_once("Fault Model: The fault model is not accurate any more.");
200  temperature = 0;
201  }
202 
203  // recover the router record and return its fault vector
204  for (int i = 0; i < number_of_fault_types; i++){
205  fault_vector[i] = routers[routerID].fault_type[i] *
206  ((float)temperature_weights[temperature]);
207  }
208  return ok;
209 }
210 
211 bool
213  int temperature_input,
214  float *aggregate_fault_prob)
215 {
216  *aggregate_fault_prob = 1.0;
217  bool ok = true;
218 
219  // is the routerID recorded?
220  if (routerID < 0 || routerID >= ((int) routers.size())){
221  warn("Fault Model: ERROR! unknown router ID argument.");
222  fatal("Fault Model: Did you enable the fault model flag)?");
223  }
224 
225  // is the temperature too high/too low?
226  int temperature = temperature_input;
227  if (temperature_input >= ((int) temperature_weights.size()) ){
228  ok = false;
229  warn_once("Fault Model: Temperature exceeded simulated upper bound.");
230  warn_once("Fault Model: The fault model is not accurate any more.");
231  temperature = (temperature_weights.size()-1);
232  } else if (temperature_input < 0){
233  ok = false;
234  warn_once("Fault Model: Temperature exceeded simulated lower bound.");
235  warn_once("Fault Model: The fault model is not accurate any more.");
236  temperature = 0;
237  }
238 
239  // recover the router record and return its aggregate fault probability
240  for (int i = 0; i < number_of_fault_types; i++){
241  *aggregate_fault_prob= *aggregate_fault_prob *
242  ( 1.0 - (routers[routerID].fault_type[i] *
243  ((float)temperature_weights[temperature])) );
244  }
245  *aggregate_fault_prob = 1.0 - *aggregate_fault_prob;
246  return ok;
247 }
248 
249 // this function is used only for debugging purposes
250 void
252 {
253  std::cout << "--- PRINTING configurations ---\n";
254  for (int record = 0; record < configurations.size(); record++){
255  std::cout << "(" << record << ") ";
256  std::cout << "VCs=" << configurations[record].vcs << " ";
257  std::cout << "Buff/VC=" << configurations[record].buff_per_vc << " [";
258  for (int fault_type_num = 0;
259  fault_type_num < number_of_fault_types;
260  fault_type_num++){
261  std::cout <<
262  (100 * configurations[record].fault_type[fault_type_num]);
263  std::cout << "% ";
264  }
265  std::cout << "]\n";
266  }
267  std::cout << "--- PRINTING temperature weights ---\n";
268  for (int record = 0; record < temperature_weights.size(); record++){
269  std::cout << "temperature=" << record << " => ";
270  std::cout << "weight=" << temperature_weights[record];
271  std::cout << "\n";
272  }
273 }
274 
275 } // namespace ruby
276 } // namespace gem5
fatal
#define fatal(...)
This implements a cprintf based fatal() function.
Definition: logging.hh:190
gem5::ruby::FaultModel::temperature_record_temp
@ temperature_record_temp
Definition: FaultModel.hh:99
warn
#define warn(...)
Definition: logging.hh:246
gem5::ruby::FaultModel::fault_vector
bool fault_vector(int routerID, int temperature, float fault_vector[])
Definition: FaultModel.cc:177
warn_once
#define warn_once(...)
Definition: logging.hh:250
gem5::ruby::FaultModel::fault_type_to_string
std::string fault_type_to_string(int fault_type_index)
Definition: FaultModel.cc:105
gem5::ruby::FaultModel::credit_conservation__credit_generation
@ credit_conservation__credit_generation
Definition: FaultModel.hh:76
gem5::ruby::FaultModel::fields_per_conf_record
@ fields_per_conf_record
Definition: FaultModel.hh:94
gem5::ruby::FaultModel::FaultModel
FaultModel(const Params &p)
Definition: FaultModel.cc:56
gem5::ruby::FaultModel::system_conf::fault_type
float fault_type[number_of_fault_types]
Definition: FaultModel.hh:108
MAX_VCs
#define MAX_VCs
Definition: FaultModel.hh:42
gem5::ruby::FaultModel::conf_record_first_fault_type
@ conf_record_first_fault_type
Definition: FaultModel.hh:92
gem5::ArmISA::i
Bitfield< 7 > i
Definition: misc_types.hh:67
gem5::ruby::FaultModel::data_corruption__all_bits
@ data_corruption__all_bits
Definition: FaultModel.hh:72
gem5::ruby::FaultModel::data_corruption__few_bits
@ data_corruption__few_bits
Definition: FaultModel.hh:71
gem5::ruby::FaultModel::system_conf
Definition: FaultModel.hh:104
gem5::ruby::FaultModel::flit_conservation__flit_duplication
@ flit_conservation__flit_duplication
Definition: FaultModel.hh:73
gem5::ruby::FaultModel::conf_record_vcs
@ conf_record_vcs
Definition: FaultModel.hh:91
gem5::ruby::FaultModel::fault_prob
bool fault_prob(int routerID, int temperature, float *aggregate_fault_prob)
Definition: FaultModel.cc:212
gem5::ruby::FaultModel::erroneous_allocation__VC
@ erroneous_allocation__VC
Definition: FaultModel.hh:78
gem5::VegaISA::p
Bitfield< 54 > p
Definition: pagetable.hh:70
gem5::ruby::FaultModel::temperature_record_weight
@ temperature_record_weight
Definition: FaultModel.hh:100
gem5::ruby::FaultModel::unfair_arbitration
@ unfair_arbitration
Definition: FaultModel.hh:80
gem5::ruby::FaultModel::declare_router
int declare_router(int number_of_inputs, int number_of_outputs, int number_of_vcs_per_vnet, int number_of_buff_per_data_vc, int number_of_buff_per_ctrl_vc)
Definition: FaultModel.cc:136
gem5::ruby::FaultModel::routers
std::vector< system_conf > routers
Definition: FaultModel.hh:140
gem5::ruby::FaultModel::conf_record_buff_per_vc
@ conf_record_buff_per_vc
Definition: FaultModel.hh:90
gem5::ruby::FaultModel::erroneous_allocation__switch
@ erroneous_allocation__switch
Definition: FaultModel.hh:79
gem5::ruby::FaultModel::print
void print(void)
Definition: FaultModel.cc:251
gem5::ruby::FaultModel::temperature_weights
std::vector< int > temperature_weights
Definition: FaultModel.hh:141
gem5::ruby::FaultModel::system_conf::vcs
int vcs
Definition: FaultModel.hh:106
gem5::SimObject
Abstract superclass for simulation objects.
Definition: sim_object.hh:146
gem5::ruby::FaultModel::number_of_fault_types
@ number_of_fault_types
Definition: FaultModel.hh:81
gem5::ruby::FaultModel::fields_per_temperature_record
@ fields_per_temperature_record
Definition: FaultModel.hh:101
gem5::ruby::FaultModel::credit_conservation__credit_loss
@ credit_conservation__credit_loss
Definition: FaultModel.hh:77
MAX
#define MAX(a, b)
Definition: FaultModel.cc:48
FaultModel.hh
gem5::ruby::FaultModel::flit_conservation__flit_loss_or_split
@ flit_conservation__flit_loss_or_split
Definition: FaultModel.hh:74
logging.hh
gem5::ruby::FaultModel::configurations
std::vector< system_conf > configurations
Definition: FaultModel.hh:139
gem5::ruby::FaultModel::system_conf::buff_per_vc
int buff_per_vc
Definition: FaultModel.hh:107
gem5::ruby::FaultModel::misrouting
@ misrouting
Definition: FaultModel.hh:75
gem5
Reference material can be found at the JEDEC website: UFS standard http://www.jedec....
Definition: gpu_translation_state.hh:37
MAX_BUFFERS_per_VC
#define MAX_BUFFERS_per_VC
Definition: FaultModel.hh:43
panic
#define panic(...)
This implements a cprintf based panic() function.
Definition: logging.hh:178
gem5::ruby::FaultModel::Params
FaultModelParams Params
Definition: FaultModel.hh:62

Generated on Thu Jul 28 2022 13:32:35 for gem5 by doxygen 1.8.17