gem5
v20.1.0.0
|
#include <kernel_code.hh>
Definition at line 83 of file kernel_code.hh.
uint32_t AMDKernelCode::amd_kernel_code_version_major |
Definition at line 85 of file kernel_code.hh.
uint32_t AMDKernelCode::amd_kernel_code_version_minor |
Definition at line 86 of file kernel_code.hh.
uint16_t AMDKernelCode::amd_machine_kind |
Definition at line 87 of file kernel_code.hh.
uint16_t AMDKernelCode::amd_machine_version_major |
Definition at line 88 of file kernel_code.hh.
uint16_t AMDKernelCode::amd_machine_version_minor |
Definition at line 89 of file kernel_code.hh.
uint16_t AMDKernelCode::amd_machine_version_stepping |
Definition at line 90 of file kernel_code.hh.
uint32_t AMDKernelCode::bulky |
Definition at line 119 of file kernel_code.hh.
int32_t AMDKernelCode::call_convention |
Definition at line 186 of file kernel_code.hh.
uint32_t AMDKernelCode::cdbg_user |
Definition at line 120 of file kernel_code.hh.
uint32_t AMDKernelCode::compute_pgm_rsrc1_reserved |
Definition at line 121 of file kernel_code.hh.
uint32_t AMDKernelCode::compute_pgm_rsrc2_reserved |
Definition at line 144 of file kernel_code.hh.
uint64_t AMDKernelCode::control_directives[16] |
Definition at line 189 of file kernel_code.hh.
uint32_t AMDKernelCode::debug_mode |
Definition at line 117 of file kernel_code.hh.
uint16_t AMDKernelCode::debug_private_segment_buffer_sgpr |
Definition at line 181 of file kernel_code.hh.
uint16_t AMDKernelCode::debug_wavefront_private_segment_offset_sgpr |
Definition at line 180 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_dx10_clamp |
Definition at line 116 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_address_watch |
Definition at line 134 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_fp_denormal_source |
Definition at line 138 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_ieee_754_fp_division_by_zero |
Definition at line 139 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_ieee_754_fp_inexact |
Definition at line 142 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_ieee_754_fp_invalid_operation |
Definition at line 137 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_ieee_754_fp_overflow |
Definition at line 140 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_ieee_754_fp_underflow |
Definition at line 141 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_int_divide_by_zero |
Definition at line 143 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_exception_memory_violation |
Definition at line 135 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_ieee_mode |
Definition at line 118 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_ordered_append_gds |
Definition at line 160 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_sgpr_dispatch_id |
Definition at line 153 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_dispatch_ptr |
Definition at line 150 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_flat_scratch_init |
Definition at line 154 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_grid_workgroup_count_x |
Definition at line 156 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_grid_workgroup_count_y |
Definition at line 157 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_grid_workgroup_count_z |
Definition at line 158 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_kernarg_segment_ptr |
Definition at line 152 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_private_segment_buffer |
Definition at line 149 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_private_segment_size |
Definition at line 155 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_private_segment_wave_byte_offset |
Definition at line 126 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_queue_ptr |
Definition at line 151 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_workgroup_id_x |
Definition at line 129 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_workgroup_id_y |
Definition at line 130 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_workgroup_id_z |
Definition at line 131 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_sgpr_workgroup_info |
Definition at line 132 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::enable_trap_handler |
Definition at line 128 of file kernel_code.hh.
uint32_t AMDKernelCode::enable_vgpr_workitem_id |
Definition at line 133 of file kernel_code.hh.
Referenced by HSAQueueEntry::parseKernelCode().
uint32_t AMDKernelCode::float_mode_denorm_16_64 |
Definition at line 114 of file kernel_code.hh.
uint32_t AMDKernelCode::float_mode_denorm_32 |
Definition at line 113 of file kernel_code.hh.
uint32_t AMDKernelCode::float_mode_round_16_64 |
Definition at line 112 of file kernel_code.hh.
uint32_t AMDKernelCode::float_mode_round_32 |
Definition at line 111 of file kernel_code.hh.
uint32_t AMDKernelCode::gds_segment_byte_size |
Definition at line 171 of file kernel_code.hh.
uint32_t AMDKernelCode::granulated_lds_size |
Definition at line 136 of file kernel_code.hh.
uint32_t AMDKernelCode::granulated_wavefront_sgpr_count |
Definition at line 109 of file kernel_code.hh.
uint32_t AMDKernelCode::granulated_workitem_vgpr_count |
The fields below are used to set program settings for compute shaders.
Here they are primarily used to setup initial register state. See the following for full details about kernel launch, state initialization, and the AMD kernel code object: https://github.com/RadeonOpenCompute/ROCm_Documentation/ blob/master/ROCm_Compiler_SDK/ROCm-Codeobj-format.rst #initial-kernel-register-state
Definition at line 108 of file kernel_code.hh.
uint8_t AMDKernelCode::group_segment_alignment |
Definition at line 183 of file kernel_code.hh.
uint32_t AMDKernelCode::is_debug_enabled |
Definition at line 164 of file kernel_code.hh.
uint32_t AMDKernelCode::is_dynamic_callstack |
Definition at line 163 of file kernel_code.hh.
uint32_t AMDKernelCode::is_ptr64 |
Definition at line 162 of file kernel_code.hh.
uint32_t AMDKernelCode::is_xnack_enabled |
Definition at line 165 of file kernel_code.hh.
uint8_t AMDKernelCode::kernarg_segment_alignment |
Definition at line 182 of file kernel_code.hh.
uint64_t AMDKernelCode::kernarg_segment_byte_size |
Definition at line 172 of file kernel_code.hh.
int64_t AMDKernelCode::kernel_code_entry_byte_offset |
Definition at line 91 of file kernel_code.hh.
Referenced by GPUCommandProcessor::submitDispatchPkt().
int64_t AMDKernelCode::kernel_code_prefetch_byte_offset |
Definition at line 92 of file kernel_code.hh.
uint64_t AMDKernelCode::kernel_code_prefetch_byte_size |
Definition at line 93 of file kernel_code.hh.
uint32_t AMDKernelCode::kernel_code_properties_reserved1 |
Definition at line 159 of file kernel_code.hh.
uint32_t AMDKernelCode::kernel_code_properties_reserved2 |
Definition at line 166 of file kernel_code.hh.
uint64_t AMDKernelCode::max_scratch_backing_memory_byte_size |
Definition at line 94 of file kernel_code.hh.
uint32_t AMDKernelCode::priority |
Definition at line 110 of file kernel_code.hh.
uint32_t AMDKernelCode::priv |
Definition at line 115 of file kernel_code.hh.
uint32_t AMDKernelCode::private_element_size |
Definition at line 161 of file kernel_code.hh.
uint8_t AMDKernelCode::private_segment_alignment |
Definition at line 184 of file kernel_code.hh.
uint8_t AMDKernelCode::reserved[12] |
Definition at line 187 of file kernel_code.hh.
uint16_t AMDKernelCode::reserved_sgpr_count |
Definition at line 179 of file kernel_code.hh.
uint16_t AMDKernelCode::reserved_sgpr_first |
Definition at line 178 of file kernel_code.hh.
uint16_t AMDKernelCode::reserved_vgpr_count |
Definition at line 177 of file kernel_code.hh.
uint16_t AMDKernelCode::reserved_vgpr_first |
Definition at line 176 of file kernel_code.hh.
uint64_t AMDKernelCode::runtime_loader_kernel_symbol |
Definition at line 188 of file kernel_code.hh.
Referenced by GPUCommandProcessor::submitDispatchPkt().
uint32_t AMDKernelCode::user_sgpr_count |
Definition at line 127 of file kernel_code.hh.
uint16_t AMDKernelCode::wavefront_sgpr_count |
Definition at line 174 of file kernel_code.hh.
uint8_t AMDKernelCode::wavefront_size |
Definition at line 185 of file kernel_code.hh.
uint32_t AMDKernelCode::workgroup_fbarrier_count |
Definition at line 173 of file kernel_code.hh.
uint32_t AMDKernelCode::workgroup_group_segment_byte_size |
Definition at line 170 of file kernel_code.hh.
uint32_t AMDKernelCode::workitem_private_segment_byte_size |
Definition at line 169 of file kernel_code.hh.
uint16_t AMDKernelCode::workitem_vgpr_count |
Definition at line 175 of file kernel_code.hh.