43 #ifndef HSA_RUNTIME_INC_HSA_H_ 44 #define HSA_RUNTIME_INC_HSA_H_ 58 #ifndef HSA_EXPORT_DECORATOR 60 #define HSA_EXPORT_DECORATOR __attribute__ ((visibility ("default"))) 62 #define HSA_EXPORT_DECORATOR 65 #define HSA_API_EXPORT HSA_EXPORT_DECORATOR HSA_CALL 66 #define HSA_API_IMPORT HSA_CALL 68 #if !defined(HSA_API) && defined(HSA_EXPORT) 69 #define HSA_API HSA_API_EXPORT 71 #define HSA_API HSA_API_IMPORT 75 #undef HSA_LARGE_MODEL 76 #if defined(__LP64__) || defined(_M_X64) 77 #define HSA_LARGE_MODEL 81 #if !defined(LITTLEENDIAN_CPU) && !defined(BIGENDIAN_CPU) 82 #if defined(__i386__) || defined(__x86_64__) || defined(_M_IX86) || \ 84 #define LITTLEENDIAN_CPU 88 #undef HSA_LITTLE_ENDIAN 89 #if defined(LITTLEENDIAN_CPU) 90 #define HSA_LITTLE_ENDIAN 91 #elif defined(BIGENDIAN_CPU) 93 #error "BIGENDIAN_CPU or LITTLEENDIAN_CPU must be defined" 96 #ifndef HSA_DEPRECATED 97 #define HSA_DEPRECATED 105 #define HSA_VERSION_1_0 1 281 const char ** status_string);
592 uint16_t version_major,
593 uint16_t version_minor,
621 uint16_t version_major,
622 uint16_t *version_minor,
661 uint16_t version_major,
662 uint16_t version_minor,
701 uint16_t version_major,
1237 uint16_t version_major,
1238 uint16_t version_minor,
1272 uint16_t version_major,
1273 uint16_t *version_minor,
1299 #ifdef HSA_LARGE_MODEL 1336 hsa_signal_value_t initial_value,
1337 uint32_t num_consumers,
1394 hsa_signal_value_t value);
1401 hsa_signal_value_t value);
1410 hsa_signal_value_t value);
1427 hsa_signal_value_t value);
1434 hsa_signal_value_t value);
1452 hsa_signal_value_t value);
1461 hsa_signal_value_t value);
1468 hsa_signal_value_t value);
1477 hsa_signal_value_t value);
1484 hsa_signal_value_t value);
1490 hsa_signal_value_t value);
1499 hsa_signal_value_t value);
1522 hsa_signal_value_t value);
1533 hsa_signal_value_t value);
1541 hsa_signal_value_t value);
1551 hsa_signal_value_t value);
1559 hsa_signal_value_t value);
1567 hsa_signal_value_t value);
1577 hsa_signal_value_t value);
1593 hsa_signal_value_t value);
1602 hsa_signal_value_t value);
1609 hsa_signal_value_t value);
1618 hsa_signal_value_t value);
1625 hsa_signal_value_t value);
1632 hsa_signal_value_t value);
1642 hsa_signal_value_t value);
1658 hsa_signal_value_t value);
1668 hsa_signal_value_t value);
1675 hsa_signal_value_t value);
1684 hsa_signal_value_t value);
1691 hsa_signal_value_t value);
1698 hsa_signal_value_t value);
1708 hsa_signal_value_t value);
1725 hsa_signal_value_t value);
1734 hsa_signal_value_t value);
1741 hsa_signal_value_t value);
1750 hsa_signal_value_t value);
1757 hsa_signal_value_t value);
1764 hsa_signal_value_t value);
1774 hsa_signal_value_t value);
1790 hsa_signal_value_t value);
1800 hsa_signal_value_t value);
1807 hsa_signal_value_t value);
1816 hsa_signal_value_t value);
1823 hsa_signal_value_t value);
1830 hsa_signal_value_t value);
1839 hsa_signal_value_t value);
1856 hsa_signal_value_t value);
1866 hsa_signal_value_t value);
1873 hsa_signal_value_t value);
1882 hsa_signal_value_t value);
1889 hsa_signal_value_t value);
1896 hsa_signal_value_t value);
1905 hsa_signal_value_t value);
1986 hsa_signal_value_t compare_value,
1987 uint64_t timeout_hint,
1996 hsa_signal_value_t compare_value,
1997 uint64_t timeout_hint,
2008 hsa_signal_value_t compare_value,
2009 uint64_t timeout_hint,
2056 uint32_t num_signals,
2058 uint32_t num_consumers,
2127 const hsa_signal_value_t *compare_values,
2130 hsa_signal_value_t *value);
2138 const hsa_signal_value_t *compare_values,
2141 hsa_signal_value_t *value);
2228 #ifdef HSA_LARGE_MODEL 2230 #elif defined HSA_LITTLE_ENDIAN 2346 hsa_queue_type32_t
type,
2349 uint32_t private_segment_size,
2350 uint32_t group_segment_size,
2410 hsa_queue_type32_t type,
2942 #ifdef HSA_LARGE_MODEL 2943 void* kernarg_address;
2944 #elif defined HSA_LITTLE_ENDIAN 2952 void* kernarg_address;
2995 #ifdef HSA_LARGE_MODEL 2996 void* return_address;
2997 #elif defined HSA_LITTLE_ENDIAN 3001 void* return_address;
4030 const void *code_object,
4123 const char *options,
4159 const char *options,
4244 const char *options,
4311 const char *options,
4345 const char *options);
4433 const char *variable_name,
4481 const char *variable_name,
4533 const char *variable_name,
4591 const char *options,
4646 const char *module_name,
4647 const char *symbol_name,
4649 int32_t call_convention,
4683 const char *symbol_name,
5151 const char *options,
5152 void **serialized_code_object,
5153 size_t *serialized_code_object_size);
5186 void *serialized_code_object,
5187 size_t serialized_code_object_size,
5188 const char *options,
5350 const char *options);
5396 const char *symbol_name,
5429 const char *module_name,
5430 const char *symbol_name,
5636 #endif // header guard hsa_status_t HSA_API hsa_agent_iterate_caches(hsa_agent_t agent, hsa_status_t(*callback)(hsa_cache_t cache, void *data), void *data)
Iterate over the memory caches of a given agent, and invoke an application-defined callback on every ...
uint32_t group_segment_size
Size in bytes of group memory allocation request (per work-group).
struct hsa_kernel_dispatch_packet_s hsa_kernel_dispatch_packet_t
AQL kernel dispatch packet.
Packet used by agents to delay processing of subsequent packets, and to express complex dependencies ...
hsa_variable_segment_t
Memory segment associated with a variable.
hsa_signal_value_t HSA_API hsa_signal_cas_screlease(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
struct hsa_barrier_and_packet_s hsa_barrier_and_packet_t
Barrier-AND packet.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_cas_acq_rel(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
hsa_status_t HSA_API hsa_executable_get_symbol_by_name(hsa_executable_t executable, const char *symbol_name, const hsa_agent_t *agent, hsa_executable_symbol_t *symbol)
Retrieve the symbol handle corresponding to a given a symbol name.
uint16_t workgroup_size_y
Y dimension of work-group, in work-items.
hsa_fp_type_t
Floating-point types.
The memory region is invalid.
uint64_t HSA_API HSA_DEPRECATED hsa_queue_load_read_index_acquire(const hsa_queue_t *queue)
Atomically load the read index of a queue.
uint16_t type
Application-defined function to be performed by the destination agent.
hsa_status_t HSA_API hsa_soft_queue_create(hsa_region_t region, uint32_t size, hsa_queue_type32_t type, uint32_t features, hsa_signal_t doorbell_signal, hsa_queue_t **queue)
Create a queue for which the application or a kernel is responsible for processing the AQL packets...
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_exchange_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
Queue supports multiple producers.
void HSA_API HSA_DEPRECATED hsa_signal_and_acq_rel(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
struct hsa_wavefront_s hsa_wavefront_t
Wavefront handle.
void HSA_API hsa_signal_or_scacq_screl(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
struct hsa_callback_data_s hsa_callback_data_t
Application data handle that is passed to the serialization and deserialization functions.
void HSA_API HSA_DEPRECATED hsa_signal_or_acq_rel(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
hsa_status_t HSA_API hsa_signal_group_create(uint32_t num_signals, const hsa_signal_t *signals, uint32_t num_consumers, const hsa_agent_t *consumers, hsa_signal_group_t *signal_group)
Create a signal group.
hsa_signal_value_t HSA_API hsa_signal_wait_scacquire(hsa_signal_t signal, hsa_signal_condition_t condition, hsa_signal_value_t compare_value, uint64_t timeout_hint, hsa_wait_state_t wait_state_hint)
Wait until a signal value satisfies a specified condition, or a certain amount of time has elapsed...
uint32_t grid_size_z
Z dimension of grid, in work-items.
void HSA_API hsa_queue_store_read_index_relaxed(const hsa_queue_t *queue, uint64_t value)
Atomically set the read index of a queue.
void HSA_API hsa_signal_add_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
Human-readable description.
hsa_region_segment_t
Memory segments associated with a region.
hsa_status_t HSA_API hsa_region_get_info(hsa_region_t region, hsa_region_info_t attribute, void *value)
Get the current value of an attribute of a region.
void HSA_API hsa_signal_store_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal.
hsa_symbol_kind_t
Symbol type.
hsa_status_t HSA_API hsa_isa_get_exception_policies(hsa_isa_t isa, hsa_profile_t profile, uint16_t *mask)
Retrieve the exception policy support for a given combination of instruction set architecture and pro...
Number of work-items in the wavefront.
Machine model this code object is produced for.
uint64_t handle
Opaque handle.
The wavefront is invalid.
hsa_signal_value_t HSA_API hsa_signal_load_relaxed(hsa_signal_t signal)
Atomically read the current value of a signal.
uint64_t HSA_API hsa_queue_load_write_index_relaxed(const hsa_queue_t *queue)
Atomically load the write index of a queue.
hsa_signal_t completion_signal
Signal used to indicate completion of the job.
hsa_region_global_flag_t
Global region flags.
const std::string & name()
void HSA_API hsa_signal_and_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
void HSA_API hsa_signal_xor_scacquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
hsa_status_t HSA_API hsa_system_get_major_extension_table(uint16_t extension, uint16_t version_major, size_t table_length, void *table)
Retrieve the function pointers corresponding to a given major version of an extension.
The executable symbol is invalid.
An error has been detected while releasing a resource.
Maximum number of fbarriers per work-group.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_load_acquire(hsa_signal_t signal)
Atomically read the current value of a signal.
hsa_wait_state_t
State of the application thread during a signal wait.
hsa_code_symbol_info_t
Code object symbol attributes.
struct hsa_queue_s hsa_queue_t
User mode queue.
A generic error has occurred.
Three-dimensional coordinate.
hsa_status_t HSA_API HSA_DEPRECATED hsa_agent_extension_supported(uint16_t extension, hsa_agent_t agent, uint16_t version_major, uint16_t version_minor, bool *result)
Query if a given version of an extension is supported by an agent.
void HSA_API hsa_signal_silent_store_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal without necessarily notifying the the agents waiting on it...
The variable is already defined.
void HSA_API hsa_signal_add_scacquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
hsa_status_t HSA_API hsa_executable_validate(hsa_executable_t executable, uint32_t *result)
Validate an executable.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_exchange_acquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
hsa_signal_value_t HSA_API hsa_signal_wait_relaxed(hsa_signal_t signal, hsa_signal_condition_t condition, hsa_signal_value_t compare_value, uint64_t timeout_hint, hsa_wait_state_t wait_state_hint)
Wait until a signal value satisfies a specified condition, or a certain amount of time has elapsed...
uint64_t handle
Opaque handle.
Application data handle that is passed to the serialization and deserialization functions.
Timestamp value increase rate, in Hz.
The signal group is invalid.
Packet used by agents for dispatching jobs to kernel agents.
void HSA_API HSA_DEPRECATED hsa_signal_add_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
uint64_t HSA_API HSA_DEPRECATED hsa_queue_add_write_index_acq_rel(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
Struct containing an opaque handle to a code object, which contains ISA for finalized kernels and ind...
uint16_t reserved0
Reserved.
Minor version of the HSA runtime specification supported by the agent.
Maximum allocation size in this region, in bytes.
hsa_extension_t
HSA extensions.
uint32_t reserved0
Reserved.
void HSA_API hsa_signal_subtract_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
No scope (no fence is applied).
Machine model supported by the HSA runtime.
hsa_status_t HSA_API hsa_executable_iterate_agent_symbols(hsa_executable_t executable, hsa_agent_t agent, hsa_status_t(*callback)(hsa_executable_t exec, hsa_agent_t agent, hsa_executable_symbol_t symbol, void *data), void *data)
Iterate over the kernels, indirect functions, and agent allocation variables in an executable for a g...
The file descriptor is invalid.
Type of a queue created in the agent.
The code object is invalid.
The application thread may be rescheduled while waiting on the signal.
The instruction set architecture is invalid.
uint64_t HSA_API HSA_DEPRECATED hsa_queue_load_write_index_acquire(const hsa_queue_t *queue)
Atomically load the write index of a queue.
16-bit floating-point type.
hsa_status_t HSA_API hsa_code_object_reader_create_from_memory(const void *code_object, size_t size, hsa_code_object_reader_t *code_object_reader)
Create a code object reader to operate on memory.
The code object reader is invalid.
uint16_t setup
Dispatch setup parameters.
hsa_round_method_t
Round methods.
uint32_t features
Queue features mask.
uint32_t reserved1
Reserved.
There is no symbol with the given name.
uint64_t kernel_object
Opaque handle to a code object that includes an implementation-defined executable code for the kernel...
The first operand is less than the second operand.
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_destroy(hsa_code_object_t code_object)
Destroy a code object.
hsa_status_t HSA_API HSA_DEPRECATED hsa_system_extension_supported(uint16_t extension, uint16_t version_major, uint16_t version_minor, bool *result)
Query if a given version of an extension is supported by the HSA implementation.
Minor version of the HSA runtime specification supported by the implementation.
Performance counter extension.
Maximum number of packets that a queue created in the agent can hold.
uint32_t reserved1
Reserved.
hsa_queue_type_t
Queue type.
Size of static private, spill, and arg segment memory required by this kernel (per work-item)...
uint64_t HSA_API hsa_queue_cas_write_index_scacquire(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
void HSA_API HSA_DEPRECATED hsa_signal_store_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal.
Alignment of buffers allocated by hsa_memory_allocate in this region.
The allocation kind of the variable.
uint64_t HSA_API hsa_queue_load_read_index_relaxed(const hsa_queue_t *queue)
Atomically load the read index of a queue.
uint32_t size
Maximum number of packets the queue can hold.
Struct containing an opaque handle to an executable, which contains ISA for finalized kernels and ind...
uint16_t header
Packet header.
hsa_packet_header_width_t
Width (in bits) of the sub-fields in hsa_packet_header_t.
Indicates whether the symbol corresponds to a definition.
uint64_t reserved2
Reserved.
void HSA_API HSA_DEPRECATED hsa_signal_xor_acquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
void HSA_API HSA_DEPRECATED hsa_signal_or_acquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
hsa_signal_value_t HSA_API hsa_signal_exchange_scacq_screl(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
hsa_status_t HSA_API hsa_wavefront_get_info(hsa_wavefront_t wavefront, hsa_wavefront_info_t attribute, void *value)
Get the current value of a wavefront attribute.
If a hardware exception is detected, a hardware status bit is set.
The application can use memory in the region to store kernel arguments, and provide the values for th...
Indicates whether the variable is constant.
hsa_status_t
Status codes.
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_serialize(hsa_code_object_t code_object, hsa_status_t(*alloc_callback)(size_t size, hsa_callback_data_t data, void **address), hsa_callback_data_t callback_data, const char *options, void **serialized_code_object, size_t *serialized_code_object_size)
Serialize a code object.
Default floating-point rounding modes supported by the instruction set architecture.
hsa_status_t HSA_API hsa_code_object_reader_create_from_file(hsa_file_t file, hsa_code_object_reader_t *code_object_reader)
Create a code object reader to operate on a file.
One of the actual arguments does not meet a precondition stated in the documentation of the correspon...
hsa_signal_value_t HSA_API hsa_signal_cas_scacq_screl(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
uint32_t grid_size_x
X dimension of grid, in work-items.
uint32_t private_segment_size
Size in bytes of private memory allocation request (per work-item).
struct hsa_loaded_code_object_s hsa_loaded_code_object_t
Loaded code object handle.
uint64_t handle
Opaque handle.
hsa_status_t HSA_API hsa_queue_create(hsa_agent_t agent, uint32_t size, hsa_queue_type32_t type, void(*callback)(hsa_status_t status, hsa_queue_t *source, void *data), void *data, uint32_t private_segment_size, uint32_t group_segment_size, hsa_queue_t **queue)
Create a user mode queue.
The fence is applied with agent scope for the global segment.
Indicates whether memory in this region can be allocated using hsa_memory_allocate.
struct hsa_isa_s hsa_isa_t
Instruction set architecture.
64-bit floating-point type.
The least significant byte is stored in the smallest address.
hsa_signal_condition_t
Wait condition operator.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_exchange_acq_rel(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
If a hardware exception is detected, a work-item signals an exception.
The agent supports AQL packets of kernel dispatch type.
struct hsa_code_object_s hsa_code_object_t
Struct containing an opaque handle to a code object, which contains ISA for finalized kernels and ind...
An HSAIL operation resulted in a hardware exception.
hsa_executable_state_t
Executable state.
Call convention of the kernel.
hsa_status_t HSA_API hsa_queue_inactivate(hsa_queue_t *queue)
Inactivate a queue.
Maximum number of work-items of each dimension of a work-group.
hsa_queue_type32_t type
Queue type.
hsa_signal_value_t HSA_API hsa_signal_exchange_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
hsa_status_t HSA_API hsa_agent_iterate_regions(hsa_agent_t agent, hsa_status_t(*callback)(hsa_region_t region, void *data), void *data)
Iterate over the memory regions associated with a given agent, and invoke an application-defined call...
The address of the variable.
uint16_t header
Packet header.
hsa_status_t HSA_API hsa_signal_group_wait_any_relaxed(hsa_signal_group_t signal_group, const hsa_signal_condition_t *conditions, const hsa_signal_value_t *compare_values, hsa_wait_state_t wait_state_hint, hsa_signal_t *signal, hsa_signal_value_t *value)
Wait until the value of at least one of the signals in a signal group satisfies its associated condit...
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_symbol_get_info(hsa_code_symbol_t code_symbol, hsa_code_symbol_info_t attribute, void *value)
Get the current value of an attribute for a given code symbol.
hsa_status_t HSA_API hsa_isa_get_info_alt(hsa_isa_t isa, hsa_isa_info_t attribute, void *value)
Get the current value of an attribute for a given instruction set architecture (ISA).
Flag indicating that the f16 HSAIL operation is at least as fast as the f32 operation in the instruct...
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_deserialize(void *serialized_code_object, size_t serialized_code_object_size, const char *options, hsa_code_object_t *code_object)
Deserialize a code object.
hsa_code_object_type_t
Code object type.
Updates to memory in this region are immediately visible to all the agents under the terms of the HSA...
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_get_info(hsa_code_object_t code_object, hsa_code_object_info_t attribute, void *value)
Get the current value of an attribute for a given code object.
Machine models supported by the instruction set architecture.
uint64_t handle
Opaque handle.
uint64_t HSA_API hsa_queue_load_read_index_scacquire(const hsa_queue_t *queue)
Atomically load the read index of a queue.
hsa_packet_header_t
Sub-fields of the header field that is present in any AQL packet.
Use a default floating-point rounding mode specified elsewhere.
The HSA runtime is not in the configuration state.
uint64_t handle
Opaque handle.
hsa_status_t HSA_API hsa_memory_assign_agent(void *ptr, hsa_agent_t agent, hsa_access_permission_t access)
Change the ownership of a global, coarse-grained buffer.
int32_t hsa_signal_value_t
Signal value.
hsa_kernel_dispatch_packet_setup_width_t
Width (in bits) of the sub-fields in hsa_kernel_dispatch_packet_setup_t.
The requested allocation is not valid.
Maximum total number of work-items in a grid.
uint64_t HSA_API hsa_queue_cas_write_index_relaxed(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
The length of the symbol name in bytes, not including the NUL terminator.
struct hsa_region_s hsa_region_t
A memory region represents a block of virtual memory with certain properties.
Profile this executable is created for.
void HSA_API hsa_signal_and_scacquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
The version of the code object.
void HSA_API HSA_DEPRECATED hsa_signal_add_acquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
The length of the cache name in bytes, not including the NUL terminator.
void HSA_API HSA_DEPRECATED hsa_queue_store_write_index_release(const hsa_queue_t *queue, uint64_t value)
Atomically set the write index of a queue.
32-bit floating-point type.
hsa_status_t HSA_API hsa_init()
Initialize the HSA runtime.
Number of dimensions of the grid.
First AMD extension number.
The length of the ISA name in bytes, not including the NUL terminator.
hsa_status_t HSA_API hsa_status_string(hsa_status_t status, const char **status_string)
Query additional information about a status code.
The HSA runtime failed to allocate the necessary resources.
void HSA_API HSA_DEPRECATED hsa_signal_or_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
hsa_signal_t doorbell_signal
Signal object used by the application to indicate the ID of a packet that is ready to be processed...
uint16_t reserved0
Reserved.
struct hsa_code_symbol_s hsa_code_symbol_t
Code object symbol handle.
hsa_status_t HSA_API hsa_system_major_extension_supported(uint16_t extension, uint16_t version_major, uint16_t *version_minor, bool *result)
Query if a given version of an extension is supported by the HSA implementation.
Code object reader handle.
uint64_t HSA_API hsa_queue_load_write_index_scacquire(const hsa_queue_t *queue)
Atomically load the write index of a queue.
hsa_status_t HSA_API hsa_cache_get_info(hsa_cache_t cache, hsa_cache_info_t attribute, void *value)
Get the current value of an attribute for a given cache object.
The agent supports AQL packets of agent dispatch type.
hsa_signal_value_t HSA_API hsa_signal_cas_scacquire(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
hsa_queue_feature_t
Queue features.
uint64_t reserved2
Reserved.
Size of static group segment memory required by the kernel (per work-group), in bytes.
void HSA_API HSA_DEPRECATED hsa_signal_add_acq_rel(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
hsa_status_t HSA_API hsa_iterate_agents(hsa_status_t(*callback)(hsa_agent_t agent, void *data), void *data)
Iterate over the available agents, and invoke an application-defined callback on every iteration...
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_get_symbol_from_name(hsa_code_object_t code_object, const char *module_name, const char *symbol_name, hsa_code_symbol_t *symbol)
Get the symbol handle within a code object for a given a symbol name.
std::vector< SwitchingFiber * > expected({ &a, &b, &a, &a, &a, &b, &c, &a, &c, &c, &c })
Size of static group segment memory required by the kernel (per work-group), in bytes.
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_load_code_object(hsa_executable_t executable, hsa_agent_t agent, hsa_code_object_t code_object, const char *options)
Load code object into the executable.
The module name to which this symbol belongs if this symbol has module linkage, otherwise an empty st...
hsa_status_t HSA_API hsa_queue_destroy(hsa_queue_t *queue)
Destroy a user mode queue.
struct hsa_barrier_or_packet_s hsa_barrier_or_packet_t
Barrier-OR packet.
uint64_t id
Queue identifier, which is unique over the lifetime of the application.
void HSA_API hsa_queue_store_write_index_relaxed(const hsa_queue_t *queue, uint64_t value)
Atomically set the write index of a queue.
hsa_endianness_t
Endianness.
hsa_status_t HSA_API hsa_signal_group_wait_any_scacquire(hsa_signal_group_t signal_group, const hsa_signal_condition_t *conditions, const hsa_signal_value_t *compare_values, hsa_wait_state_t wait_state_hint, hsa_signal_t *signal, hsa_signal_value_t *value)
Wait until the value of at least one of the signals in a signal group satisfies its associated condit...
uint16_t header
Packet header.
Maximum total number of work-items in a work-group.
hsa_status_t HSA_API HSA_DEPRECATED hsa_isa_compatible(hsa_isa_t code_object_isa, hsa_isa_t agent_isa, bool *result)
Check if the instruction set architecture of a code object can be executed on an agent associated wit...
uint64_t handle
Opaque handle.
uint64_t handle
Opaque handle.
hsa_status_t HSA_API hsa_executable_agent_global_variable_define(hsa_executable_t executable, hsa_agent_t agent, const char *variable_name, void *address)
Define an external global variable with agent allocation.
Major version of the HSA runtime specification supported by the implementation.
void HSA_API hsa_signal_xor_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_create(hsa_profile_t profile, hsa_executable_state_t executable_state, const char *options, hsa_executable_t *executable)
Create an empty executable.
Struct containing an opaque handle to an agent, a device that participates in the HSA memory model...
The requested queue creation is not valid.
struct hsa_dim3_s hsa_dim3_t
Three-dimensional coordinate.
void HSA_API hsa_signal_or_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
The packet has been processed in the past, but has not been reassigned to the packet processor...
The function has been executed successfully.
hsa_signal_t completion_signal
Signal used to indicate completion of the job.
int hsa_file_t
POSIX file descriptor.
uint64_t handle
Opaque handle.
hsa_status_t HSA_API HSA_DEPRECATED hsa_system_get_extension_table(uint16_t extension, uint16_t version_major, uint16_t version_minor, void *table)
Retrieve the function pointers corresponding to a given version of an extension.
void HSA_API hsa_signal_or_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
hsa_exception_policy_t
Exception policies applied in the presence of hardware exceptions.
hsa_flush_mode_t
Flush to zero modes.
hsa_status_t HSA_API hsa_memory_register(void *ptr, size_t size)
Register a global, fine-grained buffer.
void HSA_API HSA_DEPRECATED hsa_queue_store_read_index_release(const hsa_queue_t *queue, uint64_t value)
Atomically set the read index of a queue.
Default floating-point rounding mode specified when executable was created.
Executable state, which allows the user to load code objects and define external variables.
Endianness of the system.
The arguments passed to a functions are not compatible.
Alignment (in bytes) of the buffer used to pass arguments to the kernel, which is the maximum of 16 a...
hsa_signal_t completion_signal
Signal used to indicate completion of the job.
uint64_t handle
Opaque handle.
Profile this code object is produced for.
hsa_status_t HSA_API hsa_signal_group_destroy(hsa_signal_group_t signal_group)
Destroy a signal group previous created by hsa_signal_group_create.
uint64_t HSA_API HSA_DEPRECATED hsa_queue_add_write_index_release(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
Default floating-point rounding mode used when the code object is produced.
hsa_cache_info_t
Cache attributes.
Code object symbol handle.
uint64_t HSA_API hsa_queue_add_write_index_scacq_screl(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
hsa_packet_type_t
Packet type.
void HSA_API hsa_signal_add_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
The instruction set architecture name is invalid.
Executable state, which allows the user to query variable addresses, kernel code handles, and indirect function code handles using query operations.
hsa_symbol_linkage_t
Linkage type of a symbol.
Profiling events extension.
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_get_symbol(hsa_code_object_t code_object, const char *symbol_name, hsa_code_symbol_t *symbol)
Get the symbol handle within a code object for a given a symbol name.
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_get_symbol(hsa_executable_t executable, const char *module_name, const char *symbol_name, hsa_agent_t agent, int32_t call_convention, hsa_executable_symbol_t *symbol)
Get the symbol handle for a given a symbol name.
Indirect function object handle.
hsa_status_t HSA_API hsa_system_get_info(hsa_system_info_t attribute, void *value)
Get the current value of a system attribute.
uint64_t HSA_API hsa_queue_add_write_index_relaxed(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
uint64_t reserved2
Reserved.
uint64_t HSA_API HSA_DEPRECATED hsa_queue_cas_write_index_acquire(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
Maximum size (per work-group) of private memory that can be requested for a specific kernel dispatch...
struct hsa_code_object_reader_s hsa_code_object_reader_t
Code object reader handle.
hsa_status_t HSA_API hsa_executable_destroy(hsa_executable_t executable)
Destroy an executable.
hsa_status_t HSA_API hsa_memory_deregister(void *ptr, size_t size)
Deregister memory previously registered using hsa_memory_register.
The segment kind of the variable.
uint64_t handle
Opaque handle.
The executable is frozen.
void HSA_API hsa_queue_store_read_index_screlease(const hsa_queue_t *queue, uint64_t value)
Atomically set the read index of a queue.
hsa_signal_value_t HSA_API hsa_signal_load_scacquire(hsa_signal_t signal)
Atomically read the current value of a signal.
struct hsa_agent_s hsa_agent_t
Struct containing an opaque handle to an agent, a device that participates in the HSA memory model...
Kernel object handle, used in the kernel dispatch packet.
uint16_t header
Packet header.
The length of the symbol name in bytes, not including the NUL terminator.
void HSA_API hsa_signal_xor_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
uint64_t HSA_API HSA_DEPRECATED hsa_queue_add_write_index_acquire(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
Operations that specify the default floating-point mode are rounded to zero by default.
uint64_t HSA_API hsa_queue_add_write_index_screlease(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
hsa_status_t HSA_API hsa_executable_global_variable_define(hsa_executable_t executable, const char *variable_name, void *address)
Define an external global variable with program allocation.
hsa_status_t HSA_API hsa_memory_copy(void *dst, const void *src, size_t size)
Copy a block of memory from the location pointed to by src to the memory block pointed to by dst...
hsa_status_t HSA_API hsa_signal_destroy(hsa_signal_t signal)
Destroy a signal previous created by hsa_signal_create.
uint32_t reserved1
Reserved.
uint16_t workgroup_size_x
X dimension of work-group, in work-items.
Type of hardware device associated with the agent.
Indicates whether the symbol corresponds to a definition.
Alignment of the symbol in memory.
void HSA_API hsa_signal_subtract_scacquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
hsa_status_t HSA_API hsa_agent_iterate_isas(hsa_agent_t agent, hsa_status_t(*callback)(hsa_isa_t isa, void *data), void *data)
Iterate over the instruction sets supported by the given agent, and invoke an application-defined cal...
A traversal over a list of elements has been interrupted by the application before completing...
hsa_status_t HSA_API hsa_executable_symbol_get_info(hsa_executable_symbol_t executable_symbol, hsa_executable_symbol_info_t attribute, void *value)
Get the current value of an attribute for a given executable symbol.
Major version of the HSA runtime specification supported by the agent.
The maximum reference count for the object has been reached.
hsa_wavefront_info_t
Wavefront attributes.
Size of static private, spill, and arg segment memory required by this kernel (per work-item)...
hsa_status_t HSA_API hsa_executable_create_alt(hsa_profile_t profile, hsa_default_float_rounding_mode_t default_float_rounding_mode, const char *options, hsa_executable_t *executable)
Create an empty executable.
hsa_signal_t completion_signal
Signal used to indicate completion of the job.
Size of kernarg segment memory that is required to hold the values of the kernel arguments, in bytes.
Bit-mask indicating which extensions are supported by the agent.
void HSA_API hsa_signal_subtract_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
hsa_fence_scope_t
Scope of the memory fence operation associated with a packet.
hsa_status_t HSA_API hsa_isa_iterate_wavefronts(hsa_isa_t isa, hsa_status_t(*callback)(hsa_wavefront_t wavefront, void *data), void *data)
Iterate over the different wavefronts supported by an instruction set architecture, and invoke an application-defined callback on every iteration.
uint64_t HSA_API hsa_queue_add_write_index_scacquire(const hsa_queue_t *queue, uint64_t value)
Atomically increment the write index of a queue by an offset.
Instruction set architecture this code object is produced for.
Queue supports agent dispatch packets.
hsa_variable_allocation_t
Allocation type of a variable.
void HSA_API hsa_signal_or_scacquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise OR operation between the value of a signal and a given value...
Call convention of the indirect function.
The first operand is greater than or equal to the second operand.
hsa_status_t HSA_API HSA_DEPRECATED hsa_isa_get_info(hsa_isa_t isa, hsa_isa_info_t attribute, uint32_t index, void *value)
Get the current value of an attribute for a given instruction set architecture (ISA).
hsa_agent_feature_t
Agent features.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_cas_acquire(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
void HSA_API hsa_signal_subtract_scacq_screl(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
hsa_status_t HSA_API hsa_executable_get_info(hsa_executable_t executable, hsa_executable_info_t attribute, void *value)
Get the current value of an attribute for a given executable.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_cas_release(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
uint16_t workgroup_size_z
Z dimension of work-group, in work-items.
Maximum number of work-items of each dimension of a grid.
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_iterate_symbols(hsa_executable_t executable, hsa_status_t(*callback)(hsa_executable_t exec, hsa_executable_symbol_t symbol, void *data), void *data)
Iterate over the symbols in a executable, and invoke an application-defined callback on every iterati...
Operations that specify the default floating-point mode are rounded to the nearest representable numb...
hsa_region_info_t
Attributes of a memory region.
hsa_status_t HSA_API hsa_isa_get_round_method(hsa_isa_t isa, hsa_fp_type_t fp_type, hsa_flush_mode_t flush_mode, hsa_round_method_t *round_method)
Retrieve the round method (single or double) used to implement the floating-point multiply add instru...
The two operands are equal.
Maximum duration of a signal wait operation.
uint64_t handle
Opaque handle.
Size of kernarg segment memory that is required to hold the values of the kernel arguments, in bytes.
uint64_t HSA_API hsa_queue_cas_write_index_scacq_screl(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
hsa_status_t HSA_API hsa_memory_allocate(hsa_region_t region, size_t size, void **ptr)
Allocate a block of memory in a given region.
Release fence scope, The value of this sub-field determines the scope and type of the memory fence op...
void HSA_API hsa_signal_silent_store_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal without necessarily notifying the the agents waiting on it...
The fence is applied across both agent and system scope for the global segment.
hsa_status_t HSA_API hsa_executable_validate_alt(hsa_executable_t executable, const char *options, uint32_t *result)
Validate an executable.
uint32_t hsa_queue_type32_t
A fixed-size type used to represent hsa_queue_type_t constants.
hsa_access_permission_t
Access permissions.
The linkage kind of the symbol.
hsa_status_t HSA_API hsa_signal_create(hsa_signal_value_t initial_value, uint32_t num_consumers, const hsa_agent_t *consumers, hsa_signal_t *signal)
Create a signal.
uint32_t grid_size_y
Y dimension of grid, in work-items.
Updates to memory in this region can be performed by a single agent at a time.
void HSA_API HSA_DEPRECATED hsa_signal_and_acquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
hsa_status_t HSA_API hsa_code_object_reader_destroy(hsa_code_object_reader_t code_object_reader)
Destroy a code object reader.
The application thread stays active while waiting on a signal.
void HSA_API hsa_queue_store_write_index_screlease(const hsa_queue_t *queue, uint64_t value)
Atomically set the write index of a queue.
hsa_status_t HSA_API hsa_executable_iterate_program_symbols(hsa_executable_t executable, hsa_status_t(*callback)(hsa_executable_t exec, hsa_executable_symbol_t symbol, void *data), void *data)
Iterate over the program allocation variables in an executable, and invoke an application-defined cal...
struct hsa_signal_s hsa_signal_t
Signal handle.
hsa_status_t HSA_API hsa_shut_down()
Shut down the HSA runtime.
void HSA_API hsa_signal_and_scacq_screl(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
uint64_t handle
Opaque handle.
struct hsa_agent_dispatch_packet_s hsa_agent_dispatch_packet_t
Agent dispatch packet.
void HSA_API HSA_DEPRECATED hsa_signal_xor_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
The code object symbol is invalid.
hsa_kernel_dispatch_packet_setup_t
Sub-fields of the kernel dispatch packet setup field.
hsa_code_object_info_t
Code object attributes.
The linkage kind of the symbol.
void HSA_API HSA_DEPRECATED hsa_signal_subtract_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_wait_acquire(hsa_signal_t signal, hsa_signal_condition_t condition, hsa_signal_value_t compare_value, uint64_t timeout_hint, hsa_wait_state_t wait_state_hint)
Wait until a signal value satisfies a specified condition, or a certain amount of time has elapsed...
hsa_system_info_t
System attributes.
Executable symbol handle.
hsa_device_type_t
Hardware device type.
hsa_agent_info_t
Agent attributes.
void HSA_API HSA_DEPRECATED hsa_signal_subtract_acq_rel(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
hsa_isa_info_t
Instruction set architecture attributes.
hsa_status_t HSA_API hsa_executable_load_program_code_object(hsa_executable_t executable, hsa_code_object_reader_t code_object_reader, const char *options, hsa_loaded_code_object_t *loaded_code_object)
Load a program code object into an executable.
hsa_signal_value_t HSA_API hsa_signal_exchange_scacquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
uint64_t HSA_API HSA_DEPRECATED hsa_queue_cas_write_index_release(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
hsa_executable_symbol_info_t
Executable symbol attributes.
hsa_machine_model_t
Machine model.
hsa_signal_value_t HSA_API hsa_signal_exchange_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal and return its previous value.
Packet used by agents for dispatching jobs to agents.
Bit-mask indicating which extensions are supported by the implementation.
Instruction set architecture.
Profiles supported by the instruction set architecture.
Size of this region, in bytes.
void HSA_API HSA_DEPRECATED hsa_signal_xor_acq_rel(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
hsa_executable_info_t
Executable attributes.
Queue supports kernel dispatch packets.
The two operands are not equal.
Default floating-point rounding modes supported by the instruction set architecture in the Base profi...
hsa_status_t HSA_API hsa_agent_get_info(hsa_agent_t agent, hsa_agent_info_t attribute, void *value)
Get the current value of an attribute for a given agent.
uint64_t reserved2
Reserved.
void HSA_API HSA_DEPRECATED hsa_signal_and_release(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
Queue only supports a single producer.
Minimum number of packets that a queue created in the agent can hold.
hsa_status_t HSA_API HSA_DEPRECATED hsa_agent_get_exception_policies(hsa_agent_t agent, hsa_profile_t profile, uint16_t *mask)
Retrieve the exception policy support for a given combination of agent and profile.
void HSA_API hsa_signal_add_scacq_screl(hsa_signal_t signal, hsa_signal_value_t value)
Atomically increment the value of a signal by a given amount.
hsa_status_t HSA_API hsa_isa_from_name(const char *name, hsa_isa_t *isa)
Retrieve a reference to an instruction set architecture handle out of a symbolic name.
void HSA_API HSA_DEPRECATED hsa_signal_subtract_acquire(hsa_signal_t signal, hsa_signal_value_t value)
Atomically decrement the value of a signal by a given amount.
struct hsa_signal_group_s hsa_signal_group_t
Group of signals.
void HSA_API hsa_signal_and_screlease(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise AND operation between the value of a signal and a given value...
The length of the module name in bytes (not including the NUL terminator) to which this symbol belong...
uint64_t handle
Opaque handle.
The executable is invalid.
Alignment (in bytes) of the buffer used to pass arguments to the kernel, which is the maximum of 16 a...
uint16_t reserved0
Reserved.
hsa_status_t HSA_API hsa_executable_readonly_variable_define(hsa_executable_t executable, hsa_agent_t agent, const char *variable_name, void *address)
Define an external readonly variable.
The AQL packet is malformed.
A memory region represents a block of virtual memory with certain properties.
hsa_status_t HSA_API hsa_executable_load_agent_code_object(hsa_executable_t executable, hsa_agent_t agent, hsa_code_object_reader_t code_object_reader, const char *options, hsa_loaded_code_object_t *loaded_code_object)
Load an agent code object into an executable.
hsa_status_t HSA_API hsa_memory_free(void *ptr)
Deallocate a block of memory previously allocated using hsa_memory_allocate.
void HSA_API hsa_signal_xor_scacq_screl(hsa_signal_t signal, hsa_signal_value_t value)
Atomically perform a bitwise XOR operation between the value of a signal and a given value...
uint64_t handle
Opaque handle.
hsa_status_t HSA_API hsa_agent_major_extension_supported(uint16_t extension, hsa_agent_t agent, uint16_t version_major, uint16_t *version_minor, bool *result)
Query if a given version of an extension is supported by an agent.
struct hsa_executable_s hsa_executable_t
Struct containing an opaque handle to an executable, which contains ISA for finalized kernels and ind...
hsa_status_t HSA_API hsa_extension_get_name(uint16_t extension, const char **name)
Query the name of a given extension.
void HSA_API hsa_signal_store_relaxed(hsa_signal_t signal, hsa_signal_value_t value)
Atomically set the value of a signal.
Packet used by agents to delay processing of subsequent packets, and to express complex dependencies ...
Allocation granularity of buffers allocated by hsa_memory_allocate in this region.
uint64_t HSA_API hsa_queue_cas_write_index_screlease(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
uint64_t HSA_API HSA_DEPRECATED hsa_queue_cas_write_index_acq_rel(const hsa_queue_t *queue, uint64_t expected, uint64_t value)
Atomically set the write index of a queue if the observed value is equal to the expected value...
struct hsa_cache_s hsa_cache_t
Cache handle.
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_iterate_symbols(hsa_code_object_t code_object, hsa_status_t(*callback)(hsa_code_object_t code_object, hsa_code_symbol_t symbol, void *data), void *data)
Iterate over the symbols in a code object, and invoke an application-defined callback on every iterat...
Produces code object that contains ISA for all kernels and indirect functions in HSA source...
struct hsa_executable_symbol_s hsa_executable_symbol_t
Executable symbol handle.
Segment where memory in the region can be used.
Human-readable description.
hsa_default_float_rounding_mode_t
Default floating-point rounding mode.
The variable is undefined.
The most significant byte is stored in the smallest address.
hsa_signal_value_t HSA_API hsa_signal_cas_relaxed(hsa_signal_t signal, hsa_signal_value_t expected, hsa_signal_value_t value)
Atomically set the value of a signal if the observed value is equal to the expected value...
Loaded code object handle.
AQL kernel dispatch packet.
hsa_status_t HSA_API hsa_executable_freeze(hsa_executable_t executable, const char *options)
Freeze the executable.
An API other than hsa_init has been invoked while the reference count of the HSA runtime is 0...