mirror of
https://github.com/gcc-mirror/gcc.git
synced 2024-11-21 13:40:47 +00:00
18f477980c
If HSA_AMD_SYSTEM_INFO_SVM_ACCESSIBLE_BY_DEFAULT is true, all GPUs on the system support unified shared memory. That's the case for APUs and MI200 devices when XNACK is enabled. XNACK can be enabled by setting HSA_XNACK=1 as env var for supported devices; otherwise, if disable, USM code will use host fallback. gcc/ChangeLog: * config/gcn/gcn-hsa.h (gcn_local_sym_hash): Fix typo. include/ChangeLog: * hsa.h (HSA_AMD_SYSTEM_INFO_SVM_ACCESSIBLE_BY_DEFAULT): Add enum value. libgomp/ChangeLog: * libgomp.texi (gcn): Update USM handling * plugin/plugin-gcn.c (GOMP_OFFLOAD_get_num_devices): Handle USM if HSA_AMD_SYSTEM_INFO_SVM_ACCESSIBLE_BY_DEFAULT is true.
5649 lines
183 KiB
C
5649 lines
183 KiB
C
////////////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// Copyright (C) 2014-2020 Advanced Micro Devices Inc. All rights reserved.
|
|
//
|
|
// Permission is hereby granted, free of charge, to any person or organization
|
|
// obtaining a copy of the software and accompanying documentation covered by
|
|
// this license (the "Software") to use, reproduce, display, distribute,
|
|
// execute, and transmit the Software, and to prepare derivative works of the
|
|
// Software, and to permit third-parties to whom the Software is furnished to
|
|
// do so, all subject to the following:
|
|
//
|
|
// The copyright notices in the Software and this entire statement, including
|
|
// the above license grant, this restriction and the following disclaimer,
|
|
// must be included in all copies of the Software, in whole or in part, and
|
|
// all derivative works of the Software, unless such copies or derivative
|
|
// works are solely in the form of machine-executable object code generated by
|
|
// a source language processor.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
// FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT
|
|
// SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE
|
|
// FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE,
|
|
// ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
|
|
// DEALINGS IN THE SOFTWARE.
|
|
//
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#ifndef HSA_RUNTIME_INC_HSA_H_
|
|
#define HSA_RUNTIME_INC_HSA_H_
|
|
|
|
#include <stddef.h> /* size_t */
|
|
#include <stdint.h> /* uintXX_t */
|
|
|
|
#ifndef __cplusplus
|
|
#include <stdbool.h> /* bool */
|
|
#endif /* __cplusplus */
|
|
|
|
// Placeholder for calling convention and import/export macros
|
|
#ifndef HSA_CALL
|
|
#define HSA_CALL
|
|
#endif
|
|
|
|
#ifndef HSA_EXPORT_DECORATOR
|
|
#ifdef __GNUC__
|
|
#define HSA_EXPORT_DECORATOR __attribute__ ((visibility ("default")))
|
|
#else
|
|
#define HSA_EXPORT_DECORATOR
|
|
#endif
|
|
#endif
|
|
#define HSA_API_EXPORT HSA_EXPORT_DECORATOR HSA_CALL
|
|
#define HSA_API_IMPORT HSA_CALL
|
|
|
|
#if !defined(HSA_API) && defined(HSA_EXPORT)
|
|
#define HSA_API HSA_API_EXPORT
|
|
#else
|
|
#define HSA_API HSA_API_IMPORT
|
|
#endif
|
|
|
|
// Detect and set large model builds.
|
|
#undef HSA_LARGE_MODEL
|
|
#if defined(__LP64__) || defined(_M_X64)
|
|
#define HSA_LARGE_MODEL
|
|
#endif
|
|
|
|
// Try to detect CPU endianness
|
|
#if !defined(LITTLEENDIAN_CPU) && !defined(BIGENDIAN_CPU)
|
|
#if defined(__i386__) || defined(__x86_64__) || defined(_M_IX86) || \
|
|
defined(_M_X64)
|
|
#define LITTLEENDIAN_CPU
|
|
#endif
|
|
#endif
|
|
|
|
#undef HSA_LITTLE_ENDIAN
|
|
#if defined(LITTLEENDIAN_CPU)
|
|
#define HSA_LITTLE_ENDIAN
|
|
#elif defined(BIGENDIAN_CPU)
|
|
#else
|
|
#error "BIGENDIAN_CPU or LITTLEENDIAN_CPU must be defined"
|
|
#endif
|
|
|
|
#ifndef HSA_DEPRECATED
|
|
#define HSA_DEPRECATED
|
|
//#ifdef __GNUC__
|
|
//#define HSA_DEPRECATED __attribute__((deprecated))
|
|
//#else
|
|
//#define HSA_DEPRECATED __declspec(deprecated)
|
|
//#endif
|
|
#endif
|
|
|
|
#define HSA_VERSION_1_0 1
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif /* __cplusplus */
|
|
|
|
/** \defgroup status Runtime Notifications
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Status codes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The function has been executed successfully.
|
|
*/
|
|
HSA_STATUS_SUCCESS = 0x0,
|
|
/**
|
|
* A traversal over a list of elements has been interrupted by the
|
|
* application before completing.
|
|
*/
|
|
HSA_STATUS_INFO_BREAK = 0x1,
|
|
/**
|
|
* A generic error has occurred.
|
|
*/
|
|
HSA_STATUS_ERROR = 0x1000,
|
|
/**
|
|
* One of the actual arguments does not meet a precondition stated in the
|
|
* documentation of the corresponding formal argument.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_ARGUMENT = 0x1001,
|
|
/**
|
|
* The requested queue creation is not valid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_QUEUE_CREATION = 0x1002,
|
|
/**
|
|
* The requested allocation is not valid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_ALLOCATION = 0x1003,
|
|
/**
|
|
* The agent is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_AGENT = 0x1004,
|
|
/**
|
|
* The memory region is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_REGION = 0x1005,
|
|
/**
|
|
* The signal is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_SIGNAL = 0x1006,
|
|
/**
|
|
* The queue is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_QUEUE = 0x1007,
|
|
/**
|
|
* The HSA runtime failed to allocate the necessary resources. This error
|
|
* may also occur when the HSA runtime needs to spawn threads or create
|
|
* internal OS-specific events.
|
|
*/
|
|
HSA_STATUS_ERROR_OUT_OF_RESOURCES = 0x1008,
|
|
/**
|
|
* The AQL packet is malformed.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_PACKET_FORMAT = 0x1009,
|
|
/**
|
|
* An error has been detected while releasing a resource.
|
|
*/
|
|
HSA_STATUS_ERROR_RESOURCE_FREE = 0x100A,
|
|
/**
|
|
* An API other than ::hsa_init has been invoked while the reference count
|
|
* of the HSA runtime is 0.
|
|
*/
|
|
HSA_STATUS_ERROR_NOT_INITIALIZED = 0x100B,
|
|
/**
|
|
* The maximum reference count for the object has been reached.
|
|
*/
|
|
HSA_STATUS_ERROR_REFCOUNT_OVERFLOW = 0x100C,
|
|
/**
|
|
* The arguments passed to a functions are not compatible.
|
|
*/
|
|
HSA_STATUS_ERROR_INCOMPATIBLE_ARGUMENTS = 0x100D,
|
|
/**
|
|
* The index is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_INDEX = 0x100E,
|
|
/**
|
|
* The instruction set architecture is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_ISA = 0x100F,
|
|
/**
|
|
* The instruction set architecture name is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_ISA_NAME = 0x1017,
|
|
/**
|
|
* The code object is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_CODE_OBJECT = 0x1010,
|
|
/**
|
|
* The executable is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_EXECUTABLE = 0x1011,
|
|
/**
|
|
* The executable is frozen.
|
|
*/
|
|
HSA_STATUS_ERROR_FROZEN_EXECUTABLE = 0x1012,
|
|
/**
|
|
* There is no symbol with the given name.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_SYMBOL_NAME = 0x1013,
|
|
/**
|
|
* The variable is already defined.
|
|
*/
|
|
HSA_STATUS_ERROR_VARIABLE_ALREADY_DEFINED = 0x1014,
|
|
/**
|
|
* The variable is undefined.
|
|
*/
|
|
HSA_STATUS_ERROR_VARIABLE_UNDEFINED = 0x1015,
|
|
/**
|
|
* An HSAIL operation resulted in a hardware exception.
|
|
*/
|
|
HSA_STATUS_ERROR_EXCEPTION = 0x1016,
|
|
/**
|
|
* The code object symbol is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_CODE_SYMBOL = 0x1018,
|
|
/**
|
|
* The executable symbol is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_EXECUTABLE_SYMBOL = 0x1019,
|
|
/**
|
|
* The file descriptor is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_FILE = 0x1020,
|
|
/**
|
|
* The code object reader is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_CODE_OBJECT_READER = 0x1021,
|
|
/**
|
|
* The cache is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_CACHE = 0x1022,
|
|
/**
|
|
* The wavefront is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_WAVEFRONT = 0x1023,
|
|
/**
|
|
* The signal group is invalid.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_SIGNAL_GROUP = 0x1024,
|
|
/**
|
|
* The HSA runtime is not in the configuration state.
|
|
*/
|
|
HSA_STATUS_ERROR_INVALID_RUNTIME_STATE = 0x1025,
|
|
/**
|
|
* The queue received an error that may require process termination.
|
|
*/
|
|
HSA_STATUS_ERROR_FATAL = 0x1026
|
|
} hsa_status_t;
|
|
|
|
/**
|
|
* @brief Query additional information about a status code.
|
|
*
|
|
* @param[in] status Status code.
|
|
*
|
|
* @param[out] status_string A NUL-terminated string that describes the error
|
|
* status.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p status is an invalid
|
|
* status code, or @p status_string is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_status_string(
|
|
hsa_status_t status,
|
|
const char ** status_string);
|
|
|
|
/** @} */
|
|
|
|
/** \defgroup common Common Definitions
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Three-dimensional coordinate.
|
|
*/
|
|
typedef struct hsa_dim3_s {
|
|
/**
|
|
* X dimension.
|
|
*/
|
|
uint32_t x;
|
|
|
|
/**
|
|
* Y dimension.
|
|
*/
|
|
uint32_t y;
|
|
|
|
/**
|
|
* Z dimension.
|
|
*/
|
|
uint32_t z;
|
|
} hsa_dim3_t;
|
|
|
|
/**
|
|
* @brief Access permissions.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Read-only access.
|
|
*/
|
|
HSA_ACCESS_PERMISSION_RO = 1,
|
|
/**
|
|
* Write-only access.
|
|
*/
|
|
HSA_ACCESS_PERMISSION_WO = 2,
|
|
/**
|
|
* Read and write access.
|
|
*/
|
|
HSA_ACCESS_PERMISSION_RW = 3
|
|
} hsa_access_permission_t;
|
|
|
|
/**
|
|
* @brief POSIX file descriptor.
|
|
*/
|
|
typedef int hsa_file_t;
|
|
|
|
/** @} **/
|
|
|
|
|
|
/** \defgroup initshutdown Initialization and Shut Down
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Initialize the HSA runtime.
|
|
*
|
|
* @details Initializes the HSA runtime if it is not already initialized, and
|
|
* increases the reference counter associated with the HSA runtime for the
|
|
* current process. Invocation of any HSA function other than ::hsa_init results
|
|
* in undefined behavior if the current HSA runtime reference counter is less
|
|
* than one.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_REFCOUNT_OVERFLOW The HSA runtime reference
|
|
* count reaches INT32_MAX.
|
|
*/
|
|
hsa_status_t HSA_API hsa_init();
|
|
|
|
/**
|
|
* @brief Shut down the HSA runtime.
|
|
*
|
|
* @details Decreases the reference count of the HSA runtime instance. When the
|
|
* reference count reaches 0, the HSA runtime is no longer considered valid
|
|
* but the application might call ::hsa_init to initialize the HSA runtime
|
|
* again.
|
|
*
|
|
* Once the reference count of the HSA runtime reaches 0, all the resources
|
|
* associated with it (queues, signals, agent information, etc.) are
|
|
* considered invalid and any attempt to reference them in subsequent API calls
|
|
* results in undefined behavior. When the reference count reaches 0, the HSA
|
|
* runtime may release resources associated with it.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
*/
|
|
hsa_status_t HSA_API hsa_shut_down();
|
|
|
|
/** @} **/
|
|
|
|
/** \defgroup agentinfo System and Agent Information
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Endianness. A convention used to interpret the bytes making up a data
|
|
* word.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The least significant byte is stored in the smallest address.
|
|
*/
|
|
HSA_ENDIANNESS_LITTLE = 0,
|
|
/**
|
|
* The most significant byte is stored in the smallest address.
|
|
*/
|
|
HSA_ENDIANNESS_BIG = 1
|
|
} hsa_endianness_t;
|
|
|
|
/**
|
|
* @brief Machine model. A machine model determines the size of certain data
|
|
* types in HSA runtime and an agent.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Small machine model. Addresses use 32 bits.
|
|
*/
|
|
HSA_MACHINE_MODEL_SMALL = 0,
|
|
/**
|
|
* Large machine model. Addresses use 64 bits.
|
|
*/
|
|
HSA_MACHINE_MODEL_LARGE = 1
|
|
} hsa_machine_model_t;
|
|
|
|
/**
|
|
* @brief Profile. A profile indicates a particular level of feature
|
|
* support. For example, in the base profile the application must use the HSA
|
|
* runtime allocator to reserve shared virtual memory, while in the full profile
|
|
* any host pointer can be shared across all the agents.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Base profile.
|
|
*/
|
|
HSA_PROFILE_BASE = 0,
|
|
/**
|
|
* Full profile.
|
|
*/
|
|
HSA_PROFILE_FULL = 1
|
|
} hsa_profile_t;
|
|
|
|
/**
|
|
* @brief System attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Major version of the HSA runtime specification supported by the
|
|
* implementation. The type of this attribute is uint16_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_VERSION_MAJOR = 0,
|
|
/**
|
|
* Minor version of the HSA runtime specification supported by the
|
|
* implementation. The type of this attribute is uint16_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_VERSION_MINOR = 1,
|
|
/**
|
|
* Current timestamp. The value of this attribute monotonically increases at a
|
|
* constant rate. The type of this attribute is uint64_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_TIMESTAMP = 2,
|
|
/**
|
|
* Timestamp value increase rate, in Hz. The timestamp (clock) frequency is
|
|
* in the range 1-400MHz. The type of this attribute is uint64_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_TIMESTAMP_FREQUENCY = 3,
|
|
/**
|
|
* Maximum duration of a signal wait operation. Expressed as a count based on
|
|
* the timestamp frequency. The type of this attribute is uint64_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_SIGNAL_MAX_WAIT = 4,
|
|
/**
|
|
* Endianness of the system. The type of this attribute is ::hsa_endianness_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_ENDIANNESS = 5,
|
|
/**
|
|
* Machine model supported by the HSA runtime. The type of this attribute is
|
|
* ::hsa_machine_model_t.
|
|
*/
|
|
HSA_SYSTEM_INFO_MACHINE_MODEL = 6,
|
|
/**
|
|
* Bit-mask indicating which extensions are supported by the
|
|
* implementation. An extension with an ID of @p i is supported if the bit at
|
|
* position @p i is set. The type of this attribute is uint8_t[128].
|
|
*/
|
|
HSA_SYSTEM_INFO_EXTENSIONS = 7,
|
|
/**
|
|
* String containing the ROCr build identifier.
|
|
*/
|
|
HSA_AMD_SYSTEM_INFO_BUILD_VERSION = 0x200,
|
|
|
|
HSA_AMD_SYSTEM_INFO_SVM_ACCESSIBLE_BY_DEFAULT = 0x202
|
|
} hsa_system_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of a system attribute.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* system attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_system_get_info(
|
|
hsa_system_info_t attribute,
|
|
void* value);
|
|
|
|
/**
|
|
* @brief HSA extensions.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Finalizer extension.
|
|
*/
|
|
HSA_EXTENSION_FINALIZER = 0,
|
|
/**
|
|
* Images extension.
|
|
*/
|
|
HSA_EXTENSION_IMAGES = 1,
|
|
|
|
/**
|
|
* Performance counter extension.
|
|
*/
|
|
HSA_EXTENSION_PERFORMANCE_COUNTERS = 2,
|
|
|
|
/**
|
|
* Profiling events extension.
|
|
*/
|
|
HSA_EXTENSION_PROFILING_EVENTS = 3,
|
|
/**
|
|
* Extension count.
|
|
*/
|
|
HSA_EXTENSION_STD_LAST = 3,
|
|
/**
|
|
* First AMD extension number.
|
|
*/
|
|
HSA_AMD_FIRST_EXTENSION = 0x200,
|
|
/**
|
|
* Profiler extension.
|
|
*/
|
|
HSA_EXTENSION_AMD_PROFILER = 0x200,
|
|
/**
|
|
* Loader extension.
|
|
*/
|
|
HSA_EXTENSION_AMD_LOADER = 0x201,
|
|
/**
|
|
* AqlProfile extension.
|
|
*/
|
|
HSA_EXTENSION_AMD_AQLPROFILE = 0x202,
|
|
/**
|
|
* Last AMD extension.
|
|
*/
|
|
HSA_AMD_LAST_EXTENSION = 0x202
|
|
} hsa_extension_t;
|
|
|
|
/**
|
|
* @brief Query the name of a given extension.
|
|
*
|
|
* @param[in] extension Extension identifier. If the extension is not supported
|
|
* by the implementation (see ::HSA_SYSTEM_INFO_EXTENSIONS), the behavior
|
|
* is undefined.
|
|
*
|
|
* @param[out] name Pointer to a memory location where the HSA runtime stores
|
|
* the extension name. The extension name is a NUL-terminated string.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p name is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_extension_get_name(
|
|
uint16_t extension,
|
|
const char **name);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Query if a given version of an extension is supported by the HSA
|
|
* implementation.
|
|
*
|
|
* @param[in] extension Extension identifier.
|
|
*
|
|
* @param[in] version_major Major version number.
|
|
*
|
|
* @param[in] version_minor Minor version number.
|
|
*
|
|
* @param[out] result Pointer to a memory location where the HSA runtime stores
|
|
* the result of the check. The result is true if the specified version of the
|
|
* extension is supported, and false otherwise.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_system_extension_supported(
|
|
uint16_t extension,
|
|
uint16_t version_major,
|
|
uint16_t version_minor,
|
|
bool* result);
|
|
|
|
/**
|
|
* @brief Query if a given version of an extension is supported by the HSA
|
|
* implementation. All minor versions from 0 up to the returned @p version_minor
|
|
* must be supported by the implementation.
|
|
*
|
|
* @param[in] extension Extension identifier.
|
|
*
|
|
* @param[in] version_major Major version number.
|
|
*
|
|
* @param[out] version_minor Minor version number.
|
|
*
|
|
* @param[out] result Pointer to a memory location where the HSA runtime stores
|
|
* the result of the check. The result is true if the specified version of the
|
|
* extension is supported, and false otherwise.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p version_minor is NULL, or @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_system_major_extension_supported(
|
|
uint16_t extension,
|
|
uint16_t version_major,
|
|
uint16_t *version_minor,
|
|
bool* result);
|
|
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Retrieve the function pointers corresponding to a given version of an
|
|
* extension. Portable applications are expected to invoke the extension API
|
|
* using the returned function pointers
|
|
*
|
|
* @details The application is responsible for verifying that the given version
|
|
* of the extension is supported by the HSA implementation (see
|
|
* ::hsa_system_extension_supported). If the given combination of extension,
|
|
* major version, and minor version is not supported by the implementation, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] extension Extension identifier.
|
|
*
|
|
* @param[in] version_major Major version number for which to retrieve the
|
|
* function pointer table.
|
|
*
|
|
* @param[in] version_minor Minor version number for which to retrieve the
|
|
* function pointer table.
|
|
*
|
|
* @param[out] table Pointer to an application-allocated function pointer table
|
|
* that is populated by the HSA runtime. Must not be NULL. The memory associated
|
|
* with table can be reused or freed after the function returns.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p table is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_system_get_extension_table(
|
|
uint16_t extension,
|
|
uint16_t version_major,
|
|
uint16_t version_minor,
|
|
void *table);
|
|
|
|
/**
|
|
* @brief Retrieve the function pointers corresponding to a given major version
|
|
* of an extension. Portable applications are expected to invoke the extension
|
|
* API using the returned function pointers.
|
|
*
|
|
* @details The application is responsible for verifying that the given major
|
|
* version of the extension is supported by the HSA implementation (see
|
|
* ::hsa_system_major_extension_supported). If the given combination of extension
|
|
* and major version is not supported by the implementation, the behavior is
|
|
* undefined. Additionally if the length doesn't allow space for a full minor
|
|
* version, it is implementation defined if only some of the function pointers for
|
|
* that minor version get written.
|
|
*
|
|
* @param[in] extension Extension identifier.
|
|
*
|
|
* @param[in] version_major Major version number for which to retrieve the
|
|
* function pointer table.
|
|
*
|
|
* @param[in] table_length Size in bytes of the function pointer table to be
|
|
* populated. The implementation will not write more than this many bytes to the
|
|
* table.
|
|
*
|
|
* @param[out] table Pointer to an application-allocated function pointer table
|
|
* that is populated by the HSA runtime. Must not be NULL. The memory associated
|
|
* with table can be reused or freed after the function returns.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p table is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_system_get_major_extension_table(
|
|
uint16_t extension,
|
|
uint16_t version_major,
|
|
size_t table_length,
|
|
void *table);
|
|
|
|
/**
|
|
* @brief Struct containing an opaque handle to an agent, a device that participates in
|
|
* the HSA memory model. An agent can submit AQL packets for execution, and
|
|
* may also accept AQL packets for execution (agent dispatch packets or kernel
|
|
* dispatch packets launching HSAIL-derived binaries).
|
|
*/
|
|
typedef struct hsa_agent_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_agent_t;
|
|
|
|
/**
|
|
* @brief Agent features.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The agent supports AQL packets of kernel dispatch type. If this
|
|
* feature is enabled, the agent is also a kernel agent.
|
|
*/
|
|
HSA_AGENT_FEATURE_KERNEL_DISPATCH = 1,
|
|
/**
|
|
* The agent supports AQL packets of agent dispatch type.
|
|
*/
|
|
HSA_AGENT_FEATURE_AGENT_DISPATCH = 2
|
|
} hsa_agent_feature_t;
|
|
|
|
/**
|
|
* @brief Hardware device type.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* CPU device.
|
|
*/
|
|
HSA_DEVICE_TYPE_CPU = 0,
|
|
/**
|
|
* GPU device.
|
|
*/
|
|
HSA_DEVICE_TYPE_GPU = 1,
|
|
/**
|
|
* DSP device.
|
|
*/
|
|
HSA_DEVICE_TYPE_DSP = 2
|
|
} hsa_device_type_t;
|
|
|
|
/**
|
|
* @brief Default floating-point rounding mode.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Use a default floating-point rounding mode specified elsewhere.
|
|
*/
|
|
HSA_DEFAULT_FLOAT_ROUNDING_MODE_DEFAULT = 0,
|
|
/**
|
|
* Operations that specify the default floating-point mode are rounded to zero
|
|
* by default.
|
|
*/
|
|
HSA_DEFAULT_FLOAT_ROUNDING_MODE_ZERO = 1,
|
|
/**
|
|
* Operations that specify the default floating-point mode are rounded to the
|
|
* nearest representable number and that ties should be broken by selecting
|
|
* the value with an even least significant bit.
|
|
*/
|
|
HSA_DEFAULT_FLOAT_ROUNDING_MODE_NEAR = 2
|
|
} hsa_default_float_rounding_mode_t;
|
|
|
|
/**
|
|
* @brief Agent attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Agent name. The type of this attribute is a NUL-terminated char[64]. The
|
|
* name must be at most 63 characters long (not including the NUL terminator)
|
|
* and all array elements not used for the name must be NUL.
|
|
*/
|
|
HSA_AGENT_INFO_NAME = 0,
|
|
/**
|
|
* Name of vendor. The type of this attribute is a NUL-terminated char[64].
|
|
* The name must be at most 63 characters long (not including the NUL
|
|
* terminator) and all array elements not used for the name must be NUL.
|
|
*/
|
|
HSA_AGENT_INFO_VENDOR_NAME = 1,
|
|
/**
|
|
* Agent capability. The type of this attribute is ::hsa_agent_feature_t.
|
|
*/
|
|
HSA_AGENT_INFO_FEATURE = 2,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_MACHINE_MODELS for a given intruction set
|
|
* architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Machine model supported by the agent. The type of this attribute is
|
|
* ::hsa_machine_model_t.
|
|
*/
|
|
HSA_AGENT_INFO_MACHINE_MODEL = 3,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_PROFILES for a given intruction set
|
|
* architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Profile supported by the agent. The type of this attribute is
|
|
* ::hsa_profile_t.
|
|
*/
|
|
HSA_AGENT_INFO_PROFILE = 4,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_DEFAULT_FLOAT_ROUNDING_MODES for a given
|
|
* intruction set architecture supported by the agent instead. If more than
|
|
* one ISA is supported by the agent, the returned value corresponds to the
|
|
* first ISA enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Default floating-point rounding mode. The type of this attribute is
|
|
* ::hsa_default_float_rounding_mode_t, but the value
|
|
* ::HSA_DEFAULT_FLOAT_ROUNDING_MODE_DEFAULT is not allowed.
|
|
*/
|
|
HSA_AGENT_INFO_DEFAULT_FLOAT_ROUNDING_MODE = 5,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_BASE_PROFILE_DEFAULT_FLOAT_ROUNDING_MODES
|
|
* for a given intruction set architecture supported by the agent instead. If
|
|
* more than one ISA is supported by the agent, the returned value corresponds
|
|
* to the first ISA enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* A bit-mask of ::hsa_default_float_rounding_mode_t values, representing the
|
|
* default floating-point rounding modes supported by the agent in the Base
|
|
* profile. The type of this attribute is uint32_t. The default floating-point
|
|
* rounding mode (::HSA_AGENT_INFO_DEFAULT_FLOAT_ROUNDING_MODE) bit must not
|
|
* be set.
|
|
*/
|
|
HSA_AGENT_INFO_BASE_PROFILE_DEFAULT_FLOAT_ROUNDING_MODES = 23,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_FAST_F16_OPERATION for a given intruction
|
|
* set architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Flag indicating that the f16 HSAIL operation is at least as fast as the
|
|
* f32 operation in the current agent. The value of this attribute is
|
|
* undefined if the agent is not a kernel agent. The type of this
|
|
* attribute is bool.
|
|
*/
|
|
HSA_AGENT_INFO_FAST_F16_OPERATION = 24,
|
|
/**
|
|
* @deprecated Query ::HSA_WAVEFRONT_INFO_SIZE for a given wavefront and
|
|
* intruction set architecture supported by the agent instead. If more than
|
|
* one ISA is supported by the agent, the returned value corresponds to the
|
|
* first ISA enumerated by ::hsa_agent_iterate_isas and the first wavefront
|
|
* enumerated by ::hsa_isa_iterate_wavefronts for that ISA.
|
|
*
|
|
* Number of work-items in a wavefront. Must be a power of 2 in the range
|
|
* [1,256]. The value of this attribute is undefined if the agent is not
|
|
* a kernel agent. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_WAVEFRONT_SIZE = 6,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_WORKGROUP_MAX_DIM for a given intruction
|
|
* set architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Maximum number of work-items of each dimension of a work-group. Each
|
|
* maximum must be greater than 0. No maximum can exceed the value of
|
|
* ::HSA_AGENT_INFO_WORKGROUP_MAX_SIZE. The value of this attribute is
|
|
* undefined if the agent is not a kernel agent. The type of this
|
|
* attribute is uint16_t[3].
|
|
*/
|
|
HSA_AGENT_INFO_WORKGROUP_MAX_DIM = 7,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_WORKGROUP_MAX_SIZE for a given intruction
|
|
* set architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Maximum total number of work-items in a work-group. The value of this
|
|
* attribute is undefined if the agent is not a kernel agent. The type
|
|
* of this attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_WORKGROUP_MAX_SIZE = 8,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_GRID_MAX_DIM for a given intruction set
|
|
* architecture supported by the agent instead.
|
|
*
|
|
* Maximum number of work-items of each dimension of a grid. Each maximum must
|
|
* be greater than 0, and must not be smaller than the corresponding value in
|
|
* ::HSA_AGENT_INFO_WORKGROUP_MAX_DIM. No maximum can exceed the value of
|
|
* ::HSA_AGENT_INFO_GRID_MAX_SIZE. The value of this attribute is undefined
|
|
* if the agent is not a kernel agent. The type of this attribute is
|
|
* ::hsa_dim3_t.
|
|
*/
|
|
HSA_AGENT_INFO_GRID_MAX_DIM = 9,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_GRID_MAX_SIZE for a given intruction set
|
|
* architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Maximum total number of work-items in a grid. The value of this attribute
|
|
* is undefined if the agent is not a kernel agent. The type of this
|
|
* attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_GRID_MAX_SIZE = 10,
|
|
/**
|
|
* @deprecated Query ::HSA_ISA_INFO_FBARRIER_MAX_SIZE for a given intruction
|
|
* set architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Maximum number of fbarriers per work-group. Must be at least 32. The value
|
|
* of this attribute is undefined if the agent is not a kernel agent. The
|
|
* type of this attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_FBARRIER_MAX_SIZE = 11,
|
|
/**
|
|
* @deprecated The maximum number of queues is not statically determined.
|
|
*
|
|
* Maximum number of queues that can be active (created but not destroyed) at
|
|
* one time in the agent. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_QUEUES_MAX = 12,
|
|
/**
|
|
* Minimum number of packets that a queue created in the agent
|
|
* can hold. Must be a power of 2 greater than 0. Must not exceed
|
|
* the value of ::HSA_AGENT_INFO_QUEUE_MAX_SIZE. The type of this
|
|
* attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_QUEUE_MIN_SIZE = 13,
|
|
/**
|
|
* Maximum number of packets that a queue created in the agent can
|
|
* hold. Must be a power of 2 greater than 0. The type of this attribute
|
|
* is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_QUEUE_MAX_SIZE = 14,
|
|
/**
|
|
* Type of a queue created in the agent. The type of this attribute is
|
|
* ::hsa_queue_type32_t.
|
|
*/
|
|
HSA_AGENT_INFO_QUEUE_TYPE = 15,
|
|
/**
|
|
* @deprecated NUMA information is not exposed anywhere else in the API.
|
|
*
|
|
* Identifier of the NUMA node associated with the agent. The type of this
|
|
* attribute is uint32_t.
|
|
*/
|
|
HSA_AGENT_INFO_NODE = 16,
|
|
/**
|
|
* Type of hardware device associated with the agent. The type of this
|
|
* attribute is ::hsa_device_type_t.
|
|
*/
|
|
HSA_AGENT_INFO_DEVICE = 17,
|
|
/**
|
|
* @deprecated Query ::hsa_agent_iterate_caches to retrieve information about
|
|
* the caches present in a given agent.
|
|
*
|
|
* Array of data cache sizes (L1..L4). Each size is expressed in bytes. A size
|
|
* of 0 for a particular level indicates that there is no cache information
|
|
* for that level. The type of this attribute is uint32_t[4].
|
|
*/
|
|
HSA_AGENT_INFO_CACHE_SIZE = 18,
|
|
/**
|
|
* @deprecated An agent may support multiple instruction set
|
|
* architectures. See ::hsa_agent_iterate_isas. If more than one ISA is
|
|
* supported by the agent, the returned value corresponds to the first ISA
|
|
* enumerated by ::hsa_agent_iterate_isas.
|
|
*
|
|
* Instruction set architecture of the agent. The type of this attribute
|
|
* is ::hsa_isa_t.
|
|
*/
|
|
HSA_AGENT_INFO_ISA = 19,
|
|
/**
|
|
* Bit-mask indicating which extensions are supported by the agent. An
|
|
* extension with an ID of @p i is supported if the bit at position @p i is
|
|
* set. The type of this attribute is uint8_t[128].
|
|
*/
|
|
HSA_AGENT_INFO_EXTENSIONS = 20,
|
|
/**
|
|
* Major version of the HSA runtime specification supported by the
|
|
* agent. The type of this attribute is uint16_t.
|
|
*/
|
|
HSA_AGENT_INFO_VERSION_MAJOR = 21,
|
|
/**
|
|
* Minor version of the HSA runtime specification supported by the
|
|
* agent. The type of this attribute is uint16_t.
|
|
*/
|
|
HSA_AGENT_INFO_VERSION_MINOR = 22
|
|
|
|
} hsa_agent_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of an attribute for a given agent.
|
|
*
|
|
* @param[in] agent A valid agent.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* agent attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_agent_get_info(
|
|
hsa_agent_t agent,
|
|
hsa_agent_info_t attribute,
|
|
void* value);
|
|
|
|
/**
|
|
* @brief Iterate over the available agents, and invoke an
|
|
* application-defined callback on every iteration.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per agent. The HSA
|
|
* runtime passes two arguments to the callback: the agent and the
|
|
* application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* ::hsa_iterate_agents returns that status value.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_iterate_agents(
|
|
hsa_status_t (*callback)(hsa_agent_t agent, void* data),
|
|
void* data);
|
|
|
|
/*
|
|
|
|
// If we do not know the size of an attribute, we need to query it first
|
|
// Note: this API will not be in the spec unless needed
|
|
hsa_status_t HSA_API hsa_agent_get_info_size(
|
|
hsa_agent_t agent,
|
|
hsa_agent_info_t attribute,
|
|
size_t* size);
|
|
|
|
// Set the value of an agents attribute
|
|
// Note: this API will not be in the spec unless needed
|
|
hsa_status_t HSA_API hsa_agent_set_info(
|
|
hsa_agent_t agent,
|
|
hsa_agent_info_t attribute,
|
|
void* value);
|
|
|
|
*/
|
|
|
|
/**
|
|
* @brief Exception policies applied in the presence of hardware exceptions.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* If a hardware exception is detected, a work-item signals an exception.
|
|
*/
|
|
HSA_EXCEPTION_POLICY_BREAK = 1,
|
|
/**
|
|
* If a hardware exception is detected, a hardware status bit is set.
|
|
*/
|
|
HSA_EXCEPTION_POLICY_DETECT = 2
|
|
} hsa_exception_policy_t;
|
|
|
|
/**
|
|
* @deprecated Use ::hsa_isa_get_exception_policies for a given intruction set
|
|
* architecture supported by the agent instead. If more than one ISA is
|
|
* supported by the agent, this function uses the first value returned by
|
|
* ::hsa_agent_iterate_isas.
|
|
*
|
|
* @brief Retrieve the exception policy support for a given combination of
|
|
* agent and profile
|
|
*
|
|
* @param[in] agent Agent.
|
|
*
|
|
* @param[in] profile Profile.
|
|
*
|
|
* @param[out] mask Pointer to a memory location where the HSA runtime stores a
|
|
* mask of ::hsa_exception_policy_t values. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p profile is not a valid
|
|
* profile, or @p mask is NULL.
|
|
*
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_agent_get_exception_policies(
|
|
hsa_agent_t agent,
|
|
hsa_profile_t profile,
|
|
uint16_t *mask);
|
|
|
|
/**
|
|
* @brief Cache handle.
|
|
*/
|
|
typedef struct hsa_cache_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_cache_t;
|
|
|
|
/**
|
|
* @brief Cache attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The length of the cache name in bytes, not including the NUL terminator.
|
|
* The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_CACHE_INFO_NAME_LENGTH = 0,
|
|
/**
|
|
* Human-readable description. The type of this attribute is a NUL-terminated
|
|
* character array with the length equal to the value of
|
|
* ::HSA_CACHE_INFO_NAME_LENGTH attribute.
|
|
*/
|
|
HSA_CACHE_INFO_NAME = 1,
|
|
/**
|
|
* Cache level. A L1 cache must return a value of 1, a L2 must return a value
|
|
* of 2, and so on. The type of this attribute is uint8_t.
|
|
*/
|
|
HSA_CACHE_INFO_LEVEL = 2,
|
|
/**
|
|
* Cache size, in bytes. A value of 0 indicates that there is no size
|
|
* information available. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_CACHE_INFO_SIZE = 3
|
|
} hsa_cache_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of an attribute for a given cache object.
|
|
*
|
|
* @param[in] cache Cache.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CACHE The cache is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* instruction set architecture attribute, or @p value is
|
|
* NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_cache_get_info(
|
|
hsa_cache_t cache,
|
|
hsa_cache_info_t attribute,
|
|
void* value);
|
|
|
|
/**
|
|
* @brief Iterate over the memory caches of a given agent, and
|
|
* invoke an application-defined callback on every iteration.
|
|
*
|
|
* @details Caches are visited in ascending order according to the value of the
|
|
* ::HSA_CACHE_INFO_LEVEL attribute.
|
|
*
|
|
* @param[in] agent A valid agent.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per cache that is present in
|
|
* the agent. The HSA runtime passes two arguments to the callback: the cache
|
|
* and the application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* that value is returned.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_agent_iterate_caches(
|
|
hsa_agent_t agent,
|
|
hsa_status_t (*callback)(hsa_cache_t cache, void* data),
|
|
void* data);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Query if a given version of an extension is supported by an agent
|
|
*
|
|
* @param[in] extension Extension identifier.
|
|
*
|
|
* @param[in] agent Agent.
|
|
*
|
|
* @param[in] version_major Major version number.
|
|
*
|
|
* @param[in] version_minor Minor version number.
|
|
*
|
|
* @param[out] result Pointer to a memory location where the HSA runtime stores
|
|
* the result of the check. The result is true if the specified version of the
|
|
* extension is supported, and false otherwise. The result must be false if
|
|
* ::hsa_system_extension_supported returns false for the same extension
|
|
* version.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_agent_extension_supported(
|
|
uint16_t extension,
|
|
hsa_agent_t agent,
|
|
uint16_t version_major,
|
|
uint16_t version_minor,
|
|
bool* result);
|
|
|
|
/**
|
|
* @brief Query if a given version of an extension is supported by an agent. All
|
|
* minor versions from 0 up to the returned @p version_minor must be supported.
|
|
*
|
|
* @param[in] extension Extension identifier.
|
|
*
|
|
* @param[in] agent Agent.
|
|
*
|
|
* @param[in] version_major Major version number.
|
|
*
|
|
* @param[out] version_minor Minor version number.
|
|
*
|
|
* @param[out] result Pointer to a memory location where the HSA runtime stores
|
|
* the result of the check. The result is true if the specified version of the
|
|
* extension is supported, and false otherwise. The result must be false if
|
|
* ::hsa_system_extension_supported returns false for the same extension
|
|
* version.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p extension is not a valid
|
|
* extension, or @p version_minor is NULL, or @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_agent_major_extension_supported(
|
|
uint16_t extension,
|
|
hsa_agent_t agent,
|
|
uint16_t version_major,
|
|
uint16_t *version_minor,
|
|
bool* result);
|
|
|
|
|
|
/** @} */
|
|
|
|
|
|
/** \defgroup signals Signals
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Signal handle.
|
|
*/
|
|
typedef struct hsa_signal_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal. The value 0 is reserved.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_signal_t;
|
|
|
|
/**
|
|
* @brief Signal value. The value occupies 32 bits in small machine mode, and 64
|
|
* bits in large machine mode.
|
|
*/
|
|
#ifdef HSA_LARGE_MODEL
|
|
typedef int64_t hsa_signal_value_t;
|
|
#else
|
|
typedef int32_t hsa_signal_value_t;
|
|
#endif
|
|
|
|
/**
|
|
* @brief Create a signal.
|
|
*
|
|
* @param[in] initial_value Initial value of the signal.
|
|
*
|
|
* @param[in] num_consumers Size of @p consumers. A value of 0 indicates that
|
|
* any agent might wait on the signal.
|
|
*
|
|
* @param[in] consumers List of agents that might consume (wait on) the
|
|
* signal. If @p num_consumers is 0, this argument is ignored; otherwise, the
|
|
* HSA runtime might use the list to optimize the handling of the signal
|
|
* object. If an agent not listed in @p consumers waits on the returned
|
|
* signal, the behavior is undefined. The memory associated with @p consumers
|
|
* can be reused or freed after the function returns.
|
|
*
|
|
* @param[out] signal Pointer to a memory location where the HSA runtime will
|
|
* store the newly created signal handle. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p signal is NULL, @p
|
|
* num_consumers is greater than 0 but @p consumers is NULL, or @p consumers
|
|
* contains duplicates.
|
|
*/
|
|
hsa_status_t HSA_API hsa_signal_create(
|
|
hsa_signal_value_t initial_value,
|
|
uint32_t num_consumers,
|
|
const hsa_agent_t *consumers,
|
|
hsa_signal_t *signal);
|
|
|
|
/**
|
|
* @brief Destroy a signal previous created by ::hsa_signal_create.
|
|
*
|
|
* @param[in] signal Signal.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL @p signal is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT The handle in @p signal is 0.
|
|
*/
|
|
hsa_status_t HSA_API hsa_signal_destroy(
|
|
hsa_signal_t signal);
|
|
|
|
/**
|
|
* @brief Atomically read the current value of a signal.
|
|
*
|
|
* @param[in] signal Signal.
|
|
*
|
|
* @return Value of the signal.
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_load_scacquire(
|
|
hsa_signal_t signal);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_load_scacquire
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_load_relaxed(
|
|
hsa_signal_t signal);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_load_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_load_scacquire
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_load_acquire(
|
|
hsa_signal_t signal);
|
|
|
|
/**
|
|
* @brief Atomically set the value of a signal.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting
|
|
* on @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal.
|
|
*
|
|
* @param[in] value New signal value.
|
|
*/
|
|
void HSA_API hsa_signal_store_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_store_relaxed
|
|
*/
|
|
void HSA_API hsa_signal_store_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_store_screlease.
|
|
*
|
|
* @copydoc hsa_signal_store_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_store_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically set the value of a signal without necessarily notifying the
|
|
* the agents waiting on it.
|
|
*
|
|
* @details The agents waiting on @p signal may not wake up even when the new
|
|
* value satisfies their wait condition. If the application wants to update the
|
|
* signal and there is no need to notify any agent, invoking this function can
|
|
* be more efficient than calling the non-silent counterpart.
|
|
*
|
|
* @param[in] signal Signal.
|
|
*
|
|
* @param[in] value New signal value.
|
|
*/
|
|
void HSA_API hsa_signal_silent_store_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_silent_store_relaxed
|
|
*/
|
|
void HSA_API hsa_signal_silent_store_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically set the value of a signal and return its previous value.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting
|
|
* on @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue doorbell signal, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] value New value.
|
|
*
|
|
* @return Value of the signal prior to the exchange.
|
|
*
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_exchange_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_exchange_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_exchange_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_exchange_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_exchange_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_exchange_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_exchange_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_exchange_scacquire
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_exchange_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_exchange_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_exchange_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
/**
|
|
* @copydoc hsa_signal_exchange_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_exchange_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_exchange_screlease.
|
|
*
|
|
* @copydoc hsa_signal_exchange_screlease
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_exchange_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically set the value of a signal if the observed value is equal to
|
|
* the expected value. The observed value is returned regardless of whether the
|
|
* replacement was done.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting
|
|
* on @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue
|
|
* doorbell signal, the behavior is undefined.
|
|
*
|
|
* @param[in] expected Value to compare with.
|
|
*
|
|
* @param[in] value New value.
|
|
*
|
|
* @return Observed value of the signal.
|
|
*
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_cas_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_cas_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_cas_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_cas_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_cas_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_cas_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_cas_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_cas_scacquire
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_cas_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_cas_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_cas_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_cas_scacq_screl
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_cas_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_cas_screlease.
|
|
*
|
|
* @copydoc hsa_signal_cas_screlease
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_cas_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t expected,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically increment the value of a signal by a given amount.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting on
|
|
* @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue doorbell signal, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] value Value to add to the value of the signal.
|
|
*
|
|
*/
|
|
void HSA_API hsa_signal_add_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_add_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_add_scacq_screl
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_add_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_add_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_add_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_add_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_add_scacquire
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_add_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_add_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_add_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_add_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_add_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_add_screlease.
|
|
*
|
|
* @copydoc hsa_signal_add_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_add_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically decrement the value of a signal by a given amount.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting on
|
|
* @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue doorbell signal, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] value Value to subtract from the value of the signal.
|
|
*
|
|
*/
|
|
void HSA_API hsa_signal_subtract_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_subtract_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_subtract_scacq_screl
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_subtract_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_subtract_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_subtract_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_subtract_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_subtract_scacquire
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_subtract_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_subtract_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_subtract_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_subtract_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_subtract_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_subtract_screlease.
|
|
*
|
|
* @copydoc hsa_signal_subtract_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_subtract_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically perform a bitwise AND operation between the value of a
|
|
* signal and a given value.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting on
|
|
* @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue doorbell signal, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] value Value to AND with the value of the signal.
|
|
*
|
|
*/
|
|
void HSA_API hsa_signal_and_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_and_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_and_scacq_screl
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_and_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_and_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_and_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_and_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_and_scacquire
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_and_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_and_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_and_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_and_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_and_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_and_screlease.
|
|
*
|
|
* @copydoc hsa_signal_and_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_and_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically perform a bitwise OR operation between the value of a
|
|
* signal and a given value.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting on
|
|
* @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue doorbell signal, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] value Value to OR with the value of the signal.
|
|
*/
|
|
void HSA_API hsa_signal_or_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_or_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_or_scacq_screl
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_or_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_or_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_or_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_or_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_or_scacquire
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_or_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_or_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_or_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_or_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_or_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_or_screlease.
|
|
*
|
|
* @copydoc hsa_signal_or_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_or_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Atomically perform a bitwise XOR operation between the value of a
|
|
* signal and a given value.
|
|
*
|
|
* @details If the value of the signal is changed, all the agents waiting on
|
|
* @p signal for which @p value satisfies their wait condition are awakened.
|
|
*
|
|
* @param[in] signal Signal. If @p signal is a queue doorbell signal, the
|
|
* behavior is undefined.
|
|
*
|
|
* @param[in] value Value to XOR with the value of the signal.
|
|
*
|
|
*/
|
|
void HSA_API hsa_signal_xor_scacq_screl(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_xor_scacq_screl.
|
|
*
|
|
* @copydoc hsa_signal_xor_scacq_screl
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_xor_acq_rel(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_xor_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_xor_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_xor_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_xor_scacquire
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_xor_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_xor_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_xor_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_xor_scacq_screl
|
|
*/
|
|
void HSA_API hsa_signal_xor_screlease(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_xor_screlease.
|
|
*
|
|
* @copydoc hsa_signal_xor_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_signal_xor_release(
|
|
hsa_signal_t signal,
|
|
hsa_signal_value_t value);
|
|
|
|
/**
|
|
* @brief Wait condition operator.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The two operands are equal.
|
|
*/
|
|
HSA_SIGNAL_CONDITION_EQ = 0,
|
|
/**
|
|
* The two operands are not equal.
|
|
*/
|
|
HSA_SIGNAL_CONDITION_NE = 1,
|
|
/**
|
|
* The first operand is less than the second operand.
|
|
*/
|
|
HSA_SIGNAL_CONDITION_LT = 2,
|
|
/**
|
|
* The first operand is greater than or equal to the second operand.
|
|
*/
|
|
HSA_SIGNAL_CONDITION_GTE = 3
|
|
} hsa_signal_condition_t;
|
|
|
|
/**
|
|
* @brief State of the application thread during a signal wait.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The application thread may be rescheduled while waiting on the signal.
|
|
*/
|
|
HSA_WAIT_STATE_BLOCKED = 0,
|
|
/**
|
|
* The application thread stays active while waiting on a signal.
|
|
*/
|
|
HSA_WAIT_STATE_ACTIVE = 1
|
|
} hsa_wait_state_t;
|
|
|
|
|
|
/**
|
|
* @brief Wait until a signal value satisfies a specified condition, or a
|
|
* certain amount of time has elapsed.
|
|
*
|
|
* @details A wait operation can spuriously resume at any time sooner than the
|
|
* timeout (for example, due to system or other external factors) even when the
|
|
* condition has not been met.
|
|
*
|
|
* The function is guaranteed to return if the signal value satisfies the
|
|
* condition at some point in time during the wait, but the value returned to
|
|
* the application might not satisfy the condition. The application must ensure
|
|
* that signals are used in such way that wait wakeup conditions are not
|
|
* invalidated before dependent threads have woken up.
|
|
*
|
|
* When the wait operation internally loads the value of the passed signal, it
|
|
* uses the memory order indicated in the function name.
|
|
*
|
|
* @param[in] signal Signal.
|
|
*
|
|
* @param[in] condition Condition used to compare the signal value with @p
|
|
* compare_value.
|
|
*
|
|
* @param[in] compare_value Value to compare with.
|
|
*
|
|
* @param[in] timeout_hint Maximum duration of the wait. Specified in the same
|
|
* unit as the system timestamp. The operation might block for a shorter or
|
|
* longer time even if the condition is not met. A value of UINT64_MAX indicates
|
|
* no maximum.
|
|
*
|
|
* @param[in] wait_state_hint Hint used by the application to indicate the
|
|
* preferred waiting state. The actual waiting state is ultimately decided by
|
|
* HSA runtime and may not match the provided hint. A value of
|
|
* ::HSA_WAIT_STATE_ACTIVE may improve the latency of response to a signal
|
|
* update by avoiding rescheduling overhead.
|
|
*
|
|
* @return Observed value of the signal, which might not satisfy the specified
|
|
* condition.
|
|
*
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_wait_scacquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_condition_t condition,
|
|
hsa_signal_value_t compare_value,
|
|
uint64_t timeout_hint,
|
|
hsa_wait_state_t wait_state_hint);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_wait_scacquire
|
|
*/
|
|
hsa_signal_value_t HSA_API hsa_signal_wait_relaxed(
|
|
hsa_signal_t signal,
|
|
hsa_signal_condition_t condition,
|
|
hsa_signal_value_t compare_value,
|
|
uint64_t timeout_hint,
|
|
hsa_wait_state_t wait_state_hint);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_signal_wait_scacquire.
|
|
*
|
|
* @copydoc hsa_signal_wait_scacquire
|
|
*/
|
|
hsa_signal_value_t HSA_API HSA_DEPRECATED hsa_signal_wait_acquire(
|
|
hsa_signal_t signal,
|
|
hsa_signal_condition_t condition,
|
|
hsa_signal_value_t compare_value,
|
|
uint64_t timeout_hint,
|
|
hsa_wait_state_t wait_state_hint);
|
|
|
|
/**
|
|
* @brief Group of signals.
|
|
*/
|
|
typedef struct hsa_signal_group_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_signal_group_t;
|
|
|
|
/**
|
|
* @brief Create a signal group.
|
|
*
|
|
* @param[in] num_signals Number of elements in @p signals. Must not be 0.
|
|
*
|
|
* @param[in] signals List of signals in the group. The list must not contain
|
|
* any repeated elements. Must not be NULL.
|
|
*
|
|
* @param[in] num_consumers Number of elements in @p consumers. Must not be 0.
|
|
*
|
|
* @param[in] consumers List of agents that might consume (wait on) the signal
|
|
* group. The list must not contain repeated elements, and must be a subset of
|
|
* the set of agents that are allowed to wait on all the signals in the
|
|
* group. If an agent not listed in @p consumers waits on the returned group,
|
|
* the behavior is undefined. The memory associated with @p consumers can be
|
|
* reused or freed after the function returns. Must not be NULL.
|
|
*
|
|
* @param[out] signal_group Pointer to newly created signal group. Must not be
|
|
* NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p num_signals is 0, @p signals
|
|
* is NULL, @p num_consumers is 0, @p consumers is NULL, or @p signal_group is
|
|
* NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_signal_group_create(
|
|
uint32_t num_signals,
|
|
const hsa_signal_t *signals,
|
|
uint32_t num_consumers,
|
|
const hsa_agent_t *consumers,
|
|
hsa_signal_group_t *signal_group);
|
|
|
|
/**
|
|
* @brief Destroy a signal group previous created by ::hsa_signal_group_create.
|
|
*
|
|
* @param[in] signal_group Signal group.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL_GROUP @p signal_group is invalid.
|
|
*/
|
|
hsa_status_t HSA_API hsa_signal_group_destroy(
|
|
hsa_signal_group_t signal_group);
|
|
|
|
/**
|
|
* @brief Wait until the value of at least one of the signals in a signal group
|
|
* satisfies its associated condition.
|
|
*
|
|
* @details The function is guaranteed to return if the value of at least one of
|
|
* the signals in the group satisfies its associated condition at some point in
|
|
* time during the wait, but the signal value returned to the application may no
|
|
* longer satisfy the condition. The application must ensure that signals in the
|
|
* group are used in such way that wait wakeup conditions are not invalidated
|
|
* before dependent threads have woken up.
|
|
*
|
|
* When this operation internally loads the value of the passed signal, it uses
|
|
* the memory order indicated in the function name.
|
|
*
|
|
* @param[in] signal_group Signal group.
|
|
*
|
|
* @param[in] conditions List of conditions. Each condition, and the value at
|
|
* the same index in @p compare_values, is used to compare the value of the
|
|
* signal at that index in @p signal_group (the signal passed by the application
|
|
* to ::hsa_signal_group_create at that particular index). The size of @p
|
|
* conditions must not be smaller than the number of signals in @p signal_group;
|
|
* any extra elements are ignored. Must not be NULL.
|
|
*
|
|
* @param[in] compare_values List of comparison values. The size of @p
|
|
* compare_values must not be smaller than the number of signals in @p
|
|
* signal_group; any extra elements are ignored. Must not be NULL.
|
|
*
|
|
* @param[in] wait_state_hint Hint used by the application to indicate the
|
|
* preferred waiting state. The actual waiting state is decided by the HSA runtime
|
|
* and may not match the provided hint. A value of ::HSA_WAIT_STATE_ACTIVE may
|
|
* improve the latency of response to a signal update by avoiding rescheduling
|
|
* overhead.
|
|
*
|
|
* @param[out] signal Signal in the group that satisfied the associated
|
|
* condition. If several signals satisfied their condition, the function can
|
|
* return any of those signals. Must not be NULL.
|
|
*
|
|
* @param[out] value Observed value for @p signal, which might no longer satisfy
|
|
* the specified condition. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL_GROUP @p signal_group is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p conditions is NULL, @p
|
|
* compare_values is NULL, @p signal is NULL, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_signal_group_wait_any_scacquire(
|
|
hsa_signal_group_t signal_group,
|
|
const hsa_signal_condition_t *conditions,
|
|
const hsa_signal_value_t *compare_values,
|
|
hsa_wait_state_t wait_state_hint,
|
|
hsa_signal_t *signal,
|
|
hsa_signal_value_t *value);
|
|
|
|
/**
|
|
* @copydoc hsa_signal_group_wait_any_scacquire
|
|
*/
|
|
hsa_status_t HSA_API hsa_signal_group_wait_any_relaxed(
|
|
hsa_signal_group_t signal_group,
|
|
const hsa_signal_condition_t *conditions,
|
|
const hsa_signal_value_t *compare_values,
|
|
hsa_wait_state_t wait_state_hint,
|
|
hsa_signal_t *signal,
|
|
hsa_signal_value_t *value);
|
|
|
|
/** @} */
|
|
|
|
/** \defgroup memory Memory
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief A memory region represents a block of virtual memory with certain
|
|
* properties. For example, the HSA runtime represents fine-grained memory in
|
|
* the global segment using a region. A region might be associated with more
|
|
* than one agent.
|
|
*/
|
|
typedef struct hsa_region_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_region_t;
|
|
|
|
/** @} */
|
|
|
|
|
|
/** \defgroup queue Queues
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Queue type. Intended to be used for dynamic queue protocol
|
|
* determination.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Queue supports multiple producers. Use of multiproducer queue mechanics is
|
|
* required.
|
|
*/
|
|
HSA_QUEUE_TYPE_MULTI = 0,
|
|
/**
|
|
* Queue only supports a single producer. In some scenarios, the application
|
|
* may want to limit the submission of AQL packets to a single agent. Queues
|
|
* that support a single producer may be more efficient than queues supporting
|
|
* multiple producers. Use of multiproducer queue mechanics is not supported.
|
|
*/
|
|
HSA_QUEUE_TYPE_SINGLE = 1,
|
|
/**
|
|
* Queue supports multiple producers and cooperative dispatches. Cooperative
|
|
* dispatches are able to use GWS synchronization. Queues of this type may be
|
|
* limited in number. The runtime may return the same queue to serve multiple
|
|
* ::hsa_queue_create calls when this type is given. Callers must inspect the
|
|
* returned queue to discover queue size. Queues of this type are reference
|
|
* counted and require a matching number of ::hsa_queue_destroy calls to
|
|
* release. Use of multiproducer queue mechanics is required. See
|
|
* ::HSA_AMD_AGENT_INFO_COOPERATIVE_QUEUES to query agent support for this
|
|
* type.
|
|
*/
|
|
HSA_QUEUE_TYPE_COOPERATIVE = 2
|
|
} hsa_queue_type_t;
|
|
|
|
/**
|
|
* @brief A fixed-size type used to represent ::hsa_queue_type_t constants.
|
|
*/
|
|
typedef uint32_t hsa_queue_type32_t;
|
|
|
|
/**
|
|
* @brief Queue features.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Queue supports kernel dispatch packets.
|
|
*/
|
|
HSA_QUEUE_FEATURE_KERNEL_DISPATCH = 1,
|
|
|
|
/**
|
|
* Queue supports agent dispatch packets.
|
|
*/
|
|
HSA_QUEUE_FEATURE_AGENT_DISPATCH = 2
|
|
} hsa_queue_feature_t;
|
|
|
|
/**
|
|
* @brief User mode queue.
|
|
*
|
|
* @details The queue structure is read-only and allocated by the HSA runtime,
|
|
* but agents can directly modify the contents of the buffer pointed by @a
|
|
* base_address, or use HSA runtime APIs to access the doorbell signal.
|
|
*
|
|
*/
|
|
typedef struct hsa_queue_s {
|
|
/**
|
|
* Queue type.
|
|
*/
|
|
hsa_queue_type32_t type;
|
|
|
|
/**
|
|
* Queue features mask. This is a bit-field of ::hsa_queue_feature_t
|
|
* values. Applications should ignore any unknown set bits.
|
|
*/
|
|
uint32_t features;
|
|
|
|
#ifdef HSA_LARGE_MODEL
|
|
void* base_address;
|
|
#elif defined HSA_LITTLE_ENDIAN
|
|
/**
|
|
* Starting address of the HSA runtime-allocated buffer used to store the AQL
|
|
* packets. Must be aligned to the size of an AQL packet.
|
|
*/
|
|
void* base_address;
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved0;
|
|
#else
|
|
uint32_t reserved0;
|
|
void* base_address;
|
|
#endif
|
|
|
|
/**
|
|
* Signal object used by the application to indicate the ID of a packet that
|
|
* is ready to be processed. The HSA runtime manages the doorbell signal. If
|
|
* the application tries to replace or destroy this signal, the behavior is
|
|
* undefined.
|
|
*
|
|
* If @a type is ::HSA_QUEUE_TYPE_SINGLE, the doorbell signal value must be
|
|
* updated in a monotonically increasing fashion. If @a type is
|
|
* ::HSA_QUEUE_TYPE_MULTI, the doorbell signal value can be updated with any
|
|
* value.
|
|
*/
|
|
hsa_signal_t doorbell_signal;
|
|
|
|
/**
|
|
* Maximum number of packets the queue can hold. Must be a power of 2.
|
|
*/
|
|
uint32_t size;
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved1;
|
|
/**
|
|
* Queue identifier, which is unique over the lifetime of the application.
|
|
*/
|
|
uint64_t id;
|
|
|
|
} hsa_queue_t;
|
|
|
|
/**
|
|
* @brief Create a user mode queue.
|
|
*
|
|
* @details The HSA runtime creates the queue structure, the underlying packet
|
|
* buffer, the completion signal, and the write and read indexes. The initial
|
|
* value of the write and read indexes is 0. The type of every packet in the
|
|
* buffer is initialized to ::HSA_PACKET_TYPE_INVALID.
|
|
*
|
|
* The application should only rely on the error code returned to determine if
|
|
* the queue is valid.
|
|
*
|
|
* @param[in] agent Agent where to create the queue.
|
|
*
|
|
* @param[in] size Number of packets the queue is expected to
|
|
* hold. Must be a power of 2 between 1 and the value of
|
|
* ::HSA_AGENT_INFO_QUEUE_MAX_SIZE in @p agent. The size of the newly
|
|
* created queue is the maximum of @p size and the value of
|
|
* ::HSA_AGENT_INFO_QUEUE_MIN_SIZE in @p agent.
|
|
*
|
|
* @param[in] type Type of the queue, a bitwise OR of hsa_queue_type_t values.
|
|
* If the value of ::HSA_AGENT_INFO_QUEUE_TYPE in @p agent is ::HSA_QUEUE_TYPE_SINGLE,
|
|
* then @p type must also be ::HSA_QUEUE_TYPE_SINGLE.
|
|
*
|
|
* @param[in] callback Callback invoked by the HSA runtime for every
|
|
* asynchronous event related to the newly created queue. May be NULL. The HSA
|
|
* runtime passes three arguments to the callback: a code identifying the event
|
|
* that triggered the invocation, a pointer to the queue where the event
|
|
* originated, and the application data.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @param[in] private_segment_size Hint indicating the maximum
|
|
* expected private segment usage per work-item, in bytes. There may
|
|
* be performance degradation if the application places a kernel
|
|
* dispatch packet in the queue and the corresponding private segment
|
|
* usage exceeds @p private_segment_size. If the application does not
|
|
* want to specify any particular value for this argument, @p
|
|
* private_segment_size must be UINT32_MAX. If the queue does not
|
|
* support kernel dispatch packets, this argument is ignored.
|
|
*
|
|
* @param[in] group_segment_size Hint indicating the maximum expected
|
|
* group segment usage per work-group, in bytes. There may be
|
|
* performance degradation if the application places a kernel dispatch
|
|
* packet in the queue and the corresponding group segment usage
|
|
* exceeds @p group_segment_size. If the application does not want to
|
|
* specify any particular value for this argument, @p
|
|
* group_segment_size must be UINT32_MAX. If the queue does not
|
|
* support kernel dispatch packets, this argument is ignored.
|
|
*
|
|
* @param[out] queue Memory location where the HSA runtime stores a pointer to
|
|
* the newly created queue.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_QUEUE_CREATION @p agent does not
|
|
* support queues of the given type.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is not a power of two,
|
|
* @p size is 0, @p type is an invalid queue type, or @p queue is NULL.
|
|
*
|
|
*/
|
|
hsa_status_t HSA_API hsa_queue_create(
|
|
hsa_agent_t agent,
|
|
uint32_t size,
|
|
hsa_queue_type32_t type,
|
|
void (*callback)(hsa_status_t status, hsa_queue_t *source, void *data),
|
|
void *data,
|
|
uint32_t private_segment_size,
|
|
uint32_t group_segment_size,
|
|
hsa_queue_t **queue);
|
|
|
|
/**
|
|
* @brief Create a queue for which the application or a kernel is responsible
|
|
* for processing the AQL packets.
|
|
*
|
|
* @details The application can use this function to create queues where AQL
|
|
* packets are not parsed by the packet processor associated with an agent,
|
|
* but rather by a unit of execution running on that agent (for example, a
|
|
* thread in the host application).
|
|
*
|
|
* The application is responsible for ensuring that all the producers and
|
|
* consumers of the resulting queue can access the provided doorbell signal
|
|
* and memory region. The application is also responsible for ensuring that the
|
|
* unit of execution processing the queue packets supports the indicated
|
|
* features (AQL packet types).
|
|
*
|
|
* When the queue is created, the HSA runtime allocates the packet buffer using
|
|
* @p region, and the write and read indexes. The initial value of the write and
|
|
* read indexes is 0, and the type of every packet in the buffer is initialized
|
|
* to ::HSA_PACKET_TYPE_INVALID. The value of the @e size, @e type, @e features,
|
|
* and @e doorbell_signal fields in the returned queue match the values passed
|
|
* by the application.
|
|
*
|
|
* @param[in] region Memory region that the HSA runtime should use to allocate
|
|
* the AQL packet buffer and any other queue metadata.
|
|
*
|
|
* @param[in] size Number of packets the queue is expected to hold. Must be a
|
|
* power of 2 greater than 0.
|
|
*
|
|
* @param[in] type Queue type.
|
|
*
|
|
* @param[in] features Supported queue features. This is a bit-field of
|
|
* ::hsa_queue_feature_t values.
|
|
*
|
|
* @param[in] doorbell_signal Doorbell signal that the HSA runtime must
|
|
* associate with the returned queue. The signal handle must not be 0.
|
|
*
|
|
* @param[out] queue Memory location where the HSA runtime stores a pointer to
|
|
* the newly created queue. The application should not rely on the value
|
|
* returned for this argument but only in the status code to determine if the
|
|
* queue is valid. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is not a power of two, @p
|
|
* size is 0, @p type is an invalid queue type, the doorbell signal handle is
|
|
* 0, or @p queue is NULL.
|
|
*
|
|
*/
|
|
hsa_status_t HSA_API hsa_soft_queue_create(
|
|
hsa_region_t region,
|
|
uint32_t size,
|
|
hsa_queue_type32_t type,
|
|
uint32_t features,
|
|
hsa_signal_t doorbell_signal,
|
|
hsa_queue_t **queue);
|
|
|
|
/**
|
|
* @brief Destroy a user mode queue.
|
|
*
|
|
* @details When a queue is destroyed, the state of the AQL packets that have
|
|
* not been yet fully processed (their completion phase has not finished)
|
|
* becomes undefined. It is the responsibility of the application to ensure that
|
|
* all pending queue operations are finished if their results are required.
|
|
*
|
|
* The resources allocated by the HSA runtime during queue creation (queue
|
|
* structure, ring buffer, doorbell signal) are released. The queue should not
|
|
* be accessed after being destroyed.
|
|
*
|
|
* @param[in] queue Pointer to a queue created using ::hsa_queue_create.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_QUEUE The queue is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p queue is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_queue_destroy(
|
|
hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @brief Inactivate a queue.
|
|
*
|
|
* @details Inactivating the queue aborts any pending executions and prevent any
|
|
* new packets from being processed. Any more packets written to the queue once
|
|
* it is inactivated will be ignored by the packet processor.
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_QUEUE The queue is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p queue is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_queue_inactivate(
|
|
hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_load_read_index_scacquire.
|
|
*
|
|
* @copydoc hsa_queue_load_read_index_scacquire
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_load_read_index_acquire(
|
|
const hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @brief Atomically load the read index of a queue.
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @return Read index of the queue pointed by @p queue.
|
|
*/
|
|
uint64_t HSA_API hsa_queue_load_read_index_scacquire(
|
|
const hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_load_read_index_scacquire
|
|
*/
|
|
uint64_t HSA_API hsa_queue_load_read_index_relaxed(
|
|
const hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_load_write_index_scacquire.
|
|
*
|
|
* @copydoc hsa_queue_load_write_index_scacquire
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_load_write_index_acquire(
|
|
const hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @brief Atomically load the write index of a queue.
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @return Write index of the queue pointed by @p queue.
|
|
*/
|
|
uint64_t HSA_API hsa_queue_load_write_index_scacquire(
|
|
const hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_load_write_index_scacquire
|
|
*/
|
|
uint64_t HSA_API hsa_queue_load_write_index_relaxed(
|
|
const hsa_queue_t *queue);
|
|
|
|
/**
|
|
* @brief Atomically set the write index of a queue.
|
|
*
|
|
* @details It is recommended that the application uses this function to update
|
|
* the write index when there is a single agent submitting work to the queue
|
|
* (the queue type is ::HSA_QUEUE_TYPE_SINGLE).
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @param[in] value Value to assign to the write index.
|
|
*
|
|
*/
|
|
void HSA_API hsa_queue_store_write_index_relaxed(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_store_write_index_screlease.
|
|
*
|
|
* @copydoc hsa_queue_store_write_index_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_queue_store_write_index_release(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_store_write_index_relaxed
|
|
*/
|
|
void HSA_API hsa_queue_store_write_index_screlease(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_cas_write_index_scacq_screl.
|
|
*
|
|
* @copydoc hsa_queue_cas_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_cas_write_index_acq_rel(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @brief Atomically set the write index of a queue if the observed value is
|
|
* equal to the expected value. The application can inspect the returned value
|
|
* to determine if the replacement was done.
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @param[in] expected Expected value.
|
|
*
|
|
* @param[in] value Value to assign to the write index if @p expected matches
|
|
* the observed write index. Must be greater than @p expected.
|
|
*
|
|
* @return Previous value of the write index.
|
|
*/
|
|
uint64_t HSA_API hsa_queue_cas_write_index_scacq_screl(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_cas_write_index_scacquire.
|
|
*
|
|
* @copydoc hsa_queue_cas_write_index_scacquire
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_cas_write_index_acquire(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_cas_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API hsa_queue_cas_write_index_scacquire(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_cas_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API hsa_queue_cas_write_index_relaxed(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_cas_write_index_screlease.
|
|
*
|
|
* @copydoc hsa_queue_cas_write_index_screlease
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_cas_write_index_release(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_cas_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API hsa_queue_cas_write_index_screlease(
|
|
const hsa_queue_t *queue,
|
|
uint64_t expected,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_add_write_index_scacq_screl.
|
|
*
|
|
* @copydoc hsa_queue_add_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_add_write_index_acq_rel(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @brief Atomically increment the write index of a queue by an offset.
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @param[in] value Value to add to the write index.
|
|
*
|
|
* @return Previous value of the write index.
|
|
*/
|
|
uint64_t HSA_API hsa_queue_add_write_index_scacq_screl(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_add_write_index_scacquire.
|
|
*
|
|
* @copydoc hsa_queue_add_write_index_scacquire
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_add_write_index_acquire(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_add_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API hsa_queue_add_write_index_scacquire(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_add_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API hsa_queue_add_write_index_relaxed(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_add_write_index_screlease.
|
|
*
|
|
* @copydoc hsa_queue_add_write_index_screlease
|
|
*/
|
|
uint64_t HSA_API HSA_DEPRECATED hsa_queue_add_write_index_release(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_add_write_index_scacq_screl
|
|
*/
|
|
uint64_t HSA_API hsa_queue_add_write_index_screlease(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @brief Atomically set the read index of a queue.
|
|
*
|
|
* @details Modifications of the read index are not allowed and result in
|
|
* undefined behavior if the queue is associated with an agent for which
|
|
* only the corresponding packet processor is permitted to update the read
|
|
* index.
|
|
*
|
|
* @param[in] queue Pointer to a queue.
|
|
*
|
|
* @param[in] value Value to assign to the read index.
|
|
*
|
|
*/
|
|
void HSA_API hsa_queue_store_read_index_relaxed(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @deprecated Renamed as ::hsa_queue_store_read_index_screlease.
|
|
*
|
|
* @copydoc hsa_queue_store_read_index_screlease
|
|
*/
|
|
void HSA_API HSA_DEPRECATED hsa_queue_store_read_index_release(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
|
|
/**
|
|
* @copydoc hsa_queue_store_read_index_relaxed
|
|
*/
|
|
void HSA_API hsa_queue_store_read_index_screlease(
|
|
const hsa_queue_t *queue,
|
|
uint64_t value);
|
|
/** @} */
|
|
|
|
|
|
/** \defgroup aql Architected Queuing Language
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Packet type.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Vendor-specific packet.
|
|
*/
|
|
HSA_PACKET_TYPE_VENDOR_SPECIFIC = 0,
|
|
/**
|
|
* The packet has been processed in the past, but has not been reassigned to
|
|
* the packet processor. A packet processor must not process a packet of this
|
|
* type. All queues support this packet type.
|
|
*/
|
|
HSA_PACKET_TYPE_INVALID = 1,
|
|
/**
|
|
* Packet used by agents for dispatching jobs to kernel agents. Not all
|
|
* queues support packets of this type (see ::hsa_queue_feature_t).
|
|
*/
|
|
HSA_PACKET_TYPE_KERNEL_DISPATCH = 2,
|
|
/**
|
|
* Packet used by agents to delay processing of subsequent packets, and to
|
|
* express complex dependencies between multiple packets. All queues support
|
|
* this packet type.
|
|
*/
|
|
HSA_PACKET_TYPE_BARRIER_AND = 3,
|
|
/**
|
|
* Packet used by agents for dispatching jobs to agents. Not all
|
|
* queues support packets of this type (see ::hsa_queue_feature_t).
|
|
*/
|
|
HSA_PACKET_TYPE_AGENT_DISPATCH = 4,
|
|
/**
|
|
* Packet used by agents to delay processing of subsequent packets, and to
|
|
* express complex dependencies between multiple packets. All queues support
|
|
* this packet type.
|
|
*/
|
|
HSA_PACKET_TYPE_BARRIER_OR = 5
|
|
} hsa_packet_type_t;
|
|
|
|
/**
|
|
* @brief Scope of the memory fence operation associated with a packet.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* No scope (no fence is applied). The packet relies on external fences to
|
|
* ensure visibility of memory updates.
|
|
*/
|
|
HSA_FENCE_SCOPE_NONE = 0,
|
|
/**
|
|
* The fence is applied with agent scope for the global segment.
|
|
*/
|
|
HSA_FENCE_SCOPE_AGENT = 1,
|
|
/**
|
|
* The fence is applied across both agent and system scope for the global
|
|
* segment.
|
|
*/
|
|
HSA_FENCE_SCOPE_SYSTEM = 2
|
|
} hsa_fence_scope_t;
|
|
|
|
/**
|
|
* @brief Sub-fields of the @a header field that is present in any AQL
|
|
* packet. The offset (with respect to the address of @a header) of a sub-field
|
|
* is identical to its enumeration constant. The width of each sub-field is
|
|
* determined by the corresponding value in ::hsa_packet_header_width_t. The
|
|
* offset and the width are expressed in bits.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Packet type. The value of this sub-field must be one of
|
|
* ::hsa_packet_type_t. If the type is ::HSA_PACKET_TYPE_VENDOR_SPECIFIC, the
|
|
* packet layout is vendor-specific.
|
|
*/
|
|
HSA_PACKET_HEADER_TYPE = 0,
|
|
/**
|
|
* Barrier bit. If the barrier bit is set, the processing of the current
|
|
* packet only launches when all preceding packets (within the same queue) are
|
|
* complete.
|
|
*/
|
|
HSA_PACKET_HEADER_BARRIER = 8,
|
|
/**
|
|
* Acquire fence scope. The value of this sub-field determines the scope and
|
|
* type of the memory fence operation applied before the packet enters the
|
|
* active phase. An acquire fence ensures that any subsequent global segment
|
|
* or image loads by any unit of execution that belongs to a dispatch that has
|
|
* not yet entered the active phase on any queue of the same kernel agent,
|
|
* sees any data previously released at the scopes specified by the acquire
|
|
* fence. The value of this sub-field must be one of ::hsa_fence_scope_t.
|
|
*/
|
|
HSA_PACKET_HEADER_SCACQUIRE_FENCE_SCOPE = 9,
|
|
/**
|
|
* @deprecated Renamed as ::HSA_PACKET_HEADER_SCACQUIRE_FENCE_SCOPE.
|
|
*/
|
|
HSA_PACKET_HEADER_ACQUIRE_FENCE_SCOPE = 9,
|
|
/**
|
|
* Release fence scope, The value of this sub-field determines the scope and
|
|
* type of the memory fence operation applied after kernel completion but
|
|
* before the packet is completed. A release fence makes any global segment or
|
|
* image data that was stored by any unit of execution that belonged to a
|
|
* dispatch that has completed the active phase on any queue of the same
|
|
* kernel agent visible in all the scopes specified by the release fence. The
|
|
* value of this sub-field must be one of ::hsa_fence_scope_t.
|
|
*/
|
|
HSA_PACKET_HEADER_SCRELEASE_FENCE_SCOPE = 11,
|
|
/**
|
|
* @deprecated Renamed as ::HSA_PACKET_HEADER_SCRELEASE_FENCE_SCOPE.
|
|
*/
|
|
HSA_PACKET_HEADER_RELEASE_FENCE_SCOPE = 11
|
|
} hsa_packet_header_t;
|
|
|
|
/**
|
|
* @brief Width (in bits) of the sub-fields in ::hsa_packet_header_t.
|
|
*/
|
|
typedef enum {
|
|
HSA_PACKET_HEADER_WIDTH_TYPE = 8,
|
|
HSA_PACKET_HEADER_WIDTH_BARRIER = 1,
|
|
HSA_PACKET_HEADER_WIDTH_SCACQUIRE_FENCE_SCOPE = 2,
|
|
/**
|
|
* @deprecated Use HSA_PACKET_HEADER_WIDTH_SCACQUIRE_FENCE_SCOPE.
|
|
*/
|
|
HSA_PACKET_HEADER_WIDTH_ACQUIRE_FENCE_SCOPE = 2,
|
|
HSA_PACKET_HEADER_WIDTH_SCRELEASE_FENCE_SCOPE = 2,
|
|
/**
|
|
* @deprecated Use HSA_PACKET_HEADER_WIDTH_SCRELEASE_FENCE_SCOPE.
|
|
*/
|
|
HSA_PACKET_HEADER_WIDTH_RELEASE_FENCE_SCOPE = 2
|
|
} hsa_packet_header_width_t;
|
|
|
|
/**
|
|
* @brief Sub-fields of the kernel dispatch packet @a setup field. The offset
|
|
* (with respect to the address of @a setup) of a sub-field is identical to its
|
|
* enumeration constant. The width of each sub-field is determined by the
|
|
* corresponding value in ::hsa_kernel_dispatch_packet_setup_width_t. The
|
|
* offset and the width are expressed in bits.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Number of dimensions of the grid. Valid values are 1, 2, or 3.
|
|
*
|
|
*/
|
|
HSA_KERNEL_DISPATCH_PACKET_SETUP_DIMENSIONS = 0
|
|
} hsa_kernel_dispatch_packet_setup_t;
|
|
|
|
/**
|
|
* @brief Width (in bits) of the sub-fields in
|
|
* ::hsa_kernel_dispatch_packet_setup_t.
|
|
*/
|
|
typedef enum {
|
|
HSA_KERNEL_DISPATCH_PACKET_SETUP_WIDTH_DIMENSIONS = 2
|
|
} hsa_kernel_dispatch_packet_setup_width_t;
|
|
|
|
/**
|
|
* @brief AQL kernel dispatch packet
|
|
*/
|
|
typedef struct hsa_kernel_dispatch_packet_s {
|
|
/**
|
|
* Packet header. Used to configure multiple packet parameters such as the
|
|
* packet type. The parameters are described by ::hsa_packet_header_t.
|
|
*/
|
|
uint16_t header;
|
|
|
|
/**
|
|
* Dispatch setup parameters. Used to configure kernel dispatch parameters
|
|
* such as the number of dimensions in the grid. The parameters are described
|
|
* by ::hsa_kernel_dispatch_packet_setup_t.
|
|
*/
|
|
uint16_t setup;
|
|
|
|
/**
|
|
* X dimension of work-group, in work-items. Must be greater than 0.
|
|
*/
|
|
uint16_t workgroup_size_x;
|
|
|
|
/**
|
|
* Y dimension of work-group, in work-items. Must be greater than
|
|
* 0. If the grid has 1 dimension, the only valid value is 1.
|
|
*/
|
|
uint16_t workgroup_size_y;
|
|
|
|
/**
|
|
* Z dimension of work-group, in work-items. Must be greater than
|
|
* 0. If the grid has 1 or 2 dimensions, the only valid value is 1.
|
|
*/
|
|
uint16_t workgroup_size_z;
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint16_t reserved0;
|
|
|
|
/**
|
|
* X dimension of grid, in work-items. Must be greater than 0. Must
|
|
* not be smaller than @a workgroup_size_x.
|
|
*/
|
|
uint32_t grid_size_x;
|
|
|
|
/**
|
|
* Y dimension of grid, in work-items. Must be greater than 0. If the grid has
|
|
* 1 dimension, the only valid value is 1. Must not be smaller than @a
|
|
* workgroup_size_y.
|
|
*/
|
|
uint32_t grid_size_y;
|
|
|
|
/**
|
|
* Z dimension of grid, in work-items. Must be greater than 0. If the grid has
|
|
* 1 or 2 dimensions, the only valid value is 1. Must not be smaller than @a
|
|
* workgroup_size_z.
|
|
*/
|
|
uint32_t grid_size_z;
|
|
|
|
/**
|
|
* Size in bytes of private memory allocation request (per work-item).
|
|
*/
|
|
uint32_t private_segment_size;
|
|
|
|
/**
|
|
* Size in bytes of group memory allocation request (per work-group). Must not
|
|
* be less than the sum of the group memory used by the kernel (and the
|
|
* functions it calls directly or indirectly) and the dynamically allocated
|
|
* group segment variables.
|
|
*/
|
|
uint32_t group_segment_size;
|
|
|
|
/**
|
|
* Opaque handle to a code object that includes an implementation-defined
|
|
* executable code for the kernel.
|
|
*/
|
|
uint64_t kernel_object;
|
|
|
|
#ifdef HSA_LARGE_MODEL
|
|
void* kernarg_address;
|
|
#elif defined HSA_LITTLE_ENDIAN
|
|
/**
|
|
* Pointer to a buffer containing the kernel arguments. May be NULL.
|
|
*
|
|
* The buffer must be allocated using ::hsa_memory_allocate, and must not be
|
|
* modified once the kernel dispatch packet is enqueued until the dispatch has
|
|
* completed execution.
|
|
*/
|
|
void* kernarg_address;
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved1;
|
|
#else
|
|
uint32_t reserved1;
|
|
void* kernarg_address;
|
|
#endif
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint64_t reserved2;
|
|
|
|
/**
|
|
* Signal used to indicate completion of the job. The application can use the
|
|
* special signal handle 0 to indicate that no signal is used.
|
|
*/
|
|
hsa_signal_t completion_signal;
|
|
|
|
} hsa_kernel_dispatch_packet_t;
|
|
|
|
/**
|
|
* @brief Agent dispatch packet.
|
|
*/
|
|
typedef struct hsa_agent_dispatch_packet_s {
|
|
/**
|
|
* Packet header. Used to configure multiple packet parameters such as the
|
|
* packet type. The parameters are described by ::hsa_packet_header_t.
|
|
*/
|
|
uint16_t header;
|
|
|
|
/**
|
|
* Application-defined function to be performed by the destination agent.
|
|
*/
|
|
uint16_t type;
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved0;
|
|
|
|
#ifdef HSA_LARGE_MODEL
|
|
void* return_address;
|
|
#elif defined HSA_LITTLE_ENDIAN
|
|
/**
|
|
* Address where to store the function return values, if any.
|
|
*/
|
|
void* return_address;
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved1;
|
|
#else
|
|
uint32_t reserved1;
|
|
void* return_address;
|
|
#endif
|
|
|
|
/**
|
|
* Function arguments.
|
|
*/
|
|
uint64_t arg[4];
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint64_t reserved2;
|
|
|
|
/**
|
|
* Signal used to indicate completion of the job. The application can use the
|
|
* special signal handle 0 to indicate that no signal is used.
|
|
*/
|
|
hsa_signal_t completion_signal;
|
|
|
|
} hsa_agent_dispatch_packet_t;
|
|
|
|
/**
|
|
* @brief Barrier-AND packet.
|
|
*/
|
|
typedef struct hsa_barrier_and_packet_s {
|
|
/**
|
|
* Packet header. Used to configure multiple packet parameters such as the
|
|
* packet type. The parameters are described by ::hsa_packet_header_t.
|
|
*/
|
|
uint16_t header;
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint16_t reserved0;
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved1;
|
|
|
|
/**
|
|
* Array of dependent signal objects. Signals with a handle value of 0 are
|
|
* allowed and are interpreted by the packet processor as satisfied
|
|
* dependencies.
|
|
*/
|
|
hsa_signal_t dep_signal[5];
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint64_t reserved2;
|
|
|
|
/**
|
|
* Signal used to indicate completion of the job. The application can use the
|
|
* special signal handle 0 to indicate that no signal is used.
|
|
*/
|
|
hsa_signal_t completion_signal;
|
|
|
|
} hsa_barrier_and_packet_t;
|
|
|
|
/**
|
|
* @brief Barrier-OR packet.
|
|
*/
|
|
typedef struct hsa_barrier_or_packet_s {
|
|
/**
|
|
* Packet header. Used to configure multiple packet parameters such as the
|
|
* packet type. The parameters are described by ::hsa_packet_header_t.
|
|
*/
|
|
uint16_t header;
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint16_t reserved0;
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint32_t reserved1;
|
|
|
|
/**
|
|
* Array of dependent signal objects. Signals with a handle value of 0 are
|
|
* allowed and are interpreted by the packet processor as dependencies not
|
|
* satisfied.
|
|
*/
|
|
hsa_signal_t dep_signal[5];
|
|
|
|
/**
|
|
* Reserved. Must be 0.
|
|
*/
|
|
uint64_t reserved2;
|
|
|
|
/**
|
|
* Signal used to indicate completion of the job. The application can use the
|
|
* special signal handle 0 to indicate that no signal is used.
|
|
*/
|
|
hsa_signal_t completion_signal;
|
|
|
|
} hsa_barrier_or_packet_t;
|
|
|
|
/** @} */
|
|
|
|
/** \addtogroup memory Memory
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Memory segments associated with a region.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Global segment. Used to hold data that is shared by all agents.
|
|
*/
|
|
HSA_REGION_SEGMENT_GLOBAL = 0,
|
|
/**
|
|
* Read-only segment. Used to hold data that remains constant during the
|
|
* execution of a kernel.
|
|
*/
|
|
HSA_REGION_SEGMENT_READONLY = 1,
|
|
/**
|
|
* Private segment. Used to hold data that is local to a single work-item.
|
|
*/
|
|
HSA_REGION_SEGMENT_PRIVATE = 2,
|
|
/**
|
|
* Group segment. Used to hold data that is shared by the work-items of a
|
|
* work-group.
|
|
*/
|
|
HSA_REGION_SEGMENT_GROUP = 3,
|
|
/**
|
|
* Kernarg segment. Used to store kernel arguments.
|
|
*/
|
|
HSA_REGION_SEGMENT_KERNARG = 4
|
|
} hsa_region_segment_t;
|
|
|
|
/**
|
|
* @brief Global region flags.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The application can use memory in the region to store kernel arguments, and
|
|
* provide the values for the kernarg segment of a kernel dispatch. If this
|
|
* flag is set, then ::HSA_REGION_GLOBAL_FLAG_FINE_GRAINED must be set.
|
|
*/
|
|
HSA_REGION_GLOBAL_FLAG_KERNARG = 1,
|
|
/**
|
|
* Updates to memory in this region are immediately visible to all the
|
|
* agents under the terms of the HSA memory model. If this
|
|
* flag is set, then ::HSA_REGION_GLOBAL_FLAG_COARSE_GRAINED must not be set.
|
|
*/
|
|
HSA_REGION_GLOBAL_FLAG_FINE_GRAINED = 2,
|
|
/**
|
|
* Updates to memory in this region can be performed by a single agent at
|
|
* a time. If a different agent in the system is allowed to access the
|
|
* region, the application must explicitely invoke ::hsa_memory_assign_agent
|
|
* in order to transfer ownership to that agent for a particular buffer.
|
|
*/
|
|
HSA_REGION_GLOBAL_FLAG_COARSE_GRAINED = 4
|
|
} hsa_region_global_flag_t;
|
|
|
|
/**
|
|
* @brief Attributes of a memory region.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Segment where memory in the region can be used. The type of this
|
|
* attribute is ::hsa_region_segment_t.
|
|
*/
|
|
HSA_REGION_INFO_SEGMENT = 0,
|
|
/**
|
|
* Flag mask. The value of this attribute is undefined if the value of
|
|
* ::HSA_REGION_INFO_SEGMENT is not ::HSA_REGION_SEGMENT_GLOBAL. The type of
|
|
* this attribute is uint32_t, a bit-field of ::hsa_region_global_flag_t
|
|
* values.
|
|
*/
|
|
HSA_REGION_INFO_GLOBAL_FLAGS = 1,
|
|
/**
|
|
* Size of this region, in bytes. The type of this attribute is size_t.
|
|
*/
|
|
HSA_REGION_INFO_SIZE = 2,
|
|
/**
|
|
* Maximum allocation size in this region, in bytes. Must not exceed the value
|
|
* of ::HSA_REGION_INFO_SIZE. The type of this attribute is size_t.
|
|
*
|
|
* If the region is in the global or readonly segments, this is the maximum
|
|
* size that the application can pass to ::hsa_memory_allocate.
|
|
*
|
|
* If the region is in the group segment, this is the maximum size (per
|
|
* work-group) that can be requested for a given kernel dispatch. If the
|
|
* region is in the private segment, this is the maximum size (per work-item)
|
|
* that can be requested for a specific kernel dispatch, and must be at least
|
|
* 256 bytes.
|
|
*/
|
|
HSA_REGION_INFO_ALLOC_MAX_SIZE = 4,
|
|
/**
|
|
* Maximum size (per work-group) of private memory that can be requested for a
|
|
* specific kernel dispatch. Must be at least 65536 bytes. The type of this
|
|
* attribute is uint32_t. The value of this attribute is undefined if the
|
|
* region is not in the private segment.
|
|
*/
|
|
HSA_REGION_INFO_ALLOC_MAX_PRIVATE_WORKGROUP_SIZE = 8,
|
|
/**
|
|
* Indicates whether memory in this region can be allocated using
|
|
* ::hsa_memory_allocate. The type of this attribute is bool.
|
|
*
|
|
* The value of this flag is always false for regions in the group and private
|
|
* segments.
|
|
*/
|
|
HSA_REGION_INFO_RUNTIME_ALLOC_ALLOWED = 5,
|
|
/**
|
|
* Allocation granularity of buffers allocated by ::hsa_memory_allocate in
|
|
* this region. The size of a buffer allocated in this region is a multiple of
|
|
* the value of this attribute. The value of this attribute is only defined if
|
|
* ::HSA_REGION_INFO_RUNTIME_ALLOC_ALLOWED is true for this region. The type
|
|
* of this attribute is size_t.
|
|
*/
|
|
HSA_REGION_INFO_RUNTIME_ALLOC_GRANULE = 6,
|
|
/**
|
|
* Alignment of buffers allocated by ::hsa_memory_allocate in this region. The
|
|
* value of this attribute is only defined if
|
|
* ::HSA_REGION_INFO_RUNTIME_ALLOC_ALLOWED is true for this region, and must be
|
|
* a power of 2. The type of this attribute is size_t.
|
|
*/
|
|
HSA_REGION_INFO_RUNTIME_ALLOC_ALIGNMENT = 7
|
|
} hsa_region_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of an attribute of a region.
|
|
*
|
|
* @param[in] region A valid region.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to a application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_REGION The region is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* region attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_region_get_info(
|
|
hsa_region_t region,
|
|
hsa_region_info_t attribute,
|
|
void* value);
|
|
|
|
/**
|
|
* @brief Iterate over the memory regions associated with a given agent, and
|
|
* invoke an application-defined callback on every iteration.
|
|
*
|
|
* @param[in] agent A valid agent.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per region that is
|
|
* accessible from the agent. The HSA runtime passes two arguments to the
|
|
* callback, the region and the application data. If @p callback returns a
|
|
* status other than ::HSA_STATUS_SUCCESS for a particular iteration, the
|
|
* traversal stops and ::hsa_agent_iterate_regions returns that status value.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_agent_iterate_regions(
|
|
hsa_agent_t agent,
|
|
hsa_status_t (*callback)(hsa_region_t region, void* data),
|
|
void* data);
|
|
|
|
/**
|
|
* @brief Allocate a block of memory in a given region.
|
|
*
|
|
* @param[in] region Region where to allocate memory from. The region must have
|
|
* the ::HSA_REGION_INFO_RUNTIME_ALLOC_ALLOWED flag set.
|
|
*
|
|
* @param[in] size Allocation size, in bytes. Must not be zero. This value is
|
|
* rounded up to the nearest multiple of ::HSA_REGION_INFO_RUNTIME_ALLOC_GRANULE
|
|
* in @p region.
|
|
*
|
|
* @param[out] ptr Pointer to the location where to store the base address of
|
|
* the allocated block. The returned base address is aligned to the value of
|
|
* ::HSA_REGION_INFO_RUNTIME_ALLOC_ALIGNMENT in @p region. If the allocation
|
|
* fails, the returned value is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_REGION The region is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ALLOCATION The host is not allowed to
|
|
* allocate memory in @p region, or @p size is greater than the value of
|
|
* HSA_REGION_INFO_ALLOC_MAX_SIZE in @p region.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is NULL, or @p size is 0.
|
|
*/
|
|
hsa_status_t HSA_API hsa_memory_allocate(hsa_region_t region,
|
|
size_t size,
|
|
void** ptr);
|
|
|
|
/**
|
|
* @brief Deallocate a block of memory previously allocated using
|
|
* ::hsa_memory_allocate.
|
|
*
|
|
* @param[in] ptr Pointer to a memory block. If @p ptr does not match a value
|
|
* previously returned by ::hsa_memory_allocate, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*/
|
|
hsa_status_t HSA_API hsa_memory_free(void* ptr);
|
|
|
|
/**
|
|
* @brief Copy a block of memory from the location pointed to by @p src to the
|
|
* memory block pointed to by @p dst.
|
|
*
|
|
* @param[out] dst Buffer where the content is to be copied. If @p dst is in
|
|
* coarse-grained memory, the copied data is only visible to the agent currently
|
|
* assigned (::hsa_memory_assign_agent) to @p dst.
|
|
*
|
|
* @param[in] src A valid pointer to the source of data to be copied. The source
|
|
* buffer must not overlap with the destination buffer. If the source buffer is
|
|
* in coarse-grained memory then it must be assigned to an agent, from which the
|
|
* data will be retrieved.
|
|
*
|
|
* @param[in] size Number of bytes to copy. If @p size is 0, no copy is
|
|
* performed and the function returns success. Copying a number of bytes larger
|
|
* than the size of the buffers pointed by @p dst or @p src results in undefined
|
|
* behavior.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT The source or destination
|
|
* pointers are NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_memory_copy(
|
|
void *dst,
|
|
const void *src,
|
|
size_t size);
|
|
|
|
/**
|
|
* @brief Change the ownership of a global, coarse-grained buffer.
|
|
*
|
|
* @details The contents of a coarse-grained buffer are visible to an agent
|
|
* only after ownership has been explicitely transferred to that agent. Once the
|
|
* operation completes, the previous owner cannot longer access the data in the
|
|
* buffer.
|
|
*
|
|
* An implementation of the HSA runtime is allowed, but not required, to change
|
|
* the physical location of the buffer when ownership is transferred to a
|
|
* different agent. In general the application must not assume this
|
|
* behavior. The virtual location (address) of the passed buffer is never
|
|
* modified.
|
|
*
|
|
* @param[in] ptr Base address of a global buffer. The pointer must match an
|
|
* address previously returned by ::hsa_memory_allocate. The size of the buffer
|
|
* affected by the ownership change is identical to the size of that previous
|
|
* allocation. If @p ptr points to a fine-grained global buffer, no operation is
|
|
* performed and the function returns success. If @p ptr does not point to
|
|
* global memory, the behavior is undefined.
|
|
*
|
|
* @param[in] agent Agent that becomes the owner of the buffer. The
|
|
* application is responsible for ensuring that @p agent has access to the
|
|
* region that contains the buffer. It is allowed to change ownership to an
|
|
* agent that is already the owner of the buffer, with the same or different
|
|
* access permissions.
|
|
*
|
|
* @param[in] access Access permissions requested for the new owner.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is NULL, or @p access is
|
|
* not a valid access value.
|
|
*/
|
|
hsa_status_t HSA_API hsa_memory_assign_agent(
|
|
void *ptr,
|
|
hsa_agent_t agent,
|
|
hsa_access_permission_t access);
|
|
|
|
/**
|
|
*
|
|
* @brief Register a global, fine-grained buffer.
|
|
*
|
|
* @details Registering a buffer serves as an indication to the HSA runtime that
|
|
* the memory might be accessed from a kernel agent other than the
|
|
* host. Registration is a performance hint that allows the HSA runtime
|
|
* implementation to know which buffers will be accessed by some of the kernel
|
|
* agents ahead of time.
|
|
*
|
|
* Registration is only recommended for buffers in the global segment that have
|
|
* not been allocated using the HSA allocator (::hsa_memory_allocate), but an OS
|
|
* allocator instead. Registering an OS-allocated buffer in the base profile is
|
|
* equivalent to a no-op.
|
|
*
|
|
* Registrations should not overlap.
|
|
*
|
|
* @param[in] ptr A buffer in global, fine-grained memory. If a NULL pointer is
|
|
* passed, no operation is performed. If the buffer has been allocated using
|
|
* ::hsa_memory_allocate, or has already been registered, no operation is
|
|
* performed.
|
|
*
|
|
* @param[in] size Requested registration size in bytes. A size of 0 is
|
|
* only allowed if @p ptr is NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate
|
|
* the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is 0 but @p ptr
|
|
* is not NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_memory_register(
|
|
void *ptr,
|
|
size_t size);
|
|
|
|
/**
|
|
*
|
|
* @brief Deregister memory previously registered using ::hsa_memory_register.
|
|
*
|
|
* @details If the memory interval being deregistered does not match a previous
|
|
* registration (start and end addresses), the behavior is undefined.
|
|
*
|
|
* @param[in] ptr A pointer to the base of the buffer to be deregistered. If
|
|
* a NULL pointer is passed, no operation is performed.
|
|
*
|
|
* @param[in] size Size of the buffer to be deregistered.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
*/
|
|
hsa_status_t HSA_API hsa_memory_deregister(
|
|
void *ptr,
|
|
size_t size);
|
|
|
|
/** @} */
|
|
|
|
|
|
/** \defgroup instruction-set-architecture Instruction Set Architecture.
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Instruction set architecture.
|
|
*/
|
|
typedef struct hsa_isa_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_isa_t;
|
|
|
|
/**
|
|
* @brief Retrieve a reference to an instruction set architecture handle out of
|
|
* a symbolic name.
|
|
*
|
|
* @param[in] name Vendor-specific name associated with a a particular
|
|
* instruction set architecture. @p name must start with the vendor name and a
|
|
* colon (for example, "AMD:"). The rest of the name is vendor-specific. Must be
|
|
* a NUL-terminated string.
|
|
*
|
|
* @param[out] isa Memory location where the HSA runtime stores the ISA handle
|
|
* corresponding to the given name. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA_NAME The given name does not
|
|
* correspond to any instruction set architecture.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p name is NULL, or @p isa is
|
|
* NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_isa_from_name(
|
|
const char *name,
|
|
hsa_isa_t *isa);
|
|
|
|
/**
|
|
* @brief Iterate over the instruction sets supported by the given agent, and
|
|
* invoke an application-defined callback on every iteration. The iterator is
|
|
* deterministic: if an agent supports several instruction set architectures,
|
|
* they are traversed in the same order in every invocation of this function.
|
|
*
|
|
* @param[in] agent A valid agent.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per instruction set
|
|
* architecture. The HSA runtime passes two arguments to the callback: the
|
|
* ISA and the application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* that status value is returned.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_agent_iterate_isas(
|
|
hsa_agent_t agent,
|
|
hsa_status_t (*callback)(hsa_isa_t isa, void *data),
|
|
void *data);
|
|
|
|
/**
|
|
* @brief Instruction set architecture attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The length of the ISA name in bytes, not including the NUL terminator. The
|
|
* type of this attribute is uint32_t.
|
|
*/
|
|
HSA_ISA_INFO_NAME_LENGTH = 0,
|
|
/**
|
|
* Human-readable description. The type of this attribute is character array
|
|
* with the length equal to the value of ::HSA_ISA_INFO_NAME_LENGTH attribute.
|
|
*/
|
|
HSA_ISA_INFO_NAME = 1,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Number of call conventions supported by the instruction set architecture.
|
|
* Must be greater than zero. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_ISA_INFO_CALL_CONVENTION_COUNT = 2,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Number of work-items in a wavefront for a given call convention. Must be a
|
|
* power of 2 in the range [1,256]. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_ISA_INFO_CALL_CONVENTION_INFO_WAVEFRONT_SIZE = 3,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Number of wavefronts per compute unit for a given call convention. In
|
|
* practice, other factors (for example, the amount of group memory used by a
|
|
* work-group) may further limit the number of wavefronts per compute
|
|
* unit. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_ISA_INFO_CALL_CONVENTION_INFO_WAVEFRONTS_PER_COMPUTE_UNIT = 4,
|
|
/**
|
|
* Machine models supported by the instruction set architecture. The type of
|
|
* this attribute is a bool[2]. If the ISA supports the small machine model,
|
|
* the element at index ::HSA_MACHINE_MODEL_SMALL is true. If the ISA supports
|
|
* the large model, the element at index ::HSA_MACHINE_MODEL_LARGE is true.
|
|
*/
|
|
HSA_ISA_INFO_MACHINE_MODELS = 5,
|
|
/**
|
|
* Profiles supported by the instruction set architecture. The type of this
|
|
* attribute is a bool[2]. If the ISA supports the base profile, the element
|
|
* at index ::HSA_PROFILE_BASE is true. If the ISA supports the full profile,
|
|
* the element at index ::HSA_PROFILE_FULL is true.
|
|
*/
|
|
HSA_ISA_INFO_PROFILES = 6,
|
|
/**
|
|
* Default floating-point rounding modes supported by the instruction set
|
|
* architecture. The type of this attribute is a bool[3]. The value at a given
|
|
* index is true if the corresponding rounding mode in
|
|
* ::hsa_default_float_rounding_mode_t is supported. At least one default mode
|
|
* has to be supported.
|
|
*
|
|
* If the default mode is supported, then
|
|
* ::HSA_ISA_INFO_BASE_PROFILE_DEFAULT_FLOAT_ROUNDING_MODES must report that
|
|
* both the zero and the near roundings modes are supported.
|
|
*/
|
|
HSA_ISA_INFO_DEFAULT_FLOAT_ROUNDING_MODES = 7,
|
|
/**
|
|
* Default floating-point rounding modes supported by the instruction set
|
|
* architecture in the Base profile. The type of this attribute is a
|
|
* bool[3]. The value at a given index is true if the corresponding rounding
|
|
* mode in ::hsa_default_float_rounding_mode_t is supported. The value at
|
|
* index HSA_DEFAULT_FLOAT_ROUNDING_MODE_DEFAULT must be false. At least one
|
|
* of the values at indexes ::HSA_DEFAULT_FLOAT_ROUNDING_MODE_ZERO or
|
|
* HSA_DEFAULT_FLOAT_ROUNDING_MODE_NEAR must be true.
|
|
*/
|
|
HSA_ISA_INFO_BASE_PROFILE_DEFAULT_FLOAT_ROUNDING_MODES = 8,
|
|
/**
|
|
* Flag indicating that the f16 HSAIL operation is at least as fast as the
|
|
* f32 operation in the instruction set architecture. The type of this
|
|
* attribute is bool.
|
|
*/
|
|
HSA_ISA_INFO_FAST_F16_OPERATION = 9,
|
|
/**
|
|
* Maximum number of work-items of each dimension of a work-group. Each
|
|
* maximum must be greater than 0. No maximum can exceed the value of
|
|
* ::HSA_ISA_INFO_WORKGROUP_MAX_SIZE. The type of this attribute is
|
|
* uint16_t[3].
|
|
*/
|
|
HSA_ISA_INFO_WORKGROUP_MAX_DIM = 12,
|
|
/**
|
|
* Maximum total number of work-items in a work-group. The type
|
|
* of this attribute is uint32_t.
|
|
*/
|
|
HSA_ISA_INFO_WORKGROUP_MAX_SIZE = 13,
|
|
/**
|
|
* Maximum number of work-items of each dimension of a grid. Each maximum must
|
|
* be greater than 0, and must not be smaller than the corresponding value in
|
|
* ::HSA_ISA_INFO_WORKGROUP_MAX_DIM. No maximum can exceed the value of
|
|
* ::HSA_ISA_INFO_GRID_MAX_SIZE. The type of this attribute is
|
|
* ::hsa_dim3_t.
|
|
*/
|
|
HSA_ISA_INFO_GRID_MAX_DIM = 14,
|
|
/**
|
|
* Maximum total number of work-items in a grid. The type of this
|
|
* attribute is uint64_t.
|
|
*/
|
|
HSA_ISA_INFO_GRID_MAX_SIZE = 16,
|
|
/**
|
|
* Maximum number of fbarriers per work-group. Must be at least 32. The
|
|
* type of this attribute is uint32_t.
|
|
*/
|
|
HSA_ISA_INFO_FBARRIER_MAX_SIZE = 17
|
|
} hsa_isa_info_t;
|
|
|
|
/**
|
|
* @deprecated The concept of call convention has been deprecated. If the
|
|
* application wants to query the value of an attribute for a given instruction
|
|
* set architecture, use ::hsa_isa_get_info_alt instead. If the application
|
|
* wants to query an attribute that is specific to a given combination of ISA
|
|
* and wavefront, use ::hsa_wavefront_get_info.
|
|
*
|
|
* @brief Get the current value of an attribute for a given instruction set
|
|
* architecture (ISA).
|
|
*
|
|
* @param[in] isa A valid instruction set architecture.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[in] index Call convention index. Used only for call convention
|
|
* attributes, otherwise ignored. Must have a value between 0 (inclusive) and
|
|
* the value of the attribute ::HSA_ISA_INFO_CALL_CONVENTION_COUNT (not
|
|
* inclusive) in @p isa.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA The instruction set architecture is
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_INDEX The index is out of range.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* instruction set architecture attribute, or @p value is
|
|
* NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_isa_get_info(
|
|
hsa_isa_t isa,
|
|
hsa_isa_info_t attribute,
|
|
uint32_t index,
|
|
void *value);
|
|
|
|
/**
|
|
* @brief Get the current value of an attribute for a given instruction set
|
|
* architecture (ISA).
|
|
*
|
|
* @param[in] isa A valid instruction set architecture.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA The instruction set architecture is
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* instruction set architecture attribute, or @p value is
|
|
* NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_isa_get_info_alt(
|
|
hsa_isa_t isa,
|
|
hsa_isa_info_t attribute,
|
|
void *value);
|
|
|
|
/**
|
|
* @brief Retrieve the exception policy support for a given combination of
|
|
* instruction set architecture and profile.
|
|
*
|
|
* @param[in] isa A valid instruction set architecture.
|
|
*
|
|
* @param[in] profile Profile.
|
|
*
|
|
* @param[out] mask Pointer to a memory location where the HSA runtime stores a
|
|
* mask of ::hsa_exception_policy_t values. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA The instruction set architecture is
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p profile is not a valid
|
|
* profile, or @p mask is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_isa_get_exception_policies(
|
|
hsa_isa_t isa,
|
|
hsa_profile_t profile,
|
|
uint16_t *mask);
|
|
|
|
/**
|
|
* @brief Floating-point types.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* 16-bit floating-point type.
|
|
*/
|
|
HSA_FP_TYPE_16 = 1,
|
|
/**
|
|
* 32-bit floating-point type.
|
|
*/
|
|
HSA_FP_TYPE_32 = 2,
|
|
/**
|
|
* 64-bit floating-point type.
|
|
*/
|
|
HSA_FP_TYPE_64 = 4
|
|
} hsa_fp_type_t;
|
|
|
|
/**
|
|
* @brief Flush to zero modes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Flush to zero.
|
|
*/
|
|
HSA_FLUSH_MODE_FTZ = 1,
|
|
/**
|
|
* Do not flush to zero.
|
|
*/
|
|
HSA_FLUSH_MODE_NON_FTZ = 2
|
|
} hsa_flush_mode_t;
|
|
|
|
/**
|
|
* @brief Round methods.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Single round method.
|
|
*/
|
|
HSA_ROUND_METHOD_SINGLE = 1,
|
|
/**
|
|
* Double round method.
|
|
*/
|
|
HSA_ROUND_METHOD_DOUBLE = 2
|
|
} hsa_round_method_t;
|
|
|
|
/**
|
|
* @brief Retrieve the round method (single or double) used to implement the
|
|
* floating-point multiply add instruction (mad) for a given combination of
|
|
* instruction set architecture, floating-point type, and flush to zero
|
|
* modifier.
|
|
*
|
|
* @param[in] isa Instruction set architecture.
|
|
*
|
|
* @param[in] fp_type Floating-point type.
|
|
*
|
|
* @param[in] flush_mode Flush to zero modifier.
|
|
*
|
|
* @param[out] round_method Pointer to a memory location where the HSA
|
|
* runtime stores the round method used by the implementation. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA The instruction set architecture is
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p fp_type is not a valid
|
|
* floating-point type, or @p flush_mode is not a valid flush to zero modifier,
|
|
* or @p round_method is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_isa_get_round_method(
|
|
hsa_isa_t isa,
|
|
hsa_fp_type_t fp_type,
|
|
hsa_flush_mode_t flush_mode,
|
|
hsa_round_method_t *round_method);
|
|
|
|
/**
|
|
* @brief Wavefront handle
|
|
*/
|
|
typedef struct hsa_wavefront_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_wavefront_t;
|
|
|
|
/**
|
|
* @brief Wavefront attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Number of work-items in the wavefront. Must be a power of 2 in the range
|
|
* [1,256]. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_WAVEFRONT_INFO_SIZE = 0
|
|
} hsa_wavefront_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of a wavefront attribute.
|
|
*
|
|
* @param[in] wavefront A wavefront.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_WAVEFRONT The wavefront is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* wavefront attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_wavefront_get_info(
|
|
hsa_wavefront_t wavefront,
|
|
hsa_wavefront_info_t attribute,
|
|
void *value);
|
|
|
|
/**
|
|
* @brief Iterate over the different wavefronts supported by an instruction set
|
|
* architecture, and invoke an application-defined callback on every iteration.
|
|
*
|
|
* @param[in] isa Instruction set architecture.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per wavefront that is
|
|
* supported by the agent. The HSA runtime passes two arguments to the callback:
|
|
* the wavefront handle and the application data. If @p callback returns a
|
|
* status other than ::HSA_STATUS_SUCCESS for a particular iteration, the
|
|
* traversal stops and that value is returned.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA The instruction set architecture is
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_isa_iterate_wavefronts(
|
|
hsa_isa_t isa,
|
|
hsa_status_t (*callback)(hsa_wavefront_t wavefront, void *data),
|
|
void *data);
|
|
|
|
/**
|
|
* @deprecated Use ::hsa_agent_iterate_isas to query which instructions set
|
|
* architectures are supported by a given agent.
|
|
*
|
|
* @brief Check if the instruction set architecture of a code object can be
|
|
* executed on an agent associated with another architecture.
|
|
*
|
|
* @param[in] code_object_isa Instruction set architecture associated with a
|
|
* code object.
|
|
*
|
|
* @param[in] agent_isa Instruction set architecture associated with an agent.
|
|
*
|
|
* @param[out] result Pointer to a memory location where the HSA runtime stores
|
|
* the result of the check. If the two architectures are compatible, the result
|
|
* is true; if they are incompatible, the result is false.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ISA @p code_object_isa or @p agent_isa are
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_isa_compatible(
|
|
hsa_isa_t code_object_isa,
|
|
hsa_isa_t agent_isa,
|
|
bool *result);
|
|
|
|
/** @} */
|
|
|
|
|
|
/** \defgroup executable Executable
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @brief Code object reader handle. A code object reader is used to
|
|
* load a code object from file (when created using
|
|
* ::hsa_code_object_reader_create_from_file), or from memory (if created using
|
|
* ::hsa_code_object_reader_create_from_memory).
|
|
*/
|
|
typedef struct hsa_code_object_reader_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_code_object_reader_t;
|
|
|
|
/**
|
|
* @brief Create a code object reader to operate on a file.
|
|
*
|
|
* @param[in] file File descriptor. The file must have been opened by
|
|
* application with at least read permissions prior calling this function. The
|
|
* file must contain a vendor-specific code object.
|
|
*
|
|
* The file is owned and managed by the application; the lifetime of the file
|
|
* descriptor must exceed that of any associated code object reader.
|
|
*
|
|
* @param[out] code_object_reader Memory location to store the newly created
|
|
* code object reader handle. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_FILE @p file is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p code_object_reader is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_code_object_reader_create_from_file(
|
|
hsa_file_t file,
|
|
hsa_code_object_reader_t *code_object_reader);
|
|
|
|
/**
|
|
* @brief Create a code object reader to operate on memory.
|
|
*
|
|
* @param[in] code_object Memory buffer that contains a vendor-specific code
|
|
* object. The buffer is owned and managed by the application; the lifetime of
|
|
* the buffer must exceed that of any associated code object reader.
|
|
*
|
|
* @param[in] size Size of the buffer pointed to by @p code_object. Must not be
|
|
* 0.
|
|
*
|
|
* @param[out] code_object_reader Memory location to store newly created code
|
|
* object reader handle. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p code_object is NULL, @p size
|
|
* is zero, or @p code_object_reader is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_code_object_reader_create_from_memory(
|
|
const void *code_object,
|
|
size_t size,
|
|
hsa_code_object_reader_t *code_object_reader);
|
|
|
|
/**
|
|
* @brief Destroy a code object reader.
|
|
*
|
|
* @details The code object reader handle becomes invalid after completion of
|
|
* this function. Any file or memory used to create the code object read is not
|
|
* closed, removed, or deallocated by this function.
|
|
*
|
|
* @param[in] code_object_reader Code object reader to destroy.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT_READER @p code_object_reader
|
|
* is invalid.
|
|
*/
|
|
hsa_status_t HSA_API hsa_code_object_reader_destroy(
|
|
hsa_code_object_reader_t code_object_reader);
|
|
|
|
/**
|
|
* @brief Struct containing an opaque handle to an executable, which contains
|
|
* ISA for finalized kernels and indirect functions together with the allocated
|
|
* global or readonly segment variables they reference.
|
|
*/
|
|
typedef struct hsa_executable_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_executable_t;
|
|
|
|
/**
|
|
* @brief Executable state.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Executable state, which allows the user to load code objects and define
|
|
* external variables. Variable addresses, kernel code handles, and
|
|
* indirect function code handles are not available in query operations until
|
|
* the executable is frozen (zero always returned).
|
|
*/
|
|
HSA_EXECUTABLE_STATE_UNFROZEN = 0,
|
|
/**
|
|
* Executable state, which allows the user to query variable addresses,
|
|
* kernel code handles, and indirect function code handles using query
|
|
* operations. Loading new code objects, as well as defining external
|
|
* variables, is not allowed in this state.
|
|
*/
|
|
HSA_EXECUTABLE_STATE_FROZEN = 1
|
|
} hsa_executable_state_t;
|
|
|
|
/**
|
|
* @deprecated Use ::hsa_executable_create_alt instead, which allows the
|
|
* application to specify the default floating-point rounding mode of the
|
|
* executable and assumes an unfrozen initial state.
|
|
*
|
|
* @brief Create an empty executable.
|
|
*
|
|
* @param[in] profile Profile used in the executable.
|
|
*
|
|
* @param[in] executable_state Executable state. If the state is
|
|
* ::HSA_EXECUTABLE_STATE_FROZEN, the resulting executable is useless because no
|
|
* code objects can be loaded, and no variables can be defined.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] executable Memory location where the HSA runtime stores the newly
|
|
* created executable handle.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p profile is invalid, or
|
|
* @p executable is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_create(
|
|
hsa_profile_t profile,
|
|
hsa_executable_state_t executable_state,
|
|
const char *options,
|
|
hsa_executable_t *executable);
|
|
|
|
/**
|
|
* @brief Create an empty executable.
|
|
*
|
|
* @param[in] profile Profile used in the executable.
|
|
*
|
|
* @param[in] default_float_rounding_mode Default floating-point rounding mode
|
|
* used in the executable. Allowed rounding modes are near and zero (default is
|
|
* not allowed).
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] executable Memory location where the HSA runtime stores newly
|
|
* created executable handle. The initial state of the executable is
|
|
* ::HSA_EXECUTABLE_STATE_UNFROZEN.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p profile is invalid, or
|
|
* @p executable is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_create_alt(
|
|
hsa_profile_t profile,
|
|
hsa_default_float_rounding_mode_t default_float_rounding_mode,
|
|
const char *options,
|
|
hsa_executable_t *executable);
|
|
|
|
/**
|
|
* @brief Destroy an executable.
|
|
*
|
|
* @details An executable handle becomes invalid after the executable has been
|
|
* destroyed. Code object handles that were loaded into this executable are
|
|
* still valid after the executable has been destroyed, and can be used as
|
|
* intended. Resources allocated outside and associated with this executable
|
|
* (such as external global or readonly variables) can be released after the
|
|
* executable has been destroyed.
|
|
*
|
|
* Executable should not be destroyed while kernels are in flight.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_destroy(
|
|
hsa_executable_t executable);
|
|
|
|
/**
|
|
* @brief Loaded code object handle.
|
|
*/
|
|
typedef struct hsa_loaded_code_object_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_loaded_code_object_t;
|
|
|
|
/**
|
|
* @brief Load a program code object into an executable.
|
|
*
|
|
* @details A program code object contains information about resources that are
|
|
* accessible by all kernel agents that run the executable, and can be loaded
|
|
* at most once into an executable.
|
|
*
|
|
* If the program code object uses extensions, the implementation must support
|
|
* them for this operation to return successfully.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] code_object_reader A code object reader that holds the program
|
|
* code object to load. If a code object reader is destroyed before all the
|
|
* associated executables are destroyed, the behavior is undefined.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] loaded_code_object Pointer to a memory location where the HSA
|
|
* runtime stores the loaded code object handle. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE The executable is frozen.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT_READER @p code_object_reader
|
|
* is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INCOMPATIBLE_ARGUMENTS The program code object is
|
|
* not compatible with the executable or the implementation (for example, the
|
|
* code object uses an extension that is not supported by the implementation).
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_load_program_code_object(
|
|
hsa_executable_t executable,
|
|
hsa_code_object_reader_t code_object_reader,
|
|
const char *options,
|
|
hsa_loaded_code_object_t *loaded_code_object);
|
|
|
|
/**
|
|
* @brief Load an agent code object into an executable.
|
|
*
|
|
* @details The agent code object contains all defined agent
|
|
* allocation variables, functions, indirect functions, and kernels in a given
|
|
* program for a given instruction set architecture.
|
|
*
|
|
* Any module linkage declaration must have been defined either by a define
|
|
* variable or by loading a code object that has a symbol with module linkage
|
|
* definition.
|
|
*
|
|
* The default floating-point rounding mode of the code object associated with
|
|
* @p code_object_reader must match that of the executable
|
|
* (::HSA_EXECUTABLE_INFO_DEFAULT_FLOAT_ROUNDING_MODE), or be default (in which
|
|
* case the value of ::HSA_EXECUTABLE_INFO_DEFAULT_FLOAT_ROUNDING_MODE is used).
|
|
* If the agent code object uses extensions, the implementation and the agent
|
|
* must support them for this operation to return successfully.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] agent Agent to load code object for. A code object can be loaded
|
|
* into an executable at most once for a given agent. The instruction set
|
|
* architecture of the code object must be supported by the agent.
|
|
*
|
|
* @param[in] code_object_reader A code object reader that holds the code object
|
|
* to load. If a code object reader is destroyed before all the associated
|
|
* executables are destroyed, the behavior is undefined.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] loaded_code_object Pointer to a memory location where the HSA
|
|
* runtime stores the loaded code object handle. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE The executable is frozen.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT_READER @p code_object_reader
|
|
* is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INCOMPATIBLE_ARGUMENTS The code object read by @p
|
|
* code_object_reader is not compatible with the agent (for example, the agent
|
|
* does not support the instruction set architecture of the code object), the
|
|
* executable (for example, there is a default floating-point mode mismatch
|
|
* between the two), or the implementation.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_load_agent_code_object(
|
|
hsa_executable_t executable,
|
|
hsa_agent_t agent,
|
|
hsa_code_object_reader_t code_object_reader,
|
|
const char *options,
|
|
hsa_loaded_code_object_t *loaded_code_object);
|
|
|
|
/**
|
|
* @brief Freeze the executable.
|
|
*
|
|
* @details No modifications to executable can be made after freezing: no code
|
|
* objects can be loaded to the executable, and no external variables can be
|
|
* defined. Freezing the executable does not prevent querying the executable's
|
|
* attributes. The application must define all the external variables in an
|
|
* executable before freezing it.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_VARIABLE_UNDEFINED One or more variables are
|
|
* undefined in the executable.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE @p executable is already frozen.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_freeze(
|
|
hsa_executable_t executable,
|
|
const char *options);
|
|
|
|
/**
|
|
* @brief Executable attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Profile this executable is created for. The type of this attribute is
|
|
* ::hsa_profile_t.
|
|
*/
|
|
HSA_EXECUTABLE_INFO_PROFILE = 1,
|
|
/**
|
|
* Executable state. The type of this attribute is ::hsa_executable_state_t.
|
|
*/
|
|
HSA_EXECUTABLE_INFO_STATE = 2,
|
|
/**
|
|
* Default floating-point rounding mode specified when executable was created.
|
|
* The type of this attribute is ::hsa_default_float_rounding_mode_t.
|
|
*/
|
|
HSA_EXECUTABLE_INFO_DEFAULT_FLOAT_ROUNDING_MODE = 3
|
|
} hsa_executable_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of an attribute for a given executable.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* executable attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_get_info(
|
|
hsa_executable_t executable,
|
|
hsa_executable_info_t attribute,
|
|
void *value);
|
|
|
|
/**
|
|
* @brief Define an external global variable with program allocation.
|
|
*
|
|
* @details This function allows the application to provide the definition
|
|
* of a variable in the global segment memory with program allocation. The
|
|
* variable must be defined before loading a code object into an executable.
|
|
* In addition, code objects loaded must not define the variable.
|
|
*
|
|
* @param[in] executable Executable. Must not be in frozen state.
|
|
*
|
|
* @param[in] variable_name Name of the variable. The Programmer's Reference
|
|
* Manual describes the standard name mangling scheme.
|
|
*
|
|
* @param[in] address Address where the variable is defined. This address must
|
|
* be in global memory and can be read and written by any agent in the
|
|
* system. The application cannot deallocate the buffer pointed by @p address
|
|
* before @p executable is destroyed.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_VARIABLE_ALREADY_DEFINED The variable is
|
|
* already defined.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no variable with the
|
|
* @p variable_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE @p executable is frozen.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p variable_name is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_global_variable_define(
|
|
hsa_executable_t executable,
|
|
const char *variable_name,
|
|
void *address);
|
|
|
|
/**
|
|
* @brief Define an external global variable with agent allocation.
|
|
*
|
|
* @details This function allows the application to provide the definition
|
|
* of a variable in the global segment memory with agent allocation. The
|
|
* variable must be defined before loading a code object into an executable.
|
|
* In addition, code objects loaded must not define the variable.
|
|
*
|
|
* @param[in] executable Executable. Must not be in frozen state.
|
|
*
|
|
* @param[in] agent Agent for which the variable is being defined.
|
|
*
|
|
* @param[in] variable_name Name of the variable. The Programmer's Reference
|
|
* Manual describes the standard name mangling scheme.
|
|
*
|
|
* @param[in] address Address where the variable is defined. This address must
|
|
* have been previously allocated using ::hsa_memory_allocate in a global region
|
|
* that is only visible to @p agent. The application cannot deallocate the
|
|
* buffer pointed by @p address before @p executable is destroyed.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT @p agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_VARIABLE_ALREADY_DEFINED The variable is
|
|
* already defined.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no variable with the
|
|
* @p variable_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE @p executable is frozen.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p variable_name is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_agent_global_variable_define(
|
|
hsa_executable_t executable,
|
|
hsa_agent_t agent,
|
|
const char *variable_name,
|
|
void *address);
|
|
|
|
/**
|
|
* @brief Define an external readonly variable.
|
|
*
|
|
* @details This function allows the application to provide the definition
|
|
* of a variable in the readonly segment memory. The variable must be defined
|
|
* before loading a code object into an executable. In addition, code objects
|
|
* loaded must not define the variable.
|
|
*
|
|
* @param[in] executable Executable. Must not be in frozen state.
|
|
*
|
|
* @param[in] agent Agent for which the variable is being defined.
|
|
*
|
|
* @param[in] variable_name Name of the variable. The Programmer's Reference
|
|
* Manual describes the standard name mangling scheme.
|
|
*
|
|
* @param[in] address Address where the variable is defined. This address must
|
|
* have been previously allocated using ::hsa_memory_allocate in a readonly
|
|
* region associated with @p agent. The application cannot deallocate the buffer
|
|
* pointed by @p address before @p executable is destroyed.
|
|
*
|
|
* @param[in] address Address where the variable is defined. The buffer pointed
|
|
* by @p address is owned by the application, and cannot be deallocated before
|
|
* @p executable is destroyed.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE Executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT @p agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_VARIABLE_ALREADY_DEFINED The variable is
|
|
* already defined.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no variable with the
|
|
* @p variable_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE @p executable is frozen.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p variable_name is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_readonly_variable_define(
|
|
hsa_executable_t executable,
|
|
hsa_agent_t agent,
|
|
const char *variable_name,
|
|
void *address);
|
|
|
|
/**
|
|
* @brief Validate an executable. Checks that all code objects have matching
|
|
* machine model, profile, and default floating-point rounding mode. Checks that
|
|
* all declarations have definitions. Checks declaration-definition
|
|
* compatibility (see the HSA Programming Reference Manual for compatibility
|
|
* rules). Invoking this function is equivalent to invoking
|
|
* ::hsa_executable_validate_alt with no options.
|
|
*
|
|
* @param[in] executable Executable. Must be in frozen state.
|
|
*
|
|
* @param[out] result Memory location where the HSA runtime stores the
|
|
* validation result. If the executable passes validation, the result is 0.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE @p executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_validate(
|
|
hsa_executable_t executable,
|
|
uint32_t *result);
|
|
|
|
/**
|
|
* @brief Validate an executable. Checks that all code objects have matching
|
|
* machine model, profile, and default floating-point rounding mode. Checks that
|
|
* all declarations have definitions. Checks declaration-definition
|
|
* compatibility (see the HSA Programming Reference Manual for compatibility
|
|
* rules).
|
|
*
|
|
* @param[in] executable Executable. Must be in frozen state.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] result Memory location where the HSA runtime stores the
|
|
* validation result. If the executable passes validation, the result is 0.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE @p executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p result is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_validate_alt(
|
|
hsa_executable_t executable,
|
|
const char *options,
|
|
uint32_t *result);
|
|
|
|
/**
|
|
* @brief Executable symbol handle.
|
|
*
|
|
* The lifetime of an executable object symbol matches that of the executable
|
|
* associated with it. An operation on a symbol whose associated executable has
|
|
* been destroyed results in undefined behavior.
|
|
*/
|
|
typedef struct hsa_executable_symbol_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_executable_symbol_t;
|
|
|
|
/**
|
|
* @deprecated Use ::hsa_executable_get_symbol_by_name instead.
|
|
*
|
|
* @brief Get the symbol handle for a given a symbol name.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] module_name Module name. Must be NULL if the symbol has
|
|
* program linkage.
|
|
*
|
|
* @param[in] symbol_name Symbol name.
|
|
*
|
|
* @param[in] agent Agent associated with the symbol. If the symbol is
|
|
* independent of any agent (for example, a variable with program
|
|
* allocation), this argument is ignored.
|
|
*
|
|
* @param[in] call_convention Call convention associated with the symbol. If the
|
|
* symbol does not correspond to an indirect function, this argument is ignored.
|
|
*
|
|
* @param[out] symbol Memory location where the HSA runtime stores the symbol
|
|
* handle.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no symbol with a name
|
|
* that matches @p symbol_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p symbol_name is NULL, or
|
|
* @p symbol is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_get_symbol(
|
|
hsa_executable_t executable,
|
|
const char *module_name,
|
|
const char *symbol_name,
|
|
hsa_agent_t agent,
|
|
int32_t call_convention,
|
|
hsa_executable_symbol_t *symbol);
|
|
|
|
/**
|
|
* @brief Retrieve the symbol handle corresponding to a given a symbol name.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] symbol_name Symbol name. Must be a NUL-terminated character
|
|
* array. The Programmer's Reference Manual describes the standard name mangling
|
|
* scheme.
|
|
*
|
|
* @param[in] agent Pointer to the agent for which the symbol with the given
|
|
* name is defined. If the symbol corresponding to the given name has program
|
|
* allocation, @p agent must be NULL.
|
|
*
|
|
* @param[out] symbol Memory location where the HSA runtime stores the symbol
|
|
* handle. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no symbol with a name
|
|
* that matches @p symbol_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p symbol_name is NULL, or @p
|
|
* symbol is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_get_symbol_by_name(
|
|
hsa_executable_t executable,
|
|
const char *symbol_name,
|
|
const hsa_agent_t *agent,
|
|
hsa_executable_symbol_t *symbol);
|
|
|
|
/**
|
|
* @brief Symbol type.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Variable.
|
|
*/
|
|
HSA_SYMBOL_KIND_VARIABLE = 0,
|
|
/**
|
|
* Kernel.
|
|
*/
|
|
HSA_SYMBOL_KIND_KERNEL = 1,
|
|
/**
|
|
* Indirect function.
|
|
*/
|
|
HSA_SYMBOL_KIND_INDIRECT_FUNCTION = 2
|
|
} hsa_symbol_kind_t;
|
|
|
|
/**
|
|
* @brief Linkage type of a symbol.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Module linkage.
|
|
*/
|
|
HSA_SYMBOL_LINKAGE_MODULE = 0,
|
|
/**
|
|
* Program linkage.
|
|
*/
|
|
HSA_SYMBOL_LINKAGE_PROGRAM = 1
|
|
} hsa_symbol_linkage_t;
|
|
|
|
/**
|
|
* @brief Allocation type of a variable.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Agent allocation.
|
|
*/
|
|
HSA_VARIABLE_ALLOCATION_AGENT = 0,
|
|
/**
|
|
* Program allocation.
|
|
*/
|
|
HSA_VARIABLE_ALLOCATION_PROGRAM = 1
|
|
} hsa_variable_allocation_t;
|
|
|
|
/**
|
|
* @brief Memory segment associated with a variable.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Global memory segment.
|
|
*/
|
|
HSA_VARIABLE_SEGMENT_GLOBAL = 0,
|
|
/**
|
|
* Readonly memory segment.
|
|
*/
|
|
HSA_VARIABLE_SEGMENT_READONLY = 1
|
|
} hsa_variable_segment_t;
|
|
|
|
/**
|
|
* @brief Executable symbol attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The kind of the symbol. The type of this attribute is ::hsa_symbol_kind_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_TYPE = 0,
|
|
/**
|
|
* The length of the symbol name in bytes, not including the NUL terminator.
|
|
* The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_NAME_LENGTH = 1,
|
|
/**
|
|
* The name of the symbol. The type of this attribute is character array with
|
|
* the length equal to the value of ::HSA_EXECUTABLE_SYMBOL_INFO_NAME_LENGTH
|
|
* attribute.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_NAME = 2,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* The length of the module name in bytes (not including the NUL terminator)
|
|
* to which this symbol belongs if this symbol has module linkage, otherwise 0
|
|
* is returned. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_MODULE_NAME_LENGTH = 3,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* The module name to which this symbol belongs if this symbol has module
|
|
* linkage, otherwise an empty string is returned. The type of this attribute
|
|
* is character array with the length equal to the value of
|
|
* ::HSA_EXECUTABLE_SYMBOL_INFO_MODULE_NAME_LENGTH attribute.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_MODULE_NAME = 4,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Agent associated with this symbol. If the symbol is a variable, the
|
|
* value of this attribute is only defined if
|
|
* ::HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_ALLOCATION is
|
|
* ::HSA_VARIABLE_ALLOCATION_AGENT. The type of this attribute is hsa_agent_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_AGENT = 20,
|
|
/**
|
|
* The address of the variable. The value of this attribute is undefined if
|
|
* the symbol is not a variable. The type of this attribute is uint64_t.
|
|
*
|
|
* If executable's state is ::HSA_EXECUTABLE_STATE_UNFROZEN, then 0 is
|
|
* returned.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_ADDRESS = 21,
|
|
/**
|
|
* The linkage kind of the symbol. The type of this attribute is
|
|
* ::hsa_symbol_linkage_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_LINKAGE = 5,
|
|
/**
|
|
* Indicates whether the symbol corresponds to a definition. The type of this
|
|
* attribute is bool.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_IS_DEFINITION = 17,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* The allocation kind of the variable. The value of this attribute is
|
|
* undefined if the symbol is not a variable. The type of this attribute is
|
|
* ::hsa_variable_allocation_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_ALLOCATION = 6,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* The segment kind of the variable. The value of this attribute is undefined
|
|
* if the symbol is not a variable. The type of this attribute is
|
|
* ::hsa_variable_segment_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_SEGMENT = 7,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Alignment of the symbol in memory. The value of this attribute is undefined
|
|
* if the symbol is not a variable. The type of this attribute is uint32_t.
|
|
*
|
|
* The current alignment of the variable in memory may be greater than the
|
|
* value specified in the source program variable declaration.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_ALIGNMENT = 8,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Size of the variable. The value of this attribute is undefined if
|
|
* the symbol is not a variable. The type of this attribute is uint32_t.
|
|
*
|
|
* A value of 0 is returned if the variable is an external variable and has an
|
|
* unknown dimension.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_SIZE = 9,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Indicates whether the variable is constant. The value of this attribute is
|
|
* undefined if the symbol is not a variable. The type of this attribute is
|
|
* bool.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_VARIABLE_IS_CONST = 10,
|
|
/**
|
|
* Kernel object handle, used in the kernel dispatch packet. The value of this
|
|
* attribute is undefined if the symbol is not a kernel. The type of this
|
|
* attribute is uint64_t.
|
|
*
|
|
* If the state of the executable is ::HSA_EXECUTABLE_STATE_UNFROZEN, then 0
|
|
* is returned.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_OBJECT = 22,
|
|
/**
|
|
* Size of kernarg segment memory that is required to hold the values of the
|
|
* kernel arguments, in bytes. Must be a multiple of 16. The value of this
|
|
* attribute is undefined if the symbol is not a kernel. The type of this
|
|
* attribute is uint32_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_SIZE = 11,
|
|
/**
|
|
* Alignment (in bytes) of the buffer used to pass arguments to the kernel,
|
|
* which is the maximum of 16 and the maximum alignment of any of the kernel
|
|
* arguments. The value of this attribute is undefined if the symbol is not a
|
|
* kernel. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_ALIGNMENT = 12,
|
|
/**
|
|
* Size of static group segment memory required by the kernel (per
|
|
* work-group), in bytes. The value of this attribute is undefined
|
|
* if the symbol is not a kernel. The type of this attribute is uint32_t.
|
|
*
|
|
* The reported amount does not include any dynamically allocated group
|
|
* segment memory that may be requested by the application when a kernel is
|
|
* dispatched.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_GROUP_SEGMENT_SIZE = 13,
|
|
/**
|
|
* Size of static private, spill, and arg segment memory required by
|
|
* this kernel (per work-item), in bytes. The value of this attribute is
|
|
* undefined if the symbol is not a kernel. The type of this attribute is
|
|
* uint32_t.
|
|
*
|
|
* If the value of ::HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_DYNAMIC_CALLSTACK is
|
|
* true, the kernel may use more private memory than the reported value, and
|
|
* the application must add the dynamic call stack usage to @a
|
|
* private_segment_size when populating a kernel dispatch packet.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_PRIVATE_SEGMENT_SIZE = 14,
|
|
/**
|
|
* Dynamic callstack flag. The value of this attribute is undefined if the
|
|
* symbol is not a kernel. The type of this attribute is bool.
|
|
*
|
|
* If this flag is set (the value is true), the kernel uses a dynamically
|
|
* sized call stack. This can happen if recursive calls, calls to indirect
|
|
* functions, or the HSAIL alloca instruction are present in the kernel.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_DYNAMIC_CALLSTACK = 15,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Call convention of the kernel. The value of this attribute is undefined if
|
|
* the symbol is not a kernel. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_KERNEL_CALL_CONVENTION = 18,
|
|
/**
|
|
* Indirect function object handle. The value of this attribute is undefined
|
|
* if the symbol is not an indirect function, or the associated agent does
|
|
* not support the Full Profile. The type of this attribute depends on the
|
|
* machine model: the type is uint32_t for small machine model, and uint64_t
|
|
* for large model.
|
|
*
|
|
* If the state of the executable is ::HSA_EXECUTABLE_STATE_UNFROZEN, then 0
|
|
* is returned.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_INDIRECT_FUNCTION_OBJECT = 23,
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* Call convention of the indirect function. The value of this attribute is
|
|
* undefined if the symbol is not an indirect function, or the associated
|
|
* agent does not support the Full Profile. The type of this attribute is
|
|
* uint32_t.
|
|
*/
|
|
HSA_EXECUTABLE_SYMBOL_INFO_INDIRECT_FUNCTION_CALL_CONVENTION = 16
|
|
} hsa_executable_symbol_info_t;
|
|
|
|
/**
|
|
* @brief Get the current value of an attribute for a given executable symbol.
|
|
*
|
|
* @param[in] executable_symbol Executable symbol.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE_SYMBOL The executable symbol is
|
|
* invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* executable symbol attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_symbol_get_info(
|
|
hsa_executable_symbol_t executable_symbol,
|
|
hsa_executable_symbol_info_t attribute,
|
|
void *value);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Iterate over the symbols in a executable, and invoke an
|
|
* application-defined callback on every iteration.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per executable symbol. The
|
|
* HSA runtime passes three arguments to the callback: the executable, a symbol,
|
|
* and the application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* ::hsa_executable_iterate_symbols returns that status value.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_iterate_symbols(
|
|
hsa_executable_t executable,
|
|
hsa_status_t (*callback)(hsa_executable_t exec,
|
|
hsa_executable_symbol_t symbol,
|
|
void *data),
|
|
void *data);
|
|
|
|
/**
|
|
* @brief Iterate over the kernels, indirect functions, and agent allocation
|
|
* variables in an executable for a given agent, and invoke an application-
|
|
* defined callback on every iteration.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] agent Agent.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per executable symbol. The
|
|
* HSA runtime passes three arguments to the callback: the executable, a symbol,
|
|
* and the application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* ::hsa_executable_iterate_symbols returns that status value.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_iterate_agent_symbols(
|
|
hsa_executable_t executable,
|
|
hsa_agent_t agent,
|
|
hsa_status_t (*callback)(hsa_executable_t exec,
|
|
hsa_agent_t agent,
|
|
hsa_executable_symbol_t symbol,
|
|
void *data),
|
|
void *data);
|
|
|
|
/**
|
|
* @brief Iterate over the program allocation variables in an executable, and
|
|
* invoke an application-defined callback on every iteration.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per executable symbol. The
|
|
* HSA runtime passes three arguments to the callback: the executable, a symbol,
|
|
* and the application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* ::hsa_executable_iterate_symbols returns that status value.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API hsa_executable_iterate_program_symbols(
|
|
hsa_executable_t executable,
|
|
hsa_status_t (*callback)(hsa_executable_t exec,
|
|
hsa_executable_symbol_t symbol,
|
|
void *data),
|
|
void *data);
|
|
|
|
/** @} */
|
|
|
|
|
|
/** \defgroup code-object Code Objects (deprecated).
|
|
* @{
|
|
*/
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Struct containing an opaque handle to a code object, which contains
|
|
* ISA for finalized kernels and indirect functions together with information
|
|
* about the global or readonly segment variables they reference.
|
|
*/
|
|
typedef struct hsa_code_object_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_code_object_t;
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Application data handle that is passed to the serialization
|
|
* and deserialization functions.
|
|
*/
|
|
typedef struct hsa_callback_data_s {
|
|
/**
|
|
* Opaque handle.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_callback_data_t;
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Serialize a code object. Can be used for offline finalization,
|
|
* install-time finalization, disk code caching, etc.
|
|
*
|
|
* @param[in] code_object Code object.
|
|
*
|
|
* @param[in] alloc_callback Callback function for memory allocation. Must not
|
|
* be NULL. The HSA runtime passes three arguments to the callback: the
|
|
* allocation size, the application data, and a pointer to a memory location
|
|
* where the application stores the allocation result. The HSA runtime invokes
|
|
* @p alloc_callback once to allocate a buffer that contains the serialized
|
|
* version of @p code_object. If the callback returns a status code other than
|
|
* ::HSA_STATUS_SUCCESS, this function returns the same code.
|
|
*
|
|
* @param[in] callback_data Application data that is passed to @p
|
|
* alloc_callback. May be NULL.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] serialized_code_object Memory location where the HSA runtime
|
|
* stores a pointer to the serialized code object. Must not be NULL.
|
|
*
|
|
* @param[out] serialized_code_object_size Memory location where the HSA runtime
|
|
* stores the size (in bytes) of @p serialized_code_object. The returned value
|
|
* matches the allocation size passed by the HSA runtime to @p
|
|
* alloc_callback. Must not be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p alloc_callback, @p
|
|
* serialized_code_object, or @p serialized_code_object_size are NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_serialize(
|
|
hsa_code_object_t code_object,
|
|
hsa_status_t (*alloc_callback)(size_t size,
|
|
hsa_callback_data_t data,
|
|
void **address),
|
|
hsa_callback_data_t callback_data,
|
|
const char *options,
|
|
void **serialized_code_object,
|
|
size_t *serialized_code_object_size);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Deserialize a code object.
|
|
*
|
|
* @param[in] serialized_code_object A serialized code object. Must not be NULL.
|
|
*
|
|
* @param[in] serialized_code_object_size The size (in bytes) of @p
|
|
* serialized_code_object. Must not be 0.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @param[out] code_object Memory location where the HSA runtime stores the
|
|
* deserialized code object.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p serialized_code_object, or @p
|
|
* code_object are NULL, or @p serialized_code_object_size is 0.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_deserialize(
|
|
void *serialized_code_object,
|
|
size_t serialized_code_object_size,
|
|
const char *options,
|
|
hsa_code_object_t *code_object);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Destroy a code object.
|
|
*
|
|
* @details The lifetime of a code object must exceed that of any executable
|
|
* where it has been loaded. If an executable that loaded @p code_object has not
|
|
* been destroyed, the behavior is undefined.
|
|
*
|
|
* @param[in] code_object Code object. The handle becomes invalid after it has
|
|
* been destroyed.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_destroy(
|
|
hsa_code_object_t code_object);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Code object type.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* Produces code object that contains ISA for all kernels and indirect
|
|
* functions in HSA source.
|
|
*/
|
|
HSA_CODE_OBJECT_TYPE_PROGRAM = 0
|
|
} hsa_code_object_type_t;
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Code object attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The version of the code object. The type of this attribute is a
|
|
* NUL-terminated char[64]. The name must be at most 63 characters long (not
|
|
* including the NUL terminator) and all array elements not used for the name
|
|
* must be NUL.
|
|
*/
|
|
HSA_CODE_OBJECT_INFO_VERSION = 0,
|
|
/**
|
|
* Type of code object. The type of this attribute is
|
|
* ::hsa_code_object_type_t.
|
|
*/
|
|
HSA_CODE_OBJECT_INFO_TYPE = 1,
|
|
/**
|
|
* Instruction set architecture this code object is produced for. The type of
|
|
* this attribute is ::hsa_isa_t.
|
|
*/
|
|
HSA_CODE_OBJECT_INFO_ISA = 2,
|
|
/**
|
|
* Machine model this code object is produced for. The type of this attribute
|
|
* is ::hsa_machine_model_t.
|
|
*/
|
|
HSA_CODE_OBJECT_INFO_MACHINE_MODEL = 3,
|
|
/**
|
|
* Profile this code object is produced for. The type of this attribute is
|
|
* ::hsa_profile_t.
|
|
*/
|
|
HSA_CODE_OBJECT_INFO_PROFILE = 4,
|
|
/**
|
|
* Default floating-point rounding mode used when the code object is
|
|
* produced. The type of this attribute is
|
|
* ::hsa_default_float_rounding_mode_t.
|
|
*/
|
|
HSA_CODE_OBJECT_INFO_DEFAULT_FLOAT_ROUNDING_MODE = 5
|
|
} hsa_code_object_info_t;
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Get the current value of an attribute for a given code object.
|
|
*
|
|
* @param[in] code_object Code object.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* code object attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_get_info(
|
|
hsa_code_object_t code_object,
|
|
hsa_code_object_info_t attribute,
|
|
void *value);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Load code object into the executable.
|
|
*
|
|
* @details Every global or readonly variable that is external must be defined
|
|
* before loading the code object. An internal global or readonly variable is
|
|
* allocated once the code object, that is being loaded, references this
|
|
* variable and this variable is not allocated.
|
|
*
|
|
* Any module linkage declaration must have been defined either by a define
|
|
* variable or by loading a code object that has a symbol with module linkage
|
|
* definition.
|
|
*
|
|
* @param[in] executable Executable.
|
|
*
|
|
* @param[in] agent Agent to load code object for. The agent must support the
|
|
* default floating-point rounding mode used by @p code_object.
|
|
*
|
|
* @param[in] code_object Code object to load. The lifetime of the code object
|
|
* must exceed that of the executable: if @p code_object is destroyed before @p
|
|
* executable, the behavior is undefined.
|
|
*
|
|
* @param[in] options Standard and vendor-specific options. Unknown options are
|
|
* ignored. A standard option begins with the "-hsa_" prefix. Options beginning
|
|
* with the "-hsa_ext_<extension_name>_" prefix are reserved for extensions. A
|
|
* vendor-specific option begins with the "-<vendor_name>_" prefix. Must be a
|
|
* NUL-terminated string. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to
|
|
* allocate the required resources.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_EXECUTABLE The executable is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INCOMPATIBLE_ARGUMENTS @p agent is not compatible
|
|
* with @p code_object (for example, @p agent does not support the default
|
|
* floating-point rounding mode specified by @p code_object), or @p code_object
|
|
* is not compatible with @p executable (for example, @p code_object and @p
|
|
* executable have different machine models or profiles).
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_FROZEN_EXECUTABLE @p executable is frozen.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_executable_load_code_object(
|
|
hsa_executable_t executable,
|
|
hsa_agent_t agent,
|
|
hsa_code_object_t code_object,
|
|
const char *options);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Code object symbol handle.
|
|
*
|
|
* The lifetime of a code object symbol matches that of the code object
|
|
* associated with it. An operation on a symbol whose associated code object has
|
|
* been destroyed results in undefined behavior.
|
|
*/
|
|
typedef struct hsa_code_symbol_s {
|
|
/**
|
|
* Opaque handle. Two handles reference the same object of the enclosing type
|
|
* if and only if they are equal.
|
|
*/
|
|
uint64_t handle;
|
|
} hsa_code_symbol_t;
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Get the symbol handle within a code object for a given a symbol name.
|
|
*
|
|
* @param[in] code_object Code object.
|
|
*
|
|
* @param[in] symbol_name Symbol name.
|
|
*
|
|
* @param[out] symbol Memory location where the HSA runtime stores the symbol
|
|
* handle.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no symbol with a name
|
|
* that matches @p symbol_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p symbol_name is NULL, or
|
|
* @p symbol is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_get_symbol(
|
|
hsa_code_object_t code_object,
|
|
const char *symbol_name,
|
|
hsa_code_symbol_t *symbol);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Get the symbol handle within a code object for a given a symbol name.
|
|
*
|
|
* @param[in] code_object Code object.
|
|
*
|
|
* @param[in] module_name Module name. Must be NULL if the symbol has
|
|
* program linkage.
|
|
*
|
|
* @param[in] symbol_name Symbol name.
|
|
*
|
|
* @param[out] symbol Memory location where the HSA runtime stores the symbol
|
|
* handle.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_SYMBOL_NAME There is no symbol with a name
|
|
* that matches @p symbol_name.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p symbol_name is NULL, or
|
|
* @p symbol is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_get_symbol_from_name(
|
|
hsa_code_object_t code_object,
|
|
const char *module_name,
|
|
const char *symbol_name,
|
|
hsa_code_symbol_t *symbol);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Code object symbol attributes.
|
|
*/
|
|
typedef enum {
|
|
/**
|
|
* The type of the symbol. The type of this attribute is ::hsa_symbol_kind_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_TYPE = 0,
|
|
/**
|
|
* The length of the symbol name in bytes, not including the NUL terminator.
|
|
* The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_NAME_LENGTH = 1,
|
|
/**
|
|
* The name of the symbol. The type of this attribute is character array with
|
|
* the length equal to the value of ::HSA_CODE_SYMBOL_INFO_NAME_LENGTH
|
|
* attribute.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_NAME = 2,
|
|
/**
|
|
* The length of the module name in bytes (not including the NUL terminator)
|
|
* to which this symbol belongs if this symbol has module linkage, otherwise 0
|
|
* is returned. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_MODULE_NAME_LENGTH = 3,
|
|
/**
|
|
* The module name to which this symbol belongs if this symbol has module
|
|
* linkage, otherwise an empty string is returned. The type of this attribute
|
|
* is character array with the length equal to the value of
|
|
* ::HSA_CODE_SYMBOL_INFO_MODULE_NAME_LENGTH attribute.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_MODULE_NAME = 4,
|
|
/**
|
|
* The linkage kind of the symbol. The type of this attribute is
|
|
* ::hsa_symbol_linkage_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_LINKAGE = 5,
|
|
/**
|
|
* Indicates whether the symbol corresponds to a definition. The type of this
|
|
* attribute is bool.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_IS_DEFINITION = 17,
|
|
/**
|
|
* The allocation kind of the variable. The value of this attribute is
|
|
* undefined if the symbol is not a variable. The type of this attribute is
|
|
* ::hsa_variable_allocation_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_VARIABLE_ALLOCATION = 6,
|
|
/**
|
|
* The segment kind of the variable. The value of this attribute is
|
|
* undefined if the symbol is not a variable. The type of this attribute is
|
|
* ::hsa_variable_segment_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_VARIABLE_SEGMENT = 7,
|
|
/**
|
|
* Alignment of the symbol in memory. The value of this attribute is undefined
|
|
* if the symbol is not a variable. The type of this attribute is uint32_t.
|
|
*
|
|
* The current alignment of the variable in memory may be greater than the
|
|
* value specified in the source program variable declaration.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_VARIABLE_ALIGNMENT = 8,
|
|
/**
|
|
* Size of the variable. The value of this attribute is undefined if the
|
|
* symbol is not a variable. The type of this attribute is uint32_t.
|
|
*
|
|
* A size of 0 is returned if the variable is an external variable and has an
|
|
* unknown dimension.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_VARIABLE_SIZE = 9,
|
|
/**
|
|
* Indicates whether the variable is constant. The value of this attribute is
|
|
* undefined if the symbol is not a variable. The type of this attribute is
|
|
* bool.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_VARIABLE_IS_CONST = 10,
|
|
/**
|
|
* Size of kernarg segment memory that is required to hold the values of the
|
|
* kernel arguments, in bytes. Must be a multiple of 16. The value of this
|
|
* attribute is undefined if the symbol is not a kernel. The type of this
|
|
* attribute is uint32_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_SIZE = 11,
|
|
/**
|
|
* Alignment (in bytes) of the buffer used to pass arguments to the kernel,
|
|
* which is the maximum of 16 and the maximum alignment of any of the kernel
|
|
* arguments. The value of this attribute is undefined if the symbol is not a
|
|
* kernel. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_KERNEL_KERNARG_SEGMENT_ALIGNMENT = 12,
|
|
/**
|
|
* Size of static group segment memory required by the kernel (per
|
|
* work-group), in bytes. The value of this attribute is undefined
|
|
* if the symbol is not a kernel. The type of this attribute is uint32_t.
|
|
*
|
|
* The reported amount does not include any dynamically allocated group
|
|
* segment memory that may be requested by the application when a kernel is
|
|
* dispatched.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_KERNEL_GROUP_SEGMENT_SIZE = 13,
|
|
/**
|
|
* Size of static private, spill, and arg segment memory required by
|
|
* this kernel (per work-item), in bytes. The value of this attribute is
|
|
* undefined if the symbol is not a kernel. The type of this attribute is
|
|
* uint32_t.
|
|
*
|
|
* If the value of ::HSA_CODE_SYMBOL_INFO_KERNEL_DYNAMIC_CALLSTACK is true,
|
|
* the kernel may use more private memory than the reported value, and the
|
|
* application must add the dynamic call stack usage to @a
|
|
* private_segment_size when populating a kernel dispatch packet.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_KERNEL_PRIVATE_SEGMENT_SIZE = 14,
|
|
/**
|
|
* Dynamic callstack flag. The value of this attribute is undefined if the
|
|
* symbol is not a kernel. The type of this attribute is bool.
|
|
*
|
|
* If this flag is set (the value is true), the kernel uses a dynamically
|
|
* sized call stack. This can happen if recursive calls, calls to indirect
|
|
* functions, or the HSAIL alloca instruction are present in the kernel.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_KERNEL_DYNAMIC_CALLSTACK = 15,
|
|
/**
|
|
* Call convention of the kernel. The value of this attribute is undefined if
|
|
* the symbol is not a kernel. The type of this attribute is uint32_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_KERNEL_CALL_CONVENTION = 18,
|
|
/**
|
|
* Call convention of the indirect function. The value of this attribute is
|
|
* undefined if the symbol is not an indirect function. The type of this
|
|
* attribute is uint32_t.
|
|
*/
|
|
HSA_CODE_SYMBOL_INFO_INDIRECT_FUNCTION_CALL_CONVENTION = 16
|
|
} hsa_code_symbol_info_t;
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Get the current value of an attribute for a given code symbol.
|
|
*
|
|
* @param[in] code_symbol Code symbol.
|
|
*
|
|
* @param[in] attribute Attribute to query.
|
|
*
|
|
* @param[out] value Pointer to an application-allocated buffer where to store
|
|
* the value of the attribute. If the buffer passed by the application is not
|
|
* large enough to hold the value of @p attribute, the behavior is undefined.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_SYMBOL The code symbol is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p attribute is an invalid
|
|
* code symbol attribute, or @p value is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_symbol_get_info(
|
|
hsa_code_symbol_t code_symbol,
|
|
hsa_code_symbol_info_t attribute,
|
|
void *value);
|
|
|
|
/**
|
|
* @deprecated
|
|
*
|
|
* @brief Iterate over the symbols in a code object, and invoke an
|
|
* application-defined callback on every iteration.
|
|
*
|
|
* @param[in] code_object Code object.
|
|
*
|
|
* @param[in] callback Callback to be invoked once per code object symbol. The
|
|
* HSA runtime passes three arguments to the callback: the code object, a
|
|
* symbol, and the application data. If @p callback returns a status other than
|
|
* ::HSA_STATUS_SUCCESS for a particular iteration, the traversal stops and
|
|
* ::hsa_code_object_iterate_symbols returns that status value.
|
|
*
|
|
* @param[in] data Application data that is passed to @p callback on every
|
|
* iteration. May be NULL.
|
|
*
|
|
* @retval ::HSA_STATUS_SUCCESS The function has been executed successfully.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been
|
|
* initialized.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_CODE_OBJECT @p code_object is invalid.
|
|
*
|
|
* @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL.
|
|
*/
|
|
hsa_status_t HSA_API HSA_DEPRECATED hsa_code_object_iterate_symbols(
|
|
hsa_code_object_t code_object,
|
|
hsa_status_t (*callback)(hsa_code_object_t code_object,
|
|
hsa_code_symbol_t symbol,
|
|
void *data),
|
|
void *data);
|
|
|
|
/** @} */
|
|
|
|
#ifdef __cplusplus
|
|
} // end extern "C" block
|
|
#endif
|
|
|
|
#endif // header guard
|