| //////////////////////////////////////////////////////////////////////////////// |
| // |
| // Copyright (C) 2014-2020 Advanced Micro Devices Inc. All rights reserved. |
| // |
| // Permission is hereby granted, free of charge, to any person or organization |
| // obtaining a copy of the software and accompanying documentation covered by |
| // this license (the "Software") to use, reproduce, display, distribute, |
| // execute, and transmit the Software, and to prepare derivative works of the |
| // Software, and to permit third-parties to whom the Software is furnished to |
| // do so, all subject to the following: |
| // |
| // The copyright notices in the Software and this entire statement, including |
| // the above license grant, this restriction and the following disclaimer, |
| // must be included in all copies of the Software, in whole or in part, and |
| // all derivative works of the Software, unless such copies or derivative |
| // works are solely in the form of machine-executable object code generated by |
| // a source language processor. |
| // |
| // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| // FITNESS FOR A PARTICULAR PURPOSE, TITLE AND NON-INFRINGEMENT. IN NO EVENT |
| // SHALL THE COPYRIGHT HOLDERS OR ANYONE DISTRIBUTING THE SOFTWARE BE LIABLE |
| // FOR ANY DAMAGES OR OTHER LIABILITY, WHETHER IN CONTRACT, TORT OR OTHERWISE, |
| // ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER |
| // DEALINGS IN THE SOFTWARE. |
| // |
| //////////////////////////////////////////////////////////////////////////////// |
| |
| // HSA AMD extension. |
| |
| #ifndef HSA_RUNTIME_EXT_AMD_H_ |
| #define HSA_RUNTIME_EXT_AMD_H_ |
| |
| #include "hsa.h" |
| #include "hsa_ext_image.h" |
| |
| #define HSA_AMD_INTERFACE_VERSION_MAJOR 1 |
| #define HSA_AMD_INTERFACE_VERSION_MINOR 0 |
| |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| /** |
| * @brief Enumeration constants added to ::hsa_status_t. |
| * |
| * @remark Additions to hsa_status_t |
| */ |
| enum { |
| /** |
| * The memory pool is invalid. |
| */ |
| HSA_STATUS_ERROR_INVALID_MEMORY_POOL = 40, |
| |
| /** |
| * Agent accessed memory beyond the maximum legal address. |
| */ |
| HSA_STATUS_ERROR_MEMORY_APERTURE_VIOLATION = 41, |
| |
| /** |
| * Agent executed an invalid shader instruction. |
| */ |
| HSA_STATUS_ERROR_ILLEGAL_INSTRUCTION = 42, |
| }; |
| |
| /** |
| * @brief Agent attributes. |
| */ |
| typedef enum hsa_amd_agent_info_s { |
| /** |
| * Chip identifier. The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_CHIP_ID = 0xA000, |
| /** |
| * Size of a cacheline in bytes. The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_CACHELINE_SIZE = 0xA001, |
| /** |
| * The number of compute unit available in the agent. The type of this |
| * attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_COMPUTE_UNIT_COUNT = 0xA002, |
| /** |
| * The maximum clock frequency of the agent in MHz. The type of this |
| * attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_MAX_CLOCK_FREQUENCY = 0xA003, |
| /** |
| * Internal driver node identifier. The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_DRIVER_NODE_ID = 0xA004, |
| /** |
| * Max number of watch points on memory address ranges to generate exception |
| * events when the watched addresses are accessed. The type of this |
| * attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_MAX_ADDRESS_WATCH_POINTS = 0xA005, |
| /** |
| * Agent BDF_ID, named LocationID in thunk. The type of this attribute is |
| * uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_BDFID = 0xA006, |
| /** |
| * Memory Interface width, the return value type is uint32_t. |
| * This attribute is deprecated. |
| */ |
| HSA_AMD_AGENT_INFO_MEMORY_WIDTH = 0xA007, |
| /** |
| * Max Memory Clock, the return value type is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_MEMORY_MAX_FREQUENCY = 0xA008, |
| /** |
| * Board name of Agent - populated from MarketingName of Kfd Node |
| * The value is an Ascii string of 64 chars. |
| */ |
| HSA_AMD_AGENT_INFO_PRODUCT_NAME = 0xA009, |
| /** |
| * Maximum number of waves possible in a Compute Unit. |
| * The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_MAX_WAVES_PER_CU = 0xA00A, |
| /** |
| * Number of SIMD's per compute unit CU |
| * The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_NUM_SIMDS_PER_CU = 0xA00B, |
| /** |
| * Number of Shader Engines (SE) in Gpu |
| * The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_NUM_SHADER_ENGINES = 0xA00C, |
| /** |
| * Number of Shader Arrays Per Shader Engines in Gpu |
| * The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_NUM_SHADER_ARRAYS_PER_SE = 0xA00D, |
| /** |
| * Address of the HDP flush registers. Use of these registers does not conform to the HSA memory |
| * model and should be treated with caution. |
| * The type of this attribute is hsa_amd_hdp_flush_t. |
| */ |
| HSA_AMD_AGENT_INFO_HDP_FLUSH = 0xA00E, |
| /** |
| * PCIe domain for the agent. Pairs with HSA_AMD_AGENT_INFO_BDFID |
| * to give the full physical location of the Agent. |
| * The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_DOMAIN = 0xA00F, |
| /** |
| * Queries for support of cooperative queues. See ::HSA_QUEUE_TYPE_COOPERATIVE. |
| * The type of this attribute is bool. |
| */ |
| HSA_AMD_AGENT_INFO_COOPERATIVE_QUEUES = 0xA010, |
| /** |
| * Queries UUID of an agent. The value is an Ascii string with a maximum |
| * of 21 chars including NUL. The string value consists of two parts: header |
| * and body. The header identifies device type (GPU, CPU, DSP) while body |
| * encodes UUID as a 16 digit hex string |
| * |
| * Agents that do not support UUID will return the string "GPU-XX" or |
| * "CPU-XX" or "DSP-XX" depending upon their device type ::hsa_device_type_t |
| */ |
| HSA_AMD_AGENT_INFO_UUID = 0xA011, |
| /** |
| * Queries for the ASIC revision of an agent. The value is an integer that |
| * increments for each revision. This can be used by user-level software to |
| * change how it operates, depending on the hardware version. This allows |
| * selective workarounds for hardware errata. |
| * The type of this attribute is uint32_t. |
| */ |
| HSA_AMD_AGENT_INFO_ASIC_REVISION = 0xA012 |
| } hsa_amd_agent_info_t; |
| |
| typedef struct hsa_amd_hdp_flush_s { |
| uint32_t* HDP_MEM_FLUSH_CNTL; |
| uint32_t* HDP_REG_FLUSH_CNTL; |
| } hsa_amd_hdp_flush_t; |
| |
| /** |
| * @brief Region attributes. |
| */ |
| typedef enum hsa_amd_region_info_s { |
| /** |
| * Determine if host can access the region. The type of this attribute |
| * is bool. |
| */ |
| HSA_AMD_REGION_INFO_HOST_ACCESSIBLE = 0xA000, |
| /** |
| * Base address of the region in flat address space. |
| */ |
| HSA_AMD_REGION_INFO_BASE = 0xA001, |
| /** |
| * Memory Interface width, the return value type is uint32_t. |
| * This attribute is deprecated. Use HSA_AMD_AGENT_INFO_MEMORY_WIDTH. |
| */ |
| HSA_AMD_REGION_INFO_BUS_WIDTH = 0xA002, |
| /** |
| * Max Memory Clock, the return value type is uint32_t. |
| * This attribute is deprecated. Use HSA_AMD_AGENT_INFO_MEMORY_MAX_FREQUENCY. |
| */ |
| HSA_AMD_REGION_INFO_MAX_CLOCK_FREQUENCY = 0xA003 |
| } hsa_amd_region_info_t; |
| |
| /** |
| * @brief Coherency attributes of fine grain region. |
| */ |
| typedef enum hsa_amd_coherency_type_s { |
| /** |
| * Coherent region. |
| */ |
| HSA_AMD_COHERENCY_TYPE_COHERENT = 0, |
| /** |
| * Non coherent region. |
| */ |
| HSA_AMD_COHERENCY_TYPE_NONCOHERENT = 1 |
| } hsa_amd_coherency_type_t; |
| |
| /** |
| * @brief Get the coherency type of the fine grain region of an agent. |
| * |
| * @param[in] agent A valid agent. |
| * |
| * @param[out] type Pointer to a memory location where the HSA runtime will |
| * store the coherency type of the fine grain region. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p type is NULL. |
| */ |
| hsa_status_t HSA_API hsa_amd_coherency_get_type(hsa_agent_t agent, |
| hsa_amd_coherency_type_t* type); |
| |
| /** |
| * @brief Set the coherency type of the fine grain region of an agent. |
| * Deprecated. This is supported on KV platforms. For backward compatibility |
| * other platforms will spuriously succeed. |
| * |
| * @param[in] agent A valid agent. |
| * |
| * @param[in] type The coherency type to be set. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p type is invalid. |
| */ |
| hsa_status_t HSA_API hsa_amd_coherency_set_type(hsa_agent_t agent, |
| hsa_amd_coherency_type_t type); |
| |
| /** |
| * @brief Structure containing profiling dispatch time information. |
| * |
| * Times are reported as ticks in the domain of the HSA system clock. |
| * The HSA system clock tick and frequency is obtained via hsa_system_get_info. |
| */ |
| typedef struct hsa_amd_profiling_dispatch_time_s { |
| /** |
| * Dispatch packet processing start time. |
| */ |
| uint64_t start; |
| /** |
| * Dispatch packet completion time. |
| */ |
| uint64_t end; |
| } hsa_amd_profiling_dispatch_time_t; |
| |
| /** |
| * @brief Structure containing profiling async copy time information. |
| * |
| * Times are reported as ticks in the domain of the HSA system clock. |
| * The HSA system clock tick and frequency is obtained via hsa_system_get_info. |
| */ |
| typedef struct hsa_amd_profiling_async_copy_time_s { |
| /** |
| * Async copy processing start time. |
| */ |
| uint64_t start; |
| /** |
| * Async copy completion time. |
| */ |
| uint64_t end; |
| } hsa_amd_profiling_async_copy_time_t; |
| |
| /** |
| * @brief Enable or disable profiling capability of a queue. |
| * |
| * @param[in] queue A valid queue. |
| * |
| * @param[in] enable 1 to enable profiling. 0 to disable profiling. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_QUEUE The queue is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p queue is NULL. |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_profiling_set_profiler_enabled(hsa_queue_t* queue, int enable); |
| |
| /** |
| * @brief Enable or disable asynchronous memory copy profiling. |
| * |
| * @details The runtime will provide the copy processing start timestamp and |
| * completion timestamp of each call to hsa_amd_memory_async_copy if the |
| * async copy profiling is enabled prior to the call to |
| * hsa_amd_memory_async_copy. The completion signal object is used to |
| * hold the last async copy start and end timestamp. The client can retrieve |
| * these timestamps via call to hsa_amd_profiling_get_async_copy_time. |
| * |
| * @param[in] enable True to enable profiling. False to disable profiling. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES Failed on allocating resources |
| * needed to profile the asynchronous copy. |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_profiling_async_copy_enable(bool enable); |
| |
| /** |
| * @brief Retrieve packet processing time stamps. |
| * |
| * @param[in] agent The agent with which the signal was last used. For |
| * instance, if the profiled dispatch packet is dispatched onto queue Q, |
| * which was created on agent A, then this parameter must be A. |
| * |
| * @param[in] signal A signal used as the completion signal of the dispatch |
| * packet to retrieve time stamps from. This dispatch packet must have been |
| * issued to a queue with profiling enabled and have already completed. Also |
| * the signal must not have yet been used in any other packet following the |
| * completion of the profiled dispatch packet. |
| * |
| * @param[out] time Packet processing timestamps in the HSA system clock |
| * domain. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL The signal is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p time is NULL. |
| */ |
| hsa_status_t HSA_API hsa_amd_profiling_get_dispatch_time( |
| hsa_agent_t agent, hsa_signal_t signal, |
| hsa_amd_profiling_dispatch_time_t* time); |
| |
| /** |
| * @brief Retrieve asynchronous copy timestamps. |
| * |
| * @details Async copy profiling is enabled via call to |
| * hsa_amd_profiling_async_copy_enable. |
| * |
| * @param[in] signal A signal used as the completion signal of the call to |
| * hsa_amd_memory_async_copy. |
| * |
| * @param[out] time Async copy processing timestamps in the HSA system clock |
| * domain. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL The signal is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p time is NULL. |
| */ |
| hsa_status_t HSA_API hsa_amd_profiling_get_async_copy_time( |
| hsa_signal_t signal, hsa_amd_profiling_async_copy_time_t* time); |
| |
| /** |
| * @brief Computes the frequency ratio and offset between the agent clock and |
| * HSA system clock and converts the agent's tick to HSA system domain tick. |
| * |
| * @param[in] agent The agent used to retrieve the agent_tick. It is user's |
| * responsibility to make sure the tick number is from this agent, otherwise, |
| * the behavior is undefined. |
| * |
| * @param[in] agent_tick The tick count retrieved from the specified @p agent. |
| * |
| * @param[out] system_tick The translated HSA system domain clock counter tick. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p system_tick is NULL; |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_profiling_convert_tick_to_system_domain(hsa_agent_t agent, |
| uint64_t agent_tick, |
| uint64_t* system_tick); |
| |
| /** |
| * @brief Signal attribute flags. |
| */ |
| typedef enum { |
| /** |
| * Signal will only be consumed by AMD GPUs. Limits signal consumption to |
| * AMD GPU agents only. Ignored if @p num_consumers is not zero (all agents). |
| */ |
| HSA_AMD_SIGNAL_AMD_GPU_ONLY = 1, |
| /** |
| * Signal may be used for interprocess communication. |
| * IPC signals can be read, written, and waited on from any process. |
| * Profiling using an IPC enabled signal is only supported in a single process |
| * at a time. Producing profiling data in one process and consuming it in |
| * another process is undefined. |
| */ |
| HSA_AMD_SIGNAL_IPC = 2, |
| } hsa_amd_signal_attribute_t; |
| |
| /** |
| * @brief Create a signal with specific attributes. |
| * |
| * @param[in] initial_value Initial value of the signal. |
| * |
| * @param[in] num_consumers Size of @p consumers. A value of 0 indicates that |
| * any agent might wait on the signal. |
| * |
| * @param[in] consumers List of agents that might consume (wait on) the |
| * signal. If @p num_consumers is 0, this argument is ignored; otherwise, the |
| * HSA runtime might use the list to optimize the handling of the signal |
| * object. If an agent not listed in @p consumers waits on the returned |
| * signal, the behavior is undefined. The memory associated with @p consumers |
| * can be reused or freed after the function returns. |
| * |
| * @param[in] attributes Requested signal attributes. Multiple signal attributes |
| * may be requested by combining them with bitwise OR. Requesting no attributes |
| * (@p attributes == 0) results in the same signal as would have been obtained |
| * via hsa_signal_create. |
| * |
| * @param[out] signal Pointer to a memory location where the HSA runtime will |
| * store the newly created signal handle. Must not be NULL. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime failed to allocate |
| * the required resources. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p signal is NULL, @p |
| * num_consumers is greater than 0 but @p consumers is NULL, or @p consumers |
| * contains duplicates. |
| */ |
| hsa_status_t HSA_API hsa_amd_signal_create(hsa_signal_value_t initial_value, uint32_t num_consumers, |
| const hsa_agent_t* consumers, uint64_t attributes, |
| hsa_signal_t* signal); |
| |
| /** |
| * @brief Asyncronous signal handler function type. |
| * |
| * @details Type definition of callback function to be used with |
| * hsa_amd_signal_async_handler. This callback is invoked if the associated |
| * signal and condition are met. The callback receives the value of the signal |
| * which satisfied the associated wait condition and a user provided value. If |
| * the callback returns true then the callback will be called again if the |
| * associated signal and condition are satisfied again. If the callback returns |
| * false then it will not be called again. |
| * |
| * @param[in] value Contains the value of the signal observed by |
| * hsa_amd_signal_async_handler which caused the signal handler to be invoked. |
| * |
| * @param[in] arg Contains the user provided value given when the signal handler |
| * was registered with hsa_amd_signal_async_handler |
| * |
| * @retval true resumes monitoring the signal with this handler (as if calling |
| * hsa_amd_signal_async_handler again with identical parameters) |
| * |
| * @retval false stops monitoring the signal with this handler (handler will |
| * not be called again for this signal) |
| * |
| */ |
| typedef bool (*hsa_amd_signal_handler)(hsa_signal_value_t value, void* arg); |
| |
| /** |
| * @brief Register asynchronous signal handler function. |
| * |
| * @details Allows registering a callback function and user provided value with |
| * a signal and wait condition. The callback will be invoked if the associated |
| * signal and wait condition are satisfied. Callbacks will be invoked serially |
| * but in an arbitrary order so callbacks should be independent of each other. |
| * After being invoked a callback may continue to wait for its associated signal |
| * and condition and, possibly, be invoked again. Or the callback may stop |
| * waiting. If the callback returns true then it will continue waiting and may |
| * be called again. If false then the callback will not wait again and will not |
| * be called again for the associated signal and condition. It is possible to |
| * register the same callback multiple times with the same or different signals |
| * and/or conditions. Each registration of the callback will be treated entirely |
| * independently. |
| * |
| * @param[in] signal hsa signal to be asynchronously monitored |
| * |
| * @param[in] cond condition value to monitor for |
| * |
| * @param[in] value signal value used in condition expression |
| * |
| * @param[in] handler asynchronous signal handler invoked when signal's |
| * condition is met |
| * |
| * @param[in] arg user provided value which is provided to handler when handler |
| * is invoked |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL signal is not a valid hsa_signal_t |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT handler is invalid (NULL) |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime is out of |
| * resources or blocking signals are not supported by the HSA driver component. |
| * |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_signal_async_handler(hsa_signal_t signal, |
| hsa_signal_condition_t cond, |
| hsa_signal_value_t value, |
| hsa_amd_signal_handler handler, void* arg); |
| |
| /** |
| * @brief Call a function asynchronously |
| * |
| * @details Provides access to the runtime's asynchronous event handling thread |
| * for general asynchronous functions. Functions queued this way are executed |
| * in the same manner as if they were a signal handler who's signal is |
| * satisfied. |
| * |
| * @param[in] callback asynchronous function to be invoked |
| * |
| * @param[in] arg user provided value which is provided to handler when handler |
| * is invoked |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT handler is invalid (NULL) |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES The HSA runtime is out of |
| * resources or blocking signals are not supported by the HSA driver component. |
| * |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_async_function(void (*callback)(void* arg), void* arg); |
| |
| /** |
| * @brief Wait for any signal-condition pair to be satisfied. |
| * |
| * @details Allows waiting for any of several signal and conditions pairs to be |
| * satisfied. The function returns the index into the list of signals of the |
| * first satisfying signal-condition pair. The value of the satisfying signal's |
| * value is returned in satisfying_value unless satisfying_value is NULL. This |
| * function provides only relaxed memory semantics. |
| */ |
| uint32_t HSA_API |
| hsa_amd_signal_wait_any(uint32_t signal_count, hsa_signal_t* signals, |
| hsa_signal_condition_t* conds, |
| hsa_signal_value_t* values, uint64_t timeout_hint, |
| hsa_wait_state_t wait_hint, |
| hsa_signal_value_t* satisfying_value); |
| |
| /** |
| * @brief Query image limits. |
| * |
| * @param[in] agent A valid agent. |
| * |
| * @param[in] attribute HSA image info attribute to query. |
| * |
| * @param[out] value Pointer to an application-allocated buffer where to store |
| * the value of the attribute. If the buffer passed by the application is not |
| * large enough to hold the value of @p attribute, the behavior is undefined. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_QUEUE @p value is NULL or @p attribute < |
| * HSA_EXT_AGENT_INFO_IMAGE_1D_MAX_ELEMENTS or @p attribute > |
| * HSA_EXT_AGENT_INFO_IMAGE_ARRAY_MAX_LAYERS. |
| * |
| */ |
| hsa_status_t HSA_API hsa_amd_image_get_info_max_dim(hsa_agent_t agent, |
| hsa_agent_info_t attribute, |
| void* value); |
| |
| /** |
| * @brief Set a CU affinity to specific queues within the process, this function |
| * call is "atomic". |
| * |
| * @param[in] queue A pointer to HSA queue. |
| * |
| * @param[in] num_cu_mask_count Size of CUMask bit array passed in. |
| * |
| * @param[in] cu_mask Bit-vector representing the CU mask. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_QUEUE @p queue is NULL or invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p num_cu_mask_count is not |
| * multiple of 32 or @p cu_mask is NULL. |
| * |
| * @retval ::HSA_STATUS_ERROR failed to call thunk api |
| * |
| */ |
| hsa_status_t HSA_API hsa_amd_queue_cu_set_mask(const hsa_queue_t* queue, |
| uint32_t num_cu_mask_count, |
| const uint32_t* cu_mask); |
| |
| /** |
| * @brief Memory segments associated with a memory pool. |
| */ |
| typedef enum { |
| /** |
| * Global segment. Used to hold data that is shared by all agents. |
| */ |
| HSA_AMD_SEGMENT_GLOBAL = 0, |
| /** |
| * Read-only segment. Used to hold data that remains constant during the |
| * execution of a kernel. |
| */ |
| HSA_AMD_SEGMENT_READONLY = 1, |
| /** |
| * Private segment. Used to hold data that is local to a single work-item. |
| */ |
| HSA_AMD_SEGMENT_PRIVATE = 2, |
| /** |
| * Group segment. Used to hold data that is shared by the work-items of a |
| * work-group. |
| */ |
| HSA_AMD_SEGMENT_GROUP = 3, |
| } hsa_amd_segment_t; |
| |
| /** |
| * @brief A memory pool encapsulates physical storage on an agent |
| * along with a memory access model. |
| * |
| * @details A memory pool encapsulates a physical partition of an agent's |
| * memory system along with a memory access model. Division of a single |
| * memory system into separate pools allows querying each partition's access |
| * path properties (see ::hsa_amd_agent_memory_pool_get_info). Allocations |
| * from a pool are preferentially bound to that pool's physical partition. |
| * Binding to the pool's preferential physical partition may not be |
| * possible or persistent depending on the system's memory policy |
| * and/or state which is beyond the scope of HSA APIs. |
| * |
| * For example, a multi-node NUMA memory system may be represented by multiple |
| * pool's with each pool providing size and access path information for the |
| * partition it represents. Allocations from a pool are preferentially bound |
| * to the pool's partition (which in this example is a NUMA node) while |
| * following its memory access model. The actual placement may vary or migrate |
| * due to the system's NUMA policy and state, which is beyond the scope of |
| * HSA APIs. |
| */ |
| typedef struct hsa_amd_memory_pool_s { |
| /** |
| * Opaque handle. |
| */ |
| uint64_t handle; |
| } hsa_amd_memory_pool_t; |
| |
| typedef enum hsa_amd_memory_pool_global_flag_s { |
| /** |
| * The application can use allocations in the memory pool to store kernel |
| * arguments, and provide the values for the kernarg segment of |
| * a kernel dispatch. |
| */ |
| HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_KERNARG_INIT = 1, |
| /** |
| * Updates to memory in this pool conform to HSA memory consistency model. |
| * If this flag is set, then ::HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_COARSE_GRAINED |
| * must not be set. |
| */ |
| HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_FINE_GRAINED = 2, |
| /** |
| * Writes to memory in this pool can be performed by a single agent at a time. |
| */ |
| HSA_AMD_MEMORY_POOL_GLOBAL_FLAG_COARSE_GRAINED = 4 |
| } hsa_amd_memory_pool_global_flag_t; |
| |
| /** |
| * @brief Memory pool features. |
| */ |
| typedef enum { |
| /** |
| * Segment where the memory pool resides. The type of this attribute is |
| * ::hsa_amd_segment_t. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_SEGMENT = 0, |
| /** |
| * Flag mask. The value of this attribute is undefined if the value of |
| * ::HSA_AMD_MEMORY_POOL_INFO_SEGMENT is not ::HSA_AMD_SEGMENT_GLOBAL. The type |
| * of |
| * this attribute is uint32_t, a bit-field of |
| * ::hsa_amd_memory_pool_global_flag_t |
| * values. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_GLOBAL_FLAGS = 1, |
| /** |
| * Size of this pool, in bytes. The type of this attribute is size_t. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_SIZE = 2, |
| /** |
| * Indicates whether memory in this pool can be allocated using |
| * ::hsa_amd_memory_pool_allocate. The type of this attribute is bool. |
| * |
| * The value of this flag is always false for memory pools in the group and |
| * private segments. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED = 5, |
| /** |
| * Allocation granularity of buffers allocated by |
| * ::hsa_amd_memory_pool_allocate |
| * in this memory pool. The size of a buffer allocated in this pool is a |
| * multiple of the value of this attribute. The value of this attribute is |
| * only defined if ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED is true for |
| * this pool. The type of this attribute is size_t. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_GRANULE = 6, |
| /** |
| * Alignment of buffers allocated by ::hsa_amd_memory_pool_allocate in this |
| * pool. The value of this attribute is only defined if |
| * ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED is true for this pool, and |
| * must be a power of 2. The type of this attribute is size_t. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALIGNMENT = 7, |
| /** |
| * This memory_pool can be made directly accessible by all the agents in the |
| * system (::hsa_amd_agent_memory_pool_get_info does not return |
| * ::HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED for any agent). The type of this |
| * attribute is bool. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_ACCESSIBLE_BY_ALL = 15, |
| /** |
| * Maximum aggregate allocation size in bytes. The type of this attribute |
| * is size_t. |
| */ |
| HSA_AMD_MEMORY_POOL_INFO_ALLOC_MAX_SIZE = 16, |
| } hsa_amd_memory_pool_info_t; |
| |
| /** |
| * @brief Get the current value of an attribute of a memory pool. |
| * |
| * @param[in] memory_pool A valid memory pool. |
| * |
| * @param[in] attribute Attribute to query. |
| * |
| * @param[out] value Pointer to a application-allocated buffer where to store |
| * the value of the attribute. If the buffer passed by the application is not |
| * large enough to hold the value of @p attribute, the behavior is undefined. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_memory_pool_get_info(hsa_amd_memory_pool_t memory_pool, |
| hsa_amd_memory_pool_info_t attribute, |
| void* value); |
| |
| /** |
| * @brief Iterate over the memory pools associated with a given agent, and |
| * invoke an application-defined callback on every iteration. |
| * |
| * @details An agent can directly access buffers located in some memory pool, or |
| * be enabled to access them by the application (see ::hsa_amd_agents_allow_access), |
| * yet that memory pool may not be returned by this function for that given |
| * agent. |
| * |
| * A memory pool of fine-grained type must be associated only with the host. |
| * |
| * @param[in] agent A valid agent. |
| * |
| * @param[in] callback Callback to be invoked on the same thread that called |
| * ::hsa_amd_agent_iterate_memory_pools, serially, once per memory pool that is |
| * associated with the agent. The HSA runtime passes two arguments to the |
| * callback: the memory pool, and the application data. If @p callback |
| * returns a status other than ::HSA_STATUS_SUCCESS for a particular iteration, |
| * the traversal stops and ::hsa_amd_agent_iterate_memory_pools returns that status |
| * value. |
| * |
| * @param[in] data Application data that is passed to @p callback on every |
| * iteration. May be NULL. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL. |
| */ |
| hsa_status_t HSA_API hsa_amd_agent_iterate_memory_pools( |
| hsa_agent_t agent, |
| hsa_status_t (*callback)(hsa_amd_memory_pool_t memory_pool, void* data), |
| void* data); |
| |
| /** |
| * @brief Allocate a block of memory (or buffer) in the specified pool. |
| * |
| * @param[in] memory_pool Memory pool where to allocate memory from. The memory |
| * pool must have the ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALLOWED flag set. |
| * |
| * @param[in] size Allocation size, in bytes. Must not be zero. This value is |
| * rounded up to the nearest multiple of |
| * ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_GRANULE in @p memory_pool. |
| * |
| * @param[in] flags A bit-field that is used to specify allocation |
| * directives. Reserved parameter, must be 0. |
| * |
| * @param[out] ptr Pointer to the location where to store the base virtual |
| * address of |
| * the allocated block. The returned base address is aligned to the value of |
| * ::HSA_AMD_MEMORY_POOL_INFO_RUNTIME_ALLOC_ALIGNMENT in @p memory_pool. If the |
| * allocation fails, the returned value is undefined. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES No memory is available. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL The memory pool is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ALLOCATION The host is not allowed to |
| * allocate memory in @p memory_pool, or @p size is greater than |
| * the value of HSA_AMD_MEMORY_POOL_INFO_ALLOC_MAX_SIZE in @p memory_pool. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is NULL, or @p size is 0, |
| * or flags is not 0. |
| * |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_memory_pool_allocate(hsa_amd_memory_pool_t memory_pool, size_t size, |
| uint32_t flags, void** ptr); |
| |
| /** |
| * @brief Deallocate a block of memory previously allocated using |
| * ::hsa_amd_memory_pool_allocate. |
| * |
| * @param[in] ptr Pointer to a memory block. If @p ptr does not match a value |
| * previously returned by ::hsa_amd_memory_pool_allocate, the behavior is undefined. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| */ |
| hsa_status_t HSA_API hsa_amd_memory_pool_free(void* ptr); |
| |
| /** |
| * @brief Asynchronously copy a block of memory from the location pointed to by |
| * @p src on the @p src_agent to the memory block pointed to by @p dst on the @p |
| * dst_agent. |
| * Because the DMA engines used may not be in the same coherency domain, the caller must ensure |
| * that buffers are system-level coherent. In general this requires the sending device to have |
| * released the buffer to system scope prior to executing the copy API and the receiving device |
| * must execute a system scope acquire fence prior to use of the destination buffer. |
| * |
| * @param[out] dst Buffer where the content is to be copied. |
| * |
| * @param[in] dst_agent Agent associated with the @p dst. The agent must be able to directly |
| * access both the source and destination buffers in their current locations. |
| * |
| * @param[in] src A valid pointer to the source of data to be copied. The source |
| * buffer must not overlap with the destination buffer, otherwise the copy will succeed |
| * but contents of @p dst is undefined. |
| * |
| * @param[in] src_agent Agent associated with the @p src. The agent must be able to directly |
| * access both the source and destination buffers in their current locations. |
| * |
| * @param[in] size Number of bytes to copy. If @p size is 0, no copy is |
| * performed and the function returns success. Copying a number of bytes larger |
| * than the size of the buffers pointed by @p dst or @p src results in undefined |
| * behavior. |
| * |
| * @param[in] num_dep_signals Number of dependent signals. Can be 0. |
| * |
| * @param[in] dep_signals List of signals that must be waited on before the copy |
| * operation starts. The copy will start after every signal has been observed with |
| * the value 0. The dependent signal should not include completion signal from hsa_amd_memory_async_copy |
| * operation to be issued in future as that can result in a deadlock. If @p num_dep_signals is 0, this |
| * argument is ignored. |
| * |
| * @param[in] completion_signal Signal used to indicate completion of the copy |
| * operation. When the copy operation is finished, the value of the signal is |
| * decremented. The runtime indicates that an error has occurred during the copy |
| * operation by setting the value of the completion signal to a negative |
| * number. The signal handle must not be 0. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. The |
| * application is responsible for checking for asynchronous error conditions |
| * (see the description of @p completion_signal). |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT The agent is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_SIGNAL @p completion_signal is invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT The source or destination |
| * pointers are NULL, or the completion signal is 0. |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_memory_async_copy(void* dst, hsa_agent_t dst_agent, const void* src, |
| hsa_agent_t src_agent, size_t size, |
| uint32_t num_dep_signals, |
| const hsa_signal_t* dep_signals, |
| hsa_signal_t completion_signal); |
| |
| /* |
| [Provisional API] |
| Pitched memory descriptor. |
| All elements must be 4 byte aligned. Pitch and slice are in bytes. |
| */ |
| typedef struct hsa_pitched_ptr_s { |
| void* base; |
| size_t pitch; |
| size_t slice; |
| } hsa_pitched_ptr_t; |
| |
| /* |
| [Provisional API] |
| Copy direction flag. |
| */ |
| typedef enum { |
| hsaHostToHost = 0, |
| hsaHostToDevice = 1, |
| hsaDeviceToHost = 2, |
| hsaDeviceToDevice = 3 |
| } hsa_amd_copy_direction_t; |
| |
| /* |
| [Provisional API] |
| SDMA 3D memory copy API. The same requirements must be met by src and dst as in |
| hsa_amd_memory_async_copy. |
| Both src and dst must be directly accessible to the copy_agent during the copy, src and dst rects |
| must not overlap. |
| CPU agents are not supported. API requires SDMA and will return an error if SDMA is not available. |
| Offsets and range carry x in bytes, y and z in rows and layers. |
| */ |
| hsa_status_t HSA_API hsa_amd_memory_async_copy_rect( |
| const hsa_pitched_ptr_t* dst, const hsa_dim3_t* dst_offset, const hsa_pitched_ptr_t* src, |
| const hsa_dim3_t* src_offset, const hsa_dim3_t* range, hsa_agent_t copy_agent, |
| hsa_amd_copy_direction_t dir, uint32_t num_dep_signals, const hsa_signal_t* dep_signals, |
| hsa_signal_t completion_signal); |
| |
| /** |
| * @brief Type of accesses to a memory pool from a given agent. |
| */ |
| typedef enum { |
| /** |
| * The agent cannot directly access any buffer in the memory pool. |
| */ |
| HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED = 0, |
| /** |
| * The agent can directly access a buffer located in the pool; the application |
| * does not need to invoke ::hsa_amd_agents_allow_access. |
| */ |
| HSA_AMD_MEMORY_POOL_ACCESS_ALLOWED_BY_DEFAULT = 1, |
| /** |
| * The agent can directly access a buffer located in the pool, but only if the |
| * application has previously requested access to that buffer using |
| * ::hsa_amd_agents_allow_access. |
| */ |
| HSA_AMD_MEMORY_POOL_ACCESS_DISALLOWED_BY_DEFAULT = 2 |
| } hsa_amd_memory_pool_access_t; |
| |
| /** |
| * @brief Properties of the relationship between an agent a memory pool. |
| */ |
| typedef enum { |
| /** |
| * Hyper-transport bus type. |
| */ |
| HSA_AMD_LINK_INFO_TYPE_HYPERTRANSPORT = 0, |
| |
| /** |
| * QPI bus type. |
| */ |
| HSA_AMD_LINK_INFO_TYPE_QPI = 1, |
| |
| /** |
| * PCIe bus type. |
| */ |
| HSA_AMD_LINK_INFO_TYPE_PCIE = 2, |
| |
| /** |
| * Infiniband bus type. |
| */ |
| HSA_AMD_LINK_INFO_TYPE_INFINBAND = 3, |
| |
| /** |
| * xGMI link type. |
| */ |
| HSA_AMD_LINK_INFO_TYPE_XGMI = 4 |
| |
| } hsa_amd_link_info_type_t; |
| |
| /** |
| * @brief Link properties when accessing the memory pool from the specified |
| * agent. |
| */ |
| typedef struct hsa_amd_memory_pool_link_info_s { |
| /** |
| * Minimum transfer latency (rounded to ns). |
| */ |
| uint32_t min_latency; |
| |
| /** |
| * Maximum transfer latency (rounded to ns). |
| */ |
| uint32_t max_latency; |
| |
| /** |
| * Minimum link interface bandwidth in MB/s. |
| */ |
| uint32_t min_bandwidth; |
| |
| /** |
| * Maximum link interface bandwidth in MB/s. |
| */ |
| uint32_t max_bandwidth; |
| |
| /** |
| * Support for 32-bit atomic transactions. |
| */ |
| bool atomic_support_32bit; |
| |
| /** |
| * Support for 64-bit atomic transactions. |
| */ |
| bool atomic_support_64bit; |
| |
| /** |
| * Support for cache coherent transactions. |
| */ |
| bool coherent_support; |
| |
| /** |
| * The type of bus/link. |
| */ |
| hsa_amd_link_info_type_t link_type; |
| |
| /** |
| * NUMA distance of memory pool relative to querying agent |
| */ |
| uint32_t numa_distance; |
| } hsa_amd_memory_pool_link_info_t; |
| |
| /** |
| * @brief Properties of the relationship between an agent a memory pool. |
| */ |
| typedef enum { |
| /** |
| * Access to buffers located in the memory pool. The type of this attribute |
| * is ::hsa_amd_memory_pool_access_t. |
| * |
| * An agent can always directly access buffers currently located in a memory |
| * pool that is associated (the memory_pool is one of the values returned by |
| * ::hsa_amd_agent_iterate_memory_pools on the agent) with that agent. If the |
| * buffer is currently located in a memory pool that is not associated with |
| * the agent, and the value returned by this function for the given |
| * combination of agent and memory pool is not |
| * HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED, the application still needs to invoke |
| * ::hsa_amd_agents_allow_access in order to gain direct access to the buffer. |
| * |
| * If the given agent can directly access buffers the pool, the result is not |
| * HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. If the memory pool is associated with |
| * the agent, or it is of fined-grained type, the result must not be |
| * HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. If the memory pool is not associated |
| * with the agent, and does not reside in the global segment, the result must |
| * be HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. |
| */ |
| HSA_AMD_AGENT_MEMORY_POOL_INFO_ACCESS = 0, |
| |
| /** |
| * Number of links to hop when accessing the memory pool from the specified |
| * agent. The value of this attribute is zero if the memory pool is associated |
| * with the agent, or if the access type is |
| * HSA_AMD_MEMORY_POOL_ACCESS_NEVER_ALLOWED. The type of this attribute is |
| * uint32_t. |
| */ |
| HSA_AMD_AGENT_MEMORY_POOL_INFO_NUM_LINK_HOPS = 1, |
| |
| /** |
| * Details of each link hop when accessing the memory pool starting from the |
| * specified agent. The type of this attribute is an array size of |
| * HSA_AMD_AGENT_MEMORY_POOL_INFO_NUM_LINK_HOPS with each element containing |
| * ::hsa_amd_memory_pool_link_info_t. |
| */ |
| HSA_AMD_AGENT_MEMORY_POOL_INFO_LINK_INFO = 2 |
| |
| } hsa_amd_agent_memory_pool_info_t; |
| |
| /** |
| * @brief Get the current value of an attribute of the relationship between an |
| * agent and a memory pool. |
| * |
| * @param[in] agent Agent. |
| * |
| * @param[in] memory_pool Memory pool. |
| * |
| * @param[in] attribute Attribute to query. |
| * |
| * @param[out] value Pointer to a application-allocated buffer where to store |
| * the value of the attribute. If the buffer passed by the application is not |
| * large enough to hold the value of @p attribute, the behavior is undefined. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| */ |
| hsa_status_t HSA_API hsa_amd_agent_memory_pool_get_info( |
| hsa_agent_t agent, hsa_amd_memory_pool_t memory_pool, |
| hsa_amd_agent_memory_pool_info_t attribute, void* value); |
| |
| /** |
| * @brief Enable direct access to a buffer from a given set of agents. |
| * |
| * @details |
| * |
| * Upon return, only the listed agents and the agent associated with the |
| * buffer's memory pool have direct access to the @p ptr. |
| * |
| * Any agent that has access to the buffer before and after the call to |
| * ::hsa_amd_agents_allow_access will also have access while |
| * ::hsa_amd_agents_allow_access is in progress. |
| * |
| * The caller is responsible for ensuring that each agent in the list |
| * must be able to access the memory pool containing @p ptr |
| * (using ::hsa_amd_agent_memory_pool_get_info with ::HSA_AMD_AGENT_MEMORY_POOL_INFO_ACCESS attribute), |
| * otherwise error code is returned. |
| * |
| * @param[in] num_agents Size of @p agents. |
| * |
| * @param[in] agents List of agents. If @p num_agents is 0, this argument is |
| * ignored. |
| * |
| * @param[in] flags A list of bit-field that is used to specify access |
| * information in a per-agent basis. This is currently reserved and must be NULL. |
| * |
| * @param[in] ptr A buffer previously allocated using ::hsa_amd_memory_pool_allocate. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p num_agents is 0, or @p agents |
| * is NULL, @p flags is not NULL, or attempting to enable access to agent(s) |
| * because @p ptr is allocated from an inaccessible pool. |
| * |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_agents_allow_access(uint32_t num_agents, const hsa_agent_t* agents, |
| const uint32_t* flags, const void* ptr); |
| |
| /** |
| * @brief Query if buffers currently located in some memory pool can be |
| * relocated to a destination memory pool. |
| * |
| * @details If the returned value is non-zero, a migration of a buffer to @p |
| * dst_memory_pool using ::hsa_amd_memory_migrate may nevertheless fail due to |
| * resource limitations. |
| * |
| * @param[in] src_memory_pool Source memory pool. |
| * |
| * @param[in] dst_memory_pool Destination memory pool. |
| * |
| * @param[out] result Pointer to a memory location where the result of the query |
| * is stored. Must not be NULL. If buffers currently located in @p |
| * src_memory_pool can be relocated to @p dst_memory_pool, the result is |
| * true. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL One of the memory pools is |
| * invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p result is NULL. |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_memory_pool_can_migrate(hsa_amd_memory_pool_t src_memory_pool, |
| hsa_amd_memory_pool_t dst_memory_pool, |
| bool* result); |
| |
| /** |
| * @brief Relocate a buffer to a new memory pool. |
| * |
| * @details When a buffer is migrated, its virtual address remains the same but |
| * its physical contents are moved to the indicated memory pool. |
| * |
| * After migration, only the agent associated with the destination pool will have access. |
| * |
| * The caller is also responsible for ensuring that the allocation in the |
| * source memory pool where the buffer is currently located can be migrated to the |
| * specified destination memory pool (using ::hsa_amd_memory_pool_can_migrate returns a value of true |
| * for the source and destination memory pools), otherwise behavior is undefined. |
| * |
| * The caller must ensure that the buffer is not accessed while it is migrated. |
| * |
| * @param[in] ptr Buffer to be relocated. The buffer must have been released to system |
| * prior to call this API. The buffer will be released to system upon completion. |
| * |
| * @param[in] memory_pool Memory pool where to place the buffer. |
| * |
| * @param[in] flags A bit-field that is used to specify migration |
| * information. Must be zero. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL The destination memory pool is |
| * invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES There is a failure in |
| * allocating the necessary resources. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p flags is not 0. |
| */ |
| hsa_status_t HSA_API hsa_amd_memory_migrate(const void* ptr, |
| hsa_amd_memory_pool_t memory_pool, |
| uint32_t flags); |
| |
| /** |
| * |
| * @brief Pin a host pointer allocated by C/C++ or OS allocator (i.e. ordinary system DRAM) and |
| * return a new pointer accessible by the @p agents. If the @p host_ptr overlaps with previously |
| * locked memory, then the overlap area is kept locked (i.e multiple mappings are permitted). In |
| * this case, the same input @p host_ptr may give different locked @p agent_ptr and when it does, |
| * they are not necessarily coherent (i.e. accessing either @p agent_ptr is not equivalent). |
| * Accesses to @p agent_ptr are coarse grained. |
| * |
| * @param[in] host_ptr A buffer allocated by C/C++ or OS allocator. |
| * |
| * @param[in] size The size to be locked. |
| * |
| * @param[in] agents Array of agent handle to gain access to the @p host_ptr. |
| * If this parameter is NULL and the @p num_agent is 0, all agents |
| * in the platform will gain access to the @p host_ptr. |
| * |
| * @param[out] agent_ptr Pointer to the location where to store the new address. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES There is a failure in |
| * allocating the necessary resources. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT One or more agent in @p agents is |
| * invalid. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is 0 or @p host_ptr or |
| * @p agent_ptr is NULL or @p agents not NULL but @p num_agent is 0 or @p agents |
| * is NULL but @p num_agent is not 0. |
| */ |
| hsa_status_t HSA_API hsa_amd_memory_lock(void* host_ptr, size_t size, |
| hsa_agent_t* agents, int num_agent, |
| void** agent_ptr); |
| |
| /** |
| * |
| * @brief Pin a host pointer allocated by C/C++ or OS allocator (i.e. ordinary system DRAM) and |
| * return a new pointer accessible by the @p agents. If the @p host_ptr overlaps with previously |
| * locked memory, then the overlap area is kept locked (i.e. multiple mappings are permitted). |
| * In this case, the same input @p host_ptr may give different locked @p agent_ptr and when it |
| * does, they are not necessarily coherent (i.e. accessing either @p agent_ptr is not equivalent). |
| * Acesses to the memory via @p agent_ptr have the same access properties as memory allocated from |
| * @p pool as determined by ::hsa_amd_memory_pool_get_info and ::hsa_amd_agent_memory_pool_get_info |
| * (ex. coarse/fine grain, platform atomic support, link info). Physical composition and placement |
| * of the memory (ex. page size, NUMA binding) is not changed. |
| * |
| * @param[in] host_ptr A buffer allocated by C/C++ or OS allocator. |
| * |
| * @param[in] size The size to be locked. |
| * |
| * @param[in] agents Array of agent handle to gain access to the @p host_ptr. |
| * If this parameter is NULL and the @p num_agent is 0, all agents |
| * in the platform will gain access to the @p host_ptr. |
| * |
| * @param[in] pool Global memory pool owned by a CPU agent. |
| * |
| * @param[in] flags A bit-field that is used to specify allocation |
| * directives. Reserved parameter, must be 0. |
| * |
| * @param[out] agent_ptr Pointer to the location where to store the new address. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES There is a failure in |
| * allocating the necessary resources. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_AGENT One or more agent in @p agents is |
| * invalid or can not access @p pool. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_MEMORY_POOL @p pool is invalid or not owned |
| * by a CPU agent. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p size is 0 or @p host_ptr or |
| * @p agent_ptr is NULL or @p agents not NULL but @p num_agent is 0 or @p agents |
| * is NULL but @p num_agent is not 0 or flags is not 0. |
| */ |
| hsa_status_t HSA_API hsa_amd_memory_lock_to_pool(void* host_ptr, size_t size, hsa_agent_t* agents, |
| int num_agent, hsa_amd_memory_pool_t pool, |
| uint32_t flags, void** agent_ptr); |
| |
| /** |
| * |
| * @brief Unpin the host pointer previously pinned via ::hsa_amd_memory_lock or |
| * ::hsa_amd_memory_lock_to_pool. |
| * |
| * @details The behavior is undefined if the host pointer being unpinned does not |
| * match previous pinned address or if the host pointer was already deallocated. |
| * |
| * @param[in] host_ptr A buffer allocated by C/C++ or OS allocator that was |
| * pinned previously via ::hsa_amd_memory_lock or ::hsa_amd_memory_lock_to_pool. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| */ |
| hsa_status_t HSA_API hsa_amd_memory_unlock(void* host_ptr); |
| |
| /** |
| * @brief Sets the first @p count of uint32_t of the block of memory pointed by |
| * @p ptr to the specified @p value. |
| * |
| * @param[in] ptr Pointer to the block of memory to fill. |
| * |
| * @param[in] value Value to be set. |
| * |
| * @param[in] count Number of uint32_t element to be set to the value. |
| * |
| * @retval HSA_STATUS_SUCCESS The function has been executed successfully. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is NULL or |
| * not 4 bytes aligned |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ALLOCATION if the given memory |
| * region was not allocated with HSA runtime APIs. |
| * |
| */ |
| hsa_status_t HSA_API |
| hsa_amd_memory_fill(void* ptr, uint32_t value, size_t count); |
| |
| /** |
| * @brief Maps an interop object into the HSA flat address space and establishes |
| * memory residency. The metadata pointer is valid during the lifetime of the |
| * map (until hsa_amd_interop_unmap_buffer is called). |
| * Multiple calls to hsa_amd_interop_map_buffer with the same interop_handle |
| * result in multiple mappings with potentially different addresses and |
| * different metadata pointers. Concurrent operations on these addresses are |
| * not coherent. Memory must be fenced to system scope to ensure consistency, |
| * between mappings and with any views of this buffer in the originating |
| * software stack. |
| * |
| * @param[in] num_agents Number of agents which require access to the memory |
| * |
| * @param[in] agents List of accessing agents. |
| * |
| * @param[in] interop_handle Handle of interop buffer (dmabuf handle in Linux) |
| * |
| * @param [in] flags Reserved, must be 0 |
| * |
| * @param[out] size Size in bytes of the mapped object |
| * |
| * @param[out] ptr Base address of the mapped object |
| * |
| * @param[out] metadata_size Size of metadata in bytes, may be NULL |
| * |
| * @param[out] metadata Pointer to metadata, may be NULL |
| * |
| * @retval HSA_STATUS_SUCCESS if successfully mapped |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT all other errors |
| */ |
| hsa_status_t HSA_API hsa_amd_interop_map_buffer(uint32_t num_agents, |
| hsa_agent_t* agents, |
| int interop_handle, |
| uint32_t flags, |
| size_t* size, |
| void** ptr, |
| size_t* metadata_size, |
| const void** metadata); |
| |
| /** |
| * @brief Removes a previously mapped interop object from HSA's flat address space. |
| * Ends lifetime for the mapping's associated metadata pointer. |
| */ |
| hsa_status_t HSA_API hsa_amd_interop_unmap_buffer(void* ptr); |
| |
| /** |
| * @brief Encodes an opaque vendor specific image format. The length of data |
| * depends on the underlying format. This structure must not be copied as its |
| * true length can not be determined. |
| */ |
| typedef struct hsa_amd_image_descriptor_s { |
| /* |
| Version number of the descriptor |
| */ |
| uint32_t version; |
| |
| /* |
| Vendor and device PCI IDs for the format as VENDOR_ID<<16|DEVICE_ID. |
| */ |
| uint32_t deviceID; |
| |
| /* |
| Start of vendor specific data. |
| */ |
| uint32_t data[1]; |
| } hsa_amd_image_descriptor_t; |
| |
| /** |
| * @brief Creates an image from an opaque vendor specific image format. |
| * Does not modify data at image_data. Intended initially for |
| * accessing interop images. |
| * |
| * @param agent[in] Agent on which to create the image |
| * |
| * @param[in] image_descriptor[in] Vendor specific image format |
| * |
| * @param[in] image_data Pointer to image backing store |
| * |
| * @param[in] access_permission Access permissions for the image object |
| * |
| * @param[out] image Created image object. |
| * |
| * @retval HSA_STATUS_SUCCESS Image created successfully |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT Bad or mismatched descriptor, |
| * null image_data, or mismatched access_permission. |
| */ |
| hsa_status_t HSA_API hsa_amd_image_create( |
| hsa_agent_t agent, |
| const hsa_ext_image_descriptor_t *image_descriptor, |
| const hsa_amd_image_descriptor_t *image_layout, |
| const void *image_data, |
| hsa_access_permission_t access_permission, |
| hsa_ext_image_t *image |
| ); |
| |
| /** |
| * @brief Denotes the type of memory in a pointer info query. |
| */ |
| typedef enum { |
| /* |
| Memory is not known to the HSA driver. Unallocated or unlocked system memory. |
| */ |
| HSA_EXT_POINTER_TYPE_UNKNOWN = 0, |
| /* |
| Memory was allocated with an HSA memory allocator. |
| */ |
| HSA_EXT_POINTER_TYPE_HSA = 1, |
| /* |
| System memory which has been locked for use with an HSA agent. |
| |
| Memory of this type is normal malloc'd memory and is always accessible to |
| the CPU. Pointer info queries may not include CPU agents in the accessible |
| agents list as the CPU has implicit access. |
| */ |
| HSA_EXT_POINTER_TYPE_LOCKED = 2, |
| /* |
| Memory originated in a graphics component and is shared with ROCr. |
| */ |
| HSA_EXT_POINTER_TYPE_GRAPHICS = 3, |
| /* |
| Memory has been shared with the local process via ROCr IPC APIs. |
| */ |
| HSA_EXT_POINTER_TYPE_IPC = 4 |
| } hsa_amd_pointer_type_t; |
| |
| /** |
| * @brief Describes a memory allocation known to ROCr. |
| * Within a ROCr major version this structure can only grow. |
| */ |
| typedef struct hsa_amd_pointer_info_s { |
| /* |
| Size in bytes of this structure. Used for version control within a major ROCr |
| revision. Set to sizeof(hsa_amd_pointer_t) prior to calling |
| hsa_amd_pointer_info. If the runtime supports an older version of pointer |
| info then size will be smaller on return. Members starting after the return |
| value of size will not be updated by hsa_amd_pointer_info. |
| */ |
| uint32_t size; |
| /* |
| The type of allocation referenced. |
| */ |
| hsa_amd_pointer_type_t type; |
| /* |
| Base address at which non-host agents may access the allocation. |
| */ |
| void* agentBaseAddress; |
| /* |
| Base address at which the host agent may access the allocation. |
| */ |
| void* hostBaseAddress; |
| /* |
| Size of the allocation |
| */ |
| size_t sizeInBytes; |
| /* |
| Application provided value. |
| */ |
| void* userData; |
| /* |
| Reports an agent which "owns" (ie has preferred access to) the pool in which the allocation was |
| made. When multiple agents share equal access to a pool (ex: multiple CPU agents, or multi-die |
| GPU boards) any such agent may be returned. |
| */ |
| hsa_agent_t agentOwner; |
| } hsa_amd_pointer_info_t; |
| |
| /** |
| * @brief Retrieves information about the allocation referenced by the given |
| * pointer. Optionally returns the number and list of agents which can |
| * directly access the allocation. |
| * |
| * @param[in] ptr Pointer which references the allocation to retrieve info for. |
| * |
| * @param[in, out] info Pointer to structure to be filled with allocation info. |
| * Data member size must be set to the size of the structure prior to calling |
| * hsa_amd_pointer_info. On return size will be set to the size of the |
| * pointer info structure supported by the runtime, if smaller. Members |
| * beyond the returned value of size will not be updated by the API. |
| * Must not be NULL. |
| * |
| * @param[in] alloc Function pointer to an allocator used to allocate the |
| * @p accessible array. If NULL @p accessible will not be returned. |
| * |
| * @param[out] num_agents_accessible Recieves the count of agents in |
| * @p accessible. If NULL @p accessible will not be returned. |
| * |
| * @param[out] accessible Recieves a pointer to the array, allocated by @p alloc, |
| * holding the list of agents which may directly access the allocation. |
| * May be NULL. |
| * |
| * @retval HSA_STATUS_SUCCESS Info retrieved successfully |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT NULL in @p ptr or @p info. |
| */ |
| hsa_status_t HSA_API hsa_amd_pointer_info(void* ptr, |
| hsa_amd_pointer_info_t* info, |
| void* (*alloc)(size_t), |
| uint32_t* num_agents_accessible, |
| hsa_agent_t** accessible); |
| |
| /** |
| * @brief Associates an arbitrary pointer with an allocation known to ROCr. |
| * The pointer can be fetched by hsa_amd_pointer_info in the userData field. |
| * |
| * @param[in] ptr Pointer to the first byte of an allocation known to ROCr |
| * with which to associate @p userdata. |
| * |
| * @param[in] userdata Abitrary pointer to associate with the allocation. |
| * |
| * @retval HSA_STATUS_SUCCESS @p userdata successfully stored. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr is not known to ROCr. |
| */ |
| hsa_status_t HSA_API hsa_amd_pointer_info_set_userdata(void* ptr, |
| void* userdata); |
| |
| /** |
| * @brief 256-bit process independent identifier for a ROCr shared memory |
| * allocation. |
| */ |
| typedef struct hsa_amd_ipc_memory_s { |
| uint32_t handle[8]; |
| } hsa_amd_ipc_memory_t; |
| |
| /** |
| * @brief Prepares an allocation for interprocess sharing and creates a |
| * handle of type hsa_amd_ipc_memory_t uniquely identifying the allocation. A |
| * handle is valid while the allocation it references remains accessible in |
| * any process. In general applications should confirm that a shared memory |
| * region has been attached (via hsa_amd_ipc_memory_attach) in the remote |
| * process prior to releasing that memory in the local process. |
| * Repeated calls for the same allocation may, but are not required to, return |
| * unique handles. |
| * |
| * @param[in] ptr Pointer to memory allocated via ROCr APIs to prepare for |
| * sharing. |
| * |
| * @param[in] len Length in bytes of the allocation to share. |
| * |
| * @param[out] handle Process independent identifier referencing the shared |
| * allocation. |
| * |
| * @retval HSA_STATUS_SUCCESS allocation is prepared for interprocess sharing. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p ptr does not point to the |
| * first byte of an allocation made through ROCr, or len is not the full length |
| * of the allocation or handle is NULL. |
| */ |
| hsa_status_t HSA_API hsa_amd_ipc_memory_create(void* ptr, size_t len, |
| hsa_amd_ipc_memory_t* handle); |
| |
| /** |
| * @brief Imports shared memory into the local process and makes it accessible |
| * by the given agents. If a shared memory handle is attached multiple times |
| * in a process each attach may return a different address. Each returned |
| * address is refcounted and requires a matching number of calls to |
| * hsa_amd_ipc_memory_detach to release the shared memory mapping. |
| * |
| * @param[in] handle Pointer to the identifier for the shared memory. |
| * |
| * @param[in] len Length of the shared memory to import. |
| * Reserved. Must be the full length of the shared allocation in this version. |
| * |
| * @param[in] num_agents Count of agents in @p mapping_agents. |
| * May be zero if all agents are to be allowed access. |
| * |
| * @param[in] mapping_agents List of agents to access the shared memory. |
| * Ignored if @p num_agents is zero. |
| * |
| * @param[out] mapped_ptr Recieves a process local pointer to the shared memory. |
| * |
| * @retval HSA_STATUS_SUCCESS if memory is successfully imported. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p handle is not valid, @p len is |
| * incorrect, @p mapped_ptr is NULL, or some agent for which access was |
| * requested can not access the shared memory. |
| */ |
| hsa_status_t HSA_API hsa_amd_ipc_memory_attach( |
| const hsa_amd_ipc_memory_t* handle, size_t len, |
| uint32_t num_agents, |
| const hsa_agent_t* mapping_agents, |
| void** mapped_ptr); |
| |
| /** |
| * @brief Decrements the reference count for the shared memory mapping and |
| * releases access to shared memory imported with hsa_amd_ipc_memory_attach. |
| * |
| * @param[in] mapped_ptr Pointer to the first byte of a shared allocation |
| * imported with hsa_amd_ipc_memory_attach. |
| * |
| * @retval HSA_STATUS_SUCCESS if @p mapped_ptr was imported with |
| * hsa_amd_ipc_memory_attach. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p mapped_ptr was not imported |
| * with hsa_amd_ipc_memory_attach. |
| */ |
| hsa_status_t HSA_API hsa_amd_ipc_memory_detach(void* mapped_ptr); |
| |
| /** |
| * @brief 256-bit process independent identifier for a ROCr IPC signal. |
| */ |
| typedef hsa_amd_ipc_memory_t hsa_amd_ipc_signal_t; |
| |
| /** |
| * @brief Obtains an interprocess sharing handle for a signal. The handle is |
| * valid while the signal it references remains valid in any process. In |
| * general applications should confirm that the signal has been attached (via |
| * hsa_amd_ipc_signal_attach) in the remote process prior to destroying that |
| * signal in the local process. |
| * Repeated calls for the same signal may, but are not required to, return |
| * unique handles. |
| * |
| * @param[in] signal Signal created with attribute HSA_AMD_SIGNAL_IPC. |
| * |
| * @param[out] handle Process independent identifier referencing the shared |
| * signal. |
| * |
| * @retval HSA_STATUS_SUCCESS @p handle is ready to use for interprocess sharing. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p signal is not a valid signal |
| * created with attribute HSA_AMD_SIGNAL_IPC or handle is NULL. |
| */ |
| hsa_status_t HSA_API hsa_amd_ipc_signal_create(hsa_signal_t signal, hsa_amd_ipc_signal_t* handle); |
| |
| /** |
| * @brief Imports an IPC capable signal into the local process. If an IPC |
| * signal handle is attached multiple times in a process each attach may return |
| * a different signal handle. Each returned signal handle is refcounted and |
| * requires a matching number of calls to hsa_signal_destroy to release the |
| * shared signal. |
| * |
| * @param[in] handle Pointer to the identifier for the shared signal. |
| * |
| * @param[out] signal Recieves a process local signal handle to the shared signal. |
| * |
| * @retval HSA_STATUS_SUCCESS if the signal is successfully imported. |
| * |
| * @retval HSA_STATUS_ERROR_NOT_INITIALIZED if HSA is not initialized |
| * |
| * @retval HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p handle is not valid. |
| */ |
| hsa_status_t HSA_API hsa_amd_ipc_signal_attach(const hsa_amd_ipc_signal_t* handle, |
| hsa_signal_t* signal); |
| |
| /** |
| * @brief GPU system event type. |
| */ |
| typedef enum hsa_amd_event_type_s { |
| /* |
| AMD GPU memory fault. |
| */ |
| HSA_AMD_GPU_MEMORY_FAULT_EVENT = 0, |
| } hsa_amd_event_type_t; |
| |
| /** |
| * @brief Flags denoting the cause of a memory fault. |
| */ |
| typedef enum { |
| // Page not present or supervisor privilege. |
| HSA_AMD_MEMORY_FAULT_PAGE_NOT_PRESENT = 1 << 0, |
| // Write access to a read-only page. |
| HSA_AMD_MEMORY_FAULT_READ_ONLY = 1 << 1, |
| // Execute access to a page marked NX. |
| HSA_AMD_MEMORY_FAULT_NX = 1 << 2, |
| // GPU attempted access to a host only page. |
| HSA_AMD_MEMORY_FAULT_HOST_ONLY = 1 << 3, |
| // DRAM ECC failure. |
| HSA_AMD_MEMORY_FAULT_DRAM_ECC = 1 << 4, |
| // Can't determine the exact fault address. |
| HSA_AMD_MEMORY_FAULT_IMPRECISE = 1 << 5, |
| // SRAM ECC failure (ie registers, no fault address). |
| HSA_AMD_MEMORY_FAULT_SRAM_ECC = 1 << 6, |
| // GPU reset following unspecified hang. |
| HSA_AMD_MEMORY_FAULT_HANG = 1 << 31 |
| } hsa_amd_memory_fault_reason_t; |
| |
| /** |
| * @brief AMD GPU memory fault event data. |
| */ |
| typedef struct hsa_amd_gpu_memory_fault_info_s { |
| /* |
| The agent where the memory fault occurred. |
| */ |
| hsa_agent_t agent; |
| /* |
| Virtual address accessed. |
| */ |
| uint64_t virtual_address; |
| /* |
| Bit field encoding the memory access failure reasons. There could be multiple bits set |
| for one fault. Bits are defined in hsa_amd_memory_fault_reason_t. |
| */ |
| uint32_t fault_reason_mask; |
| } hsa_amd_gpu_memory_fault_info_t; |
| |
| /** |
| * @brief AMD GPU event data passed to event handler. |
| */ |
| typedef struct hsa_amd_event_s { |
| /* |
| The event type. |
| */ |
| hsa_amd_event_type_t event_type; |
| union { |
| /* |
| The memory fault info, only valid when @p event_type is HSA_AMD_GPU_MEMORY_FAULT_EVENT. |
| */ |
| hsa_amd_gpu_memory_fault_info_t memory_fault; |
| }; |
| } hsa_amd_event_t; |
| |
| typedef hsa_status_t (*hsa_amd_system_event_callback_t)(const hsa_amd_event_t* event, void* data); |
| |
| /** |
| * @brief Register AMD GPU event handler. |
| * |
| * @param[in] callback Callback to be invoked when an event is triggered. |
| * The HSA runtime passes two arguments to the callback: @p event |
| * is defined per event by the HSA runtime, and @p data is the user data. |
| * |
| * @param[in] data User data that is passed to @p callback. May be NULL. |
| * |
| * @retval HSA_STATUS_SUCCESS The handler has been registered successfully. |
| * |
| * @retval HSA_STATUS_ERROR An event handler has already been registered. |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT @p event is invalid. |
| */ |
| hsa_status_t HSA_API hsa_amd_register_system_event_handler(hsa_amd_system_event_callback_t callback, |
| void* data); |
| |
| /** |
| * @brief Per-queue dispatch and wavefront scheduling priority. |
| */ |
| typedef enum hsa_amd_queue_priority_s { |
| /* |
| Below normal/high priority compute and all graphics |
| */ |
| HSA_AMD_QUEUE_PRIORITY_LOW = 0, |
| /* |
| Above low priority compute, below high priority compute and all graphics |
| */ |
| HSA_AMD_QUEUE_PRIORITY_NORMAL = 1, |
| /* |
| Above low/normal priority compute and all graphics |
| */ |
| HSA_AMD_QUEUE_PRIORITY_HIGH = 2, |
| } hsa_amd_queue_priority_t; |
| |
| /** |
| * @brief Modifies the dispatch and wavefront scheduling prioirty for a |
| * given compute queue. The default is HSA_AMD_QUEUE_PRIORITY_NORMAL. |
| * |
| * @param[in] queue Compute queue to apply new priority to. |
| * |
| * @param[in] priority Priority to associate with queue. |
| * |
| * @retval HSA_STATUS_SUCCESS if priority was changed successfully. |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_QUEUE if queue is not a valid |
| * compute queue handle. |
| * |
| * @retval HSA_STATUS_ERROR_INVALID_ARGUMENT if priority is not a valid |
| * value from hsa_amd_queue_priority_t. |
| */ |
| hsa_status_t HSA_API hsa_amd_queue_set_priority(hsa_queue_t* queue, |
| hsa_amd_queue_priority_t priority); |
| |
| /** |
| * @brief Deallocation notifier function type. |
| */ |
| typedef void (*hsa_amd_deallocation_callback_t)(void* ptr, void* user_data); |
| |
| /** |
| * @brief Registers a deallocation notifier monitoring for release of agent |
| * accessible address @p ptr. If successful, @p callback will be invoked when |
| * @p ptr is removed from accessibility from all agents. |
| * |
| * Notification callbacks are automatically deregistered when they are invoked. |
| * |
| * Note: The current version supports notifications of address release |
| * originating from ::hsa_amd_memory_pool_free. Support for other address |
| * release APIs will follow. |
| * |
| * @param[in] ptr Agent accessible address to monitor for deallocation. Passed |
| * to @p callback. |
| * |
| * @param[in] callback Notifier to be invoked when @p ptr is released from |
| * agent accessibility. |
| * |
| * @param[in] user_data User provided value passed to @p callback. May be NULL. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The notifier registered successfully |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ALLOCATION @p ptr does not refer to a valid agent accessible |
| * address. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT @p callback is NULL or @p ptr is NULL. |
| * |
| * @retval ::HSA_STATUS_ERROR_OUT_OF_RESOURCES if there is a failure in allocating |
| * necessary resources |
| */ |
| hsa_status_t HSA_API hsa_amd_register_deallocation_callback(void* ptr, |
| hsa_amd_deallocation_callback_t callback, |
| void* user_data); |
| |
| /** |
| * @brief Removes a deallocation notifier previously registered with |
| * ::hsa_amd_register_deallocation_callback. Arguments must be identical to |
| * those given in ::hsa_amd_register_deallocation_callback. |
| * |
| * @param[in] ptr Agent accessible address which was monitored for deallocation. |
| * |
| * @param[in] callback Notifier to be removed. |
| * |
| * @retval ::HSA_STATUS_SUCCESS The notifier has been removed successfully. |
| * |
| * @retval ::HSA_STATUS_ERROR_NOT_INITIALIZED The HSA runtime has not been |
| * initialized. |
| * |
| * @retval ::HSA_STATUS_ERROR_INVALID_ARGUMENT The given notifier was not registered. |
| */ |
| hsa_status_t HSA_API hsa_amd_deregister_deallocation_callback(void* ptr, |
| hsa_amd_deallocation_callback_t callback); |
| |
| #ifdef __cplusplus |
| } // end extern "C" block |
| #endif |
| |
| #endif // header guard |