1184 lines
35 KiB
C
1184 lines
35 KiB
C
/*
|
||
* Copyright 2014 Advanced Micro Devices, Inc.
|
||
*
|
||
* Permission is hereby granted, free of charge, to any person obtaining a
|
||
* copy of this software and associated documentation files (the "Software"),
|
||
* to deal in the Software without restriction, including without limitation
|
||
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||
* and/or sell copies of the Software, and to permit persons to whom the
|
||
* Software is furnished to do so, subject to the following conditions:
|
||
*
|
||
* The above copyright notice and this permission notice shall be included in
|
||
* all copies or substantial portions of the Software.
|
||
*
|
||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||
* THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
|
||
* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
|
||
* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
|
||
* OTHER DEALINGS IN THE SOFTWARE.
|
||
*
|
||
*/
|
||
|
||
/**
|
||
* \file amdgpu.h
|
||
*
|
||
* Declare public libdrm_amdgpu API
|
||
*
|
||
* This file define API exposed by libdrm_amdgpu library.
|
||
* User wanted to use libdrm_amdgpu functionality must include
|
||
* this file.
|
||
*
|
||
*/
|
||
#ifndef _AMDGPU_H_
|
||
#define _AMDGPU_H_
|
||
|
||
#include <stdint.h>
|
||
#include <stdbool.h>
|
||
|
||
struct drm_amdgpu_info_hw_ip;
|
||
|
||
/*--------------------------------------------------------------------------*/
|
||
/* --------------------------- Defines ------------------------------------ */
|
||
/*--------------------------------------------------------------------------*/
|
||
|
||
/**
|
||
* Define max. number of Command Buffers (IB) which could be sent to the single
|
||
* hardware IP to accommodate CE/DE requirements
|
||
*
|
||
* \sa amdgpu_cs_ib_info
|
||
*/
|
||
#define AMDGPU_CS_MAX_IBS_PER_SUBMIT 4
|
||
|
||
/**
|
||
* Special timeout value meaning that the timeout is infinite.
|
||
*/
|
||
#define AMDGPU_TIMEOUT_INFINITE 0xffffffffffffffffull
|
||
|
||
/**
|
||
* Used in amdgpu_cs_query_fence_status(), meaning that the given timeout
|
||
* is absolute.
|
||
*/
|
||
#define AMDGPU_QUERY_FENCE_TIMEOUT_IS_ABSOLUTE (1 << 0)
|
||
|
||
/*--------------------------------------------------------------------------*/
|
||
/* ----------------------------- Enums ------------------------------------ */
|
||
/*--------------------------------------------------------------------------*/
|
||
|
||
/**
|
||
* Enum describing possible handle types
|
||
*
|
||
* \sa amdgpu_bo_import, amdgpu_bo_export
|
||
*
|
||
*/
|
||
enum amdgpu_bo_handle_type {
|
||
/** GEM flink name (needs DRM authentication, used by DRI2) */
|
||
amdgpu_bo_handle_type_gem_flink_name = 0,
|
||
|
||
/** KMS handle which is used by all driver ioctls */
|
||
amdgpu_bo_handle_type_kms = 1,
|
||
|
||
/** DMA-buf fd handle */
|
||
amdgpu_bo_handle_type_dma_buf_fd = 2
|
||
};
|
||
|
||
/** Define known types of GPU VM VA ranges */
|
||
enum amdgpu_gpu_va_range
|
||
{
|
||
/** Allocate from "normal"/general range */
|
||
amdgpu_gpu_va_range_general = 0
|
||
};
|
||
|
||
/*--------------------------------------------------------------------------*/
|
||
/* -------------------------- Datatypes ----------------------------------- */
|
||
/*--------------------------------------------------------------------------*/
|
||
|
||
/**
|
||
* Define opaque pointer to context associated with fd.
|
||
* This context will be returned as the result of
|
||
* "initialize" function and should be pass as the first
|
||
* parameter to any API call
|
||
*/
|
||
typedef struct amdgpu_device *amdgpu_device_handle;
|
||
|
||
/**
|
||
* Define GPU Context type as pointer to opaque structure
|
||
* Example of GPU Context is the "rendering" context associated
|
||
* with OpenGL context (glCreateContext)
|
||
*/
|
||
typedef struct amdgpu_context *amdgpu_context_handle;
|
||
|
||
/**
|
||
* Define handle for amdgpu resources: buffer, GDS, etc.
|
||
*/
|
||
typedef struct amdgpu_bo *amdgpu_bo_handle;
|
||
|
||
/**
|
||
* Define handle for list of BOs
|
||
*/
|
||
typedef struct amdgpu_bo_list *amdgpu_bo_list_handle;
|
||
|
||
/**
|
||
* Define handle to be used to work with VA allocated ranges
|
||
*/
|
||
typedef struct amdgpu_va *amdgpu_va_handle;
|
||
|
||
/*--------------------------------------------------------------------------*/
|
||
/* -------------------------- Structures ---------------------------------- */
|
||
/*--------------------------------------------------------------------------*/
|
||
|
||
/**
|
||
* Structure describing memory allocation request
|
||
*
|
||
* \sa amdgpu_bo_alloc()
|
||
*
|
||
*/
|
||
struct amdgpu_bo_alloc_request {
|
||
/** Allocation request. It must be aligned correctly. */
|
||
uint64_t alloc_size;
|
||
|
||
/**
|
||
* It may be required to have some specific alignment requirements
|
||
* for physical back-up storage (e.g. for displayable surface).
|
||
* If 0 there is no special alignment requirement
|
||
*/
|
||
uint64_t phys_alignment;
|
||
|
||
/**
|
||
* UMD should specify where to allocate memory and how it
|
||
* will be accessed by the CPU.
|
||
*/
|
||
uint32_t preferred_heap;
|
||
|
||
/** Additional flags passed on allocation */
|
||
uint64_t flags;
|
||
};
|
||
|
||
/**
|
||
* Special UMD specific information associated with buffer.
|
||
*
|
||
* It may be need to pass some buffer charactersitic as part
|
||
* of buffer sharing. Such information are defined UMD and
|
||
* opaque for libdrm_amdgpu as well for kernel driver.
|
||
*
|
||
* \sa amdgpu_bo_set_metadata(), amdgpu_bo_query_info,
|
||
* amdgpu_bo_import(), amdgpu_bo_export
|
||
*
|
||
*/
|
||
struct amdgpu_bo_metadata {
|
||
/** Special flag associated with surface */
|
||
uint64_t flags;
|
||
|
||
/**
|
||
* ASIC-specific tiling information (also used by DCE).
|
||
* The encoding is defined by the AMDGPU_TILING_* definitions.
|
||
*/
|
||
uint64_t tiling_info;
|
||
|
||
/** Size of metadata associated with the buffer, in bytes. */
|
||
uint32_t size_metadata;
|
||
|
||
/** UMD specific metadata. Opaque for kernel */
|
||
uint32_t umd_metadata[64];
|
||
};
|
||
|
||
/**
|
||
* Structure describing allocated buffer. Client may need
|
||
* to query such information as part of 'sharing' buffers mechanism
|
||
*
|
||
* \sa amdgpu_bo_set_metadata(), amdgpu_bo_query_info(),
|
||
* amdgpu_bo_import(), amdgpu_bo_export()
|
||
*/
|
||
struct amdgpu_bo_info {
|
||
/** Allocated memory size */
|
||
uint64_t alloc_size;
|
||
|
||
/**
|
||
* It may be required to have some specific alignment requirements
|
||
* for physical back-up storage.
|
||
*/
|
||
uint64_t phys_alignment;
|
||
|
||
/** Heap where to allocate memory. */
|
||
uint32_t preferred_heap;
|
||
|
||
/** Additional allocation flags. */
|
||
uint64_t alloc_flags;
|
||
|
||
/** Metadata associated with buffer if any. */
|
||
struct amdgpu_bo_metadata metadata;
|
||
};
|
||
|
||
/**
|
||
* Structure with information about "imported" buffer
|
||
*
|
||
* \sa amdgpu_bo_import()
|
||
*
|
||
*/
|
||
struct amdgpu_bo_import_result {
|
||
/** Handle of memory/buffer to use */
|
||
amdgpu_bo_handle buf_handle;
|
||
|
||
/** Buffer size */
|
||
uint64_t alloc_size;
|
||
};
|
||
|
||
/**
|
||
*
|
||
* Structure to describe GDS partitioning information.
|
||
* \note OA and GWS resources are asscoiated with GDS partition
|
||
*
|
||
* \sa amdgpu_gpu_resource_query_gds_info
|
||
*
|
||
*/
|
||
struct amdgpu_gds_resource_info {
|
||
uint32_t gds_gfx_partition_size;
|
||
uint32_t compute_partition_size;
|
||
uint32_t gds_total_size;
|
||
uint32_t gws_per_gfx_partition;
|
||
uint32_t gws_per_compute_partition;
|
||
uint32_t oa_per_gfx_partition;
|
||
uint32_t oa_per_compute_partition;
|
||
};
|
||
|
||
/**
|
||
* Structure describing CS fence
|
||
*
|
||
* \sa amdgpu_cs_query_fence_status(), amdgpu_cs_request, amdgpu_cs_submit()
|
||
*
|
||
*/
|
||
struct amdgpu_cs_fence {
|
||
|
||
/** In which context IB was sent to execution */
|
||
amdgpu_context_handle context;
|
||
|
||
/** To which HW IP type the fence belongs */
|
||
uint32_t ip_type;
|
||
|
||
/** IP instance index if there are several IPs of the same type. */
|
||
uint32_t ip_instance;
|
||
|
||
/** Ring index of the HW IP */
|
||
uint32_t ring;
|
||
|
||
/** Specify fence for which we need to check submission status.*/
|
||
uint64_t fence;
|
||
};
|
||
|
||
/**
|
||
* Structure describing IB
|
||
*
|
||
* \sa amdgpu_cs_request, amdgpu_cs_submit()
|
||
*
|
||
*/
|
||
struct amdgpu_cs_ib_info {
|
||
/** Special flags */
|
||
uint64_t flags;
|
||
|
||
/** Virtual MC address of the command buffer */
|
||
uint64_t ib_mc_address;
|
||
|
||
/**
|
||
* Size of Command Buffer to be submitted.
|
||
* - The size is in units of dwords (4 bytes).
|
||
* - Could be 0
|
||
*/
|
||
uint32_t size;
|
||
};
|
||
|
||
/**
|
||
* Structure describing fence information
|
||
*
|
||
* \sa amdgpu_cs_request, amdgpu_cs_query_fence,
|
||
* amdgpu_cs_submit(), amdgpu_cs_query_fence_status()
|
||
*/
|
||
struct amdgpu_cs_fence_info {
|
||
/** buffer object for the fence */
|
||
amdgpu_bo_handle handle;
|
||
|
||
/** fence offset in the unit of sizeof(uint64_t) */
|
||
uint64_t offset;
|
||
};
|
||
|
||
/**
|
||
* Structure describing submission request
|
||
*
|
||
* \note We could have several IBs as packet. e.g. CE, CE, DE case for gfx
|
||
*
|
||
* \sa amdgpu_cs_submit()
|
||
*/
|
||
struct amdgpu_cs_request {
|
||
/** Specify flags with additional information */
|
||
uint64_t flags;
|
||
|
||
/** Specify HW IP block type to which to send the IB. */
|
||
unsigned ip_type;
|
||
|
||
/** IP instance index if there are several IPs of the same type. */
|
||
unsigned ip_instance;
|
||
|
||
/**
|
||
* Specify ring index of the IP. We could have several rings
|
||
* in the same IP. E.g. 0 for SDMA0 and 1 for SDMA1.
|
||
*/
|
||
uint32_t ring;
|
||
|
||
/**
|
||
* List handle with resources used by this request.
|
||
*/
|
||
amdgpu_bo_list_handle resources;
|
||
|
||
/**
|
||
* Number of dependencies this Command submission needs to
|
||
* wait for before starting execution.
|
||
*/
|
||
uint32_t number_of_dependencies;
|
||
|
||
/**
|
||
* Array of dependencies which need to be met before
|
||
* execution can start.
|
||
*/
|
||
struct amdgpu_cs_fence *dependencies;
|
||
|
||
/** Number of IBs to submit in the field ibs. */
|
||
uint32_t number_of_ibs;
|
||
|
||
/**
|
||
* IBs to submit. Those IBs will be submit together as single entity
|
||
*/
|
||
struct amdgpu_cs_ib_info *ibs;
|
||
|
||
/**
|
||
* The returned sequence number for the command submission
|
||
*/
|
||
uint64_t seq_no;
|
||
|
||
/**
|
||
* The fence information
|
||
*/
|
||
struct amdgpu_cs_fence_info fence_info;
|
||
};
|
||
|
||
/**
|
||
* Structure which provide information about GPU VM MC Address space
|
||
* alignments requirements
|
||
*
|
||
* \sa amdgpu_query_buffer_size_alignment
|
||
*/
|
||
struct amdgpu_buffer_size_alignments {
|
||
/** Size alignment requirement for allocation in
|
||
* local memory */
|
||
uint64_t size_local;
|
||
|
||
/**
|
||
* Size alignment requirement for allocation in remote memory
|
||
*/
|
||
uint64_t size_remote;
|
||
};
|
||
|
||
/**
|
||
* Structure which provide information about heap
|
||
*
|
||
* \sa amdgpu_query_heap_info()
|
||
*
|
||
*/
|
||
struct amdgpu_heap_info {
|
||
/** Theoretical max. available memory in the given heap */
|
||
uint64_t heap_size;
|
||
|
||
/**
|
||
* Number of bytes allocated in the heap. This includes all processes
|
||
* and private allocations in the kernel. It changes when new buffers
|
||
* are allocated, freed, and moved. It cannot be larger than
|
||
* heap_size.
|
||
*/
|
||
uint64_t heap_usage;
|
||
|
||
/**
|
||
* Theoretical possible max. size of buffer which
|
||
* could be allocated in the given heap
|
||
*/
|
||
uint64_t max_allocation;
|
||
};
|
||
|
||
/**
|
||
* Describe GPU h/w info needed for UMD correct initialization
|
||
*
|
||
* \sa amdgpu_query_gpu_info()
|
||
*/
|
||
struct amdgpu_gpu_info {
|
||
/** Asic id */
|
||
uint32_t asic_id;
|
||
/** Chip revision */
|
||
uint32_t chip_rev;
|
||
/** Chip external revision */
|
||
uint32_t chip_external_rev;
|
||
/** Family ID */
|
||
uint32_t family_id;
|
||
/** Special flags */
|
||
uint64_t ids_flags;
|
||
/** max engine clock*/
|
||
uint64_t max_engine_clk;
|
||
/** max memory clock */
|
||
uint64_t max_memory_clk;
|
||
/** number of shader engines */
|
||
uint32_t num_shader_engines;
|
||
/** number of shader arrays per engine */
|
||
uint32_t num_shader_arrays_per_engine;
|
||
/** Number of available good shader pipes */
|
||
uint32_t avail_quad_shader_pipes;
|
||
/** Max. number of shader pipes.(including good and bad pipes */
|
||
uint32_t max_quad_shader_pipes;
|
||
/** Number of parameter cache entries per shader quad pipe */
|
||
uint32_t cache_entries_per_quad_pipe;
|
||
/** Number of available graphics context */
|
||
uint32_t num_hw_gfx_contexts;
|
||
/** Number of render backend pipes */
|
||
uint32_t rb_pipes;
|
||
/** Enabled render backend pipe mask */
|
||
uint32_t enabled_rb_pipes_mask;
|
||
/** Frequency of GPU Counter */
|
||
uint32_t gpu_counter_freq;
|
||
/** CC_RB_BACKEND_DISABLE.BACKEND_DISABLE per SE */
|
||
uint32_t backend_disable[4];
|
||
/** Value of MC_ARB_RAMCFG register*/
|
||
uint32_t mc_arb_ramcfg;
|
||
/** Value of GB_ADDR_CONFIG */
|
||
uint32_t gb_addr_cfg;
|
||
/** Values of the GB_TILE_MODE0..31 registers */
|
||
uint32_t gb_tile_mode[32];
|
||
/** Values of GB_MACROTILE_MODE0..15 registers */
|
||
uint32_t gb_macro_tile_mode[16];
|
||
/** Value of PA_SC_RASTER_CONFIG register per SE */
|
||
uint32_t pa_sc_raster_cfg[4];
|
||
/** Value of PA_SC_RASTER_CONFIG_1 register per SE */
|
||
uint32_t pa_sc_raster_cfg1[4];
|
||
/* CU info */
|
||
uint32_t cu_active_number;
|
||
uint32_t cu_ao_mask;
|
||
uint32_t cu_bitmap[4][4];
|
||
/* video memory type info*/
|
||
uint32_t vram_type;
|
||
/* video memory bit width*/
|
||
uint32_t vram_bit_width;
|
||
/** constant engine ram size*/
|
||
uint32_t ce_ram_size;
|
||
/* vce harvesting instance */
|
||
uint32_t vce_harvest_config;
|
||
/* PCI revision ID */
|
||
uint32_t pci_rev_id;
|
||
};
|
||
|
||
|
||
/*--------------------------------------------------------------------------*/
|
||
/*------------------------- Functions --------------------------------------*/
|
||
/*--------------------------------------------------------------------------*/
|
||
|
||
/*
|
||
* Initialization / Cleanup
|
||
*
|
||
*/
|
||
|
||
/**
|
||
*
|
||
* \param fd - \c [in] File descriptor for AMD GPU device
|
||
* received previously as the result of
|
||
* e.g. drmOpen() call.
|
||
* For legacy fd type, the DRI2/DRI3
|
||
* authentication should be done before
|
||
* calling this function.
|
||
* \param major_version - \c [out] Major version of library. It is assumed
|
||
* that adding new functionality will cause
|
||
* increase in major version
|
||
* \param minor_version - \c [out] Minor version of library
|
||
* \param device_handle - \c [out] Pointer to opaque context which should
|
||
* be passed as the first parameter on each
|
||
* API call
|
||
*
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*
|
||
* \sa amdgpu_device_deinitialize()
|
||
*/
|
||
int amdgpu_device_initialize(int fd,
|
||
uint32_t *major_version,
|
||
uint32_t *minor_version,
|
||
amdgpu_device_handle *device_handle);
|
||
|
||
/**
|
||
*
|
||
* When access to such library does not needed any more the special
|
||
* function must be call giving opportunity to clean up any
|
||
* resources if needed.
|
||
*
|
||
* \param device_handle - \c [in] Context associated with file
|
||
* descriptor for AMD GPU device
|
||
* received previously as the
|
||
* result e.g. of drmOpen() call.
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_device_initialize()
|
||
*
|
||
*/
|
||
int amdgpu_device_deinitialize(amdgpu_device_handle device_handle);
|
||
|
||
/*
|
||
* Memory Management
|
||
*
|
||
*/
|
||
|
||
/**
|
||
* Allocate memory to be used by UMD for GPU related operations
|
||
*
|
||
* \param dev - \c [in] Device handle.
|
||
* See #amdgpu_device_initialize()
|
||
* \param alloc_buffer - \c [in] Pointer to the structure describing an
|
||
* allocation request
|
||
* \param buf_handle - \c [out] Allocated buffer handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_free()
|
||
*/
|
||
int amdgpu_bo_alloc(amdgpu_device_handle dev,
|
||
struct amdgpu_bo_alloc_request *alloc_buffer,
|
||
amdgpu_bo_handle *buf_handle);
|
||
|
||
/**
|
||
* Associate opaque data with buffer to be queried by another UMD
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param buf_handle - \c [in] Buffer handle
|
||
* \param info - \c [in] Metadata to associated with buffer
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*/
|
||
int amdgpu_bo_set_metadata(amdgpu_bo_handle buf_handle,
|
||
struct amdgpu_bo_metadata *info);
|
||
|
||
/**
|
||
* Query buffer information including metadata previusly associated with
|
||
* buffer.
|
||
*
|
||
* \param dev - \c [in] Device handle.
|
||
* See #amdgpu_device_initialize()
|
||
* \param buf_handle - \c [in] Buffer handle
|
||
* \param info - \c [out] Structure describing buffer
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_set_metadata(), amdgpu_bo_alloc()
|
||
*/
|
||
int amdgpu_bo_query_info(amdgpu_bo_handle buf_handle,
|
||
struct amdgpu_bo_info *info);
|
||
|
||
/**
|
||
* Allow others to get access to buffer
|
||
*
|
||
* \param dev - \c [in] Device handle.
|
||
* See #amdgpu_device_initialize()
|
||
* \param buf_handle - \c [in] Buffer handle
|
||
* \param type - \c [in] Type of handle requested
|
||
* \param shared_handle - \c [out] Special "shared" handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_import()
|
||
*
|
||
*/
|
||
int amdgpu_bo_export(amdgpu_bo_handle buf_handle,
|
||
enum amdgpu_bo_handle_type type,
|
||
uint32_t *shared_handle);
|
||
|
||
/**
|
||
* Request access to "shared" buffer
|
||
*
|
||
* \param dev - \c [in] Device handle.
|
||
* See #amdgpu_device_initialize()
|
||
* \param type - \c [in] Type of handle requested
|
||
* \param shared_handle - \c [in] Shared handle received as result "import"
|
||
* operation
|
||
* \param output - \c [out] Pointer to structure with information
|
||
* about imported buffer
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \note Buffer must be "imported" only using new "fd" (different from
|
||
* one used by "exporter").
|
||
*
|
||
* \sa amdgpu_bo_export()
|
||
*
|
||
*/
|
||
int amdgpu_bo_import(amdgpu_device_handle dev,
|
||
enum amdgpu_bo_handle_type type,
|
||
uint32_t shared_handle,
|
||
struct amdgpu_bo_import_result *output);
|
||
|
||
/**
|
||
* Request GPU access to user allocated memory e.g. via "malloc"
|
||
*
|
||
* \param dev - [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param cpu - [in] CPU address of user allocated memory which we
|
||
* want to map to GPU address space (make GPU accessible)
|
||
* (This address must be correctly aligned).
|
||
* \param size - [in] Size of allocation (must be correctly aligned)
|
||
* \param buf_handle - [out] Buffer handle for the userptr memory
|
||
* resource on submission and be used in other operations.
|
||
*
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \note
|
||
* This call doesn't guarantee that such memory will be persistently
|
||
* "locked" / make non-pageable. The purpose of this call is to provide
|
||
* opportunity for GPU get access to this resource during submission.
|
||
*
|
||
* The maximum amount of memory which could be mapped in this call depends
|
||
* if overcommit is disabled or not. If overcommit is disabled than the max.
|
||
* amount of memory to be pinned will be limited by left "free" size in total
|
||
* amount of memory which could be locked simultaneously ("GART" size).
|
||
*
|
||
* Supported (theoretical) max. size of mapping is restricted only by
|
||
* "GART" size.
|
||
*
|
||
* It is responsibility of caller to correctly specify access rights
|
||
* on VA assignment.
|
||
*/
|
||
int amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
|
||
void *cpu, uint64_t size,
|
||
amdgpu_bo_handle *buf_handle);
|
||
|
||
/**
|
||
* Free previosuly allocated memory
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param buf_handle - \c [in] Buffer handle to free
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \note In the case of memory shared between different applications all
|
||
* resources will be “physically” freed only all such applications
|
||
* will be terminated
|
||
* \note If is UMD responsibility to ‘free’ buffer only when there is no
|
||
* more GPU access
|
||
*
|
||
* \sa amdgpu_bo_set_metadata(), amdgpu_bo_alloc()
|
||
*
|
||
*/
|
||
int amdgpu_bo_free(amdgpu_bo_handle buf_handle);
|
||
|
||
/**
|
||
* Request CPU access to GPU accessable memory
|
||
*
|
||
* \param buf_handle - \c [in] Buffer handle
|
||
* \param cpu - \c [out] CPU address to be used for access
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_cpu_unmap()
|
||
*
|
||
*/
|
||
int amdgpu_bo_cpu_map(amdgpu_bo_handle buf_handle, void **cpu);
|
||
|
||
/**
|
||
* Release CPU access to GPU memory
|
||
*
|
||
* \param buf_handle - \c [in] Buffer handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_cpu_map()
|
||
*
|
||
*/
|
||
int amdgpu_bo_cpu_unmap(amdgpu_bo_handle buf_handle);
|
||
|
||
/**
|
||
* Wait until a buffer is not used by the device.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param buf_handle - \c [in] Buffer handle.
|
||
* \param timeout_ns - Timeout in nanoseconds.
|
||
* \param buffer_busy - 0 if buffer is idle, all GPU access was completed
|
||
* and no GPU access is scheduled.
|
||
* 1 GPU access is in fly or scheduled
|
||
*
|
||
* \return 0 - on success
|
||
* <0 - Negative POSIX Error code
|
||
*/
|
||
int amdgpu_bo_wait_for_idle(amdgpu_bo_handle buf_handle,
|
||
uint64_t timeout_ns,
|
||
bool *buffer_busy);
|
||
|
||
/**
|
||
* Creates a BO list handle for command submission.
|
||
*
|
||
* \param dev - \c [in] Device handle.
|
||
* See #amdgpu_device_initialize()
|
||
* \param number_of_resources - \c [in] Number of BOs in the list
|
||
* \param resources - \c [in] List of BO handles
|
||
* \param resource_prios - \c [in] Optional priority for each handle
|
||
* \param result - \c [out] Created BO list handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_list_destroy()
|
||
*/
|
||
int amdgpu_bo_list_create(amdgpu_device_handle dev,
|
||
uint32_t number_of_resources,
|
||
amdgpu_bo_handle *resources,
|
||
uint8_t *resource_prios,
|
||
amdgpu_bo_list_handle *result);
|
||
|
||
/**
|
||
* Destroys a BO list handle.
|
||
*
|
||
* \param handle - \c [in] BO list handle.
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_list_create()
|
||
*/
|
||
int amdgpu_bo_list_destroy(amdgpu_bo_list_handle handle);
|
||
|
||
/**
|
||
* Update resources for existing BO list
|
||
*
|
||
* \param handle - \c [in] BO list handle
|
||
* \param number_of_resources - \c [in] Number of BOs in the list
|
||
* \param resources - \c [in] List of BO handles
|
||
* \param resource_prios - \c [in] Optional priority for each handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_bo_list_update()
|
||
*/
|
||
int amdgpu_bo_list_update(amdgpu_bo_list_handle handle,
|
||
uint32_t number_of_resources,
|
||
amdgpu_bo_handle *resources,
|
||
uint8_t *resource_prios);
|
||
|
||
/*
|
||
* GPU Execution context
|
||
*
|
||
*/
|
||
|
||
/**
|
||
* Create GPU execution Context
|
||
*
|
||
* For the purpose of GPU Scheduler and GPU Robustness extensions it is
|
||
* necessary to have information/identify rendering/compute contexts.
|
||
* It also may be needed to associate some specific requirements with such
|
||
* contexts. Kernel driver will guarantee that submission from the same
|
||
* context will always be executed in order (first come, first serve).
|
||
*
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param context - \c [out] GPU Context handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_cs_ctx_free()
|
||
*
|
||
*/
|
||
int amdgpu_cs_ctx_create(amdgpu_device_handle dev,
|
||
amdgpu_context_handle *context);
|
||
|
||
/**
|
||
*
|
||
* Destroy GPU execution context when not needed any more
|
||
*
|
||
* \param context - \c [in] GPU Context handle
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_cs_ctx_create()
|
||
*
|
||
*/
|
||
int amdgpu_cs_ctx_free(amdgpu_context_handle context);
|
||
|
||
/**
|
||
* Query reset state for the specific GPU Context
|
||
*
|
||
* \param context - \c [in] GPU Context handle
|
||
* \param state - \c [out] One of AMDGPU_CTX_*_RESET
|
||
* \param hangs - \c [out] Number of hangs caused by the context.
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \sa amdgpu_cs_ctx_create()
|
||
*
|
||
*/
|
||
int amdgpu_cs_query_reset_state(amdgpu_context_handle context,
|
||
uint32_t *state, uint32_t *hangs);
|
||
|
||
/*
|
||
* Command Buffers Management
|
||
*
|
||
*/
|
||
|
||
/**
|
||
* Send request to submit command buffers to hardware.
|
||
*
|
||
* Kernel driver could use GPU Scheduler to make decision when physically
|
||
* sent this request to the hardware. Accordingly this request could be put
|
||
* in queue and sent for execution later. The only guarantee is that request
|
||
* from the same GPU context to the same ip:ip_instance:ring will be executed in
|
||
* order.
|
||
*
|
||
* The caller can specify the user fence buffer/location with the fence_info in the
|
||
* cs_request.The sequence number is returned via the 'seq_no' paramter
|
||
* in ibs_request structure.
|
||
*
|
||
*
|
||
* \param dev - \c [in] Device handle.
|
||
* See #amdgpu_device_initialize()
|
||
* \param context - \c [in] GPU Context
|
||
* \param flags - \c [in] Global submission flags
|
||
* \param ibs_request - \c [in/out] Pointer to submission requests.
|
||
* We could submit to the several
|
||
* engines/rings simulteniously as
|
||
* 'atomic' operation
|
||
* \param number_of_requests - \c [in] Number of submission requests
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \note It is required to pass correct resource list with buffer handles
|
||
* which will be accessible by command buffers from submission
|
||
* This will allow kernel driver to correctly implement "paging".
|
||
* Failure to do so will have unpredictable results.
|
||
*
|
||
* \sa amdgpu_command_buffer_alloc(), amdgpu_command_buffer_free(),
|
||
* amdgpu_cs_query_fence_status()
|
||
*
|
||
*/
|
||
int amdgpu_cs_submit(amdgpu_context_handle context,
|
||
uint64_t flags,
|
||
struct amdgpu_cs_request *ibs_request,
|
||
uint32_t number_of_requests);
|
||
|
||
/**
|
||
* Query status of Command Buffer Submission
|
||
*
|
||
* \param fence - \c [in] Structure describing fence to query
|
||
* \param timeout_ns - \c [in] Timeout value to wait
|
||
* \param flags - \c [in] Flags for the query
|
||
* \param expired - \c [out] If fence expired or not.\n
|
||
* 0 – if fence is not expired\n
|
||
* !0 - otherwise
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \note If UMD wants only to check operation status and returned immediately
|
||
* then timeout value as 0 must be passed. In this case success will be
|
||
* returned in the case if submission was completed or timeout error
|
||
* code.
|
||
*
|
||
* \sa amdgpu_cs_submit()
|
||
*/
|
||
int amdgpu_cs_query_fence_status(struct amdgpu_cs_fence *fence,
|
||
uint64_t timeout_ns,
|
||
uint64_t flags,
|
||
uint32_t *expired);
|
||
|
||
/*
|
||
* Query / Info API
|
||
*
|
||
*/
|
||
|
||
/**
|
||
* Query allocation size alignments
|
||
*
|
||
* UMD should query information about GPU VM MC size alignments requirements
|
||
* to be able correctly choose required allocation size and implement
|
||
* internal optimization if needed.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param info - \c [out] Pointer to structure to get size alignment
|
||
* requirements
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_query_buffer_size_alignment(amdgpu_device_handle dev,
|
||
struct amdgpu_buffer_size_alignments
|
||
*info);
|
||
|
||
/**
|
||
* Query firmware versions
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param fw_type - \c [in] AMDGPU_INFO_FW_*
|
||
* \param ip_instance - \c [in] Index of the IP block of the same type.
|
||
* \param index - \c [in] Index of the engine. (for SDMA and MEC)
|
||
* \param version - \c [out] Pointer to to the "version" return value
|
||
* \param feature - \c [out] Pointer to to the "feature" return value
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_query_firmware_version(amdgpu_device_handle dev, unsigned fw_type,
|
||
unsigned ip_instance, unsigned index,
|
||
uint32_t *version, uint32_t *feature);
|
||
|
||
/**
|
||
* Query the number of HW IP instances of a certain type.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param type - \c [in] Hardware IP block type = AMDGPU_HW_IP_*
|
||
* \param count - \c [out] Pointer to structure to get information
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*/
|
||
int amdgpu_query_hw_ip_count(amdgpu_device_handle dev, unsigned type,
|
||
uint32_t *count);
|
||
|
||
/**
|
||
* Query engine information
|
||
*
|
||
* This query allows UMD to query information different engines and their
|
||
* capabilities.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param type - \c [in] Hardware IP block type = AMDGPU_HW_IP_*
|
||
* \param ip_instance - \c [in] Index of the IP block of the same type.
|
||
* \param info - \c [out] Pointer to structure to get information
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*/
|
||
int amdgpu_query_hw_ip_info(amdgpu_device_handle dev, unsigned type,
|
||
unsigned ip_instance,
|
||
struct drm_amdgpu_info_hw_ip *info);
|
||
|
||
/**
|
||
* Query heap information
|
||
*
|
||
* This query allows UMD to query potentially available memory resources and
|
||
* adjust their logic if necessary.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param heap - \c [in] Heap type
|
||
* \param info - \c [in] Pointer to structure to get needed information
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_query_heap_info(amdgpu_device_handle dev, uint32_t heap,
|
||
uint32_t flags, struct amdgpu_heap_info *info);
|
||
|
||
/**
|
||
* Get the CRTC ID from the mode object ID
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param id - \c [in] Mode object ID
|
||
* \param result - \c [in] Pointer to the CRTC ID
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_query_crtc_from_id(amdgpu_device_handle dev, unsigned id,
|
||
int32_t *result);
|
||
|
||
/**
|
||
* Query GPU H/w Info
|
||
*
|
||
* Query hardware specific information
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param heap - \c [in] Heap type
|
||
* \param info - \c [in] Pointer to structure to get needed information
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_query_gpu_info(amdgpu_device_handle dev,
|
||
struct amdgpu_gpu_info *info);
|
||
|
||
/**
|
||
* Query hardware or driver information.
|
||
*
|
||
* The return size is query-specific and depends on the "info_id" parameter.
|
||
* No more than "size" bytes is returned.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param info_id - \c [in] AMDGPU_INFO_*
|
||
* \param size - \c [in] Size of the returned value.
|
||
* \param value - \c [out] Pointer to the return value.
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX error code
|
||
*
|
||
*/
|
||
int amdgpu_query_info(amdgpu_device_handle dev, unsigned info_id,
|
||
unsigned size, void *value);
|
||
|
||
/**
|
||
* Query information about GDS
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param gds_info - \c [out] Pointer to structure to get GDS information
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_query_gds_info(amdgpu_device_handle dev,
|
||
struct amdgpu_gds_resource_info *gds_info);
|
||
|
||
/**
|
||
* Read a set of consecutive memory-mapped registers.
|
||
* Not all registers are allowed to be read by userspace.
|
||
*
|
||
* \param dev - \c [in] Device handle. See #amdgpu_device_initialize(
|
||
* \param dword_offset - \c [in] Register offset in dwords
|
||
* \param count - \c [in] The number of registers to read starting
|
||
* from the offset
|
||
* \param instance - \c [in] GRBM_GFX_INDEX selector. It may have other
|
||
* uses. Set it to 0xffffffff if unsure.
|
||
* \param flags - \c [in] Flags with additional information.
|
||
* \param values - \c [out] The pointer to return values.
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX error code
|
||
*
|
||
*/
|
||
int amdgpu_read_mm_registers(amdgpu_device_handle dev, unsigned dword_offset,
|
||
unsigned count, uint32_t instance, uint32_t flags,
|
||
uint32_t *values);
|
||
|
||
/**
|
||
* Flag to request VA address range in the 32bit address space
|
||
*/
|
||
#define AMDGPU_VA_RANGE_32_BIT 0x1
|
||
|
||
/**
|
||
* Allocate virtual address range
|
||
*
|
||
* \param dev - [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param va_range_type - \c [in] Type of MC va range from which to allocate
|
||
* \param size - \c [in] Size of range. Size must be correctly* aligned.
|
||
* It is client responsibility to correctly aligned size based on the future
|
||
* usage of allocated range.
|
||
* \param va_base_alignment - \c [in] Overwrite base address alignment
|
||
* requirement for GPU VM MC virtual
|
||
* address assignment. Must be multiple of size alignments received as
|
||
* 'amdgpu_buffer_size_alignments'.
|
||
* If 0 use the default one.
|
||
* \param va_base_required - \c [in] Specified required va base address.
|
||
* If 0 then library choose available one.
|
||
* If !0 value will be passed and those value already "in use" then
|
||
* corresponding error status will be returned.
|
||
* \param va_base_allocated - \c [out] On return: Allocated VA base to be used
|
||
* by client.
|
||
* \param va_range_handle - \c [out] On return: Handle assigned to allocation
|
||
* \param flags - \c [in] flags for special VA range
|
||
*
|
||
* \return 0 on success\n
|
||
* >0 - AMD specific error code\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
* \notes \n
|
||
* It is client responsibility to correctly handle VA assignments and usage.
|
||
* Neither kernel driver nor libdrm_amdpgu are able to prevent and
|
||
* detect wrong va assignemnt.
|
||
*
|
||
* It is client responsibility to correctly handle multi-GPU cases and to pass
|
||
* the corresponding arrays of all devices handles where corresponding VA will
|
||
* be used.
|
||
*
|
||
*/
|
||
int amdgpu_va_range_alloc(amdgpu_device_handle dev,
|
||
enum amdgpu_gpu_va_range va_range_type,
|
||
uint64_t size,
|
||
uint64_t va_base_alignment,
|
||
uint64_t va_base_required,
|
||
uint64_t *va_base_allocated,
|
||
amdgpu_va_handle *va_range_handle,
|
||
uint64_t flags);
|
||
|
||
/**
|
||
* Free previously allocated virtual address range
|
||
*
|
||
*
|
||
* \param va_range_handle - \c [in] Handle assigned to VA allocation
|
||
*
|
||
* \return 0 on success\n
|
||
* >0 - AMD specific error code\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
int amdgpu_va_range_free(amdgpu_va_handle va_range_handle);
|
||
|
||
/**
|
||
* Query virtual address range
|
||
*
|
||
* UMD can query GPU VM range supported by each device
|
||
* to initialize its own VAM accordingly.
|
||
*
|
||
* \param dev - [in] Device handle. See #amdgpu_device_initialize()
|
||
* \param type - \c [in] Type of virtual address range
|
||
* \param offset - \c [out] Start offset of virtual address range
|
||
* \param size - \c [out] Size of virtual address range
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
|
||
int amdgpu_va_range_query(amdgpu_device_handle dev,
|
||
enum amdgpu_gpu_va_range type,
|
||
uint64_t *start,
|
||
uint64_t *end);
|
||
|
||
/**
|
||
* VA mapping/unmapping for the buffer object
|
||
*
|
||
* \param bo - \c [in] BO handle
|
||
* \param offset - \c [in] Start offset to map
|
||
* \param size - \c [in] Size to map
|
||
* \param addr - \c [in] Start virtual address.
|
||
* \param flags - \c [in] Supported flags for mapping/unmapping
|
||
* \param ops - \c [in] AMDGPU_VA_OP_MAP or AMDGPU_VA_OP_UNMAP
|
||
*
|
||
* \return 0 on success\n
|
||
* <0 - Negative POSIX Error code
|
||
*
|
||
*/
|
||
|
||
int amdgpu_bo_va_op(amdgpu_bo_handle bo,
|
||
uint64_t offset,
|
||
uint64_t size,
|
||
uint64_t addr,
|
||
uint64_t flags,
|
||
uint32_t ops);
|
||
|
||
#endif /* #ifdef _AMDGPU_H_ */
|