blob: 302f1dc418446dfbab272eb6c8934697651ef425 [file] [log] [blame]
Alex Deucher09361392015-04-20 12:04:22 -04001/*
2 * Copyright 2014 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22*/
23
24/**
25 * \file amdgpu.h
26 *
27 * Declare public libdrm_amdgpu API
28 *
29 * This file define API exposed by libdrm_amdgpu library.
30 * User wanted to use libdrm_amdgpu functionality must include
31 * this file.
32 *
33 */
34#ifndef _AMDGPU_H_
35#define _AMDGPU_H_
36
37#include <stdint.h>
38#include <stdbool.h>
39
40struct drm_amdgpu_info_hw_ip;
41
42/*--------------------------------------------------------------------------*/
43/* --------------------------- Defines ------------------------------------ */
44/*--------------------------------------------------------------------------*/
45
46/**
47 * Define max. number of Command Buffers (IB) which could be sent to the single
48 * hardware IP to accommodate CE/DE requirements
49 *
50 * \sa amdgpu_cs_ib_info
51*/
52#define AMDGPU_CS_MAX_IBS_PER_SUBMIT 4
53
54/**
55 *
56 */
57#define AMDGPU_TIMEOUT_INFINITE 0xffffffffffffffffull
58
59/**
Alex Deucher09361392015-04-20 12:04:22 -040060 * The special flag to mark that this IB will re-used
61 * by client and should not be automatically return back
62 * to free pool by libdrm_amdgpu when submission is completed.
63 *
64 * \sa amdgpu_cs_ib_info
65*/
66#define AMDGPU_CS_REUSE_IB 0x2
67
Alex Deucher09361392015-04-20 12:04:22 -040068/*--------------------------------------------------------------------------*/
69/* ----------------------------- Enums ------------------------------------ */
70/*--------------------------------------------------------------------------*/
71
72/**
73 * Enum describing possible handle types
74 *
75 * \sa amdgpu_bo_import, amdgpu_bo_export
76 *
77*/
78enum amdgpu_bo_handle_type {
79 /** GEM flink name (needs DRM authentication, used by DRI2) */
80 amdgpu_bo_handle_type_gem_flink_name = 0,
81
82 /** KMS handle which is used by all driver ioctls */
83 amdgpu_bo_handle_type_kms = 1,
84
85 /** DMA-buf fd handle */
86 amdgpu_bo_handle_type_dma_buf_fd = 2
87};
88
89/**
Alex Deucher09361392015-04-20 12:04:22 -040090 * For performance reasons and to simplify logic libdrm_amdgpu will handle
91 * IBs only some pre-defined sizes.
92 *
93 * \sa amdgpu_cs_alloc_ib()
94 */
95enum amdgpu_cs_ib_size {
Jammy Zhou8a208ee2015-05-18 19:14:56 +080096 amdgpu_cs_ib_size_4K = 0,
97 amdgpu_cs_ib_size_16K = 1,
98 amdgpu_cs_ib_size_32K = 2,
99 amdgpu_cs_ib_size_64K = 3,
100 amdgpu_cs_ib_size_128K = 4
Alex Deucher09361392015-04-20 12:04:22 -0400101};
102
103/** The number of different IB sizes */
Jammy Zhou8a208ee2015-05-18 19:14:56 +0800104#define AMDGPU_CS_IB_SIZE_NUM 5
Alex Deucher09361392015-04-20 12:04:22 -0400105
106
107/*--------------------------------------------------------------------------*/
108/* -------------------------- Datatypes ----------------------------------- */
109/*--------------------------------------------------------------------------*/
110
111/**
112 * Define opaque pointer to context associated with fd.
113 * This context will be returned as the result of
114 * "initialize" function and should be pass as the first
115 * parameter to any API call
116 */
117typedef struct amdgpu_device *amdgpu_device_handle;
118
119/**
120 * Define GPU Context type as pointer to opaque structure
121 * Example of GPU Context is the "rendering" context associated
122 * with OpenGL context (glCreateContext)
123 */
124typedef struct amdgpu_context *amdgpu_context_handle;
125
126/**
127 * Define handle for amdgpu resources: buffer, GDS, etc.
128 */
129typedef struct amdgpu_bo *amdgpu_bo_handle;
130
131/**
Christian König6dc2eaf2015-04-22 14:52:34 +0200132 * Define handle for list of BOs
133 */
134typedef struct amdgpu_bo_list *amdgpu_bo_list_handle;
135
136/**
Alex Deucher09361392015-04-20 12:04:22 -0400137 * Define handle to be used when dealing with command
138 * buffers (a.k.a. ibs)
139 *
140 */
141typedef struct amdgpu_ib *amdgpu_ib_handle;
142
143
144/*--------------------------------------------------------------------------*/
145/* -------------------------- Structures ---------------------------------- */
146/*--------------------------------------------------------------------------*/
147
148/**
149 * Structure describing memory allocation request
150 *
151 * \sa amdgpu_bo_alloc()
152 *
153*/
154struct amdgpu_bo_alloc_request {
155 /** Allocation request. It must be aligned correctly. */
156 uint64_t alloc_size;
157
158 /**
159 * It may be required to have some specific alignment requirements
160 * for physical back-up storage (e.g. for displayable surface).
161 * If 0 there is no special alignment requirement
162 */
163 uint64_t phys_alignment;
164
165 /**
166 * UMD should specify where to allocate memory and how it
167 * will be accessed by the CPU.
168 */
169 uint32_t preferred_heap;
170
171 /** Additional flags passed on allocation */
172 uint64_t flags;
173};
174
175/**
176 * Structure describing memory allocation request
177 *
178 * \sa amdgpu_bo_alloc()
179*/
180struct amdgpu_bo_alloc_result {
181 /** Assigned virtual MC Base Address */
182 uint64_t virtual_mc_base_address;
183
184 /** Handle of allocated memory to be used by the given process only. */
185 amdgpu_bo_handle buf_handle;
186};
187
188/**
189 * Special UMD specific information associated with buffer.
190 *
191 * It may be need to pass some buffer charactersitic as part
192 * of buffer sharing. Such information are defined UMD and
193 * opaque for libdrm_amdgpu as well for kernel driver.
194 *
195 * \sa amdgpu_bo_set_metadata(), amdgpu_bo_query_info,
196 * amdgpu_bo_import(), amdgpu_bo_export
197 *
198*/
199struct amdgpu_bo_metadata {
200 /** Special flag associated with surface */
201 uint64_t flags;
202
203 /**
204 * ASIC-specific tiling information (also used by DCE).
205 * The encoding is defined by the AMDGPU_TILING_* definitions.
206 */
207 uint64_t tiling_info;
208
209 /** Size of metadata associated with the buffer, in bytes. */
210 uint32_t size_metadata;
211
212 /** UMD specific metadata. Opaque for kernel */
213 uint32_t umd_metadata[64];
214};
215
216/**
217 * Structure describing allocated buffer. Client may need
218 * to query such information as part of 'sharing' buffers mechanism
219 *
220 * \sa amdgpu_bo_set_metadata(), amdgpu_bo_query_info(),
221 * amdgpu_bo_import(), amdgpu_bo_export()
222*/
223struct amdgpu_bo_info {
224 /** Allocated memory size */
225 uint64_t alloc_size;
226
227 /**
228 * It may be required to have some specific alignment requirements
229 * for physical back-up storage.
230 */
231 uint64_t phys_alignment;
232
233 /**
234 * Assigned virtual MC Base Address.
235 * \note This information will be returned only if this buffer was
236 * allocated in the same process otherwise 0 will be returned.
237 */
238 uint64_t virtual_mc_base_address;
239
240 /** Heap where to allocate memory. */
241 uint32_t preferred_heap;
242
243 /** Additional allocation flags. */
244 uint64_t alloc_flags;
245
246 /** Metadata associated with buffer if any. */
247 struct amdgpu_bo_metadata metadata;
248};
249
250/**
251 * Structure with information about "imported" buffer
252 *
253 * \sa amdgpu_bo_import()
254 *
255 */
256struct amdgpu_bo_import_result {
257 /** Handle of memory/buffer to use */
258 amdgpu_bo_handle buf_handle;
259
260 /** Buffer size */
261 uint64_t alloc_size;
262
263 /** Assigned virtual MC Base Address */
264 uint64_t virtual_mc_base_address;
265};
266
267
268/**
269 *
270 * Structure to describe GDS partitioning information.
271 * \note OA and GWS resources are asscoiated with GDS partition
272 *
273 * \sa amdgpu_gpu_resource_query_gds_info
274 *
275*/
276struct amdgpu_gds_resource_info {
277 uint32_t gds_gfx_partition_size;
278 uint32_t compute_partition_size;
279 uint32_t gds_total_size;
280 uint32_t gws_per_gfx_partition;
281 uint32_t gws_per_compute_partition;
282 uint32_t oa_per_gfx_partition;
283 uint32_t oa_per_compute_partition;
284};
285
286
287
288/**
289 * Structure describing result of request to allocate GDS
290 *
291 * \sa amdgpu_gpu_resource_gds_alloc
292 *
293*/
294struct amdgpu_gds_alloc_info {
295 /** Handle assigned to gds allocation */
296 amdgpu_bo_handle resource_handle;
297
298 /** How much was really allocated */
299 uint32_t gds_memory_size;
300
301 /** Number of GWS resources allocated */
302 uint32_t gws;
303
304 /** Number of OA resources allocated */
305 uint32_t oa;
306};
307
308/**
309 * Structure to described allocated command buffer (a.k.a. IB)
310 *
311 * \sa amdgpu_cs_alloc_ib()
312 *
313*/
314struct amdgpu_cs_ib_alloc_result {
315 /** IB allocation handle */
316 amdgpu_ib_handle handle;
317
318 /** Assigned GPU VM MC Address of command buffer */
319 uint64_t mc_address;
320
321 /** Address to be used for CPU access */
322 void *cpu;
323};
324
325/**
326 * Structure describing IB
327 *
328 * \sa amdgpu_cs_request, amdgpu_cs_submit()
329 *
330*/
331struct amdgpu_cs_ib_info {
332 /** Special flags */
333 uint64_t flags;
334
335 /** Handle of command buffer */
336 amdgpu_ib_handle ib_handle;
337
338 /**
339 * Size of Command Buffer to be submitted.
340 * - The size is in units of dwords (4 bytes).
341 * - Must be less or equal to the size of allocated IB
342 * - Could be 0
343 */
344 uint32_t size;
Jammy Zhou60e221c2015-05-21 04:17:48 +0800345
346 /** Offset in the IB buffer object (in unit of dwords) */
347 uint32_t offset_dw;
Alex Deucher09361392015-04-20 12:04:22 -0400348};
349
350/**
351 * Structure describing submission request
352 *
353 * \note We could have several IBs as packet. e.g. CE, CE, DE case for gfx
354 *
355 * \sa amdgpu_cs_submit()
356*/
357struct amdgpu_cs_request {
358 /** Specify flags with additional information */
359 uint64_t flags;
360
361 /** Specify HW IP block type to which to send the IB. */
362 unsigned ip_type;
363
364 /** IP instance index if there are several IPs of the same type. */
365 unsigned ip_instance;
366
367 /**
368 * Specify ring index of the IP. We could have several rings
369 * in the same IP. E.g. 0 for SDMA0 and 1 for SDMA1.
370 */
371 uint32_t ring;
372
373 /**
Christian König6dc2eaf2015-04-22 14:52:34 +0200374 * List handle with resources used by this request.
Alex Deucher09361392015-04-20 12:04:22 -0400375 */
Christian König6dc2eaf2015-04-22 14:52:34 +0200376 amdgpu_bo_list_handle resources;
Alex Deucher09361392015-04-20 12:04:22 -0400377
378 /** Number of IBs to submit in the field ibs. */
379 uint32_t number_of_ibs;
380
381 /**
382 * IBs to submit. Those IBs will be submit together as single entity
383 */
384 struct amdgpu_cs_ib_info *ibs;
385};
386
387/**
388 * Structure describing request to check submission state using fence
389 *
390 * \sa amdgpu_cs_query_fence_status()
391 *
392*/
393struct amdgpu_cs_query_fence {
394
395 /** In which context IB was sent to execution */
396 amdgpu_context_handle context;
397
398 /** Timeout in nanoseconds. */
399 uint64_t timeout_ns;
400
401 /** To which HW IP type the fence belongs */
402 unsigned ip_type;
403
404 /** IP instance index if there are several IPs of the same type. */
405 unsigned ip_instance;
406
407 /** Ring index of the HW IP */
408 uint32_t ring;
409
410 /** Flags */
411 uint64_t flags;
412
413 /** Specify fence for which we need to check
414 * submission status.*/
415 uint64_t fence;
416};
417
418/**
419 * Structure which provide information about GPU VM MC Address space
420 * alignments requirements
421 *
422 * \sa amdgpu_query_buffer_size_alignment
423 */
424struct amdgpu_buffer_size_alignments {
425 /** Size alignment requirement for allocation in
426 * local memory */
427 uint64_t size_local;
428
429 /**
430 * Size alignment requirement for allocation in remote memory
431 */
432 uint64_t size_remote;
433};
434
435
436/**
437 * Structure which provide information about heap
438 *
439 * \sa amdgpu_query_heap_info()
440 *
441 */
442struct amdgpu_heap_info {
443 /** Theoretical max. available memory in the given heap */
444 uint64_t heap_size;
445
446 /**
447 * Number of bytes allocated in the heap. This includes all processes
448 * and private allocations in the kernel. It changes when new buffers
449 * are allocated, freed, and moved. It cannot be larger than
450 * heap_size.
451 */
452 uint64_t heap_usage;
453
454 /**
455 * Theoretical possible max. size of buffer which
456 * could be allocated in the given heap
457 */
458 uint64_t max_allocation;
459};
460
461
462
463/**
464 * Describe GPU h/w info needed for UMD correct initialization
465 *
466 * \sa amdgpu_query_gpu_info()
467*/
468struct amdgpu_gpu_info {
469 /** Asic id */
470 uint32_t asic_id;
471 /**< Chip revision */
472 uint32_t chip_rev;
473 /** Chip external revision */
474 uint32_t chip_external_rev;
475 /** Family ID */
476 uint32_t family_id;
477 /** Special flags */
478 uint64_t ids_flags;
479 /** max engine clock*/
480 uint64_t max_engine_clk;
Ken Wangfc9fc7d2015-06-03 17:07:44 +0800481 /** max memory clock */
482 uint64_t max_memory_clk;
Alex Deucher09361392015-04-20 12:04:22 -0400483 /** number of shader engines */
484 uint32_t num_shader_engines;
485 /** number of shader arrays per engine */
486 uint32_t num_shader_arrays_per_engine;
487 /** Number of available good shader pipes */
488 uint32_t avail_quad_shader_pipes;
489 /** Max. number of shader pipes.(including good and bad pipes */
490 uint32_t max_quad_shader_pipes;
491 /** Number of parameter cache entries per shader quad pipe */
492 uint32_t cache_entries_per_quad_pipe;
493 /** Number of available graphics context */
494 uint32_t num_hw_gfx_contexts;
495 /** Number of render backend pipes */
496 uint32_t rb_pipes;
Alex Deucher09361392015-04-20 12:04:22 -0400497 /** Enabled render backend pipe mask */
498 uint32_t enabled_rb_pipes_mask;
499 /** Frequency of GPU Counter */
500 uint32_t gpu_counter_freq;
501 /** CC_RB_BACKEND_DISABLE.BACKEND_DISABLE per SE */
502 uint32_t backend_disable[4];
503 /** Value of MC_ARB_RAMCFG register*/
504 uint32_t mc_arb_ramcfg;
505 /** Value of GB_ADDR_CONFIG */
506 uint32_t gb_addr_cfg;
507 /** Values of the GB_TILE_MODE0..31 registers */
508 uint32_t gb_tile_mode[32];
509 /** Values of GB_MACROTILE_MODE0..15 registers */
510 uint32_t gb_macro_tile_mode[16];
511 /** Value of PA_SC_RASTER_CONFIG register per SE */
512 uint32_t pa_sc_raster_cfg[4];
513 /** Value of PA_SC_RASTER_CONFIG_1 register per SE */
514 uint32_t pa_sc_raster_cfg1[4];
515 /* CU info */
516 uint32_t cu_active_number;
517 uint32_t cu_ao_mask;
518 uint32_t cu_bitmap[4][4];
Ken Wang4bf29412015-06-03 17:15:29 +0800519 /* video memory type info*/
520 uint32_t vram_type;
521 /* video memory bit width*/
522 uint32_t vram_bit_width;
Ken Wangcdd1edc2015-06-03 17:21:27 +0800523 /** constant engine ram size*/
524 uint32_t ce_ram_size;
Alex Deucher09361392015-04-20 12:04:22 -0400525};
526
527
528/*--------------------------------------------------------------------------*/
529/*------------------------- Functions --------------------------------------*/
530/*--------------------------------------------------------------------------*/
531
532/*
533 * Initialization / Cleanup
534 *
535*/
536
537
538/**
539 *
540 * \param fd - \c [in] File descriptor for AMD GPU device
541 * received previously as the result of
542 * e.g. drmOpen() call.
543 * For legacy fd type, the DRI2/DRI3 authentication
544 * should be done before calling this function.
545 * \param major_version - \c [out] Major version of library. It is assumed
546 * that adding new functionality will cause
547 * increase in major version
548 * \param minor_version - \c [out] Minor version of library
549 * \param device_handle - \c [out] Pointer to opaque context which should
550 * be passed as the first parameter on each
551 * API call
552 *
553 *
554 * \return 0 on success\n
555 * >0 - AMD specific error code\n
556 * <0 - Negative POSIX Error code
557 *
558 *
559 * \sa amdgpu_device_deinitialize()
560*/
561int amdgpu_device_initialize(int fd,
562 uint32_t *major_version,
563 uint32_t *minor_version,
564 amdgpu_device_handle *device_handle);
565
566
567
568/**
569 *
570 * When access to such library does not needed any more the special
571 * function must be call giving opportunity to clean up any
572 * resources if needed.
573 *
574 * \param device_handle - \c [in] Context associated with file
575 * descriptor for AMD GPU device
576 * received previously as the
577 * result e.g. of drmOpen() call.
578 *
579 * \return 0 on success\n
580 * >0 - AMD specific error code\n
581 * <0 - Negative POSIX Error code
582 *
583 * \sa amdgpu_device_initialize()
584 *
585*/
586int amdgpu_device_deinitialize(amdgpu_device_handle device_handle);
587
588
589/*
590 * Memory Management
591 *
592*/
593
594/**
595 * Allocate memory to be used by UMD for GPU related operations
596 *
597 * \param dev - \c [in] Device handle.
598 * See #amdgpu_device_initialize()
599 * \param alloc_buffer - \c [in] Pointer to the structure describing an
600 * allocation request
601 * \param info - \c [out] Pointer to structure which return
602 * information about allocated memory
603 *
604 * \return 0 on success\n
605 * >0 - AMD specific error code\n
606 * <0 - Negative POSIX Error code
607 *
608 * \sa amdgpu_bo_free()
609*/
610int amdgpu_bo_alloc(amdgpu_device_handle dev,
611 struct amdgpu_bo_alloc_request *alloc_buffer,
612 struct amdgpu_bo_alloc_result *info);
613
614/**
615 * Associate opaque data with buffer to be queried by another UMD
616 *
617 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
618 * \param buf_handle - \c [in] Buffer handle
619 * \param info - \c [in] Metadata to associated with buffer
620 *
621 * \return 0 on success\n
622 * >0 - AMD specific error code\n
623 * <0 - Negative POSIX Error code
624*/
625int amdgpu_bo_set_metadata(amdgpu_bo_handle buf_handle,
626 struct amdgpu_bo_metadata *info);
627
628/**
629 * Query buffer information including metadata previusly associated with
630 * buffer.
631 *
632 * \param dev - \c [in] Device handle.
633 * See #amdgpu_device_initialize()
634 * \param buf_handle - \c [in] Buffer handle
635 * \param info - \c [out] Structure describing buffer
636 *
637 * \return 0 on success\n
638 * >0 - AMD specific error code\n
639 * <0 - Negative POSIX Error code
640 *
641 * \sa amdgpu_bo_set_metadata(), amdgpu_bo_alloc()
642*/
643int amdgpu_bo_query_info(amdgpu_bo_handle buf_handle,
644 struct amdgpu_bo_info *info);
645
646/**
647 * Allow others to get access to buffer
648 *
649 * \param dev - \c [in] Device handle.
650 * See #amdgpu_device_initialize()
651 * \param buf_handle - \c [in] Buffer handle
652 * \param type - \c [in] Type of handle requested
653 * \param shared_handle - \c [out] Special "shared" handle
654 *
655 * \return 0 on success\n
656 * >0 - AMD specific error code\n
657 * <0 - Negative POSIX Error code
658 *
659 * \sa amdgpu_bo_import()
660 *
661*/
662int amdgpu_bo_export(amdgpu_bo_handle buf_handle,
663 enum amdgpu_bo_handle_type type,
664 uint32_t *shared_handle);
665
666/**
667 * Request access to "shared" buffer
668 *
669 * \param dev - \c [in] Device handle.
670 * See #amdgpu_device_initialize()
671 * \param type - \c [in] Type of handle requested
672 * \param shared_handle - \c [in] Shared handle received as result "import"
673 * operation
674 * \param output - \c [out] Pointer to structure with information
675 * about imported buffer
676 *
677 * \return 0 on success\n
678 * >0 - AMD specific error code\n
679 * <0 - Negative POSIX Error code
680 *
681 * \note Buffer must be "imported" only using new "fd" (different from
682 * one used by "exporter").
683 *
684 * \sa amdgpu_bo_export()
685 *
686*/
687int amdgpu_bo_import(amdgpu_device_handle dev,
688 enum amdgpu_bo_handle_type type,
689 uint32_t shared_handle,
690 struct amdgpu_bo_import_result *output);
691
692/**
693 * Free previosuly allocated memory
694 *
695 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
696 * \param buf_handle - \c [in] Buffer handle to free
697 *
698 * \return 0 on success\n
699 * >0 - AMD specific error code\n
700 * <0 - Negative POSIX Error code
701 *
702 * \note In the case of memory shared between different applications all
703 * resources will be “physically” freed only all such applications
704 * will be terminated
705 * \note If is UMD responsibility to ‘free’ buffer only when there is no
706 * more GPU access
707 *
708 * \sa amdgpu_bo_set_metadata(), amdgpu_bo_alloc()
709 *
710*/
711int amdgpu_bo_free(amdgpu_bo_handle buf_handle);
712
713/**
714 * Request CPU access to GPU accessable memory
715 *
716 * \param buf_handle - \c [in] Buffer handle
717 * \param cpu - \c [out] CPU address to be used for access
718 *
719 * \return 0 on success\n
720 * >0 - AMD specific error code\n
721 * <0 - Negative POSIX Error code
722 *
723 * \sa amdgpu_bo_cpu_unmap()
724 *
725*/
726int amdgpu_bo_cpu_map(amdgpu_bo_handle buf_handle, void **cpu);
727
728/**
729 * Release CPU access to GPU memory
730 *
731 * \param buf_handle - \c [in] Buffer handle
732 *
733 * \return 0 on success\n
734 * >0 - AMD specific error code\n
735 * <0 - Negative POSIX Error code
736 *
737 * \sa amdgpu_bo_cpu_map()
738 *
739*/
740int amdgpu_bo_cpu_unmap(amdgpu_bo_handle buf_handle);
741
742
743/**
744 * Wait until a buffer is not used by the device.
745 *
746 * \param dev - \c [in] Device handle. See #amdgpu_lib_initialize()
747 * \param buf_handle - \c [in] Buffer handle.
748 * \param timeout_ns - Timeout in nanoseconds.
749 * \param buffer_busy - 0 if buffer is idle, all GPU access was completed
750 * and no GPU access is scheduled.
751 * 1 GPU access is in fly or scheduled
752 *
753 * \return 0 - on success
754 * <0 - AMD specific error code
755 */
756int amdgpu_bo_wait_for_idle(amdgpu_bo_handle buf_handle,
757 uint64_t timeout_ns,
758 bool *buffer_busy);
759
Christian König6dc2eaf2015-04-22 14:52:34 +0200760/**
761 * Creates a BO list handle for command submission.
762 *
763 * \param dev - \c [in] Device handle.
764 * See #amdgpu_device_initialize()
765 * \param number_of_resources - \c [in] Number of BOs in the list
766 * \param resources - \c [in] List of BO handles
767 * \param resource_prios - \c [in] Optional priority for each handle
768 * \param result - \c [out] Created BO list handle
769 *
770 * \return 0 on success\n
771 * >0 - AMD specific error code\n
772 * <0 - Negative POSIX Error code
773 *
774 * \sa amdgpu_bo_list_destroy()
775*/
776int amdgpu_bo_list_create(amdgpu_device_handle dev,
777 uint32_t number_of_resources,
778 amdgpu_bo_handle *resources,
779 uint8_t *resource_prios,
780 amdgpu_bo_list_handle *result);
781
782/**
783 * Destroys a BO list handle.
784 *
785 * \param handle - \c [in] BO list handle.
786 *
787 * \return 0 on success\n
788 * >0 - AMD specific error code\n
789 * <0 - Negative POSIX Error code
790 *
791 * \sa amdgpu_bo_list_create()
792*/
793int amdgpu_bo_list_destroy(amdgpu_bo_list_handle handle);
Alex Deucher09361392015-04-20 12:04:22 -0400794
Jammy Zhou72446982015-05-18 20:27:24 +0800795/**
796 * Update resources for existing BO list
797 *
798 * \param handle - \c [in] BO list handle
799 * \param number_of_resources - \c [in] Number of BOs in the list
800 * \param resources - \c [in] List of BO handles
801 * \param resource_prios - \c [in] Optional priority for each handle
802 *
803 * \return 0 on success\n
804 * >0 - AMD specific error code\n
805 * <0 - Negative POSIX Error code
806 *
807 * \sa amdgpu_bo_list_update()
808*/
809int amdgpu_bo_list_update(amdgpu_bo_list_handle handle,
810 uint32_t number_of_resources,
811 amdgpu_bo_handle *resources,
812 uint8_t *resource_prios);
813
Alex Deucher09361392015-04-20 12:04:22 -0400814/*
815 * Special GPU Resources
816 *
817*/
818
819
820
821/**
822 * Query information about GDS
823 *
824 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
825 * \param gds_info - \c [out] Pointer to structure to get GDS information
826 *
827 * \return 0 on success\n
828 * >0 - AMD specific error code\n
829 * <0 - Negative POSIX Error code
830 *
831*/
832int amdgpu_gpu_resource_query_gds_info(amdgpu_device_handle dev,
833 struct amdgpu_gds_resource_info *
834 gds_info);
835
836
837/**
838 * Allocate GDS partitions
839 *
840 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
841 * \param gds_size - \c [in] Size of gds allocation. Must be aligned
842 * accordingly.
843 * \param alloc_info - \c [out] Pointer to structure to receive information
844 * about allocation
845 *
846 * \return 0 on success\n
847 * >0 - AMD specific error code\n
848 * <0 - Negative POSIX Error code
849 *
850 *
851*/
852int amdgpu_gpu_resource_gds_alloc(amdgpu_device_handle dev,
853 uint32_t gds_size,
854 struct amdgpu_gds_alloc_info *alloc_info);
855
856
857
858
859/**
860 * Release GDS resource. When GDS and associated resources not needed any
861 * more UMD should free them
862 *
863 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
864 * \param handle - \c [in] Handle assigned to GDS allocation
865 *
866 * \return 0 on success\n
867 * >0 - AMD specific error code\n
868 * <0 - Negative POSIX Error code
869 *
870*/
871int amdgpu_gpu_resource_gds_free(amdgpu_bo_handle handle);
872
873
874
875/*
876 * GPU Execution context
877 *
878*/
879
880/**
881 * Create GPU execution Context
882 *
883 * For the purpose of GPU Scheduler and GPU Robustness extensions it is
884 * necessary to have information/identify rendering/compute contexts.
885 * It also may be needed to associate some specific requirements with such
886 * contexts. Kernel driver will guarantee that submission from the same
887 * context will always be executed in order (first come, first serve).
888 *
889 *
890 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
891 * \param context - \c [out] GPU Context handle
892 *
893 * \return 0 on success\n
894 * >0 - AMD specific error code\n
895 * <0 - Negative POSIX Error code
896 *
897 * \sa amdgpu_cs_ctx_free()
898 *
899*/
900int amdgpu_cs_ctx_create(amdgpu_device_handle dev,
901 amdgpu_context_handle *context);
902
903/**
904 *
905 * Destroy GPU execution context when not needed any more
906 *
Alex Deucher09361392015-04-20 12:04:22 -0400907 * \param context - \c [in] GPU Context handle
908 *
909 * \return 0 on success\n
910 * >0 - AMD specific error code\n
911 * <0 - Negative POSIX Error code
912 *
913 * \sa amdgpu_cs_ctx_create()
914 *
915*/
Christian König9c2afff2015-04-22 12:21:13 +0200916int amdgpu_cs_ctx_free(amdgpu_context_handle context);
Alex Deucher09361392015-04-20 12:04:22 -0400917
918/**
919 * Query reset state for the specific GPU Context
920 *
Alex Deucher09361392015-04-20 12:04:22 -0400921 * \param context - \c [in] GPU Context handle
Marek Olšák4b39a8e2015-05-05 21:23:02 +0200922 * \param state - \c [out] One of AMDGPU_CTX_*_RESET
923 * \param hangs - \c [out] Number of hangs caused by the context.
Alex Deucher09361392015-04-20 12:04:22 -0400924 *
925 * \return 0 on success\n
926 * >0 - AMD specific error code\n
927 * <0 - Negative POSIX Error code
928 *
929 * \sa amdgpu_cs_ctx_create()
930 *
931*/
Christian König9c2afff2015-04-22 12:21:13 +0200932int amdgpu_cs_query_reset_state(amdgpu_context_handle context,
Marek Olšák4b39a8e2015-05-05 21:23:02 +0200933 uint32_t *state, uint32_t *hangs);
Alex Deucher09361392015-04-20 12:04:22 -0400934
935
936/*
937 * Command Buffers Management
938 *
939*/
940
941
942/**
943 * Allocate memory to be filled with PM4 packets and be served as the first
944 * entry point of execution (a.k.a. Indirect Buffer)
945 *
Alex Deucher09361392015-04-20 12:04:22 -0400946 * \param context - \c [in] GPU Context which will use IB
947 * \param ib_size - \c [in] Size of allocation
948 * \param output - \c [out] Pointer to structure to get information about
949 * allocated IB
950 *
951 * \return 0 on success\n
952 * >0 - AMD specific error code\n
953 * <0 - Negative POSIX Error code
954 *
955 * \sa amdgpu_cs_free_ib()
956 *
957*/
Christian König9c2afff2015-04-22 12:21:13 +0200958int amdgpu_cs_alloc_ib(amdgpu_context_handle context,
Alex Deucher09361392015-04-20 12:04:22 -0400959 enum amdgpu_cs_ib_size ib_size,
960 struct amdgpu_cs_ib_alloc_result *output);
961
962/**
963 * If UMD has allocates IBs which doesn’t need any more than those IBs must
964 * be explicitly freed
965 *
Alex Deucher09361392015-04-20 12:04:22 -0400966 * \param handle - \c [in] IB handle
967 *
968 * \return 0 on success\n
969 * >0 - AMD specific error code\n
970 * <0 - Negative POSIX Error code
971 *
972 * \note Libdrm_amdgpu will guarantee that it will correctly detect when it
973 * is safe to return IB to free pool
974 *
975 * \sa amdgpu_cs_alloc_ib()
976 *
977*/
Christian König9c2afff2015-04-22 12:21:13 +0200978int amdgpu_cs_free_ib(amdgpu_ib_handle handle);
Alex Deucher09361392015-04-20 12:04:22 -0400979
980/**
981 * Send request to submit command buffers to hardware.
982 *
983 * Kernel driver could use GPU Scheduler to make decision when physically
984 * sent this request to the hardware. Accordingly this request could be put
985 * in queue and sent for execution later. The only guarantee is that request
986 * from the same GPU context to the same ip:ip_instance:ring will be executed in
987 * order.
988 *
989 *
990 * \param dev - \c [in] Device handle.
991 * See #amdgpu_device_initialize()
992 * \param context - \c [in] GPU Context
993 * \param flags - \c [in] Global submission flags
994 * \param ibs_request - \c [in] Pointer to submission requests.
995 * We could submit to the several
996 * engines/rings simulteniously as
997 * 'atomic' operation
998 * \param number_of_requests - \c [in] Number of submission requests
999 * \param fences - \c [out] Pointer to array of data to get
1000 * fences to identify submission
1001 * requests. Timestamps are valid
1002 * in this GPU context and could be used
1003 * to identify/detect completion of
1004 * submission request
1005 *
1006 * \return 0 on success\n
1007 * >0 - AMD specific error code\n
1008 * <0 - Negative POSIX Error code
1009 *
1010 * \note It is assumed that by default IB will be returned to free pool
1011 * automatically by libdrm_amdgpu when submission will completed.
1012 * It is possible for UMD to make decision to re-use the same IB in
1013 * this case it should be explicitly freed.\n
1014 * Accordingly, by default, after submission UMD should not touch passed
1015 * IBs. If UMD needs to re-use IB then the special flag AMDGPU_CS_REUSE_IB
1016 * must be passed.
1017 *
1018 * \note It is required to pass correct resource list with buffer handles
1019 * which will be accessible by command buffers from submission
1020 * This will allow kernel driver to correctly implement "paging".
1021 * Failure to do so will have unpredictable results.
1022 *
1023 * \sa amdgpu_command_buffer_alloc(), amdgpu_command_buffer_free(),
1024 * amdgpu_cs_query_fence_status()
1025 *
1026*/
Christian König9c2afff2015-04-22 12:21:13 +02001027int amdgpu_cs_submit(amdgpu_context_handle context,
Alex Deucher09361392015-04-20 12:04:22 -04001028 uint64_t flags,
1029 struct amdgpu_cs_request *ibs_request,
1030 uint32_t number_of_requests,
1031 uint64_t *fences);
1032
1033/**
1034 * Query status of Command Buffer Submission
1035 *
1036 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1037 * \param fence - \c [in] Structure describing fence to query
1038 * \param expired - \c [out] If fence expired or not.\n
1039 * 0 – if fence is not expired\n
1040 * !0 - otherwise
1041 *
1042 * \return 0 on success\n
1043 * >0 - AMD specific error code\n
1044 * <0 - Negative POSIX Error code
1045 *
1046 * \note If UMD wants only to check operation status and returned immediately
1047 * then timeout value as 0 must be passed. In this case success will be
1048 * returned in the case if submission was completed or timeout error
1049 * code.
1050 *
1051 * \sa amdgpu_cs_submit()
1052*/
Christian König9c2afff2015-04-22 12:21:13 +02001053int amdgpu_cs_query_fence_status(struct amdgpu_cs_query_fence *fence,
Alex Deucher09361392015-04-20 12:04:22 -04001054 uint32_t *expired);
1055
1056
1057/*
1058 * Query / Info API
1059 *
1060*/
1061
1062
1063/**
1064 * Query allocation size alignments
1065 *
1066 * UMD should query information about GPU VM MC size alignments requirements
1067 * to be able correctly choose required allocation size and implement
1068 * internal optimization if needed.
1069 *
1070 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1071 * \param info - \c [out] Pointer to structure to get size alignment
1072 * requirements
1073 *
1074 * \return 0 on success\n
1075 * >0 - AMD specific error code\n
1076 * <0 - Negative POSIX Error code
1077 *
1078*/
1079int amdgpu_query_buffer_size_alignment(amdgpu_device_handle dev,
1080 struct amdgpu_buffer_size_alignments
1081 *info);
1082
1083
1084
1085/**
1086 * Query firmware versions
1087 *
1088 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1089 * \param fw_type - \c [in] AMDGPU_INFO_FW_*
1090 * \param ip_instance - \c [in] Index of the IP block of the same type.
1091 * \param index - \c [in] Index of the engine. (for SDMA and MEC)
1092 * \param version - \c [out] Pointer to to the "version" return value
1093 * \param feature - \c [out] Pointer to to the "feature" return value
1094 *
1095 * \return 0 on success\n
1096 * >0 - AMD specific error code\n
1097 * <0 - Negative POSIX Error code
1098 *
1099*/
1100int amdgpu_query_firmware_version(amdgpu_device_handle dev, unsigned fw_type,
1101 unsigned ip_instance, unsigned index,
1102 uint32_t *version, uint32_t *feature);
1103
1104
1105
1106/**
1107 * Query the number of HW IP instances of a certain type.
1108 *
1109 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1110 * \param type - \c [in] Hardware IP block type = AMDGPU_HW_IP_*
1111 * \param count - \c [out] Pointer to structure to get information
1112 *
1113 * \return 0 on success\n
1114 * >0 - AMD specific error code\n
1115 * <0 - Negative POSIX Error code
1116*/
1117int amdgpu_query_hw_ip_count(amdgpu_device_handle dev, unsigned type,
1118 uint32_t *count);
1119
1120
1121
1122/**
1123 * Query engine information
1124 *
1125 * This query allows UMD to query information different engines and their
1126 * capabilities.
1127 *
1128 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1129 * \param type - \c [in] Hardware IP block type = AMDGPU_HW_IP_*
1130 * \param ip_instance - \c [in] Index of the IP block of the same type.
1131 * \param info - \c [out] Pointer to structure to get information
1132 *
1133 * \return 0 on success\n
1134 * >0 - AMD specific error code\n
1135 * <0 - Negative POSIX Error code
1136*/
1137int amdgpu_query_hw_ip_info(amdgpu_device_handle dev, unsigned type,
1138 unsigned ip_instance,
1139 struct drm_amdgpu_info_hw_ip *info);
1140
1141
1142
1143
1144/**
1145 * Query heap information
1146 *
1147 * This query allows UMD to query potentially available memory resources and
1148 * adjust their logic if necessary.
1149 *
1150 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1151 * \param heap - \c [in] Heap type
1152 * \param info - \c [in] Pointer to structure to get needed information
1153 *
1154 * \return 0 on success\n
1155 * >0 - AMD specific error code\n
1156 * <0 - Negative POSIX Error code
1157 *
1158*/
1159int amdgpu_query_heap_info(amdgpu_device_handle dev,
1160 uint32_t heap,
1161 uint32_t flags,
1162 struct amdgpu_heap_info *info);
1163
1164
1165
1166/**
1167 * Get the CRTC ID from the mode object ID
1168 *
1169 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1170 * \param id - \c [in] Mode object ID
1171 * \param result - \c [in] Pointer to the CRTC ID
1172 *
1173 * \return 0 on success\n
1174 * >0 - AMD specific error code\n
1175 * <0 - Negative POSIX Error code
1176 *
1177*/
1178int amdgpu_query_crtc_from_id(amdgpu_device_handle dev, unsigned id,
1179 int32_t *result);
1180
1181
1182
1183/**
1184 * Query GPU H/w Info
1185 *
1186 * Query hardware specific information
1187 *
1188 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1189 * \param heap - \c [in] Heap type
1190 * \param info - \c [in] Pointer to structure to get needed information
1191 *
1192 * \return 0 on success\n
1193 * >0 - AMD specific error code\n
1194 * <0 - Negative POSIX Error code
1195 *
1196*/
1197int amdgpu_query_gpu_info(amdgpu_device_handle dev,
1198 struct amdgpu_gpu_info *info);
1199
1200
1201
1202/**
1203 * Query hardware or driver information.
1204 *
1205 * The return size is query-specific and depends on the "info_id" parameter.
1206 * No more than "size" bytes is returned.
1207 *
1208 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize()
1209 * \param info_id - \c [in] AMDGPU_INFO_*
1210 * \param size - \c [in] Size of the returned value.
1211 * \param value - \c [out] Pointer to the return value.
1212 *
1213 * \return 0 on success\n
1214 * >0 - AMD specific error code\n
1215 * <0 - Negative POSIX error code
1216 *
1217*/
1218int amdgpu_query_info(amdgpu_device_handle dev, unsigned info_id,
1219 unsigned size, void *value);
1220
1221
1222
1223/**
1224 * Read a set of consecutive memory-mapped registers.
1225 * Not all registers are allowed to be read by userspace.
1226 *
1227 * \param dev - \c [in] Device handle. See #amdgpu_device_initialize(
1228 * \param dword_offset - \c [in] Register offset in dwords
1229 * \param count - \c [in] The number of registers to read starting
1230 * from the offset
1231 * \param instance - \c [in] GRBM_GFX_INDEX selector. It may have other
1232 * uses. Set it to 0xffffffff if unsure.
1233 * \param flags - \c [in] Flags with additional information.
1234 * \param values - \c [out] The pointer to return values.
1235 *
1236 * \return 0 on success\n
1237 * >0 - AMD specific error code\n
1238 * <0 - Negative POSIX error code
1239 *
1240*/
1241int amdgpu_read_mm_registers(amdgpu_device_handle dev, unsigned dword_offset,
1242 unsigned count, uint32_t instance, uint32_t flags,
1243 uint32_t *values);
1244
1245
1246
1247/**
1248 * Request GPU access to user allocated memory e.g. via "malloc"
1249 *
1250 * \param dev - [in] Device handle. See #amdgpu_device_initialize()
1251 * \param cpu - [in] CPU address of user allocated memory which we
1252 * want to map to GPU address space (make GPU accessible)
1253 * (This address must be correctly aligned).
1254 * \param size - [in] Size of allocation (must be correctly aligned)
1255 * \param amdgpu_bo_alloc_result - [out] Handle of allocation to be passed as resource
1256 * on submission and be used in other operations.(e.g. for VA submission)
1257 * ( Temporally defined amdgpu_bo_alloc_result as parameter for return mc address. )
1258 *
1259 *
1260 * \return 0 on success
1261 * >0 - AMD specific error code
1262 * <0 - Negative POSIX Error code
1263 *
1264 *
1265 * \note
1266 * This call doesn't guarantee that such memory will be persistently
1267 * "locked" / make non-pageable. The purpose of this call is to provide
1268 * opportunity for GPU get access to this resource during submission.
1269 *
1270 * The maximum amount of memory which could be mapped in this call depends
1271 * if overcommit is disabled or not. If overcommit is disabled than the max.
1272 * amount of memory to be pinned will be limited by left "free" size in total
1273 * amount of memory which could be locked simultaneously ("GART" size).
1274 *
1275 * Supported (theoretical) max. size of mapping is restricted only by
1276 * "GART" size.
1277 *
1278 * It is responsibility of caller to correctly specify access rights
1279 * on VA assignment.
1280*/
1281int amdgpu_create_bo_from_user_mem(amdgpu_device_handle dev,
1282 void *cpu,
1283 uint64_t size,
1284 struct amdgpu_bo_alloc_result *info);
1285
1286
1287#endif /* #ifdef _AMDGPU_H_ */