blob: d7261e01ff8a2f7523c32bca8f96d612a5cf6af1 [file] [log] [blame]
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001/*
2 * Copyright 2013 Advanced Micro Devices, Inc.
3 * All Rights Reserved.
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sub license, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
12 *
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
16 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
17 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
18 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
19 * USE OR OTHER DEALINGS IN THE SOFTWARE.
20 *
21 * The above copyright notice and this permission notice (including the
22 * next paragraph) shall be included in all copies or substantial portions
23 * of the Software.
24 *
25 * Authors: Christian König <christian.koenig@amd.com>
26 */
27
28#include <linux/firmware.h>
29#include <linux/module.h>
30#include <drm/drmP.h>
31#include <drm/drm.h>
32
33#include "amdgpu.h"
34#include "amdgpu_pm.h"
35#include "amdgpu_vce.h"
36#include "cikd.h"
37
38/* 1 second timeout */
Christian König182830a2016-07-01 17:43:57 +020039#define VCE_IDLE_TIMEOUT msecs_to_jiffies(1000)
Alex Deucherd38ceaf2015-04-20 16:55:21 -040040
41/* Firmware Names */
42#ifdef CONFIG_DRM_AMDGPU_CIK
43#define FIRMWARE_BONAIRE "radeon/bonaire_vce.bin"
Christian Königedf600d2016-05-03 15:54:54 +020044#define FIRMWARE_KABINI "radeon/kabini_vce.bin"
45#define FIRMWARE_KAVERI "radeon/kaveri_vce.bin"
46#define FIRMWARE_HAWAII "radeon/hawaii_vce.bin"
Alex Deucherd38ceaf2015-04-20 16:55:21 -040047#define FIRMWARE_MULLINS "radeon/mullins_vce.bin"
48#endif
Jammy Zhouc65444f2015-05-13 22:49:04 +080049#define FIRMWARE_TONGA "amdgpu/tonga_vce.bin"
50#define FIRMWARE_CARRIZO "amdgpu/carrizo_vce.bin"
Alex Deucher188a9bc2015-07-27 14:24:14 -040051#define FIRMWARE_FIJI "amdgpu/fiji_vce.bin"
Samuel Licfaba562015-10-08 16:27:55 -040052#define FIRMWARE_STONEY "amdgpu/stoney_vce.bin"
Flora Cui2cc0c0b2016-03-14 18:33:29 -040053#define FIRMWARE_POLARIS10 "amdgpu/polaris10_vce.bin"
54#define FIRMWARE_POLARIS11 "amdgpu/polaris11_vce.bin"
Junwei Zhangc4642a42016-12-14 15:32:28 -050055#define FIRMWARE_POLARIS12 "amdgpu/polaris12_vce.bin"
Alex Deucherd38ceaf2015-04-20 16:55:21 -040056
Leo Liuc1dc3562017-03-03 18:27:49 -050057#define FIRMWARE_VEGA10 "amdgpu/vega10_vce.bin"
Alex Deucher9aa52bc2017-09-01 16:37:21 -040058#define FIRMWARE_VEGA12 "amdgpu/vega12_vce.bin"
Leo Liuc1dc3562017-03-03 18:27:49 -050059
Alex Deucherd38ceaf2015-04-20 16:55:21 -040060#ifdef CONFIG_DRM_AMDGPU_CIK
61MODULE_FIRMWARE(FIRMWARE_BONAIRE);
62MODULE_FIRMWARE(FIRMWARE_KABINI);
63MODULE_FIRMWARE(FIRMWARE_KAVERI);
64MODULE_FIRMWARE(FIRMWARE_HAWAII);
65MODULE_FIRMWARE(FIRMWARE_MULLINS);
66#endif
67MODULE_FIRMWARE(FIRMWARE_TONGA);
68MODULE_FIRMWARE(FIRMWARE_CARRIZO);
Alex Deucher188a9bc2015-07-27 14:24:14 -040069MODULE_FIRMWARE(FIRMWARE_FIJI);
Samuel Licfaba562015-10-08 16:27:55 -040070MODULE_FIRMWARE(FIRMWARE_STONEY);
Flora Cui2cc0c0b2016-03-14 18:33:29 -040071MODULE_FIRMWARE(FIRMWARE_POLARIS10);
72MODULE_FIRMWARE(FIRMWARE_POLARIS11);
Junwei Zhangc4642a42016-12-14 15:32:28 -050073MODULE_FIRMWARE(FIRMWARE_POLARIS12);
Alex Deucherd38ceaf2015-04-20 16:55:21 -040074
Leo Liuc1dc3562017-03-03 18:27:49 -050075MODULE_FIRMWARE(FIRMWARE_VEGA10);
Alex Deucher9aa52bc2017-09-01 16:37:21 -040076MODULE_FIRMWARE(FIRMWARE_VEGA12);
Leo Liuc1dc3562017-03-03 18:27:49 -050077
Alex Deucherd38ceaf2015-04-20 16:55:21 -040078static void amdgpu_vce_idle_work_handler(struct work_struct *work);
79
80/**
81 * amdgpu_vce_init - allocate memory, load vce firmware
82 *
83 * @adev: amdgpu_device pointer
84 *
85 * First step to get VCE online, allocate memory and load the firmware
86 */
Leo Liue9822622015-05-06 14:31:27 -040087int amdgpu_vce_sw_init(struct amdgpu_device *adev, unsigned long size)
Alex Deucherd38ceaf2015-04-20 16:55:21 -040088{
Christian Königc5949892016-02-10 17:43:00 +010089 struct amdgpu_ring *ring;
Lucas Stach1b1f42d2017-12-06 17:49:39 +010090 struct drm_sched_rq *rq;
Alex Deucherd38ceaf2015-04-20 16:55:21 -040091 const char *fw_name;
92 const struct common_firmware_header *hdr;
93 unsigned ucode_version, version_major, version_minor, binary_id;
94 int i, r;
95
Alex Deucherd38ceaf2015-04-20 16:55:21 -040096 switch (adev->asic_type) {
97#ifdef CONFIG_DRM_AMDGPU_CIK
98 case CHIP_BONAIRE:
99 fw_name = FIRMWARE_BONAIRE;
100 break;
101 case CHIP_KAVERI:
102 fw_name = FIRMWARE_KAVERI;
103 break;
104 case CHIP_KABINI:
105 fw_name = FIRMWARE_KABINI;
106 break;
107 case CHIP_HAWAII:
108 fw_name = FIRMWARE_HAWAII;
109 break;
110 case CHIP_MULLINS:
111 fw_name = FIRMWARE_MULLINS;
112 break;
113#endif
114 case CHIP_TONGA:
115 fw_name = FIRMWARE_TONGA;
116 break;
117 case CHIP_CARRIZO:
118 fw_name = FIRMWARE_CARRIZO;
119 break;
Alex Deucher188a9bc2015-07-27 14:24:14 -0400120 case CHIP_FIJI:
121 fw_name = FIRMWARE_FIJI;
122 break;
Samuel Licfaba562015-10-08 16:27:55 -0400123 case CHIP_STONEY:
124 fw_name = FIRMWARE_STONEY;
125 break;
Flora Cui2cc0c0b2016-03-14 18:33:29 -0400126 case CHIP_POLARIS10:
127 fw_name = FIRMWARE_POLARIS10;
Sonny Jiang1b4eeea2016-03-11 14:33:40 -0500128 break;
Flora Cui2cc0c0b2016-03-14 18:33:29 -0400129 case CHIP_POLARIS11:
130 fw_name = FIRMWARE_POLARIS11;
Sonny Jiang1b4eeea2016-03-11 14:33:40 -0500131 break;
Alex Deucher9aa52bc2017-09-01 16:37:21 -0400132 case CHIP_POLARIS12:
133 fw_name = FIRMWARE_POLARIS12;
134 break;
Leo Liuc1dc3562017-03-03 18:27:49 -0500135 case CHIP_VEGA10:
136 fw_name = FIRMWARE_VEGA10;
137 break;
Alex Deucher9aa52bc2017-09-01 16:37:21 -0400138 case CHIP_VEGA12:
139 fw_name = FIRMWARE_VEGA12;
Junwei Zhangc4642a42016-12-14 15:32:28 -0500140 break;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400141
142 default:
143 return -EINVAL;
144 }
145
146 r = request_firmware(&adev->vce.fw, fw_name, adev->dev);
147 if (r) {
148 dev_err(adev->dev, "amdgpu_vce: Can't load firmware \"%s\"\n",
149 fw_name);
150 return r;
151 }
152
153 r = amdgpu_ucode_validate(adev->vce.fw);
154 if (r) {
155 dev_err(adev->dev, "amdgpu_vce: Can't validate firmware \"%s\"\n",
156 fw_name);
157 release_firmware(adev->vce.fw);
158 adev->vce.fw = NULL;
159 return r;
160 }
161
162 hdr = (const struct common_firmware_header *)adev->vce.fw->data;
163
164 ucode_version = le32_to_cpu(hdr->ucode_version);
165 version_major = (ucode_version >> 20) & 0xfff;
166 version_minor = (ucode_version >> 8) & 0xfff;
167 binary_id = ucode_version & 0xff;
168 DRM_INFO("Found VCE firmware Version: %hhd.%hhd Binary ID: %hhd\n",
169 version_major, version_minor, binary_id);
170 adev->vce.fw_version = ((version_major << 24) | (version_minor << 16) |
171 (binary_id << 8));
172
Leo Liu78b3c832017-05-31 14:13:20 -0400173 r = amdgpu_bo_create_kernel(adev, size, PAGE_SIZE,
174 AMDGPU_GEM_DOMAIN_VRAM, &adev->vce.vcpu_bo,
175 &adev->vce.gpu_addr, &adev->vce.cpu_addr);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400176 if (r) {
177 dev_err(adev->dev, "(%d) failed to allocate VCE bo\n", r);
178 return r;
179 }
180
Christian Königc5949892016-02-10 17:43:00 +0100181 ring = &adev->vce.ring[0];
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100182 rq = &ring->sched.sched_rq[DRM_SCHED_PRIORITY_NORMAL];
183 r = drm_sched_entity_init(&ring->sched, &adev->vce.entity,
Monk Liub3eebe32017-10-23 12:23:29 +0800184 rq, amdgpu_sched_jobs, NULL);
Christian Königc5949892016-02-10 17:43:00 +0100185 if (r != 0) {
186 DRM_ERROR("Failed setting up VCE run queue.\n");
187 return r;
188 }
189
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400190 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i) {
191 atomic_set(&adev->vce.handles[i], 0);
192 adev->vce.filp[i] = NULL;
193 }
194
Christian Königebff4852016-07-20 16:53:36 +0200195 INIT_DELAYED_WORK(&adev->vce.idle_work, amdgpu_vce_idle_work_handler);
196 mutex_init(&adev->vce.idle_mutex);
197
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400198 return 0;
199}
200
201/**
202 * amdgpu_vce_fini - free memory
203 *
204 * @adev: amdgpu_device pointer
205 *
206 * Last step on VCE teardown, free firmware memory
207 */
208int amdgpu_vce_sw_fini(struct amdgpu_device *adev)
209{
Grazvydas Ignotas4cd00d32016-09-25 23:34:49 +0300210 unsigned i;
211
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400212 if (adev->vce.vcpu_bo == NULL)
213 return 0;
214
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100215 drm_sched_entity_fini(&adev->vce.ring[0].sched, &adev->vce.entity);
Christian Königc5949892016-02-10 17:43:00 +0100216
Leo Liu78b3c832017-05-31 14:13:20 -0400217 amdgpu_bo_free_kernel(&adev->vce.vcpu_bo, &adev->vce.gpu_addr,
218 (void **)&adev->vce.cpu_addr);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400219
Grazvydas Ignotas4cd00d32016-09-25 23:34:49 +0300220 for (i = 0; i < adev->vce.num_rings; i++)
221 amdgpu_ring_fini(&adev->vce.ring[i]);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400222
223 release_firmware(adev->vce.fw);
Christian Königebff4852016-07-20 16:53:36 +0200224 mutex_destroy(&adev->vce.idle_mutex);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400225
226 return 0;
227}
228
229/**
230 * amdgpu_vce_suspend - unpin VCE fw memory
231 *
232 * @adev: amdgpu_device pointer
233 *
234 */
235int amdgpu_vce_suspend(struct amdgpu_device *adev)
236{
237 int i;
238
239 if (adev->vce.vcpu_bo == NULL)
240 return 0;
241
242 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i)
243 if (atomic_read(&adev->vce.handles[i]))
244 break;
245
246 if (i == AMDGPU_MAX_VCE_HANDLES)
247 return 0;
248
Rex Zhu85cc88f2016-04-12 19:25:52 +0800249 cancel_delayed_work_sync(&adev->vce.idle_work);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400250 /* TODO: suspending running encoding sessions isn't supported */
251 return -EINVAL;
252}
253
254/**
255 * amdgpu_vce_resume - pin VCE fw memory
256 *
257 * @adev: amdgpu_device pointer
258 *
259 */
260int amdgpu_vce_resume(struct amdgpu_device *adev)
261{
262 void *cpu_addr;
263 const struct common_firmware_header *hdr;
264 unsigned offset;
265 int r;
266
267 if (adev->vce.vcpu_bo == NULL)
268 return -EINVAL;
269
270 r = amdgpu_bo_reserve(adev->vce.vcpu_bo, false);
271 if (r) {
272 dev_err(adev->dev, "(%d) failed to reserve VCE bo\n", r);
273 return r;
274 }
275
276 r = amdgpu_bo_kmap(adev->vce.vcpu_bo, &cpu_addr);
277 if (r) {
278 amdgpu_bo_unreserve(adev->vce.vcpu_bo);
279 dev_err(adev->dev, "(%d) VCE map failed\n", r);
280 return r;
281 }
282
283 hdr = (const struct common_firmware_header *)adev->vce.fw->data;
284 offset = le32_to_cpu(hdr->ucode_array_offset_bytes);
Christian König7b4d3e22016-08-23 11:18:59 +0200285 memcpy_toio(cpu_addr, adev->vce.fw->data + offset,
286 adev->vce.fw->size - offset);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400287
288 amdgpu_bo_kunmap(adev->vce.vcpu_bo);
289
290 amdgpu_bo_unreserve(adev->vce.vcpu_bo);
291
292 return 0;
293}
294
295/**
296 * amdgpu_vce_idle_work_handler - power off VCE
297 *
298 * @work: pointer to work structure
299 *
300 * power of VCE when it's not used any more
301 */
302static void amdgpu_vce_idle_work_handler(struct work_struct *work)
303{
304 struct amdgpu_device *adev =
305 container_of(work, struct amdgpu_device, vce.idle_work.work);
Alex Deucher24c5fe52016-09-26 15:19:14 -0400306 unsigned i, count = 0;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400307
Alex Deucher24c5fe52016-09-26 15:19:14 -0400308 for (i = 0; i < adev->vce.num_rings; i++)
309 count += amdgpu_fence_count_emitted(&adev->vce.ring[i]);
310
311 if (count == 0) {
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400312 if (adev->pm.dpm_enabled) {
313 amdgpu_dpm_enable_vce(adev, false);
314 } else {
315 amdgpu_asic_set_vce_clocks(adev, 0, 0);
Alex Deucher2990a1f2017-12-15 16:18:00 -0500316 amdgpu_device_ip_set_powergating_state(adev, AMD_IP_BLOCK_TYPE_VCE,
317 AMD_PG_STATE_GATE);
318 amdgpu_device_ip_set_clockgating_state(adev, AMD_IP_BLOCK_TYPE_VCE,
319 AMD_CG_STATE_GATE);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400320 }
321 } else {
Christian König182830a2016-07-01 17:43:57 +0200322 schedule_delayed_work(&adev->vce.idle_work, VCE_IDLE_TIMEOUT);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400323 }
324}
325
326/**
Christian Königebff4852016-07-20 16:53:36 +0200327 * amdgpu_vce_ring_begin_use - power up VCE
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400328 *
Christian Königebff4852016-07-20 16:53:36 +0200329 * @ring: amdgpu ring
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400330 *
331 * Make sure VCE is powerd up when we want to use it
332 */
Christian Königebff4852016-07-20 16:53:36 +0200333void amdgpu_vce_ring_begin_use(struct amdgpu_ring *ring)
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400334{
Christian Königebff4852016-07-20 16:53:36 +0200335 struct amdgpu_device *adev = ring->adev;
336 bool set_clocks;
Christian König182830a2016-07-01 17:43:57 +0200337
Xiangliang Yud9af2252017-03-07 14:45:25 +0800338 if (amdgpu_sriov_vf(adev))
339 return;
340
Christian Königebff4852016-07-20 16:53:36 +0200341 mutex_lock(&adev->vce.idle_mutex);
342 set_clocks = !cancel_delayed_work_sync(&adev->vce.idle_work);
Christian König182830a2016-07-01 17:43:57 +0200343 if (set_clocks) {
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400344 if (adev->pm.dpm_enabled) {
345 amdgpu_dpm_enable_vce(adev, true);
346 } else {
347 amdgpu_asic_set_vce_clocks(adev, 53300, 40000);
Alex Deucher2990a1f2017-12-15 16:18:00 -0500348 amdgpu_device_ip_set_clockgating_state(adev, AMD_IP_BLOCK_TYPE_VCE,
349 AMD_CG_STATE_UNGATE);
350 amdgpu_device_ip_set_powergating_state(adev, AMD_IP_BLOCK_TYPE_VCE,
351 AMD_PG_STATE_UNGATE);
Rex Zhu28ed5502017-01-25 17:35:14 +0800352
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400353 }
354 }
Christian Königebff4852016-07-20 16:53:36 +0200355 mutex_unlock(&adev->vce.idle_mutex);
356}
357
358/**
359 * amdgpu_vce_ring_end_use - power VCE down
360 *
361 * @ring: amdgpu ring
362 *
363 * Schedule work to power VCE down again
364 */
365void amdgpu_vce_ring_end_use(struct amdgpu_ring *ring)
366{
Monk Liu14a80322018-01-19 20:29:17 +0800367 if (!amdgpu_sriov_vf(ring->adev))
368 schedule_delayed_work(&ring->adev->vce.idle_work, VCE_IDLE_TIMEOUT);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400369}
370
371/**
372 * amdgpu_vce_free_handles - free still open VCE handles
373 *
374 * @adev: amdgpu_device pointer
375 * @filp: drm file pointer
376 *
377 * Close all VCE handles still open by this file pointer
378 */
379void amdgpu_vce_free_handles(struct amdgpu_device *adev, struct drm_file *filp)
380{
381 struct amdgpu_ring *ring = &adev->vce.ring[0];
382 int i, r;
383 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i) {
384 uint32_t handle = atomic_read(&adev->vce.handles[i]);
Christian König182830a2016-07-01 17:43:57 +0200385
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400386 if (!handle || adev->vce.filp[i] != filp)
387 continue;
388
Christian König9f2ade32016-02-03 16:50:56 +0100389 r = amdgpu_vce_get_destroy_msg(ring, handle, false, NULL);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400390 if (r)
391 DRM_ERROR("Error destroying VCE handle (%d)!\n", r);
392
393 adev->vce.filp[i] = NULL;
394 atomic_set(&adev->vce.handles[i], 0);
395 }
396}
397
398/**
399 * amdgpu_vce_get_create_msg - generate a VCE create msg
400 *
401 * @adev: amdgpu_device pointer
402 * @ring: ring we should submit the msg to
403 * @handle: VCE session handle to use
404 * @fence: optional fence to return
405 *
406 * Open up a stream for HW test
407 */
408int amdgpu_vce_get_create_msg(struct amdgpu_ring *ring, uint32_t handle,
Chris Wilsonf54d1862016-10-25 13:00:45 +0100409 struct dma_fence **fence)
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400410{
411 const unsigned ib_size_dw = 1024;
Christian Königd71518b2016-02-01 12:20:25 +0100412 struct amdgpu_job *job;
413 struct amdgpu_ib *ib;
Chris Wilsonf54d1862016-10-25 13:00:45 +0100414 struct dma_fence *f = NULL;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400415 uint64_t dummy;
416 int i, r;
417
Christian Königd71518b2016-02-01 12:20:25 +0100418 r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
419 if (r)
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400420 return r;
Christian Königd71518b2016-02-01 12:20:25 +0100421
422 ib = &job->ibs[0];
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400423
Chunming Zhou81287652015-07-03 14:18:26 +0800424 dummy = ib->gpu_addr + 1024;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400425
426 /* stitch together an VCE create msg */
Chunming Zhou81287652015-07-03 14:18:26 +0800427 ib->length_dw = 0;
428 ib->ptr[ib->length_dw++] = 0x0000000c; /* len */
429 ib->ptr[ib->length_dw++] = 0x00000001; /* session cmd */
430 ib->ptr[ib->length_dw++] = handle;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400431
Leo Liud66f8e42015-11-18 11:57:33 -0500432 if ((ring->adev->vce.fw_version >> 24) >= 52)
433 ib->ptr[ib->length_dw++] = 0x00000040; /* len */
434 else
435 ib->ptr[ib->length_dw++] = 0x00000030; /* len */
Chunming Zhou81287652015-07-03 14:18:26 +0800436 ib->ptr[ib->length_dw++] = 0x01000001; /* create cmd */
437 ib->ptr[ib->length_dw++] = 0x00000000;
438 ib->ptr[ib->length_dw++] = 0x00000042;
439 ib->ptr[ib->length_dw++] = 0x0000000a;
440 ib->ptr[ib->length_dw++] = 0x00000001;
441 ib->ptr[ib->length_dw++] = 0x00000080;
442 ib->ptr[ib->length_dw++] = 0x00000060;
443 ib->ptr[ib->length_dw++] = 0x00000100;
444 ib->ptr[ib->length_dw++] = 0x00000100;
445 ib->ptr[ib->length_dw++] = 0x0000000c;
446 ib->ptr[ib->length_dw++] = 0x00000000;
Leo Liud66f8e42015-11-18 11:57:33 -0500447 if ((ring->adev->vce.fw_version >> 24) >= 52) {
448 ib->ptr[ib->length_dw++] = 0x00000000;
449 ib->ptr[ib->length_dw++] = 0x00000000;
450 ib->ptr[ib->length_dw++] = 0x00000000;
451 ib->ptr[ib->length_dw++] = 0x00000000;
452 }
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400453
Chunming Zhou81287652015-07-03 14:18:26 +0800454 ib->ptr[ib->length_dw++] = 0x00000014; /* len */
455 ib->ptr[ib->length_dw++] = 0x05000005; /* feedback buffer */
456 ib->ptr[ib->length_dw++] = upper_32_bits(dummy);
457 ib->ptr[ib->length_dw++] = dummy;
458 ib->ptr[ib->length_dw++] = 0x00000001;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400459
Chunming Zhou81287652015-07-03 14:18:26 +0800460 for (i = ib->length_dw; i < ib_size_dw; ++i)
461 ib->ptr[i] = 0x0;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400462
Junwei Zhang50ddc752017-01-23 16:30:38 +0800463 r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
Chris Wilsonf54d1862016-10-25 13:00:45 +0100464 job->fence = dma_fence_get(f);
Chunming Zhou81287652015-07-03 14:18:26 +0800465 if (r)
466 goto err;
Christian König9f2ade32016-02-03 16:50:56 +0100467
468 amdgpu_job_free(job);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400469 if (fence)
Chris Wilsonf54d1862016-10-25 13:00:45 +0100470 *fence = dma_fence_get(f);
471 dma_fence_put(f);
Chunming Zhoucadf97b2016-01-15 11:25:00 +0800472 return 0;
Christian Königd71518b2016-02-01 12:20:25 +0100473
Chunming Zhou81287652015-07-03 14:18:26 +0800474err:
Christian Königd71518b2016-02-01 12:20:25 +0100475 amdgpu_job_free(job);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400476 return r;
477}
478
479/**
480 * amdgpu_vce_get_destroy_msg - generate a VCE destroy msg
481 *
482 * @adev: amdgpu_device pointer
483 * @ring: ring we should submit the msg to
484 * @handle: VCE session handle to use
485 * @fence: optional fence to return
486 *
487 * Close up a stream for HW test or if userspace failed to do so
488 */
489int amdgpu_vce_get_destroy_msg(struct amdgpu_ring *ring, uint32_t handle,
Chris Wilsonf54d1862016-10-25 13:00:45 +0100490 bool direct, struct dma_fence **fence)
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400491{
492 const unsigned ib_size_dw = 1024;
Christian Königd71518b2016-02-01 12:20:25 +0100493 struct amdgpu_job *job;
494 struct amdgpu_ib *ib;
Chris Wilsonf54d1862016-10-25 13:00:45 +0100495 struct dma_fence *f = NULL;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400496 int i, r;
497
Christian Königd71518b2016-02-01 12:20:25 +0100498 r = amdgpu_job_alloc_with_ib(ring->adev, ib_size_dw * 4, &job);
499 if (r)
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400500 return r;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400501
Christian Königd71518b2016-02-01 12:20:25 +0100502 ib = &job->ibs[0];
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400503
504 /* stitch together an VCE destroy msg */
Chunming Zhou81287652015-07-03 14:18:26 +0800505 ib->length_dw = 0;
506 ib->ptr[ib->length_dw++] = 0x0000000c; /* len */
507 ib->ptr[ib->length_dw++] = 0x00000001; /* session cmd */
508 ib->ptr[ib->length_dw++] = handle;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400509
Rex Zhu99453a92016-07-21 20:46:55 +0800510 ib->ptr[ib->length_dw++] = 0x00000020; /* len */
511 ib->ptr[ib->length_dw++] = 0x00000002; /* task info */
512 ib->ptr[ib->length_dw++] = 0xffffffff; /* next task info, set to 0xffffffff if no */
513 ib->ptr[ib->length_dw++] = 0x00000001; /* destroy session */
514 ib->ptr[ib->length_dw++] = 0x00000000;
515 ib->ptr[ib->length_dw++] = 0x00000000;
516 ib->ptr[ib->length_dw++] = 0xffffffff; /* feedback is not needed, set to 0xffffffff and firmware will not output feedback */
517 ib->ptr[ib->length_dw++] = 0x00000000;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400518
Chunming Zhou81287652015-07-03 14:18:26 +0800519 ib->ptr[ib->length_dw++] = 0x00000008; /* len */
520 ib->ptr[ib->length_dw++] = 0x02000001; /* destroy cmd */
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400521
Chunming Zhou81287652015-07-03 14:18:26 +0800522 for (i = ib->length_dw; i < ib_size_dw; ++i)
523 ib->ptr[i] = 0x0;
Christian König9f2ade32016-02-03 16:50:56 +0100524
525 if (direct) {
Junwei Zhang50ddc752017-01-23 16:30:38 +0800526 r = amdgpu_ib_schedule(ring, 1, ib, NULL, &f);
Chris Wilsonf54d1862016-10-25 13:00:45 +0100527 job->fence = dma_fence_get(f);
Christian König9f2ade32016-02-03 16:50:56 +0100528 if (r)
529 goto err;
530
531 amdgpu_job_free(job);
532 } else {
Christian Königc5949892016-02-10 17:43:00 +0100533 r = amdgpu_job_submit(job, ring, &ring->adev->vce.entity,
Christian König9f2ade32016-02-03 16:50:56 +0100534 AMDGPU_FENCE_OWNER_UNDEFINED, &f);
535 if (r)
536 goto err;
537 }
538
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400539 if (fence)
Chris Wilsonf54d1862016-10-25 13:00:45 +0100540 *fence = dma_fence_get(f);
541 dma_fence_put(f);
Chunming Zhoucadf97b2016-01-15 11:25:00 +0800542 return 0;
Christian Königd71518b2016-02-01 12:20:25 +0100543
Chunming Zhou81287652015-07-03 14:18:26 +0800544err:
Christian Königd71518b2016-02-01 12:20:25 +0100545 amdgpu_job_free(job);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400546 return r;
547}
548
549/**
Christian König23594312017-11-17 11:09:43 +0100550 * amdgpu_vce_cs_validate_bo - make sure not to cross 4GB boundary
551 *
552 * @p: parser context
553 * @lo: address of lower dword
554 * @hi: address of higher dword
555 * @size: minimum size
556 * @index: bs/fb index
557 *
558 * Make sure that no BO cross a 4GB boundary.
559 */
560static int amdgpu_vce_validate_bo(struct amdgpu_cs_parser *p, uint32_t ib_idx,
561 int lo, int hi, unsigned size, int32_t index)
562{
563 int64_t offset = ((uint64_t)size) * ((int64_t)index);
Christian König19be5572017-04-12 14:24:39 +0200564 struct ttm_operation_ctx ctx = { false, false };
Christian König23594312017-11-17 11:09:43 +0100565 struct amdgpu_bo_va_mapping *mapping;
566 unsigned i, fpfn, lpfn;
567 struct amdgpu_bo *bo;
568 uint64_t addr;
569 int r;
570
571 addr = ((uint64_t)amdgpu_get_ib_value(p, ib_idx, lo)) |
572 ((uint64_t)amdgpu_get_ib_value(p, ib_idx, hi)) << 32;
573 if (index >= 0) {
574 addr += offset;
575 fpfn = PAGE_ALIGN(offset) >> PAGE_SHIFT;
576 lpfn = 0x100000000ULL >> PAGE_SHIFT;
577 } else {
578 fpfn = 0;
579 lpfn = (0x100000000ULL - PAGE_ALIGN(offset)) >> PAGE_SHIFT;
580 }
581
582 r = amdgpu_cs_find_mapping(p, addr, &bo, &mapping);
583 if (r) {
584 DRM_ERROR("Can't find BO for addr 0x%010Lx %d %d %d %d\n",
585 addr, lo, hi, size, index);
586 return r;
587 }
588
589 for (i = 0; i < bo->placement.num_placement; ++i) {
590 bo->placements[i].fpfn = max(bo->placements[i].fpfn, fpfn);
Christian König4c63abb2018-01-16 11:00:12 +0100591 bo->placements[i].lpfn = bo->placements[i].lpfn ?
592 min(bo->placements[i].lpfn, lpfn) : lpfn;
Christian König23594312017-11-17 11:09:43 +0100593 }
Christian König19be5572017-04-12 14:24:39 +0200594 return ttm_bo_validate(&bo->tbo, &bo->placement, &ctx);
Christian König23594312017-11-17 11:09:43 +0100595}
596
597
598/**
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400599 * amdgpu_vce_cs_reloc - command submission relocation
600 *
601 * @p: parser context
602 * @lo: address of lower dword
603 * @hi: address of higher dword
Christian Königf1689ec2015-06-11 20:56:18 +0200604 * @size: minimum size
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400605 *
606 * Patch relocation inside command stream with real buffer address
607 */
Christian Königf1689ec2015-06-11 20:56:18 +0200608static int amdgpu_vce_cs_reloc(struct amdgpu_cs_parser *p, uint32_t ib_idx,
Christian Königdc783302015-06-12 14:16:20 +0200609 int lo, int hi, unsigned size, uint32_t index)
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400610{
611 struct amdgpu_bo_va_mapping *mapping;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400612 struct amdgpu_bo *bo;
613 uint64_t addr;
Christian König9cca0b82017-09-06 16:15:28 +0200614 int r;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400615
Christian Königdc783302015-06-12 14:16:20 +0200616 if (index == 0xffffffff)
617 index = 0;
618
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400619 addr = ((uint64_t)amdgpu_get_ib_value(p, ib_idx, lo)) |
620 ((uint64_t)amdgpu_get_ib_value(p, ib_idx, hi)) << 32;
Christian Königdc783302015-06-12 14:16:20 +0200621 addr += ((uint64_t)size) * ((uint64_t)index);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400622
Christian König9cca0b82017-09-06 16:15:28 +0200623 r = amdgpu_cs_find_mapping(p, addr, &bo, &mapping);
624 if (r) {
Christian Königdc783302015-06-12 14:16:20 +0200625 DRM_ERROR("Can't find BO for addr 0x%010Lx %d %d %d %d\n",
626 addr, lo, hi, size, index);
Christian König9cca0b82017-09-06 16:15:28 +0200627 return r;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400628 }
629
Christian Königf1689ec2015-06-11 20:56:18 +0200630 if ((addr + (uint64_t)size) >
Christian Königa9f87f62017-03-30 14:03:59 +0200631 (mapping->last + 1) * AMDGPU_GPU_PAGE_SIZE) {
Christian Königf1689ec2015-06-11 20:56:18 +0200632 DRM_ERROR("BO to small for addr 0x%010Lx %d %d\n",
633 addr, lo, hi);
634 return -EINVAL;
635 }
636
Christian Königa9f87f62017-03-30 14:03:59 +0200637 addr -= mapping->start * AMDGPU_GPU_PAGE_SIZE;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400638 addr += amdgpu_bo_gpu_offset(bo);
Christian Königdc783302015-06-12 14:16:20 +0200639 addr -= ((uint64_t)size) * ((uint64_t)index);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400640
Christian König7270f832016-01-31 11:00:41 +0100641 amdgpu_set_ib_value(p, ib_idx, lo, lower_32_bits(addr));
642 amdgpu_set_ib_value(p, ib_idx, hi, upper_32_bits(addr));
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400643
644 return 0;
645}
646
647/**
Christian Königf1689ec2015-06-11 20:56:18 +0200648 * amdgpu_vce_validate_handle - validate stream handle
649 *
650 * @p: parser context
651 * @handle: handle to validate
Christian König2f4b9362015-06-11 21:33:55 +0200652 * @allocated: allocated a new handle?
Christian Königf1689ec2015-06-11 20:56:18 +0200653 *
654 * Validates the handle and return the found session index or -EINVAL
655 * we we don't have another free session index.
656 */
657static int amdgpu_vce_validate_handle(struct amdgpu_cs_parser *p,
Christian Könige5223212016-07-01 22:19:25 +0200658 uint32_t handle, uint32_t *allocated)
Christian Königf1689ec2015-06-11 20:56:18 +0200659{
660 unsigned i;
661
662 /* validate the handle */
663 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i) {
Christian König2f4b9362015-06-11 21:33:55 +0200664 if (atomic_read(&p->adev->vce.handles[i]) == handle) {
665 if (p->adev->vce.filp[i] != p->filp) {
666 DRM_ERROR("VCE handle collision detected!\n");
667 return -EINVAL;
668 }
Christian Königf1689ec2015-06-11 20:56:18 +0200669 return i;
Christian König2f4b9362015-06-11 21:33:55 +0200670 }
Christian Königf1689ec2015-06-11 20:56:18 +0200671 }
672
673 /* handle not found try to alloc a new one */
674 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i) {
675 if (!atomic_cmpxchg(&p->adev->vce.handles[i], 0, handle)) {
676 p->adev->vce.filp[i] = p->filp;
677 p->adev->vce.img_size[i] = 0;
Christian Könige5223212016-07-01 22:19:25 +0200678 *allocated |= 1 << i;
Christian Königf1689ec2015-06-11 20:56:18 +0200679 return i;
680 }
681 }
682
683 DRM_ERROR("No more free VCE handles!\n");
684 return -EINVAL;
685}
686
687/**
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400688 * amdgpu_vce_cs_parse - parse and validate the command stream
689 *
690 * @p: parser context
691 *
692 */
693int amdgpu_vce_ring_parse_cs(struct amdgpu_cs_parser *p, uint32_t ib_idx)
694{
Christian König50838c82016-02-03 13:44:52 +0100695 struct amdgpu_ib *ib = &p->job->ibs[ib_idx];
Christian Königdc783302015-06-12 14:16:20 +0200696 unsigned fb_idx = 0, bs_idx = 0;
Christian Königf1689ec2015-06-11 20:56:18 +0200697 int session_idx = -1;
Christian Könige5223212016-07-01 22:19:25 +0200698 uint32_t destroyed = 0;
699 uint32_t created = 0;
700 uint32_t allocated = 0;
Christian Königf1689ec2015-06-11 20:56:18 +0200701 uint32_t tmp, handle = 0;
702 uint32_t *size = &tmp;
Christian König23594312017-11-17 11:09:43 +0100703 unsigned idx;
704 int i, r = 0;
Christian Königc855e252016-09-05 17:00:57 +0200705
Christian König45088ef2016-10-05 16:49:19 +0200706 p->job->vm = NULL;
707 ib->gpu_addr = amdgpu_sa_bo_gpu_addr(ib->sa_bo);
708
Christian König23594312017-11-17 11:09:43 +0100709 for (idx = 0; idx < ib->length_dw;) {
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400710 uint32_t len = amdgpu_get_ib_value(p, ib_idx, idx);
711 uint32_t cmd = amdgpu_get_ib_value(p, ib_idx, idx + 1);
712
713 if ((len < 8) || (len & 3)) {
714 DRM_ERROR("invalid VCE command length (%d)!\n", len);
Christian König2f4b9362015-06-11 21:33:55 +0200715 r = -EINVAL;
716 goto out;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400717 }
718
719 switch (cmd) {
Christian König23594312017-11-17 11:09:43 +0100720 case 0x00000002: /* task info */
721 fb_idx = amdgpu_get_ib_value(p, ib_idx, idx + 6);
722 bs_idx = amdgpu_get_ib_value(p, ib_idx, idx + 7);
723 break;
724
725 case 0x03000001: /* encode */
726 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 10,
727 idx + 9, 0, 0);
728 if (r)
729 goto out;
730
731 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 12,
732 idx + 11, 0, 0);
733 if (r)
734 goto out;
735 break;
736
737 case 0x05000001: /* context buffer */
738 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 3,
739 idx + 2, 0, 0);
740 if (r)
741 goto out;
742 break;
743
744 case 0x05000004: /* video bitstream buffer */
745 tmp = amdgpu_get_ib_value(p, ib_idx, idx + 4);
746 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 3, idx + 2,
747 tmp, bs_idx);
748 if (r)
749 goto out;
750 break;
751
752 case 0x05000005: /* feedback buffer */
753 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 3, idx + 2,
754 4096, fb_idx);
755 if (r)
756 goto out;
757 break;
James Zhu1eb15472018-04-03 10:41:32 -0400758
759 case 0x0500000d: /* MV buffer */
760 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 3,
761 idx + 2, 0, 0);
762 if (r)
763 goto out;
764
765 r = amdgpu_vce_validate_bo(p, ib_idx, idx + 8,
766 idx + 7, 0, 0);
767 if (r)
768 goto out;
769 break;
Christian König23594312017-11-17 11:09:43 +0100770 }
771
772 idx += len / 4;
773 }
774
775 for (idx = 0; idx < ib->length_dw;) {
776 uint32_t len = amdgpu_get_ib_value(p, ib_idx, idx);
777 uint32_t cmd = amdgpu_get_ib_value(p, ib_idx, idx + 1);
778
779 switch (cmd) {
Christian König182830a2016-07-01 17:43:57 +0200780 case 0x00000001: /* session */
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400781 handle = amdgpu_get_ib_value(p, ib_idx, idx + 2);
Christian König2f4b9362015-06-11 21:33:55 +0200782 session_idx = amdgpu_vce_validate_handle(p, handle,
783 &allocated);
Christian Könige5223212016-07-01 22:19:25 +0200784 if (session_idx < 0) {
785 r = session_idx;
786 goto out;
787 }
Christian Königf1689ec2015-06-11 20:56:18 +0200788 size = &p->adev->vce.img_size[session_idx];
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400789 break;
790
Christian König182830a2016-07-01 17:43:57 +0200791 case 0x00000002: /* task info */
Christian Königdc783302015-06-12 14:16:20 +0200792 fb_idx = amdgpu_get_ib_value(p, ib_idx, idx + 6);
793 bs_idx = amdgpu_get_ib_value(p, ib_idx, idx + 7);
Christian Königf1689ec2015-06-11 20:56:18 +0200794 break;
795
Christian König182830a2016-07-01 17:43:57 +0200796 case 0x01000001: /* create */
Christian Könige5223212016-07-01 22:19:25 +0200797 created |= 1 << session_idx;
798 if (destroyed & (1 << session_idx)) {
799 destroyed &= ~(1 << session_idx);
800 allocated |= 1 << session_idx;
801
802 } else if (!(allocated & (1 << session_idx))) {
Christian König2f4b9362015-06-11 21:33:55 +0200803 DRM_ERROR("Handle already in use!\n");
804 r = -EINVAL;
805 goto out;
806 }
807
Christian Königf1689ec2015-06-11 20:56:18 +0200808 *size = amdgpu_get_ib_value(p, ib_idx, idx + 8) *
809 amdgpu_get_ib_value(p, ib_idx, idx + 10) *
810 8 * 3 / 2;
811 break;
812
Christian König182830a2016-07-01 17:43:57 +0200813 case 0x04000001: /* config extension */
814 case 0x04000002: /* pic control */
815 case 0x04000005: /* rate control */
816 case 0x04000007: /* motion estimation */
817 case 0x04000008: /* rdo */
818 case 0x04000009: /* vui */
819 case 0x05000002: /* auxiliary buffer */
Alex Deucher4f827782016-09-21 14:57:06 -0400820 case 0x05000009: /* clock table */
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400821 break;
822
Alex Deucher5eeda8a2016-09-23 17:22:42 -0400823 case 0x0500000c: /* hw config */
824 switch (p->adev->asic_type) {
825#ifdef CONFIG_DRM_AMDGPU_CIK
826 case CHIP_KAVERI:
827 case CHIP_MULLINS:
828#endif
829 case CHIP_CARRIZO:
830 break;
831 default:
832 r = -EINVAL;
833 goto out;
834 }
835 break;
836
Christian König182830a2016-07-01 17:43:57 +0200837 case 0x03000001: /* encode */
Christian Königf1689ec2015-06-11 20:56:18 +0200838 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 10, idx + 9,
Christian Königdc783302015-06-12 14:16:20 +0200839 *size, 0);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400840 if (r)
Christian König2f4b9362015-06-11 21:33:55 +0200841 goto out;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400842
Christian Königf1689ec2015-06-11 20:56:18 +0200843 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 12, idx + 11,
Christian Königdc783302015-06-12 14:16:20 +0200844 *size / 3, 0);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400845 if (r)
Christian König2f4b9362015-06-11 21:33:55 +0200846 goto out;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400847 break;
848
Christian König182830a2016-07-01 17:43:57 +0200849 case 0x02000001: /* destroy */
Christian Könige5223212016-07-01 22:19:25 +0200850 destroyed |= 1 << session_idx;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400851 break;
852
Christian König182830a2016-07-01 17:43:57 +0200853 case 0x05000001: /* context buffer */
Christian Königf1689ec2015-06-11 20:56:18 +0200854 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 3, idx + 2,
Christian Königdc783302015-06-12 14:16:20 +0200855 *size * 2, 0);
Christian Königf1689ec2015-06-11 20:56:18 +0200856 if (r)
Christian König2f4b9362015-06-11 21:33:55 +0200857 goto out;
Christian Königf1689ec2015-06-11 20:56:18 +0200858 break;
859
Christian König182830a2016-07-01 17:43:57 +0200860 case 0x05000004: /* video bitstream buffer */
Christian Königf1689ec2015-06-11 20:56:18 +0200861 tmp = amdgpu_get_ib_value(p, ib_idx, idx + 4);
862 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 3, idx + 2,
Christian Königdc783302015-06-12 14:16:20 +0200863 tmp, bs_idx);
Christian Königf1689ec2015-06-11 20:56:18 +0200864 if (r)
Christian König2f4b9362015-06-11 21:33:55 +0200865 goto out;
Christian Königf1689ec2015-06-11 20:56:18 +0200866 break;
867
Christian König182830a2016-07-01 17:43:57 +0200868 case 0x05000005: /* feedback buffer */
Christian Königf1689ec2015-06-11 20:56:18 +0200869 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 3, idx + 2,
Christian Königdc783302015-06-12 14:16:20 +0200870 4096, fb_idx);
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400871 if (r)
Christian König2f4b9362015-06-11 21:33:55 +0200872 goto out;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400873 break;
874
James Zhu1eb15472018-04-03 10:41:32 -0400875 case 0x0500000d: /* MV buffer */
876 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 3,
877 idx + 2, *size, 0);
878 if (r)
879 goto out;
880
881 r = amdgpu_vce_cs_reloc(p, ib_idx, idx + 8,
882 idx + 7, *size / 12, 0);
883 if (r)
884 goto out;
885 break;
886
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400887 default:
888 DRM_ERROR("invalid VCE command (0x%x)!\n", cmd);
Christian König2f4b9362015-06-11 21:33:55 +0200889 r = -EINVAL;
890 goto out;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400891 }
892
Christian Königf1689ec2015-06-11 20:56:18 +0200893 if (session_idx == -1) {
894 DRM_ERROR("no session command at start of IB\n");
Christian König2f4b9362015-06-11 21:33:55 +0200895 r = -EINVAL;
896 goto out;
Christian Königf1689ec2015-06-11 20:56:18 +0200897 }
898
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400899 idx += len / 4;
900 }
901
Christian Könige5223212016-07-01 22:19:25 +0200902 if (allocated & ~created) {
Christian König2f4b9362015-06-11 21:33:55 +0200903 DRM_ERROR("New session without create command!\n");
904 r = -ENOENT;
905 }
906
907out:
Christian Könige5223212016-07-01 22:19:25 +0200908 if (!r) {
909 /* No error, free all destroyed handle slots */
910 tmp = destroyed;
911 } else {
912 /* Error during parsing, free all allocated handle slots */
913 tmp = allocated;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400914 }
915
Christian Könige5223212016-07-01 22:19:25 +0200916 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i)
917 if (tmp & (1 << i))
918 atomic_set(&p->adev->vce.handles[i], 0);
919
Christian König2f4b9362015-06-11 21:33:55 +0200920 return r;
Alex Deucherd38ceaf2015-04-20 16:55:21 -0400921}
922
923/**
Christian König98614702016-10-10 15:23:32 +0200924 * amdgpu_vce_cs_parse_vm - parse the command stream in VM mode
925 *
926 * @p: parser context
927 *
928 */
929int amdgpu_vce_ring_parse_cs_vm(struct amdgpu_cs_parser *p, uint32_t ib_idx)
930{
931 struct amdgpu_ib *ib = &p->job->ibs[ib_idx];
932 int session_idx = -1;
933 uint32_t destroyed = 0;
934 uint32_t created = 0;
935 uint32_t allocated = 0;
936 uint32_t tmp, handle = 0;
937 int i, r = 0, idx = 0;
938
939 while (idx < ib->length_dw) {
940 uint32_t len = amdgpu_get_ib_value(p, ib_idx, idx);
941 uint32_t cmd = amdgpu_get_ib_value(p, ib_idx, idx + 1);
942
943 if ((len < 8) || (len & 3)) {
944 DRM_ERROR("invalid VCE command length (%d)!\n", len);
945 r = -EINVAL;
946 goto out;
947 }
948
949 switch (cmd) {
950 case 0x00000001: /* session */
951 handle = amdgpu_get_ib_value(p, ib_idx, idx + 2);
952 session_idx = amdgpu_vce_validate_handle(p, handle,
953 &allocated);
954 if (session_idx < 0) {
955 r = session_idx;
956 goto out;
957 }
958 break;
959
960 case 0x01000001: /* create */
961 created |= 1 << session_idx;
962 if (destroyed & (1 << session_idx)) {
963 destroyed &= ~(1 << session_idx);
964 allocated |= 1 << session_idx;
965
966 } else if (!(allocated & (1 << session_idx))) {
967 DRM_ERROR("Handle already in use!\n");
968 r = -EINVAL;
969 goto out;
970 }
971
972 break;
973
974 case 0x02000001: /* destroy */
975 destroyed |= 1 << session_idx;
976 break;
977
978 default:
979 break;
980 }
981
982 if (session_idx == -1) {
983 DRM_ERROR("no session command at start of IB\n");
984 r = -EINVAL;
985 goto out;
986 }
987
988 idx += len / 4;
989 }
990
991 if (allocated & ~created) {
992 DRM_ERROR("New session without create command!\n");
993 r = -ENOENT;
994 }
995
996out:
997 if (!r) {
998 /* No error, free all destroyed handle slots */
999 tmp = destroyed;
1000 amdgpu_ib_free(p->adev, ib, NULL);
1001 } else {
1002 /* Error during parsing, free all allocated handle slots */
1003 tmp = allocated;
1004 }
1005
1006 for (i = 0; i < AMDGPU_MAX_VCE_HANDLES; ++i)
1007 if (tmp & (1 << i))
1008 atomic_set(&p->adev->vce.handles[i], 0);
1009
1010 return r;
1011}
1012
1013/**
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001014 * amdgpu_vce_ring_emit_ib - execute indirect buffer
1015 *
1016 * @ring: engine to use
1017 * @ib: the IB to execute
1018 *
1019 */
Christian Königd88bf582016-05-06 17:50:03 +02001020void amdgpu_vce_ring_emit_ib(struct amdgpu_ring *ring, struct amdgpu_ib *ib,
Christian Königc4f46f22017-12-18 17:08:25 +01001021 unsigned vmid, bool ctx_switch)
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001022{
1023 amdgpu_ring_write(ring, VCE_CMD_IB);
1024 amdgpu_ring_write(ring, lower_32_bits(ib->gpu_addr));
1025 amdgpu_ring_write(ring, upper_32_bits(ib->gpu_addr));
1026 amdgpu_ring_write(ring, ib->length_dw);
1027}
1028
1029/**
1030 * amdgpu_vce_ring_emit_fence - add a fence command to the ring
1031 *
1032 * @ring: engine to use
1033 * @fence: the fence
1034 *
1035 */
1036void amdgpu_vce_ring_emit_fence(struct amdgpu_ring *ring, u64 addr, u64 seq,
Chunming Zhou890ee232015-06-01 14:35:03 +08001037 unsigned flags)
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001038{
Chunming Zhou890ee232015-06-01 14:35:03 +08001039 WARN_ON(flags & AMDGPU_FENCE_FLAG_64BIT);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001040
1041 amdgpu_ring_write(ring, VCE_CMD_FENCE);
1042 amdgpu_ring_write(ring, addr);
1043 amdgpu_ring_write(ring, upper_32_bits(addr));
1044 amdgpu_ring_write(ring, seq);
1045 amdgpu_ring_write(ring, VCE_CMD_TRAP);
1046 amdgpu_ring_write(ring, VCE_CMD_END);
1047}
1048
1049/**
1050 * amdgpu_vce_ring_test_ring - test if VCE ring is working
1051 *
1052 * @ring: the engine to test on
1053 *
1054 */
1055int amdgpu_vce_ring_test_ring(struct amdgpu_ring *ring)
1056{
1057 struct amdgpu_device *adev = ring->adev;
1058 uint32_t rptr = amdgpu_ring_get_rptr(ring);
1059 unsigned i;
Xiangliang Yua2f537e2017-04-06 14:43:48 +08001060 int r, timeout = adev->usec_timeout;
1061
Frank Mina1b90222017-06-12 11:02:09 +08001062 /* skip ring test for sriov*/
Xiangliang Yua2f537e2017-04-06 14:43:48 +08001063 if (amdgpu_sriov_vf(adev))
Frank Mina1b90222017-06-12 11:02:09 +08001064 return 0;
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001065
Christian Königa27de352016-01-21 11:28:53 +01001066 r = amdgpu_ring_alloc(ring, 16);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001067 if (r) {
1068 DRM_ERROR("amdgpu: vce failed to lock ring %d (%d).\n",
1069 ring->idx, r);
1070 return r;
1071 }
1072 amdgpu_ring_write(ring, VCE_CMD_END);
Christian Königa27de352016-01-21 11:28:53 +01001073 amdgpu_ring_commit(ring);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001074
Xiangliang Yua2f537e2017-04-06 14:43:48 +08001075 for (i = 0; i < timeout; i++) {
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001076 if (amdgpu_ring_get_rptr(ring) != rptr)
1077 break;
1078 DRM_UDELAY(1);
1079 }
1080
Xiangliang Yua2f537e2017-04-06 14:43:48 +08001081 if (i < timeout) {
pding9953b722017-10-26 09:30:38 +08001082 DRM_DEBUG("ring test on %d succeeded in %d usecs\n",
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001083 ring->idx, i);
1084 } else {
1085 DRM_ERROR("amdgpu: ring %d test failed\n",
1086 ring->idx);
1087 r = -ETIMEDOUT;
1088 }
1089
1090 return r;
1091}
1092
1093/**
1094 * amdgpu_vce_ring_test_ib - test if VCE IBs are working
1095 *
1096 * @ring: the engine to test on
1097 *
1098 */
Christian Königbbec97a2016-07-05 21:07:17 +02001099int amdgpu_vce_ring_test_ib(struct amdgpu_ring *ring, long timeout)
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001100{
Chris Wilsonf54d1862016-10-25 13:00:45 +01001101 struct dma_fence *fence = NULL;
Christian Königbbec97a2016-07-05 21:07:17 +02001102 long r;
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001103
Alex Deucher6f0359f2016-08-24 17:15:33 -04001104 /* skip vce ring1/2 ib test for now, since it's not reliable */
1105 if (ring != &ring->adev->vce.ring[0])
Leo Liu898e50d2015-09-04 15:08:55 -04001106 return 0;
1107
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001108 r = amdgpu_vce_get_create_msg(ring, 1, NULL);
1109 if (r) {
Christian Königbbec97a2016-07-05 21:07:17 +02001110 DRM_ERROR("amdgpu: failed to get create msg (%ld).\n", r);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001111 goto error;
1112 }
1113
Christian König9f2ade32016-02-03 16:50:56 +01001114 r = amdgpu_vce_get_destroy_msg(ring, 1, true, &fence);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001115 if (r) {
Christian Königbbec97a2016-07-05 21:07:17 +02001116 DRM_ERROR("amdgpu: failed to get destroy ib (%ld).\n", r);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001117 goto error;
1118 }
1119
Chris Wilsonf54d1862016-10-25 13:00:45 +01001120 r = dma_fence_wait_timeout(fence, false, timeout);
Christian Königbbec97a2016-07-05 21:07:17 +02001121 if (r == 0) {
1122 DRM_ERROR("amdgpu: IB test timed out.\n");
1123 r = -ETIMEDOUT;
1124 } else if (r < 0) {
1125 DRM_ERROR("amdgpu: fence wait failed (%ld).\n", r);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001126 } else {
pding9953b722017-10-26 09:30:38 +08001127 DRM_DEBUG("ib test on ring %d succeeded\n", ring->idx);
Christian Königbbec97a2016-07-05 21:07:17 +02001128 r = 0;
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001129 }
1130error:
Chris Wilsonf54d1862016-10-25 13:00:45 +01001131 dma_fence_put(fence);
Alex Deucherd38ceaf2015-04-20 16:55:21 -04001132 return r;
1133}