blob: 2bd56760c7441fdc720d3a469fef424ae39741ea [file] [log] [blame]
Chunming Zhouc1b69ed2015-07-21 13:45:14 +08001/*
2 * Copyright 2015 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 *
23 */
24#include <linux/kthread.h>
25#include <linux/wait.h>
26#include <linux/sched.h>
27#include <drm/drmP.h>
28#include "amdgpu.h"
Chunming Zhou7034dec2015-11-11 14:56:00 +080029#include "amdgpu_trace.h"
Chunming Zhouc1b69ed2015-07-21 13:45:14 +080030
Lucas Stach1b1f42d2017-12-06 17:49:39 +010031static void amdgpu_job_timedout(struct drm_sched_job *s_job)
Monk Liu0de24792016-03-04 18:51:02 +080032{
Christian König0e51a772016-05-18 14:19:32 +020033 struct amdgpu_job *job = container_of(s_job, struct amdgpu_job, base);
34
Monk Liu0de24792016-03-04 18:51:02 +080035 DRM_ERROR("ring %s timeout, last signaled seq=%u, last emitted seq=%u\n",
Christian König0e51a772016-05-18 14:19:32 +020036 job->base.sched->name,
37 atomic_read(&job->ring->fence_drv.last_seq),
38 job->ring->fence_drv.sync_seq);
Monk Liu4fbf87e22017-05-05 15:09:42 +080039
Alex Deucher5f152b52017-12-15 16:40:49 -050040 amdgpu_device_gpu_recover(job->adev, job, false);
Monk Liu0de24792016-03-04 18:51:02 +080041}
42
Christian König50838c82016-02-03 13:44:52 +010043int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
Monk Liuc5637832016-04-19 20:11:32 +080044 struct amdgpu_job **job, struct amdgpu_vm *vm)
Christian König50838c82016-02-03 13:44:52 +010045{
46 size_t size = sizeof(struct amdgpu_job);
47
48 if (num_ibs == 0)
49 return -EINVAL;
50
51 size += sizeof(struct amdgpu_ib) * num_ibs;
52
53 *job = kzalloc(size, GFP_KERNEL);
54 if (!*job)
55 return -ENOMEM;
56
57 (*job)->adev = adev;
Monk Liuc5637832016-04-19 20:11:32 +080058 (*job)->vm = vm;
Christian König50838c82016-02-03 13:44:52 +010059 (*job)->ibs = (void *)&(*job)[1];
60 (*job)->num_ibs = num_ibs;
Christian König50838c82016-02-03 13:44:52 +010061
Christian Könige86f9ce2016-02-08 12:13:05 +010062 amdgpu_sync_create(&(*job)->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +080063 amdgpu_sync_create(&(*job)->sched_sync);
Monk Liuc70b78a2017-10-16 20:02:08 +080064 (*job)->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
Christian Könige86f9ce2016-02-08 12:13:05 +010065
Christian König50838c82016-02-03 13:44:52 +010066 return 0;
67}
68
Christian Königd71518b2016-02-01 12:20:25 +010069int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
70 struct amdgpu_job **job)
71{
72 int r;
73
Monk Liuc5637832016-04-19 20:11:32 +080074 r = amdgpu_job_alloc(adev, 1, job, NULL);
Christian Königd71518b2016-02-01 12:20:25 +010075 if (r)
76 return r;
77
78 r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]);
79 if (r)
80 kfree(*job);
Christian Königdf264f92017-06-28 15:41:17 +020081 else
82 (*job)->vm_pd_addr = adev->gart.table_addr;
Christian Königd71518b2016-02-01 12:20:25 +010083
84 return r;
85}
86
Christian Königa5fb4ec2016-06-29 15:10:31 +020087void amdgpu_job_free_resources(struct amdgpu_job *job)
Christian König50838c82016-02-03 13:44:52 +010088{
Chris Wilsonf54d1862016-10-25 13:00:45 +010089 struct dma_fence *f;
Christian König1ab0d212016-05-18 13:09:47 +020090 unsigned i;
91
Monk Liu676d8c22016-03-17 13:57:09 +080092 /* use sched fence if available */
Christian König6fc13672016-05-20 12:53:52 +020093 f = job->base.s_fence ? &job->base.s_fence->finished : job->fence;
Christian König50838c82016-02-03 13:44:52 +010094
95 for (i = 0; i < job->num_ibs; ++i)
Christian König1ab0d212016-05-18 13:09:47 +020096 amdgpu_ib_free(job->adev, &job->ibs[i], f);
Christian Königd71518b2016-02-01 12:20:25 +010097}
98
Lucas Stach1b1f42d2017-12-06 17:49:39 +010099static void amdgpu_job_free_cb(struct drm_sched_job *s_job)
Monk Liub6723c82016-03-10 12:14:44 +0800100{
Christian Königc5f74f72016-05-19 09:54:15 +0200101 struct amdgpu_job *job = container_of(s_job, struct amdgpu_job, base);
102
Andrey Grodzovskyd1f6dc12017-10-19 14:29:46 -0400103 amdgpu_ring_priority_put(job->ring, s_job->s_priority);
Chris Wilsonf54d1862016-10-25 13:00:45 +0100104 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200105 amdgpu_sync_free(&job->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800106 amdgpu_sync_free(&job->sched_sync);
Monk Liub6723c82016-03-10 12:14:44 +0800107 kfree(job);
108}
109
Christian König1e24e312016-05-18 13:12:12 +0200110void amdgpu_job_free(struct amdgpu_job *job)
111{
112 amdgpu_job_free_resources(job);
Christian Königa79a5bd2016-06-29 13:29:57 +0200113
Chris Wilsonf54d1862016-10-25 13:00:45 +0100114 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200115 amdgpu_sync_free(&job->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800116 amdgpu_sync_free(&job->sched_sync);
Christian König1e24e312016-05-18 13:12:12 +0200117 kfree(job);
118}
119
Christian Königd71518b2016-02-01 12:20:25 +0100120int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring,
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100121 struct drm_sched_entity *entity, void *owner,
Chris Wilsonf54d1862016-10-25 13:00:45 +0100122 struct dma_fence **f)
Christian Königd71518b2016-02-01 12:20:25 +0100123{
Monk Liue6869412016-03-07 12:49:55 +0800124 int r;
Christian Königd71518b2016-02-01 12:20:25 +0100125 job->ring = ring;
Christian Königd71518b2016-02-01 12:20:25 +0100126
Monk Liue6869412016-03-07 12:49:55 +0800127 if (!f)
128 return -EINVAL;
129
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100130 r = drm_sched_job_init(&job->base, &ring->sched, entity, owner);
Monk Liue6869412016-03-07 12:49:55 +0800131 if (r)
132 return r;
Christian Königd71518b2016-02-01 12:20:25 +0100133
134 job->owner = owner;
Monk Liu3aecd242016-08-25 15:40:48 +0800135 job->fence_ctx = entity->fence_context;
Chris Wilsonf54d1862016-10-25 13:00:45 +0100136 *f = dma_fence_get(&job->base.s_fence->finished);
Christian Königa5fb4ec2016-06-29 15:10:31 +0200137 amdgpu_job_free_resources(job);
Andrey Grodzovskyd1f6dc12017-10-19 14:29:46 -0400138 amdgpu_ring_priority_get(job->ring, job->base.s_priority);
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100139 drm_sched_entity_push_job(&job->base, entity);
Christian Königd71518b2016-02-01 12:20:25 +0100140
141 return 0;
Christian König50838c82016-02-03 13:44:52 +0100142}
143
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100144static struct dma_fence *amdgpu_job_dependency(struct drm_sched_job *sched_job,
145 struct drm_sched_entity *s_entity)
Christian Könige61235d2015-08-25 11:05:36 +0200146{
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800147 struct amdgpu_job *job = to_amdgpu_job(sched_job);
Monk Liuc5637832016-04-19 20:11:32 +0800148 struct amdgpu_vm *vm = job->vm;
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500149 bool explicit = false;
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800150 int r;
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500151 struct dma_fence *fence = amdgpu_sync_get_fence(&job->sync, &explicit);
Christian König8d0a7ce2015-11-03 20:58:50 +0100152
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500153 if (fence && explicit) {
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100154 if (drm_sched_dependency_optimized(fence, s_entity)) {
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500155 r = amdgpu_sync_fence(job->adev, &job->sched_sync, fence, false);
156 if (r)
157 DRM_ERROR("Error adding fence to sync (%d)\n", r);
158 }
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800159 }
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500160
Christian Königc4f46f22017-12-18 17:08:25 +0100161 while (fence == NULL && vm && !job->vmid) {
Christian Königb07c60c2016-01-31 12:29:04 +0100162 struct amdgpu_ring *ring = job->ring;
Christian König8d0a7ce2015-11-03 20:58:50 +0100163
Christian König620f7742017-12-18 16:53:03 +0100164 r = amdgpu_vmid_grab(vm, ring, &job->sync,
165 &job->base.s_fence->finished,
166 job);
Christian König94dd0a42016-01-18 17:01:42 +0100167 if (r)
Christian König8d0a7ce2015-11-03 20:58:50 +0100168 DRM_ERROR("Error getting VM ID (%d)\n", r);
Christian König8d0a7ce2015-11-03 20:58:50 +0100169
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500170 fence = amdgpu_sync_get_fence(&job->sync, NULL);
Christian König8d0a7ce2015-11-03 20:58:50 +0100171 }
172
173 return fence;
Christian Könige61235d2015-08-25 11:05:36 +0200174}
175
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100176static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job)
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800177{
Monk Liu48f05f22017-10-25 16:21:08 +0800178 struct dma_fence *fence = NULL, *finished;
Christian König14e47f92017-10-09 15:04:41 +0200179 struct amdgpu_device *adev;
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800180 struct amdgpu_job *job;
Christian Königbd755d02015-08-24 14:57:26 +0200181 int r;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800182
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800183 if (!sched_job) {
Chunming Zhou4cef9262015-08-05 19:52:14 +0800184 DRM_ERROR("job is null\n");
Christian König6f0e54a2015-08-05 21:22:10 +0200185 return NULL;
Chunming Zhou4cef9262015-08-05 19:52:14 +0800186 }
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800187 job = to_amdgpu_job(sched_job);
Monk Liu48f05f22017-10-25 16:21:08 +0800188 finished = &job->base.s_fence->finished;
Christian König14e47f92017-10-09 15:04:41 +0200189 adev = job->adev;
Christian Könige86f9ce2016-02-08 12:13:05 +0100190
Christian König1fbb2e92016-06-01 10:47:36 +0200191 BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL));
Christian Könige86f9ce2016-02-08 12:13:05 +0100192
Chunming Zhou7034dec2015-11-11 14:56:00 +0800193 trace_amdgpu_sched_run_job(job);
Monk Liu48f05f22017-10-25 16:21:08 +0800194
195 if (job->vram_lost_counter != atomic_read(&adev->vram_lost_counter))
196 dma_fence_set_error(finished, -ECANCELED);/* skip IB as well if VRAM lost */
197
198 if (finished->error < 0) {
199 DRM_INFO("Skip scheduling IBs!\n");
Christian König14e47f92017-10-09 15:04:41 +0200200 } else {
201 r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs, job,
202 &fence);
Chunming Zhou15d73ce2017-05-16 14:34:27 +0800203 if (r)
204 DRM_ERROR("Error scheduling IBs (%d)\n", r);
205 }
Chunming Zhouc7c5fbc2016-06-30 17:30:42 +0800206 /* if gpu reset, hw fence will be replaced here */
Chris Wilsonf54d1862016-10-25 13:00:45 +0100207 dma_fence_put(job->fence);
208 job->fence = dma_fence_get(fence);
Andres Rodriguezb2ff0e82017-02-20 17:53:19 -0500209
Christian König22a77cf2016-07-05 14:48:17 +0200210 amdgpu_job_free_resources(job);
Christian Königec72b802016-02-01 11:56:35 +0100211 return fence;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800212}
213
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100214const struct drm_sched_backend_ops amdgpu_sched_ops = {
Christian König0856cab2016-02-01 12:31:01 +0100215 .dependency = amdgpu_job_dependency,
216 .run_job = amdgpu_job_run,
Christian König0e51a772016-05-18 14:19:32 +0200217 .timedout_job = amdgpu_job_timedout,
Christian Königc5f74f72016-05-19 09:54:15 +0200218 .free_job = amdgpu_job_free_cb
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800219};