blob: 391e2f7c03aacdfae679057204e02e10e756cb8a [file] [log] [blame]
Chunming Zhouc1b69ed2015-07-21 13:45:14 +08001/*
2 * Copyright 2015 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 *
23 */
24#include <linux/kthread.h>
25#include <linux/wait.h>
26#include <linux/sched.h>
27#include <drm/drmP.h>
28#include "amdgpu.h"
Chunming Zhou7034dec2015-11-11 14:56:00 +080029#include "amdgpu_trace.h"
Chunming Zhouc1b69ed2015-07-21 13:45:14 +080030
Lucas Stach1b1f42d2017-12-06 17:49:39 +010031static void amdgpu_job_timedout(struct drm_sched_job *s_job)
Monk Liu0de24792016-03-04 18:51:02 +080032{
Christian König3320b8d2018-07-13 15:08:44 +020033 struct amdgpu_ring *ring = to_amdgpu_ring(s_job->sched);
34 struct amdgpu_job *job = to_amdgpu_job(s_job);
Christian König0e51a772016-05-18 14:19:32 +020035
Christian Königf024e882018-07-13 14:01:08 +020036 DRM_ERROR("ring %s timeout, signaled seq=%u, emitted seq=%u\n",
Christian König3320b8d2018-07-13 15:08:44 +020037 job->base.sched->name, atomic_read(&ring->fence_drv.last_seq),
38 ring->fence_drv.sync_seq);
Monk Liu4fbf87e22017-05-05 15:09:42 +080039
Christian Königa1917b72018-07-13 17:15:54 +020040 amdgpu_device_gpu_recover(ring->adev, job, false);
Monk Liu0de24792016-03-04 18:51:02 +080041}
42
Christian König50838c82016-02-03 13:44:52 +010043int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
Monk Liuc5637832016-04-19 20:11:32 +080044 struct amdgpu_job **job, struct amdgpu_vm *vm)
Christian König50838c82016-02-03 13:44:52 +010045{
46 size_t size = sizeof(struct amdgpu_job);
47
48 if (num_ibs == 0)
49 return -EINVAL;
50
51 size += sizeof(struct amdgpu_ib) * num_ibs;
52
53 *job = kzalloc(size, GFP_KERNEL);
54 if (!*job)
55 return -ENOMEM;
56
Christian Königa1917b72018-07-13 17:15:54 +020057 /*
58 * Initialize the scheduler to at least some ring so that we always
59 * have a pointer to adev.
60 */
61 (*job)->base.sched = &adev->rings[0]->sched;
Monk Liuc5637832016-04-19 20:11:32 +080062 (*job)->vm = vm;
Christian König50838c82016-02-03 13:44:52 +010063 (*job)->ibs = (void *)&(*job)[1];
64 (*job)->num_ibs = num_ibs;
Christian König50838c82016-02-03 13:44:52 +010065
Christian Könige86f9ce2016-02-08 12:13:05 +010066 amdgpu_sync_create(&(*job)->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +080067 amdgpu_sync_create(&(*job)->sched_sync);
Monk Liuc70b78a2017-10-16 20:02:08 +080068 (*job)->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
Christian Könige86f9ce2016-02-08 12:13:05 +010069
Christian König50838c82016-02-03 13:44:52 +010070 return 0;
71}
72
Christian Königd71518b2016-02-01 12:20:25 +010073int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
74 struct amdgpu_job **job)
75{
76 int r;
77
Monk Liuc5637832016-04-19 20:11:32 +080078 r = amdgpu_job_alloc(adev, 1, job, NULL);
Christian Königd71518b2016-02-01 12:20:25 +010079 if (r)
80 return r;
81
82 r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]);
83 if (r)
84 kfree(*job);
Christian Königdf264f92017-06-28 15:41:17 +020085 else
86 (*job)->vm_pd_addr = adev->gart.table_addr;
Christian Königd71518b2016-02-01 12:20:25 +010087
88 return r;
89}
90
Christian Königa5fb4ec2016-06-29 15:10:31 +020091void amdgpu_job_free_resources(struct amdgpu_job *job)
Christian König50838c82016-02-03 13:44:52 +010092{
Christian Königa1917b72018-07-13 17:15:54 +020093 struct amdgpu_ring *ring = to_amdgpu_ring(job->base.sched);
Chris Wilsonf54d1862016-10-25 13:00:45 +010094 struct dma_fence *f;
Christian König1ab0d212016-05-18 13:09:47 +020095 unsigned i;
96
Monk Liu676d8c22016-03-17 13:57:09 +080097 /* use sched fence if available */
Christian König6fc13672016-05-20 12:53:52 +020098 f = job->base.s_fence ? &job->base.s_fence->finished : job->fence;
Christian König50838c82016-02-03 13:44:52 +010099
100 for (i = 0; i < job->num_ibs; ++i)
Christian Königa1917b72018-07-13 17:15:54 +0200101 amdgpu_ib_free(ring->adev, &job->ibs[i], f);
Christian Königd71518b2016-02-01 12:20:25 +0100102}
103
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100104static void amdgpu_job_free_cb(struct drm_sched_job *s_job)
Monk Liub6723c82016-03-10 12:14:44 +0800105{
Christian König3320b8d2018-07-13 15:08:44 +0200106 struct amdgpu_ring *ring = to_amdgpu_ring(s_job->sched);
107 struct amdgpu_job *job = to_amdgpu_job(s_job);
Christian Königc5f74f72016-05-19 09:54:15 +0200108
Christian König3320b8d2018-07-13 15:08:44 +0200109 amdgpu_ring_priority_put(ring, s_job->s_priority);
Chris Wilsonf54d1862016-10-25 13:00:45 +0100110 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200111 amdgpu_sync_free(&job->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800112 amdgpu_sync_free(&job->sched_sync);
Monk Liub6723c82016-03-10 12:14:44 +0800113 kfree(job);
114}
115
Christian König1e24e312016-05-18 13:12:12 +0200116void amdgpu_job_free(struct amdgpu_job *job)
117{
118 amdgpu_job_free_resources(job);
Christian Königa79a5bd2016-06-29 13:29:57 +0200119
Chris Wilsonf54d1862016-10-25 13:00:45 +0100120 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200121 amdgpu_sync_free(&job->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800122 amdgpu_sync_free(&job->sched_sync);
Christian König1e24e312016-05-18 13:12:12 +0200123 kfree(job);
124}
125
Christian König0e28b102018-07-13 13:54:56 +0200126int amdgpu_job_submit(struct amdgpu_job *job, struct drm_sched_entity *entity,
127 void *owner, struct dma_fence **f)
Christian Königd71518b2016-02-01 12:20:25 +0100128{
Christian Königb5286802018-07-16 14:58:48 +0200129 enum drm_sched_priority priority;
130 struct amdgpu_ring *ring;
Monk Liue6869412016-03-07 12:49:55 +0800131 int r;
Christian Königd71518b2016-02-01 12:20:25 +0100132
Monk Liue6869412016-03-07 12:49:55 +0800133 if (!f)
134 return -EINVAL;
135
Nayan Deshmukhcdc50172018-07-20 17:51:05 +0530136 r = drm_sched_job_init(&job->base, entity, owner);
Monk Liue6869412016-03-07 12:49:55 +0800137 if (r)
138 return r;
Christian Königd71518b2016-02-01 12:20:25 +0100139
140 job->owner = owner;
Chris Wilsonf54d1862016-10-25 13:00:45 +0100141 *f = dma_fence_get(&job->base.s_fence->finished);
Christian Königa5fb4ec2016-06-29 15:10:31 +0200142 amdgpu_job_free_resources(job);
Christian Königb5286802018-07-16 14:58:48 +0200143 priority = job->base.s_priority;
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100144 drm_sched_entity_push_job(&job->base, entity);
Christian Königd71518b2016-02-01 12:20:25 +0100145
Nayan Deshmukh068c3302018-07-20 17:51:06 +0530146 ring = to_amdgpu_ring(entity->rq->sched);
Christian Königb5286802018-07-16 14:58:48 +0200147 amdgpu_ring_priority_get(ring, priority);
148
Christian Königd71518b2016-02-01 12:20:25 +0100149 return 0;
Christian König50838c82016-02-03 13:44:52 +0100150}
151
Christian Königee913fd2018-07-13 16:29:10 +0200152int amdgpu_job_submit_direct(struct amdgpu_job *job, struct amdgpu_ring *ring,
153 struct dma_fence **fence)
154{
155 int r;
156
157 job->base.sched = &ring->sched;
158 r = amdgpu_ib_schedule(ring, job->num_ibs, job->ibs, NULL, fence);
159 job->fence = dma_fence_get(*fence);
160 if (r)
161 return r;
162
163 amdgpu_job_free(job);
164 return 0;
165}
166
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100167static struct dma_fence *amdgpu_job_dependency(struct drm_sched_job *sched_job,
168 struct drm_sched_entity *s_entity)
Christian Könige61235d2015-08-25 11:05:36 +0200169{
Nayan Deshmukh068c3302018-07-20 17:51:06 +0530170 struct amdgpu_ring *ring = to_amdgpu_ring(s_entity->rq->sched);
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800171 struct amdgpu_job *job = to_amdgpu_job(sched_job);
Monk Liuc5637832016-04-19 20:11:32 +0800172 struct amdgpu_vm *vm = job->vm;
Christian Königf024e882018-07-13 14:01:08 +0200173 struct dma_fence *fence;
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500174 bool explicit = false;
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800175 int r;
Christian König8d0a7ce2015-11-03 20:58:50 +0100176
Christian Königf024e882018-07-13 14:01:08 +0200177 fence = amdgpu_sync_get_fence(&job->sync, &explicit);
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500178 if (fence && explicit) {
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100179 if (drm_sched_dependency_optimized(fence, s_entity)) {
Christian Königa1917b72018-07-13 17:15:54 +0200180 r = amdgpu_sync_fence(ring->adev, &job->sched_sync,
181 fence, false);
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500182 if (r)
Christian Königf024e882018-07-13 14:01:08 +0200183 DRM_ERROR("Error adding fence (%d)\n", r);
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500184 }
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800185 }
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500186
Christian Königc4f46f22017-12-18 17:08:25 +0100187 while (fence == NULL && vm && !job->vmid) {
Christian König620f7742017-12-18 16:53:03 +0100188 r = amdgpu_vmid_grab(vm, ring, &job->sync,
189 &job->base.s_fence->finished,
190 job);
Christian König94dd0a42016-01-18 17:01:42 +0100191 if (r)
Christian König8d0a7ce2015-11-03 20:58:50 +0100192 DRM_ERROR("Error getting VM ID (%d)\n", r);
Christian König8d0a7ce2015-11-03 20:58:50 +0100193
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500194 fence = amdgpu_sync_get_fence(&job->sync, NULL);
Christian König8d0a7ce2015-11-03 20:58:50 +0100195 }
196
197 return fence;
Christian Könige61235d2015-08-25 11:05:36 +0200198}
199
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100200static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job)
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800201{
Christian König3320b8d2018-07-13 15:08:44 +0200202 struct amdgpu_ring *ring = to_amdgpu_ring(sched_job->sched);
Monk Liu48f05f22017-10-25 16:21:08 +0800203 struct dma_fence *fence = NULL, *finished;
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800204 struct amdgpu_job *job;
Christian Königbd755d02015-08-24 14:57:26 +0200205 int r;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800206
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800207 job = to_amdgpu_job(sched_job);
Monk Liu48f05f22017-10-25 16:21:08 +0800208 finished = &job->base.s_fence->finished;
Christian Könige86f9ce2016-02-08 12:13:05 +0100209
Christian König1fbb2e92016-06-01 10:47:36 +0200210 BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL));
Christian Könige86f9ce2016-02-08 12:13:05 +0100211
Chunming Zhou7034dec2015-11-11 14:56:00 +0800212 trace_amdgpu_sched_run_job(job);
Monk Liu48f05f22017-10-25 16:21:08 +0800213
Christian Königa1917b72018-07-13 17:15:54 +0200214 if (job->vram_lost_counter != atomic_read(&ring->adev->vram_lost_counter))
Monk Liu48f05f22017-10-25 16:21:08 +0800215 dma_fence_set_error(finished, -ECANCELED);/* skip IB as well if VRAM lost */
216
217 if (finished->error < 0) {
218 DRM_INFO("Skip scheduling IBs!\n");
Christian König14e47f92017-10-09 15:04:41 +0200219 } else {
Christian König3320b8d2018-07-13 15:08:44 +0200220 r = amdgpu_ib_schedule(ring, job->num_ibs, job->ibs, job,
Christian König14e47f92017-10-09 15:04:41 +0200221 &fence);
Chunming Zhou15d73ce2017-05-16 14:34:27 +0800222 if (r)
223 DRM_ERROR("Error scheduling IBs (%d)\n", r);
224 }
Chunming Zhouc7c5fbc2016-06-30 17:30:42 +0800225 /* if gpu reset, hw fence will be replaced here */
Chris Wilsonf54d1862016-10-25 13:00:45 +0100226 dma_fence_put(job->fence);
227 job->fence = dma_fence_get(fence);
Andres Rodriguezb2ff0e82017-02-20 17:53:19 -0500228
Christian König22a77cf2016-07-05 14:48:17 +0200229 amdgpu_job_free_resources(job);
Christian Königec72b802016-02-01 11:56:35 +0100230 return fence;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800231}
232
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100233const struct drm_sched_backend_ops amdgpu_sched_ops = {
Christian König0856cab2016-02-01 12:31:01 +0100234 .dependency = amdgpu_job_dependency,
235 .run_job = amdgpu_job_run,
Christian König0e51a772016-05-18 14:19:32 +0200236 .timedout_job = amdgpu_job_timedout,
Christian Königc5f74f72016-05-19 09:54:15 +0200237 .free_job = amdgpu_job_free_cb
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800238};