blob: 9b1c54ace5834772f0b4a0d4887780d899eb96f3 [file] [log] [blame]
Chunming Zhouc1b69ed2015-07-21 13:45:14 +08001/*
2 * Copyright 2015 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 *
23 */
24#include <linux/kthread.h>
25#include <linux/wait.h>
26#include <linux/sched.h>
27#include <drm/drmP.h>
28#include "amdgpu.h"
Chunming Zhou7034dec2015-11-11 14:56:00 +080029#include "amdgpu_trace.h"
Chunming Zhouc1b69ed2015-07-21 13:45:14 +080030
Lucas Stach1b1f42d2017-12-06 17:49:39 +010031static void amdgpu_job_timedout(struct drm_sched_job *s_job)
Monk Liu0de24792016-03-04 18:51:02 +080032{
Christian König3320b8d2018-07-13 15:08:44 +020033 struct amdgpu_ring *ring = to_amdgpu_ring(s_job->sched);
34 struct amdgpu_job *job = to_amdgpu_job(s_job);
Christian König0e51a772016-05-18 14:19:32 +020035
Monk Liu0de24792016-03-04 18:51:02 +080036 DRM_ERROR("ring %s timeout, last signaled seq=%u, last emitted seq=%u\n",
Christian König3320b8d2018-07-13 15:08:44 +020037 job->base.sched->name, atomic_read(&ring->fence_drv.last_seq),
38 ring->fence_drv.sync_seq);
Monk Liu4fbf87e22017-05-05 15:09:42 +080039
Christian Königa1917b72018-07-13 17:15:54 +020040 amdgpu_device_gpu_recover(ring->adev, job, false);
Monk Liu0de24792016-03-04 18:51:02 +080041}
42
Christian König50838c82016-02-03 13:44:52 +010043int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
Monk Liuc5637832016-04-19 20:11:32 +080044 struct amdgpu_job **job, struct amdgpu_vm *vm)
Christian König50838c82016-02-03 13:44:52 +010045{
46 size_t size = sizeof(struct amdgpu_job);
47
48 if (num_ibs == 0)
49 return -EINVAL;
50
51 size += sizeof(struct amdgpu_ib) * num_ibs;
52
53 *job = kzalloc(size, GFP_KERNEL);
54 if (!*job)
55 return -ENOMEM;
56
Christian Königa1917b72018-07-13 17:15:54 +020057 /*
58 * Initialize the scheduler to at least some ring so that we always
59 * have a pointer to adev.
60 */
61 (*job)->base.sched = &adev->rings[0]->sched;
Monk Liuc5637832016-04-19 20:11:32 +080062 (*job)->vm = vm;
Christian König50838c82016-02-03 13:44:52 +010063 (*job)->ibs = (void *)&(*job)[1];
64 (*job)->num_ibs = num_ibs;
Christian König50838c82016-02-03 13:44:52 +010065
Christian Könige86f9ce2016-02-08 12:13:05 +010066 amdgpu_sync_create(&(*job)->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +080067 amdgpu_sync_create(&(*job)->sched_sync);
Monk Liuc70b78a2017-10-16 20:02:08 +080068 (*job)->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
Christian Könige86f9ce2016-02-08 12:13:05 +010069
Christian König50838c82016-02-03 13:44:52 +010070 return 0;
71}
72
Christian Königd71518b2016-02-01 12:20:25 +010073int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
74 struct amdgpu_job **job)
75{
76 int r;
77
Monk Liuc5637832016-04-19 20:11:32 +080078 r = amdgpu_job_alloc(adev, 1, job, NULL);
Christian Königd71518b2016-02-01 12:20:25 +010079 if (r)
80 return r;
81
82 r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]);
83 if (r)
84 kfree(*job);
Christian Königdf264f92017-06-28 15:41:17 +020085 else
86 (*job)->vm_pd_addr = adev->gart.table_addr;
Christian Königd71518b2016-02-01 12:20:25 +010087
88 return r;
89}
90
Christian Königa5fb4ec2016-06-29 15:10:31 +020091void amdgpu_job_free_resources(struct amdgpu_job *job)
Christian König50838c82016-02-03 13:44:52 +010092{
Christian Königa1917b72018-07-13 17:15:54 +020093 struct amdgpu_ring *ring = to_amdgpu_ring(job->base.sched);
Chris Wilsonf54d1862016-10-25 13:00:45 +010094 struct dma_fence *f;
Christian König1ab0d212016-05-18 13:09:47 +020095 unsigned i;
96
Monk Liu676d8c22016-03-17 13:57:09 +080097 /* use sched fence if available */
Christian König6fc13672016-05-20 12:53:52 +020098 f = job->base.s_fence ? &job->base.s_fence->finished : job->fence;
Christian König50838c82016-02-03 13:44:52 +010099
100 for (i = 0; i < job->num_ibs; ++i)
Christian Königa1917b72018-07-13 17:15:54 +0200101 amdgpu_ib_free(ring->adev, &job->ibs[i], f);
Christian Königd71518b2016-02-01 12:20:25 +0100102}
103
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100104static void amdgpu_job_free_cb(struct drm_sched_job *s_job)
Monk Liub6723c82016-03-10 12:14:44 +0800105{
Christian König3320b8d2018-07-13 15:08:44 +0200106 struct amdgpu_ring *ring = to_amdgpu_ring(s_job->sched);
107 struct amdgpu_job *job = to_amdgpu_job(s_job);
Christian Königc5f74f72016-05-19 09:54:15 +0200108
Christian König3320b8d2018-07-13 15:08:44 +0200109 amdgpu_ring_priority_put(ring, s_job->s_priority);
Chris Wilsonf54d1862016-10-25 13:00:45 +0100110 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200111 amdgpu_sync_free(&job->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800112 amdgpu_sync_free(&job->sched_sync);
Monk Liub6723c82016-03-10 12:14:44 +0800113 kfree(job);
114}
115
Christian König1e24e312016-05-18 13:12:12 +0200116void amdgpu_job_free(struct amdgpu_job *job)
117{
118 amdgpu_job_free_resources(job);
Christian Königa79a5bd2016-06-29 13:29:57 +0200119
Chris Wilsonf54d1862016-10-25 13:00:45 +0100120 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200121 amdgpu_sync_free(&job->sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800122 amdgpu_sync_free(&job->sched_sync);
Christian König1e24e312016-05-18 13:12:12 +0200123 kfree(job);
124}
125
Christian König0e28b102018-07-13 13:54:56 +0200126int amdgpu_job_submit(struct amdgpu_job *job, struct drm_sched_entity *entity,
127 void *owner, struct dma_fence **f)
Christian Königd71518b2016-02-01 12:20:25 +0100128{
Christian König3320b8d2018-07-13 15:08:44 +0200129 struct amdgpu_ring *ring = to_amdgpu_ring(entity->sched);
Monk Liue6869412016-03-07 12:49:55 +0800130 int r;
Christian Königd71518b2016-02-01 12:20:25 +0100131
Monk Liue6869412016-03-07 12:49:55 +0800132 if (!f)
133 return -EINVAL;
134
Christian König0e28b102018-07-13 13:54:56 +0200135 r = drm_sched_job_init(&job->base, entity->sched, entity, owner);
Monk Liue6869412016-03-07 12:49:55 +0800136 if (r)
137 return r;
Christian Königd71518b2016-02-01 12:20:25 +0100138
139 job->owner = owner;
Chris Wilsonf54d1862016-10-25 13:00:45 +0100140 *f = dma_fence_get(&job->base.s_fence->finished);
Christian Königa5fb4ec2016-06-29 15:10:31 +0200141 amdgpu_job_free_resources(job);
Christian König3320b8d2018-07-13 15:08:44 +0200142 amdgpu_ring_priority_get(ring, job->base.s_priority);
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100143 drm_sched_entity_push_job(&job->base, entity);
Christian Königd71518b2016-02-01 12:20:25 +0100144
145 return 0;
Christian König50838c82016-02-03 13:44:52 +0100146}
147
Christian Königee913fd2018-07-13 16:29:10 +0200148int amdgpu_job_submit_direct(struct amdgpu_job *job, struct amdgpu_ring *ring,
149 struct dma_fence **fence)
150{
151 int r;
152
153 job->base.sched = &ring->sched;
154 r = amdgpu_ib_schedule(ring, job->num_ibs, job->ibs, NULL, fence);
155 job->fence = dma_fence_get(*fence);
156 if (r)
157 return r;
158
159 amdgpu_job_free(job);
160 return 0;
161}
162
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100163static struct dma_fence *amdgpu_job_dependency(struct drm_sched_job *sched_job,
164 struct drm_sched_entity *s_entity)
Christian Könige61235d2015-08-25 11:05:36 +0200165{
Christian König3320b8d2018-07-13 15:08:44 +0200166 struct amdgpu_ring *ring = to_amdgpu_ring(s_entity->sched);
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800167 struct amdgpu_job *job = to_amdgpu_job(sched_job);
Monk Liuc5637832016-04-19 20:11:32 +0800168 struct amdgpu_vm *vm = job->vm;
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500169 bool explicit = false;
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800170 int r;
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500171 struct dma_fence *fence = amdgpu_sync_get_fence(&job->sync, &explicit);
Christian König8d0a7ce2015-11-03 20:58:50 +0100172
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500173 if (fence && explicit) {
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100174 if (drm_sched_dependency_optimized(fence, s_entity)) {
Christian Königa1917b72018-07-13 17:15:54 +0200175 r = amdgpu_sync_fence(ring->adev, &job->sched_sync,
176 fence, false);
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500177 if (r)
178 DRM_ERROR("Error adding fence to sync (%d)\n", r);
179 }
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800180 }
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500181
Christian Königc4f46f22017-12-18 17:08:25 +0100182 while (fence == NULL && vm && !job->vmid) {
Christian König620f7742017-12-18 16:53:03 +0100183 r = amdgpu_vmid_grab(vm, ring, &job->sync,
184 &job->base.s_fence->finished,
185 job);
Christian König94dd0a42016-01-18 17:01:42 +0100186 if (r)
Christian König8d0a7ce2015-11-03 20:58:50 +0100187 DRM_ERROR("Error getting VM ID (%d)\n", r);
Christian König8d0a7ce2015-11-03 20:58:50 +0100188
Andrey Grodzovskycebb52b2017-11-13 14:47:52 -0500189 fence = amdgpu_sync_get_fence(&job->sync, NULL);
Christian König8d0a7ce2015-11-03 20:58:50 +0100190 }
191
192 return fence;
Christian Könige61235d2015-08-25 11:05:36 +0200193}
194
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100195static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job)
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800196{
Christian König3320b8d2018-07-13 15:08:44 +0200197 struct amdgpu_ring *ring = to_amdgpu_ring(sched_job->sched);
Monk Liu48f05f22017-10-25 16:21:08 +0800198 struct dma_fence *fence = NULL, *finished;
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800199 struct amdgpu_job *job;
Christian Königbd755d02015-08-24 14:57:26 +0200200 int r;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800201
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800202 if (!sched_job) {
Chunming Zhou4cef9262015-08-05 19:52:14 +0800203 DRM_ERROR("job is null\n");
Christian König6f0e54a2015-08-05 21:22:10 +0200204 return NULL;
Chunming Zhou4cef9262015-08-05 19:52:14 +0800205 }
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800206 job = to_amdgpu_job(sched_job);
Monk Liu48f05f22017-10-25 16:21:08 +0800207 finished = &job->base.s_fence->finished;
Christian Könige86f9ce2016-02-08 12:13:05 +0100208
Christian König1fbb2e92016-06-01 10:47:36 +0200209 BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL));
Christian Könige86f9ce2016-02-08 12:13:05 +0100210
Chunming Zhou7034dec2015-11-11 14:56:00 +0800211 trace_amdgpu_sched_run_job(job);
Monk Liu48f05f22017-10-25 16:21:08 +0800212
Christian Königa1917b72018-07-13 17:15:54 +0200213 if (job->vram_lost_counter != atomic_read(&ring->adev->vram_lost_counter))
Monk Liu48f05f22017-10-25 16:21:08 +0800214 dma_fence_set_error(finished, -ECANCELED);/* skip IB as well if VRAM lost */
215
216 if (finished->error < 0) {
217 DRM_INFO("Skip scheduling IBs!\n");
Christian König14e47f92017-10-09 15:04:41 +0200218 } else {
Christian König3320b8d2018-07-13 15:08:44 +0200219 r = amdgpu_ib_schedule(ring, job->num_ibs, job->ibs, job,
Christian König14e47f92017-10-09 15:04:41 +0200220 &fence);
Chunming Zhou15d73ce2017-05-16 14:34:27 +0800221 if (r)
222 DRM_ERROR("Error scheduling IBs (%d)\n", r);
223 }
Chunming Zhouc7c5fbc2016-06-30 17:30:42 +0800224 /* if gpu reset, hw fence will be replaced here */
Chris Wilsonf54d1862016-10-25 13:00:45 +0100225 dma_fence_put(job->fence);
226 job->fence = dma_fence_get(fence);
Andres Rodriguezb2ff0e82017-02-20 17:53:19 -0500227
Christian König22a77cf2016-07-05 14:48:17 +0200228 amdgpu_job_free_resources(job);
Christian Königec72b802016-02-01 11:56:35 +0100229 return fence;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800230}
231
Lucas Stach1b1f42d2017-12-06 17:49:39 +0100232const struct drm_sched_backend_ops amdgpu_sched_ops = {
Christian König0856cab2016-02-01 12:31:01 +0100233 .dependency = amdgpu_job_dependency,
234 .run_job = amdgpu_job_run,
Christian König0e51a772016-05-18 14:19:32 +0200235 .timedout_job = amdgpu_job_timedout,
Christian Königc5f74f72016-05-19 09:54:15 +0200236 .free_job = amdgpu_job_free_cb
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800237};