blob: 4f2b5acc8743f09f451f5d04ec4fabe9c686453c [file] [log] [blame]
Chunming Zhouc1b69ed2015-07-21 13:45:14 +08001/*
2 * Copyright 2015 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 *
23 */
24#include <linux/kthread.h>
25#include <linux/wait.h>
26#include <linux/sched.h>
27#include <drm/drmP.h>
28#include "amdgpu.h"
Chunming Zhou7034dec2015-11-11 14:56:00 +080029#include "amdgpu_trace.h"
Chunming Zhouc1b69ed2015-07-21 13:45:14 +080030
Christian König0e51a772016-05-18 14:19:32 +020031static void amdgpu_job_timedout(struct amd_sched_job *s_job)
Monk Liu0de24792016-03-04 18:51:02 +080032{
Christian König0e51a772016-05-18 14:19:32 +020033 struct amdgpu_job *job = container_of(s_job, struct amdgpu_job, base);
34
Monk Liu0de24792016-03-04 18:51:02 +080035 DRM_ERROR("ring %s timeout, last signaled seq=%u, last emitted seq=%u\n",
Christian König0e51a772016-05-18 14:19:32 +020036 job->base.sched->name,
37 atomic_read(&job->ring->fence_drv.last_seq),
38 job->ring->fence_drv.sync_seq);
Monk Liu4fbf87e22017-05-05 15:09:42 +080039
40 if (amdgpu_sriov_vf(job->adev))
Monk Liu7225f872017-04-26 14:51:54 +080041 amdgpu_sriov_gpu_reset(job->adev, job);
Monk Liu4fbf87e22017-05-05 15:09:42 +080042 else
43 amdgpu_gpu_reset(job->adev);
Monk Liu0de24792016-03-04 18:51:02 +080044}
45
Christian König50838c82016-02-03 13:44:52 +010046int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
Monk Liuc5637832016-04-19 20:11:32 +080047 struct amdgpu_job **job, struct amdgpu_vm *vm)
Christian König50838c82016-02-03 13:44:52 +010048{
49 size_t size = sizeof(struct amdgpu_job);
50
51 if (num_ibs == 0)
52 return -EINVAL;
53
54 size += sizeof(struct amdgpu_ib) * num_ibs;
55
56 *job = kzalloc(size, GFP_KERNEL);
57 if (!*job)
58 return -ENOMEM;
59
60 (*job)->adev = adev;
Monk Liuc5637832016-04-19 20:11:32 +080061 (*job)->vm = vm;
Christian König50838c82016-02-03 13:44:52 +010062 (*job)->ibs = (void *)&(*job)[1];
63 (*job)->num_ibs = num_ibs;
Christian König14e47f92017-10-09 15:04:41 +020064 (*job)->vram_lost_counter = atomic_read(&adev->vram_lost_counter);
Christian König50838c82016-02-03 13:44:52 +010065
Christian Könige86f9ce2016-02-08 12:13:05 +010066 amdgpu_sync_create(&(*job)->sync);
Chunming Zhoua340c7b2017-05-18 15:19:03 +080067 amdgpu_sync_create(&(*job)->dep_sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +080068 amdgpu_sync_create(&(*job)->sched_sync);
Christian Könige86f9ce2016-02-08 12:13:05 +010069
Christian König50838c82016-02-03 13:44:52 +010070 return 0;
71}
72
Christian Königd71518b2016-02-01 12:20:25 +010073int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
74 struct amdgpu_job **job)
75{
76 int r;
77
Monk Liuc5637832016-04-19 20:11:32 +080078 r = amdgpu_job_alloc(adev, 1, job, NULL);
Christian Königd71518b2016-02-01 12:20:25 +010079 if (r)
80 return r;
81
82 r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]);
83 if (r)
84 kfree(*job);
Christian Königdf264f92017-06-28 15:41:17 +020085 else
86 (*job)->vm_pd_addr = adev->gart.table_addr;
Christian Königd71518b2016-02-01 12:20:25 +010087
88 return r;
89}
90
Christian Königa5fb4ec2016-06-29 15:10:31 +020091void amdgpu_job_free_resources(struct amdgpu_job *job)
Christian König50838c82016-02-03 13:44:52 +010092{
Chris Wilsonf54d1862016-10-25 13:00:45 +010093 struct dma_fence *f;
Christian König1ab0d212016-05-18 13:09:47 +020094 unsigned i;
95
Monk Liu676d8c22016-03-17 13:57:09 +080096 /* use sched fence if available */
Christian König6fc13672016-05-20 12:53:52 +020097 f = job->base.s_fence ? &job->base.s_fence->finished : job->fence;
Christian König50838c82016-02-03 13:44:52 +010098
99 for (i = 0; i < job->num_ibs; ++i)
Christian König1ab0d212016-05-18 13:09:47 +0200100 amdgpu_ib_free(job->adev, &job->ibs[i], f);
Christian Königd71518b2016-02-01 12:20:25 +0100101}
102
Baoyou Xie761c2e82016-09-03 13:57:14 +0800103static void amdgpu_job_free_cb(struct amd_sched_job *s_job)
Monk Liub6723c82016-03-10 12:14:44 +0800104{
Christian Königc5f74f72016-05-19 09:54:15 +0200105 struct amdgpu_job *job = container_of(s_job, struct amdgpu_job, base);
106
Andres Rodriguezb2ff0e82017-02-20 17:53:19 -0500107 amdgpu_ring_priority_put(job->ring, amd_sched_get_job_priority(s_job));
Chris Wilsonf54d1862016-10-25 13:00:45 +0100108 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200109 amdgpu_sync_free(&job->sync);
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800110 amdgpu_sync_free(&job->dep_sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800111 amdgpu_sync_free(&job->sched_sync);
Monk Liub6723c82016-03-10 12:14:44 +0800112 kfree(job);
113}
114
Christian König1e24e312016-05-18 13:12:12 +0200115void amdgpu_job_free(struct amdgpu_job *job)
116{
117 amdgpu_job_free_resources(job);
Christian Königa79a5bd2016-06-29 13:29:57 +0200118
Chris Wilsonf54d1862016-10-25 13:00:45 +0100119 dma_fence_put(job->fence);
Christian Königa79a5bd2016-06-29 13:29:57 +0200120 amdgpu_sync_free(&job->sync);
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800121 amdgpu_sync_free(&job->dep_sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800122 amdgpu_sync_free(&job->sched_sync);
Christian König1e24e312016-05-18 13:12:12 +0200123 kfree(job);
124}
125
Christian Königd71518b2016-02-01 12:20:25 +0100126int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring,
Christian König2bd9ccf2016-02-01 12:53:58 +0100127 struct amd_sched_entity *entity, void *owner,
Chris Wilsonf54d1862016-10-25 13:00:45 +0100128 struct dma_fence **f)
Christian Königd71518b2016-02-01 12:20:25 +0100129{
Monk Liue6869412016-03-07 12:49:55 +0800130 int r;
Christian Königd71518b2016-02-01 12:20:25 +0100131 job->ring = ring;
Christian Königd71518b2016-02-01 12:20:25 +0100132
Monk Liue6869412016-03-07 12:49:55 +0800133 if (!f)
134 return -EINVAL;
135
Christian König595a9cd2016-06-30 10:52:03 +0200136 r = amd_sched_job_init(&job->base, &ring->sched, entity, owner);
Monk Liue6869412016-03-07 12:49:55 +0800137 if (r)
138 return r;
Christian Königd71518b2016-02-01 12:20:25 +0100139
140 job->owner = owner;
Monk Liu3aecd242016-08-25 15:40:48 +0800141 job->fence_ctx = entity->fence_context;
Chris Wilsonf54d1862016-10-25 13:00:45 +0100142 *f = dma_fence_get(&job->base.s_fence->finished);
Christian Königa5fb4ec2016-06-29 15:10:31 +0200143 amdgpu_job_free_resources(job);
Andres Rodriguezb2ff0e82017-02-20 17:53:19 -0500144 amdgpu_ring_priority_get(job->ring,
145 amd_sched_get_job_priority(&job->base));
Christian Königd71518b2016-02-01 12:20:25 +0100146 amd_sched_entity_push_job(&job->base);
147
148 return 0;
Christian König50838c82016-02-03 13:44:52 +0100149}
150
Chris Wilsonf54d1862016-10-25 13:00:45 +0100151static struct dma_fence *amdgpu_job_dependency(struct amd_sched_job *sched_job)
Christian Könige61235d2015-08-25 11:05:36 +0200152{
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800153 struct amdgpu_job *job = to_amdgpu_job(sched_job);
Monk Liuc5637832016-04-19 20:11:32 +0800154 struct amdgpu_vm *vm = job->vm;
Christian König8d0a7ce2015-11-03 20:58:50 +0100155
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800156 struct dma_fence *fence = amdgpu_sync_get_fence(&job->dep_sync);
Chunming Zhoudf83d1e2017-05-09 15:50:22 +0800157 int r;
Christian König8d0a7ce2015-11-03 20:58:50 +0100158
Chunming Zhoua340c7b2017-05-18 15:19:03 +0800159 if (amd_sched_dependency_optimized(fence, sched_job->s_entity)) {
160 r = amdgpu_sync_fence(job->adev, &job->sched_sync, fence);
161 if (r)
162 DRM_ERROR("Error adding fence to sync (%d)\n", r);
163 }
164 if (!fence)
165 fence = amdgpu_sync_get_fence(&job->sync);
Chunming Zhou6c98d312017-04-21 17:58:42 +0800166 while (fence == NULL && vm && !job->vm_id) {
Christian Königb07c60c2016-01-31 12:29:04 +0100167 struct amdgpu_ring *ring = job->ring;
Christian König8d0a7ce2015-11-03 20:58:50 +0100168
Christian Könige86f9ce2016-02-08 12:13:05 +0100169 r = amdgpu_vm_grab_id(vm, ring, &job->sync,
Christian König6fc13672016-05-20 12:53:52 +0200170 &job->base.s_fence->finished,
Chunming Zhoufd53be32016-07-01 17:59:01 +0800171 job);
Christian König94dd0a42016-01-18 17:01:42 +0100172 if (r)
Christian König8d0a7ce2015-11-03 20:58:50 +0100173 DRM_ERROR("Error getting VM ID (%d)\n", r);
Christian König8d0a7ce2015-11-03 20:58:50 +0100174
Christian Könige86f9ce2016-02-08 12:13:05 +0100175 fence = amdgpu_sync_get_fence(&job->sync);
Christian König8d0a7ce2015-11-03 20:58:50 +0100176 }
177
178 return fence;
Christian Könige61235d2015-08-25 11:05:36 +0200179}
180
Chris Wilsonf54d1862016-10-25 13:00:45 +0100181static struct dma_fence *amdgpu_job_run(struct amd_sched_job *sched_job)
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800182{
Chris Wilsonf54d1862016-10-25 13:00:45 +0100183 struct dma_fence *fence = NULL;
Christian König14e47f92017-10-09 15:04:41 +0200184 struct amdgpu_device *adev;
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800185 struct amdgpu_job *job;
Christian Königbd755d02015-08-24 14:57:26 +0200186 int r;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800187
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800188 if (!sched_job) {
Chunming Zhou4cef9262015-08-05 19:52:14 +0800189 DRM_ERROR("job is null\n");
Christian König6f0e54a2015-08-05 21:22:10 +0200190 return NULL;
Chunming Zhou4cef9262015-08-05 19:52:14 +0800191 }
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800192 job = to_amdgpu_job(sched_job);
Christian König14e47f92017-10-09 15:04:41 +0200193 adev = job->adev;
Christian Könige86f9ce2016-02-08 12:13:05 +0100194
Christian König1fbb2e92016-06-01 10:47:36 +0200195 BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL));
Christian Könige86f9ce2016-02-08 12:13:05 +0100196
Chunming Zhou7034dec2015-11-11 14:56:00 +0800197 trace_amdgpu_sched_run_job(job);
Chunming Zhou15d73ce2017-05-16 14:34:27 +0800198 /* skip ib schedule when vram is lost */
Christian König14e47f92017-10-09 15:04:41 +0200199 if (job->vram_lost_counter != atomic_read(&adev->vram_lost_counter)) {
Chunming Zhou15d73ce2017-05-16 14:34:27 +0800200 DRM_ERROR("Skip scheduling IBs!\n");
Christian König14e47f92017-10-09 15:04:41 +0200201 } else {
202 r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs, job,
203 &fence);
Chunming Zhou15d73ce2017-05-16 14:34:27 +0800204 if (r)
205 DRM_ERROR("Error scheduling IBs (%d)\n", r);
206 }
Chunming Zhouc7c5fbc2016-06-30 17:30:42 +0800207 /* if gpu reset, hw fence will be replaced here */
Chris Wilsonf54d1862016-10-25 13:00:45 +0100208 dma_fence_put(job->fence);
209 job->fence = dma_fence_get(fence);
Andres Rodriguezb2ff0e82017-02-20 17:53:19 -0500210
Christian König22a77cf2016-07-05 14:48:17 +0200211 amdgpu_job_free_resources(job);
Christian Königec72b802016-02-01 11:56:35 +0100212 return fence;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800213}
214
Nils Wallménius62250a92016-04-10 16:30:00 +0200215const struct amd_sched_backend_ops amdgpu_sched_ops = {
Christian König0856cab2016-02-01 12:31:01 +0100216 .dependency = amdgpu_job_dependency,
217 .run_job = amdgpu_job_run,
Christian König0e51a772016-05-18 14:19:32 +0200218 .timedout_job = amdgpu_job_timedout,
Christian Königc5f74f72016-05-19 09:54:15 +0200219 .free_job = amdgpu_job_free_cb
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800220};