blob: 917c6f3bfa0949a648fa870ce9295ddf71be3f38 [file] [log] [blame]
Chunming Zhouc1b69ed2015-07-21 13:45:14 +08001/*
2 * Copyright 2015 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 *
23 */
24#include <linux/kthread.h>
25#include <linux/wait.h>
26#include <linux/sched.h>
27#include <drm/drmP.h>
28#include "amdgpu.h"
Chunming Zhou7034dec2015-11-11 14:56:00 +080029#include "amdgpu_trace.h"
Chunming Zhouc1b69ed2015-07-21 13:45:14 +080030
Monk Liue472d252016-03-03 19:00:50 +080031static void amdgpu_job_free_handler(struct work_struct *ws)
32{
33 struct amdgpu_job *job = container_of(ws, struct amdgpu_job, base.work_free_job);
Monk Liub6723c82016-03-10 12:14:44 +080034 amd_sched_job_put(&job->base);
Monk Liue472d252016-03-03 19:00:50 +080035}
36
Monk Liu0de24792016-03-04 18:51:02 +080037void amdgpu_job_timeout_func(struct work_struct *work)
38{
39 struct amdgpu_job *job = container_of(work, struct amdgpu_job, base.work_tdr.work);
40 DRM_ERROR("ring %s timeout, last signaled seq=%u, last emitted seq=%u\n",
41 job->base.sched->name,
42 (uint32_t)atomic_read(&job->ring->fence_drv.last_seq),
43 job->ring->fence_drv.sync_seq);
Monk Liub6723c82016-03-10 12:14:44 +080044
45 amd_sched_job_put(&job->base);
Monk Liu0de24792016-03-04 18:51:02 +080046}
47
Christian König50838c82016-02-03 13:44:52 +010048int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs,
Monk Liuc5637832016-04-19 20:11:32 +080049 struct amdgpu_job **job, struct amdgpu_vm *vm)
Christian König50838c82016-02-03 13:44:52 +010050{
51 size_t size = sizeof(struct amdgpu_job);
52
53 if (num_ibs == 0)
54 return -EINVAL;
55
56 size += sizeof(struct amdgpu_ib) * num_ibs;
57
58 *job = kzalloc(size, GFP_KERNEL);
59 if (!*job)
60 return -ENOMEM;
61
62 (*job)->adev = adev;
Monk Liuc5637832016-04-19 20:11:32 +080063 (*job)->vm = vm;
Christian König50838c82016-02-03 13:44:52 +010064 (*job)->ibs = (void *)&(*job)[1];
65 (*job)->num_ibs = num_ibs;
Monk Liue472d252016-03-03 19:00:50 +080066 INIT_WORK(&(*job)->base.work_free_job, amdgpu_job_free_handler);
Christian König50838c82016-02-03 13:44:52 +010067
Christian Könige86f9ce2016-02-08 12:13:05 +010068 amdgpu_sync_create(&(*job)->sync);
69
Christian König50838c82016-02-03 13:44:52 +010070 return 0;
71}
72
Christian Königd71518b2016-02-01 12:20:25 +010073int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size,
74 struct amdgpu_job **job)
75{
76 int r;
77
Monk Liuc5637832016-04-19 20:11:32 +080078 r = amdgpu_job_alloc(adev, 1, job, NULL);
Christian Königd71518b2016-02-01 12:20:25 +010079 if (r)
80 return r;
81
82 r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]);
83 if (r)
84 kfree(*job);
85
86 return r;
87}
88
Christian König50838c82016-02-03 13:44:52 +010089void amdgpu_job_free(struct amdgpu_job *job)
90{
91 unsigned i;
Monk Liu676d8c22016-03-17 13:57:09 +080092 struct fence *f;
93 /* use sched fence if available */
94 f = (job->base.s_fence)? &job->base.s_fence->base : job->fence;
Christian König50838c82016-02-03 13:44:52 +010095
96 for (i = 0; i < job->num_ibs; ++i)
Monk Liu676d8c22016-03-17 13:57:09 +080097 amdgpu_sa_bo_free(job->adev, &job->ibs[i].sa_bo, f);
Monk Liu73cfa5f2016-03-17 13:48:13 +080098 fence_put(job->fence);
Christian König50838c82016-02-03 13:44:52 +010099
100 amdgpu_bo_unref(&job->uf.bo);
Christian Könige86f9ce2016-02-08 12:13:05 +0100101 amdgpu_sync_free(&job->sync);
Monk Liue472d252016-03-03 19:00:50 +0800102
103 if (!job->base.use_sched)
104 kfree(job);
Christian Königd71518b2016-02-01 12:20:25 +0100105}
106
Monk Liub6723c82016-03-10 12:14:44 +0800107void amdgpu_job_free_func(struct kref *refcount)
108{
109 struct amdgpu_job *job = container_of(refcount, struct amdgpu_job, base.refcount);
110 kfree(job);
111}
112
Christian Königd71518b2016-02-01 12:20:25 +0100113int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring,
Christian König2bd9ccf2016-02-01 12:53:58 +0100114 struct amd_sched_entity *entity, void *owner,
115 struct fence **f)
Christian Königd71518b2016-02-01 12:20:25 +0100116{
Monk Liue6869412016-03-07 12:49:55 +0800117 struct fence *fence;
118 int r;
Christian Königd71518b2016-02-01 12:20:25 +0100119 job->ring = ring;
Christian Königd71518b2016-02-01 12:20:25 +0100120
Monk Liue6869412016-03-07 12:49:55 +0800121 if (!f)
122 return -EINVAL;
123
Monk Liu0de24792016-03-04 18:51:02 +0800124 r = amd_sched_job_init(&job->base, &ring->sched,
Monk Liub6723c82016-03-10 12:14:44 +0800125 entity,
Monk Liu0de24792016-03-04 18:51:02 +0800126 amdgpu_job_timeout_func,
Monk Liub6723c82016-03-10 12:14:44 +0800127 amdgpu_job_free_func,
128 owner, &fence);
Monk Liue6869412016-03-07 12:49:55 +0800129 if (r)
130 return r;
Christian Königd71518b2016-02-01 12:20:25 +0100131
132 job->owner = owner;
Monk Liue6869412016-03-07 12:49:55 +0800133 *f = fence_get(fence);
Christian Königd71518b2016-02-01 12:20:25 +0100134 amd_sched_entity_push_job(&job->base);
135
136 return 0;
Christian König50838c82016-02-03 13:44:52 +0100137}
138
Christian König0856cab2016-02-01 12:31:01 +0100139static struct fence *amdgpu_job_dependency(struct amd_sched_job *sched_job)
Christian Könige61235d2015-08-25 11:05:36 +0200140{
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800141 struct amdgpu_job *job = to_amdgpu_job(sched_job);
Monk Liuc5637832016-04-19 20:11:32 +0800142 struct amdgpu_vm *vm = job->vm;
Christian König8d0a7ce2015-11-03 20:58:50 +0100143
Christian Könige86f9ce2016-02-08 12:13:05 +0100144 struct fence *fence = amdgpu_sync_get_fence(&job->sync);
Christian König8d0a7ce2015-11-03 20:58:50 +0100145
Christian König4ff37a82016-02-26 16:18:26 +0100146 if (fence == NULL && vm && !job->ibs->vm_id) {
Christian Königb07c60c2016-01-31 12:29:04 +0100147 struct amdgpu_ring *ring = job->ring;
Christian König4ff37a82016-02-26 16:18:26 +0100148 unsigned i, vm_id;
149 uint64_t vm_pd_addr;
Christian König8d0a7ce2015-11-03 20:58:50 +0100150 int r;
151
Christian Könige86f9ce2016-02-08 12:13:05 +0100152 r = amdgpu_vm_grab_id(vm, ring, &job->sync,
Christian König4ff37a82016-02-26 16:18:26 +0100153 &job->base.s_fence->base,
154 &vm_id, &vm_pd_addr);
Christian König94dd0a42016-01-18 17:01:42 +0100155 if (r)
Christian König8d0a7ce2015-11-03 20:58:50 +0100156 DRM_ERROR("Error getting VM ID (%d)\n", r);
Christian König4ff37a82016-02-26 16:18:26 +0100157 else {
158 for (i = 0; i < job->num_ibs; ++i) {
159 job->ibs[i].vm_id = vm_id;
160 job->ibs[i].vm_pd_addr = vm_pd_addr;
161 }
162 }
Christian König8d0a7ce2015-11-03 20:58:50 +0100163
Christian Könige86f9ce2016-02-08 12:13:05 +0100164 fence = amdgpu_sync_get_fence(&job->sync);
Christian König8d0a7ce2015-11-03 20:58:50 +0100165 }
166
167 return fence;
Christian Könige61235d2015-08-25 11:05:36 +0200168}
169
Christian König0856cab2016-02-01 12:31:01 +0100170static struct fence *amdgpu_job_run(struct amd_sched_job *sched_job)
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800171{
Christian Königec72b802016-02-01 11:56:35 +0100172 struct fence *fence = NULL;
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800173 struct amdgpu_job *job;
Christian Königbd755d02015-08-24 14:57:26 +0200174 int r;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800175
Junwei Zhang4c7eb912015-09-09 09:05:55 +0800176 if (!sched_job) {
Chunming Zhou4cef9262015-08-05 19:52:14 +0800177 DRM_ERROR("job is null\n");
Christian König6f0e54a2015-08-05 21:22:10 +0200178 return NULL;
Chunming Zhou4cef9262015-08-05 19:52:14 +0800179 }
Junwei Zhanga6db8a32015-09-09 09:21:19 +0800180 job = to_amdgpu_job(sched_job);
Christian Könige86f9ce2016-02-08 12:13:05 +0100181
182 r = amdgpu_sync_wait(&job->sync);
183 if (r) {
184 DRM_ERROR("failed to sync wait (%d)\n", r);
185 return NULL;
186 }
187
Chunming Zhou7034dec2015-11-11 14:56:00 +0800188 trace_amdgpu_sched_run_job(job);
Christian König336d1f52016-02-16 10:57:10 +0100189 r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs,
Monk Liuc5637832016-04-19 20:11:32 +0800190 job->sync.last_vm_update, job, &fence);
Christian König1886d1a2015-08-31 17:28:28 +0200191 if (r) {
192 DRM_ERROR("Error scheduling IBs (%d)\n", r);
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800193 goto err;
Christian König1886d1a2015-08-31 17:28:28 +0200194 }
195
Christian König1886d1a2015-08-31 17:28:28 +0200196err:
Monk Liu73cfa5f2016-03-17 13:48:13 +0800197 job->fence = fence;
Christian Königd71518b2016-02-01 12:20:25 +0100198 amdgpu_job_free(job);
Christian Königec72b802016-02-01 11:56:35 +0100199 return fence;
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800200}
201
Nils Wallménius62250a92016-04-10 16:30:00 +0200202const struct amd_sched_backend_ops amdgpu_sched_ops = {
Christian König0856cab2016-02-01 12:31:01 +0100203 .dependency = amdgpu_job_dependency,
204 .run_job = amdgpu_job_run,
Monk Liu0de24792016-03-04 18:51:02 +0800205 .begin_job = amd_sched_job_begin,
206 .finish_job = amd_sched_job_finish,
Chunming Zhouc1b69ed2015-07-21 13:45:14 +0800207};