Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2015 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
| 18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
| 19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
| 20 | * OTHER DEALINGS IN THE SOFTWARE. |
| 21 | * |
| 22 | * |
| 23 | */ |
| 24 | #include <linux/kthread.h> |
| 25 | #include <linux/wait.h> |
| 26 | #include <linux/sched.h> |
| 27 | #include <drm/drmP.h> |
| 28 | #include "amdgpu.h" |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 29 | #include "amdgpu_trace.h" |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 30 | |
Monk Liu | e472d25 | 2016-03-03 19:00:50 +0800 | [diff] [blame] | 31 | static void amdgpu_job_free_handler(struct work_struct *ws) |
| 32 | { |
| 33 | struct amdgpu_job *job = container_of(ws, struct amdgpu_job, base.work_free_job); |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 34 | amd_sched_job_put(&job->base); |
Monk Liu | e472d25 | 2016-03-03 19:00:50 +0800 | [diff] [blame] | 35 | } |
| 36 | |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 37 | void amdgpu_job_timeout_func(struct work_struct *work) |
| 38 | { |
| 39 | struct amdgpu_job *job = container_of(work, struct amdgpu_job, base.work_tdr.work); |
| 40 | DRM_ERROR("ring %s timeout, last signaled seq=%u, last emitted seq=%u\n", |
| 41 | job->base.sched->name, |
| 42 | (uint32_t)atomic_read(&job->ring->fence_drv.last_seq), |
| 43 | job->ring->fence_drv.sync_seq); |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 44 | |
| 45 | amd_sched_job_put(&job->base); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 46 | } |
| 47 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 48 | int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs, |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame^] | 49 | struct amdgpu_job **job, struct amdgpu_vm *vm) |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 50 | { |
| 51 | size_t size = sizeof(struct amdgpu_job); |
| 52 | |
| 53 | if (num_ibs == 0) |
| 54 | return -EINVAL; |
| 55 | |
| 56 | size += sizeof(struct amdgpu_ib) * num_ibs; |
| 57 | |
| 58 | *job = kzalloc(size, GFP_KERNEL); |
| 59 | if (!*job) |
| 60 | return -ENOMEM; |
| 61 | |
| 62 | (*job)->adev = adev; |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame^] | 63 | (*job)->vm = vm; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 64 | (*job)->ibs = (void *)&(*job)[1]; |
| 65 | (*job)->num_ibs = num_ibs; |
Monk Liu | e472d25 | 2016-03-03 19:00:50 +0800 | [diff] [blame] | 66 | INIT_WORK(&(*job)->base.work_free_job, amdgpu_job_free_handler); |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 67 | |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 68 | amdgpu_sync_create(&(*job)->sync); |
| 69 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 70 | return 0; |
| 71 | } |
| 72 | |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 73 | int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size, |
| 74 | struct amdgpu_job **job) |
| 75 | { |
| 76 | int r; |
| 77 | |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame^] | 78 | r = amdgpu_job_alloc(adev, 1, job, NULL); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 79 | if (r) |
| 80 | return r; |
| 81 | |
| 82 | r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]); |
| 83 | if (r) |
| 84 | kfree(*job); |
| 85 | |
| 86 | return r; |
| 87 | } |
| 88 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 89 | void amdgpu_job_free(struct amdgpu_job *job) |
| 90 | { |
| 91 | unsigned i; |
Monk Liu | 676d8c2 | 2016-03-17 13:57:09 +0800 | [diff] [blame] | 92 | struct fence *f; |
| 93 | /* use sched fence if available */ |
| 94 | f = (job->base.s_fence)? &job->base.s_fence->base : job->fence; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 95 | |
| 96 | for (i = 0; i < job->num_ibs; ++i) |
Monk Liu | 676d8c2 | 2016-03-17 13:57:09 +0800 | [diff] [blame] | 97 | amdgpu_sa_bo_free(job->adev, &job->ibs[i].sa_bo, f); |
Monk Liu | 73cfa5f | 2016-03-17 13:48:13 +0800 | [diff] [blame] | 98 | fence_put(job->fence); |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 99 | |
| 100 | amdgpu_bo_unref(&job->uf.bo); |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 101 | amdgpu_sync_free(&job->sync); |
Monk Liu | e472d25 | 2016-03-03 19:00:50 +0800 | [diff] [blame] | 102 | |
| 103 | if (!job->base.use_sched) |
| 104 | kfree(job); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 105 | } |
| 106 | |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 107 | void amdgpu_job_free_func(struct kref *refcount) |
| 108 | { |
| 109 | struct amdgpu_job *job = container_of(refcount, struct amdgpu_job, base.refcount); |
| 110 | kfree(job); |
| 111 | } |
| 112 | |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 113 | int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring, |
Christian König | 2bd9ccf | 2016-02-01 12:53:58 +0100 | [diff] [blame] | 114 | struct amd_sched_entity *entity, void *owner, |
| 115 | struct fence **f) |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 116 | { |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 117 | struct fence *fence; |
| 118 | int r; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 119 | job->ring = ring; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 120 | |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 121 | if (!f) |
| 122 | return -EINVAL; |
| 123 | |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 124 | r = amd_sched_job_init(&job->base, &ring->sched, |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 125 | entity, |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 126 | amdgpu_job_timeout_func, |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 127 | amdgpu_job_free_func, |
| 128 | owner, &fence); |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 129 | if (r) |
| 130 | return r; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 131 | |
| 132 | job->owner = owner; |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 133 | *f = fence_get(fence); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 134 | amd_sched_entity_push_job(&job->base); |
| 135 | |
| 136 | return 0; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 137 | } |
| 138 | |
Christian König | 0856cab | 2016-02-01 12:31:01 +0100 | [diff] [blame] | 139 | static struct fence *amdgpu_job_dependency(struct amd_sched_job *sched_job) |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 140 | { |
Junwei Zhang | a6db8a3 | 2015-09-09 09:21:19 +0800 | [diff] [blame] | 141 | struct amdgpu_job *job = to_amdgpu_job(sched_job); |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame^] | 142 | struct amdgpu_vm *vm = job->vm; |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 143 | |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 144 | struct fence *fence = amdgpu_sync_get_fence(&job->sync); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 145 | |
Christian König | 4ff37a8 | 2016-02-26 16:18:26 +0100 | [diff] [blame] | 146 | if (fence == NULL && vm && !job->ibs->vm_id) { |
Christian König | b07c60c | 2016-01-31 12:29:04 +0100 | [diff] [blame] | 147 | struct amdgpu_ring *ring = job->ring; |
Christian König | 4ff37a8 | 2016-02-26 16:18:26 +0100 | [diff] [blame] | 148 | unsigned i, vm_id; |
| 149 | uint64_t vm_pd_addr; |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 150 | int r; |
| 151 | |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 152 | r = amdgpu_vm_grab_id(vm, ring, &job->sync, |
Christian König | 4ff37a8 | 2016-02-26 16:18:26 +0100 | [diff] [blame] | 153 | &job->base.s_fence->base, |
| 154 | &vm_id, &vm_pd_addr); |
Christian König | 94dd0a4 | 2016-01-18 17:01:42 +0100 | [diff] [blame] | 155 | if (r) |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 156 | DRM_ERROR("Error getting VM ID (%d)\n", r); |
Christian König | 4ff37a8 | 2016-02-26 16:18:26 +0100 | [diff] [blame] | 157 | else { |
| 158 | for (i = 0; i < job->num_ibs; ++i) { |
| 159 | job->ibs[i].vm_id = vm_id; |
| 160 | job->ibs[i].vm_pd_addr = vm_pd_addr; |
| 161 | } |
| 162 | } |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 163 | |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 164 | fence = amdgpu_sync_get_fence(&job->sync); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 165 | } |
| 166 | |
| 167 | return fence; |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 168 | } |
| 169 | |
Christian König | 0856cab | 2016-02-01 12:31:01 +0100 | [diff] [blame] | 170 | static struct fence *amdgpu_job_run(struct amd_sched_job *sched_job) |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 171 | { |
Christian König | ec72b80 | 2016-02-01 11:56:35 +0100 | [diff] [blame] | 172 | struct fence *fence = NULL; |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 173 | struct amdgpu_job *job; |
Christian König | bd755d0 | 2015-08-24 14:57:26 +0200 | [diff] [blame] | 174 | int r; |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 175 | |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 176 | if (!sched_job) { |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 177 | DRM_ERROR("job is null\n"); |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 178 | return NULL; |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 179 | } |
Junwei Zhang | a6db8a3 | 2015-09-09 09:21:19 +0800 | [diff] [blame] | 180 | job = to_amdgpu_job(sched_job); |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 181 | |
| 182 | r = amdgpu_sync_wait(&job->sync); |
| 183 | if (r) { |
| 184 | DRM_ERROR("failed to sync wait (%d)\n", r); |
| 185 | return NULL; |
| 186 | } |
| 187 | |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 188 | trace_amdgpu_sched_run_job(job); |
Christian König | 336d1f5 | 2016-02-16 10:57:10 +0100 | [diff] [blame] | 189 | r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs, |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame^] | 190 | job->sync.last_vm_update, job, &fence); |
Christian König | 1886d1a | 2015-08-31 17:28:28 +0200 | [diff] [blame] | 191 | if (r) { |
| 192 | DRM_ERROR("Error scheduling IBs (%d)\n", r); |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 193 | goto err; |
Christian König | 1886d1a | 2015-08-31 17:28:28 +0200 | [diff] [blame] | 194 | } |
| 195 | |
Christian König | 1886d1a | 2015-08-31 17:28:28 +0200 | [diff] [blame] | 196 | err: |
Monk Liu | 73cfa5f | 2016-03-17 13:48:13 +0800 | [diff] [blame] | 197 | job->fence = fence; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 198 | amdgpu_job_free(job); |
Christian König | ec72b80 | 2016-02-01 11:56:35 +0100 | [diff] [blame] | 199 | return fence; |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 200 | } |
| 201 | |
Nils Wallménius | 62250a9 | 2016-04-10 16:30:00 +0200 | [diff] [blame] | 202 | const struct amd_sched_backend_ops amdgpu_sched_ops = { |
Christian König | 0856cab | 2016-02-01 12:31:01 +0100 | [diff] [blame] | 203 | .dependency = amdgpu_job_dependency, |
| 204 | .run_job = amdgpu_job_run, |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 205 | .begin_job = amd_sched_job_begin, |
| 206 | .finish_job = amd_sched_job_finish, |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 207 | }; |