Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2015 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
| 18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
| 19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
| 20 | * OTHER DEALINGS IN THE SOFTWARE. |
| 21 | * |
| 22 | * |
| 23 | */ |
| 24 | #include <linux/kthread.h> |
| 25 | #include <linux/wait.h> |
| 26 | #include <linux/sched.h> |
| 27 | #include <drm/drmP.h> |
| 28 | #include "amdgpu.h" |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 29 | #include "amdgpu_trace.h" |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 30 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 31 | static void amdgpu_job_timedout(struct drm_sched_job *s_job) |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 32 | { |
Christian König | 3320b8d | 2018-07-13 15:08:44 +0200 | [diff] [blame] | 33 | struct amdgpu_ring *ring = to_amdgpu_ring(s_job->sched); |
| 34 | struct amdgpu_job *job = to_amdgpu_job(s_job); |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 35 | |
Christian König | f024e88 | 2018-07-13 14:01:08 +0200 | [diff] [blame] | 36 | DRM_ERROR("ring %s timeout, signaled seq=%u, emitted seq=%u\n", |
Christian König | 3320b8d | 2018-07-13 15:08:44 +0200 | [diff] [blame] | 37 | job->base.sched->name, atomic_read(&ring->fence_drv.last_seq), |
| 38 | ring->fence_drv.sync_seq); |
Monk Liu | 4fbf87e2 | 2017-05-05 15:09:42 +0800 | [diff] [blame] | 39 | |
Christian König | a1917b7 | 2018-07-13 17:15:54 +0200 | [diff] [blame] | 40 | amdgpu_device_gpu_recover(ring->adev, job, false); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 41 | } |
| 42 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 43 | int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs, |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 44 | struct amdgpu_job **job, struct amdgpu_vm *vm) |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 45 | { |
| 46 | size_t size = sizeof(struct amdgpu_job); |
| 47 | |
| 48 | if (num_ibs == 0) |
| 49 | return -EINVAL; |
| 50 | |
| 51 | size += sizeof(struct amdgpu_ib) * num_ibs; |
| 52 | |
| 53 | *job = kzalloc(size, GFP_KERNEL); |
| 54 | if (!*job) |
| 55 | return -ENOMEM; |
| 56 | |
Christian König | a1917b7 | 2018-07-13 17:15:54 +0200 | [diff] [blame] | 57 | /* |
| 58 | * Initialize the scheduler to at least some ring so that we always |
| 59 | * have a pointer to adev. |
| 60 | */ |
| 61 | (*job)->base.sched = &adev->rings[0]->sched; |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 62 | (*job)->vm = vm; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 63 | (*job)->ibs = (void *)&(*job)[1]; |
| 64 | (*job)->num_ibs = num_ibs; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 65 | |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 66 | amdgpu_sync_create(&(*job)->sync); |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 67 | amdgpu_sync_create(&(*job)->sched_sync); |
Monk Liu | c70b78a | 2017-10-16 20:02:08 +0800 | [diff] [blame] | 68 | (*job)->vram_lost_counter = atomic_read(&adev->vram_lost_counter); |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 69 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 70 | return 0; |
| 71 | } |
| 72 | |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 73 | int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size, |
| 74 | struct amdgpu_job **job) |
| 75 | { |
| 76 | int r; |
| 77 | |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 78 | r = amdgpu_job_alloc(adev, 1, job, NULL); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 79 | if (r) |
| 80 | return r; |
| 81 | |
| 82 | r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]); |
| 83 | if (r) |
| 84 | kfree(*job); |
Christian König | df264f9 | 2017-06-28 15:41:17 +0200 | [diff] [blame] | 85 | else |
| 86 | (*job)->vm_pd_addr = adev->gart.table_addr; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 87 | |
| 88 | return r; |
| 89 | } |
| 90 | |
Christian König | a5fb4ec | 2016-06-29 15:10:31 +0200 | [diff] [blame] | 91 | void amdgpu_job_free_resources(struct amdgpu_job *job) |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 92 | { |
Christian König | a1917b7 | 2018-07-13 17:15:54 +0200 | [diff] [blame] | 93 | struct amdgpu_ring *ring = to_amdgpu_ring(job->base.sched); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 94 | struct dma_fence *f; |
Christian König | 1ab0d21 | 2016-05-18 13:09:47 +0200 | [diff] [blame] | 95 | unsigned i; |
| 96 | |
Monk Liu | 676d8c2 | 2016-03-17 13:57:09 +0800 | [diff] [blame] | 97 | /* use sched fence if available */ |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 98 | f = job->base.s_fence ? &job->base.s_fence->finished : job->fence; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 99 | |
| 100 | for (i = 0; i < job->num_ibs; ++i) |
Christian König | a1917b7 | 2018-07-13 17:15:54 +0200 | [diff] [blame] | 101 | amdgpu_ib_free(ring->adev, &job->ibs[i], f); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 102 | } |
| 103 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 104 | static void amdgpu_job_free_cb(struct drm_sched_job *s_job) |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 105 | { |
Christian König | 3320b8d | 2018-07-13 15:08:44 +0200 | [diff] [blame] | 106 | struct amdgpu_ring *ring = to_amdgpu_ring(s_job->sched); |
| 107 | struct amdgpu_job *job = to_amdgpu_job(s_job); |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 108 | |
Christian König | 3320b8d | 2018-07-13 15:08:44 +0200 | [diff] [blame] | 109 | amdgpu_ring_priority_put(ring, s_job->s_priority); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 110 | dma_fence_put(job->fence); |
Christian König | a79a5bd | 2016-06-29 13:29:57 +0200 | [diff] [blame] | 111 | amdgpu_sync_free(&job->sync); |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 112 | amdgpu_sync_free(&job->sched_sync); |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 113 | kfree(job); |
| 114 | } |
| 115 | |
Christian König | 1e24e31 | 2016-05-18 13:12:12 +0200 | [diff] [blame] | 116 | void amdgpu_job_free(struct amdgpu_job *job) |
| 117 | { |
| 118 | amdgpu_job_free_resources(job); |
Christian König | a79a5bd | 2016-06-29 13:29:57 +0200 | [diff] [blame] | 119 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 120 | dma_fence_put(job->fence); |
Christian König | a79a5bd | 2016-06-29 13:29:57 +0200 | [diff] [blame] | 121 | amdgpu_sync_free(&job->sync); |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 122 | amdgpu_sync_free(&job->sched_sync); |
Christian König | 1e24e31 | 2016-05-18 13:12:12 +0200 | [diff] [blame] | 123 | kfree(job); |
| 124 | } |
| 125 | |
Christian König | 0e28b10 | 2018-07-13 13:54:56 +0200 | [diff] [blame] | 126 | int amdgpu_job_submit(struct amdgpu_job *job, struct drm_sched_entity *entity, |
| 127 | void *owner, struct dma_fence **f) |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 128 | { |
Christian König | b528680 | 2018-07-16 14:58:48 +0200 | [diff] [blame] | 129 | enum drm_sched_priority priority; |
| 130 | struct amdgpu_ring *ring; |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 131 | int r; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 132 | |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 133 | if (!f) |
| 134 | return -EINVAL; |
| 135 | |
Nayan Deshmukh | cdc5017 | 2018-07-20 17:51:05 +0530 | [diff] [blame] | 136 | r = drm_sched_job_init(&job->base, entity, owner); |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 137 | if (r) |
| 138 | return r; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 139 | |
| 140 | job->owner = owner; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 141 | *f = dma_fence_get(&job->base.s_fence->finished); |
Christian König | a5fb4ec | 2016-06-29 15:10:31 +0200 | [diff] [blame] | 142 | amdgpu_job_free_resources(job); |
Christian König | b528680 | 2018-07-16 14:58:48 +0200 | [diff] [blame] | 143 | priority = job->base.s_priority; |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 144 | drm_sched_entity_push_job(&job->base, entity); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 145 | |
Nayan Deshmukh | 068c330 | 2018-07-20 17:51:06 +0530 | [diff] [blame] | 146 | ring = to_amdgpu_ring(entity->rq->sched); |
Christian König | b528680 | 2018-07-16 14:58:48 +0200 | [diff] [blame] | 147 | amdgpu_ring_priority_get(ring, priority); |
| 148 | |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 149 | return 0; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 150 | } |
| 151 | |
Christian König | ee913fd | 2018-07-13 16:29:10 +0200 | [diff] [blame] | 152 | int amdgpu_job_submit_direct(struct amdgpu_job *job, struct amdgpu_ring *ring, |
| 153 | struct dma_fence **fence) |
| 154 | { |
| 155 | int r; |
| 156 | |
| 157 | job->base.sched = &ring->sched; |
| 158 | r = amdgpu_ib_schedule(ring, job->num_ibs, job->ibs, NULL, fence); |
| 159 | job->fence = dma_fence_get(*fence); |
| 160 | if (r) |
| 161 | return r; |
| 162 | |
| 163 | amdgpu_job_free(job); |
| 164 | return 0; |
| 165 | } |
| 166 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 167 | static struct dma_fence *amdgpu_job_dependency(struct drm_sched_job *sched_job, |
| 168 | struct drm_sched_entity *s_entity) |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 169 | { |
Nayan Deshmukh | 068c330 | 2018-07-20 17:51:06 +0530 | [diff] [blame] | 170 | struct amdgpu_ring *ring = to_amdgpu_ring(s_entity->rq->sched); |
Junwei Zhang | a6db8a3 | 2015-09-09 09:21:19 +0800 | [diff] [blame] | 171 | struct amdgpu_job *job = to_amdgpu_job(sched_job); |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 172 | struct amdgpu_vm *vm = job->vm; |
Christian König | f024e88 | 2018-07-13 14:01:08 +0200 | [diff] [blame] | 173 | struct dma_fence *fence; |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 174 | bool explicit = false; |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 175 | int r; |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 176 | |
Christian König | f024e88 | 2018-07-13 14:01:08 +0200 | [diff] [blame] | 177 | fence = amdgpu_sync_get_fence(&job->sync, &explicit); |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 178 | if (fence && explicit) { |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 179 | if (drm_sched_dependency_optimized(fence, s_entity)) { |
Christian König | a1917b7 | 2018-07-13 17:15:54 +0200 | [diff] [blame] | 180 | r = amdgpu_sync_fence(ring->adev, &job->sched_sync, |
| 181 | fence, false); |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 182 | if (r) |
Christian König | f024e88 | 2018-07-13 14:01:08 +0200 | [diff] [blame] | 183 | DRM_ERROR("Error adding fence (%d)\n", r); |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 184 | } |
Chunming Zhou | a340c7b | 2017-05-18 15:19:03 +0800 | [diff] [blame] | 185 | } |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 186 | |
Christian König | c4f46f2 | 2017-12-18 17:08:25 +0100 | [diff] [blame] | 187 | while (fence == NULL && vm && !job->vmid) { |
Christian König | 620f774 | 2017-12-18 16:53:03 +0100 | [diff] [blame] | 188 | r = amdgpu_vmid_grab(vm, ring, &job->sync, |
| 189 | &job->base.s_fence->finished, |
| 190 | job); |
Christian König | 94dd0a4 | 2016-01-18 17:01:42 +0100 | [diff] [blame] | 191 | if (r) |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 192 | DRM_ERROR("Error getting VM ID (%d)\n", r); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 193 | |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 194 | fence = amdgpu_sync_get_fence(&job->sync, NULL); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 195 | } |
| 196 | |
| 197 | return fence; |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 198 | } |
| 199 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 200 | static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job) |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 201 | { |
Christian König | 3320b8d | 2018-07-13 15:08:44 +0200 | [diff] [blame] | 202 | struct amdgpu_ring *ring = to_amdgpu_ring(sched_job->sched); |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 203 | struct dma_fence *fence = NULL, *finished; |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 204 | struct amdgpu_job *job; |
Christian König | bd755d0 | 2015-08-24 14:57:26 +0200 | [diff] [blame] | 205 | int r; |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 206 | |
Junwei Zhang | a6db8a3 | 2015-09-09 09:21:19 +0800 | [diff] [blame] | 207 | job = to_amdgpu_job(sched_job); |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 208 | finished = &job->base.s_fence->finished; |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 209 | |
Christian König | 1fbb2e9 | 2016-06-01 10:47:36 +0200 | [diff] [blame] | 210 | BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL)); |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 211 | |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 212 | trace_amdgpu_sched_run_job(job); |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 213 | |
Christian König | a1917b7 | 2018-07-13 17:15:54 +0200 | [diff] [blame] | 214 | if (job->vram_lost_counter != atomic_read(&ring->adev->vram_lost_counter)) |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 215 | dma_fence_set_error(finished, -ECANCELED);/* skip IB as well if VRAM lost */ |
| 216 | |
| 217 | if (finished->error < 0) { |
| 218 | DRM_INFO("Skip scheduling IBs!\n"); |
Christian König | 14e47f9 | 2017-10-09 15:04:41 +0200 | [diff] [blame] | 219 | } else { |
Christian König | 3320b8d | 2018-07-13 15:08:44 +0200 | [diff] [blame] | 220 | r = amdgpu_ib_schedule(ring, job->num_ibs, job->ibs, job, |
Christian König | 14e47f9 | 2017-10-09 15:04:41 +0200 | [diff] [blame] | 221 | &fence); |
Chunming Zhou | 15d73ce | 2017-05-16 14:34:27 +0800 | [diff] [blame] | 222 | if (r) |
| 223 | DRM_ERROR("Error scheduling IBs (%d)\n", r); |
| 224 | } |
Chunming Zhou | c7c5fbc | 2016-06-30 17:30:42 +0800 | [diff] [blame] | 225 | /* if gpu reset, hw fence will be replaced here */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 226 | dma_fence_put(job->fence); |
| 227 | job->fence = dma_fence_get(fence); |
Andres Rodriguez | b2ff0e8 | 2017-02-20 17:53:19 -0500 | [diff] [blame] | 228 | |
Christian König | 22a77cf | 2016-07-05 14:48:17 +0200 | [diff] [blame] | 229 | amdgpu_job_free_resources(job); |
Christian König | ec72b80 | 2016-02-01 11:56:35 +0100 | [diff] [blame] | 230 | return fence; |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 231 | } |
| 232 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 233 | const struct drm_sched_backend_ops amdgpu_sched_ops = { |
Christian König | 0856cab | 2016-02-01 12:31:01 +0100 | [diff] [blame] | 234 | .dependency = amdgpu_job_dependency, |
| 235 | .run_job = amdgpu_job_run, |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 236 | .timedout_job = amdgpu_job_timedout, |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 237 | .free_job = amdgpu_job_free_cb |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 238 | }; |