Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2015 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
| 18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
| 19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
| 20 | * OTHER DEALINGS IN THE SOFTWARE. |
| 21 | * |
| 22 | * |
| 23 | */ |
| 24 | #include <linux/kthread.h> |
| 25 | #include <linux/wait.h> |
| 26 | #include <linux/sched.h> |
| 27 | #include <drm/drmP.h> |
| 28 | #include "amdgpu.h" |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 29 | #include "amdgpu_trace.h" |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 30 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 31 | static void amdgpu_job_timedout(struct drm_sched_job *s_job) |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 32 | { |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 33 | struct amdgpu_job *job = container_of(s_job, struct amdgpu_job, base); |
| 34 | |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 35 | DRM_ERROR("ring %s timeout, last signaled seq=%u, last emitted seq=%u\n", |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 36 | job->base.sched->name, |
| 37 | atomic_read(&job->ring->fence_drv.last_seq), |
| 38 | job->ring->fence_drv.sync_seq); |
Monk Liu | 4fbf87e2 | 2017-05-05 15:09:42 +0800 | [diff] [blame] | 39 | |
Alex Deucher | 5f152b5 | 2017-12-15 16:40:49 -0500 | [diff] [blame] | 40 | amdgpu_device_gpu_recover(job->adev, job, false); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 41 | } |
| 42 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 43 | int amdgpu_job_alloc(struct amdgpu_device *adev, unsigned num_ibs, |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 44 | struct amdgpu_job **job, struct amdgpu_vm *vm) |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 45 | { |
| 46 | size_t size = sizeof(struct amdgpu_job); |
| 47 | |
| 48 | if (num_ibs == 0) |
| 49 | return -EINVAL; |
| 50 | |
| 51 | size += sizeof(struct amdgpu_ib) * num_ibs; |
| 52 | |
| 53 | *job = kzalloc(size, GFP_KERNEL); |
| 54 | if (!*job) |
| 55 | return -ENOMEM; |
| 56 | |
| 57 | (*job)->adev = adev; |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 58 | (*job)->vm = vm; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 59 | (*job)->ibs = (void *)&(*job)[1]; |
| 60 | (*job)->num_ibs = num_ibs; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 61 | |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 62 | amdgpu_sync_create(&(*job)->sync); |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 63 | amdgpu_sync_create(&(*job)->sched_sync); |
Monk Liu | c70b78a | 2017-10-16 20:02:08 +0800 | [diff] [blame] | 64 | (*job)->vram_lost_counter = atomic_read(&adev->vram_lost_counter); |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 65 | |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 66 | return 0; |
| 67 | } |
| 68 | |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 69 | int amdgpu_job_alloc_with_ib(struct amdgpu_device *adev, unsigned size, |
| 70 | struct amdgpu_job **job) |
| 71 | { |
| 72 | int r; |
| 73 | |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 74 | r = amdgpu_job_alloc(adev, 1, job, NULL); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 75 | if (r) |
| 76 | return r; |
| 77 | |
| 78 | r = amdgpu_ib_get(adev, NULL, size, &(*job)->ibs[0]); |
| 79 | if (r) |
| 80 | kfree(*job); |
Christian König | df264f9 | 2017-06-28 15:41:17 +0200 | [diff] [blame] | 81 | else |
| 82 | (*job)->vm_pd_addr = adev->gart.table_addr; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 83 | |
| 84 | return r; |
| 85 | } |
| 86 | |
Christian König | a5fb4ec | 2016-06-29 15:10:31 +0200 | [diff] [blame] | 87 | void amdgpu_job_free_resources(struct amdgpu_job *job) |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 88 | { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 89 | struct dma_fence *f; |
Christian König | 1ab0d21 | 2016-05-18 13:09:47 +0200 | [diff] [blame] | 90 | unsigned i; |
| 91 | |
Monk Liu | 676d8c2 | 2016-03-17 13:57:09 +0800 | [diff] [blame] | 92 | /* use sched fence if available */ |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 93 | f = job->base.s_fence ? &job->base.s_fence->finished : job->fence; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 94 | |
| 95 | for (i = 0; i < job->num_ibs; ++i) |
Christian König | 1ab0d21 | 2016-05-18 13:09:47 +0200 | [diff] [blame] | 96 | amdgpu_ib_free(job->adev, &job->ibs[i], f); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 97 | } |
| 98 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 99 | static void amdgpu_job_free_cb(struct drm_sched_job *s_job) |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 100 | { |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 101 | struct amdgpu_job *job = container_of(s_job, struct amdgpu_job, base); |
| 102 | |
Andrey Grodzovsky | d1f6dc1 | 2017-10-19 14:29:46 -0400 | [diff] [blame] | 103 | amdgpu_ring_priority_put(job->ring, s_job->s_priority); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 104 | dma_fence_put(job->fence); |
Christian König | a79a5bd | 2016-06-29 13:29:57 +0200 | [diff] [blame] | 105 | amdgpu_sync_free(&job->sync); |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 106 | amdgpu_sync_free(&job->sched_sync); |
Monk Liu | b6723c8 | 2016-03-10 12:14:44 +0800 | [diff] [blame] | 107 | kfree(job); |
| 108 | } |
| 109 | |
Christian König | 1e24e31 | 2016-05-18 13:12:12 +0200 | [diff] [blame] | 110 | void amdgpu_job_free(struct amdgpu_job *job) |
| 111 | { |
| 112 | amdgpu_job_free_resources(job); |
Christian König | a79a5bd | 2016-06-29 13:29:57 +0200 | [diff] [blame] | 113 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 114 | dma_fence_put(job->fence); |
Christian König | a79a5bd | 2016-06-29 13:29:57 +0200 | [diff] [blame] | 115 | amdgpu_sync_free(&job->sync); |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 116 | amdgpu_sync_free(&job->sched_sync); |
Christian König | 1e24e31 | 2016-05-18 13:12:12 +0200 | [diff] [blame] | 117 | kfree(job); |
| 118 | } |
| 119 | |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 120 | int amdgpu_job_submit(struct amdgpu_job *job, struct amdgpu_ring *ring, |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 121 | struct drm_sched_entity *entity, void *owner, |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 122 | struct dma_fence **f) |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 123 | { |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 124 | int r; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 125 | job->ring = ring; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 126 | |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 127 | if (!f) |
| 128 | return -EINVAL; |
| 129 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 130 | r = drm_sched_job_init(&job->base, &ring->sched, entity, owner); |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 131 | if (r) |
| 132 | return r; |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 133 | |
| 134 | job->owner = owner; |
Monk Liu | 3aecd24 | 2016-08-25 15:40:48 +0800 | [diff] [blame] | 135 | job->fence_ctx = entity->fence_context; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 136 | *f = dma_fence_get(&job->base.s_fence->finished); |
Christian König | a5fb4ec | 2016-06-29 15:10:31 +0200 | [diff] [blame] | 137 | amdgpu_job_free_resources(job); |
Andrey Grodzovsky | d1f6dc1 | 2017-10-19 14:29:46 -0400 | [diff] [blame] | 138 | amdgpu_ring_priority_get(job->ring, job->base.s_priority); |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 139 | drm_sched_entity_push_job(&job->base, entity); |
Christian König | d71518b | 2016-02-01 12:20:25 +0100 | [diff] [blame] | 140 | |
| 141 | return 0; |
Christian König | 50838c8 | 2016-02-03 13:44:52 +0100 | [diff] [blame] | 142 | } |
| 143 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 144 | static struct dma_fence *amdgpu_job_dependency(struct drm_sched_job *sched_job, |
| 145 | struct drm_sched_entity *s_entity) |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 146 | { |
Junwei Zhang | a6db8a3 | 2015-09-09 09:21:19 +0800 | [diff] [blame] | 147 | struct amdgpu_job *job = to_amdgpu_job(sched_job); |
Monk Liu | c563783 | 2016-04-19 20:11:32 +0800 | [diff] [blame] | 148 | struct amdgpu_vm *vm = job->vm; |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 149 | bool explicit = false; |
Chunming Zhou | df83d1e | 2017-05-09 15:50:22 +0800 | [diff] [blame] | 150 | int r; |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 151 | struct dma_fence *fence = amdgpu_sync_get_fence(&job->sync, &explicit); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 152 | |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 153 | if (fence && explicit) { |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 154 | if (drm_sched_dependency_optimized(fence, s_entity)) { |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 155 | r = amdgpu_sync_fence(job->adev, &job->sched_sync, fence, false); |
| 156 | if (r) |
| 157 | DRM_ERROR("Error adding fence to sync (%d)\n", r); |
| 158 | } |
Chunming Zhou | a340c7b | 2017-05-18 15:19:03 +0800 | [diff] [blame] | 159 | } |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 160 | |
Christian König | c4f46f2 | 2017-12-18 17:08:25 +0100 | [diff] [blame] | 161 | while (fence == NULL && vm && !job->vmid) { |
Christian König | b07c60c | 2016-01-31 12:29:04 +0100 | [diff] [blame] | 162 | struct amdgpu_ring *ring = job->ring; |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 163 | |
Christian König | 620f774 | 2017-12-18 16:53:03 +0100 | [diff] [blame] | 164 | r = amdgpu_vmid_grab(vm, ring, &job->sync, |
| 165 | &job->base.s_fence->finished, |
| 166 | job); |
Christian König | 94dd0a4 | 2016-01-18 17:01:42 +0100 | [diff] [blame] | 167 | if (r) |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 168 | DRM_ERROR("Error getting VM ID (%d)\n", r); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 169 | |
Andrey Grodzovsky | cebb52b | 2017-11-13 14:47:52 -0500 | [diff] [blame] | 170 | fence = amdgpu_sync_get_fence(&job->sync, NULL); |
Christian König | 8d0a7ce | 2015-11-03 20:58:50 +0100 | [diff] [blame] | 171 | } |
| 172 | |
| 173 | return fence; |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 174 | } |
| 175 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 176 | static struct dma_fence *amdgpu_job_run(struct drm_sched_job *sched_job) |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 177 | { |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 178 | struct dma_fence *fence = NULL, *finished; |
Christian König | 14e47f9 | 2017-10-09 15:04:41 +0200 | [diff] [blame] | 179 | struct amdgpu_device *adev; |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 180 | struct amdgpu_job *job; |
Christian König | bd755d0 | 2015-08-24 14:57:26 +0200 | [diff] [blame] | 181 | int r; |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 182 | |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 183 | if (!sched_job) { |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 184 | DRM_ERROR("job is null\n"); |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 185 | return NULL; |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 186 | } |
Junwei Zhang | a6db8a3 | 2015-09-09 09:21:19 +0800 | [diff] [blame] | 187 | job = to_amdgpu_job(sched_job); |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 188 | finished = &job->base.s_fence->finished; |
Christian König | 14e47f9 | 2017-10-09 15:04:41 +0200 | [diff] [blame] | 189 | adev = job->adev; |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 190 | |
Christian König | 1fbb2e9 | 2016-06-01 10:47:36 +0200 | [diff] [blame] | 191 | BUG_ON(amdgpu_sync_peek_fence(&job->sync, NULL)); |
Christian König | e86f9ce | 2016-02-08 12:13:05 +0100 | [diff] [blame] | 192 | |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 193 | trace_amdgpu_sched_run_job(job); |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame] | 194 | |
| 195 | if (job->vram_lost_counter != atomic_read(&adev->vram_lost_counter)) |
| 196 | dma_fence_set_error(finished, -ECANCELED);/* skip IB as well if VRAM lost */ |
| 197 | |
| 198 | if (finished->error < 0) { |
| 199 | DRM_INFO("Skip scheduling IBs!\n"); |
Christian König | 14e47f9 | 2017-10-09 15:04:41 +0200 | [diff] [blame] | 200 | } else { |
| 201 | r = amdgpu_ib_schedule(job->ring, job->num_ibs, job->ibs, job, |
| 202 | &fence); |
Chunming Zhou | 15d73ce | 2017-05-16 14:34:27 +0800 | [diff] [blame] | 203 | if (r) |
| 204 | DRM_ERROR("Error scheduling IBs (%d)\n", r); |
| 205 | } |
Chunming Zhou | c7c5fbc | 2016-06-30 17:30:42 +0800 | [diff] [blame] | 206 | /* if gpu reset, hw fence will be replaced here */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 207 | dma_fence_put(job->fence); |
| 208 | job->fence = dma_fence_get(fence); |
Andres Rodriguez | b2ff0e8 | 2017-02-20 17:53:19 -0500 | [diff] [blame] | 209 | |
Christian König | 22a77cf | 2016-07-05 14:48:17 +0200 | [diff] [blame] | 210 | amdgpu_job_free_resources(job); |
Christian König | ec72b80 | 2016-02-01 11:56:35 +0100 | [diff] [blame] | 211 | return fence; |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 212 | } |
| 213 | |
Lucas Stach | 1b1f42d | 2017-12-06 17:49:39 +0100 | [diff] [blame] | 214 | const struct drm_sched_backend_ops amdgpu_sched_ops = { |
Christian König | 0856cab | 2016-02-01 12:31:01 +0100 | [diff] [blame] | 215 | .dependency = amdgpu_job_dependency, |
| 216 | .run_job = amdgpu_job_run, |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 217 | .timedout_job = amdgpu_job_timedout, |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 218 | .free_job = amdgpu_job_free_cb |
Chunming Zhou | c1b69ed | 2015-07-21 13:45:14 +0800 | [diff] [blame] | 219 | }; |