Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2015 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
| 18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
| 19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
| 20 | * OTHER DEALINGS IN THE SOFTWARE. |
| 21 | * |
| 22 | * |
| 23 | */ |
| 24 | #include <linux/kthread.h> |
| 25 | #include <linux/wait.h> |
| 26 | #include <linux/sched.h> |
Ingo Molnar | ae7e81c | 2017-02-01 18:07:51 +0100 | [diff] [blame] | 27 | #include <uapi/linux/sched/types.h> |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 28 | #include <drm/drmP.h> |
| 29 | #include "gpu_scheduler.h" |
| 30 | |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 31 | #include "spsc_queue.h" |
| 32 | |
Chunming Zhou | 353da3c | 2015-09-07 16:06:53 +0800 | [diff] [blame] | 33 | #define CREATE_TRACE_POINTS |
| 34 | #include "gpu_sched_trace.h" |
| 35 | |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 36 | #define to_amd_sched_job(sched_job) \ |
| 37 | container_of((sched_job), struct amd_sched_job, queue_node) |
| 38 | |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 39 | static bool amd_sched_entity_is_ready(struct amd_sched_entity *entity); |
Christian König | 8807900 | 2015-08-24 14:29:40 +0200 | [diff] [blame] | 40 | static void amd_sched_wakeup(struct amd_gpu_scheduler *sched); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 41 | static void amd_sched_process_job(struct dma_fence *f, struct dma_fence_cb *cb); |
Christian König | 8807900 | 2015-08-24 14:29:40 +0200 | [diff] [blame] | 42 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 43 | /* Initialize a given run queue struct */ |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 44 | static void amd_sched_rq_init(struct amd_sched_rq *rq) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 45 | { |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 46 | spin_lock_init(&rq->lock); |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 47 | INIT_LIST_HEAD(&rq->entities); |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 48 | rq->current_entity = NULL; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 49 | } |
| 50 | |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 51 | static void amd_sched_rq_add_entity(struct amd_sched_rq *rq, |
| 52 | struct amd_sched_entity *entity) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 53 | { |
Chunming Zhou | e8deea2 | 2015-12-11 18:22:52 +0800 | [diff] [blame] | 54 | if (!list_empty(&entity->list)) |
| 55 | return; |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 56 | spin_lock(&rq->lock); |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 57 | list_add_tail(&entity->list, &rq->entities); |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 58 | spin_unlock(&rq->lock); |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 59 | } |
| 60 | |
| 61 | static void amd_sched_rq_remove_entity(struct amd_sched_rq *rq, |
| 62 | struct amd_sched_entity *entity) |
| 63 | { |
Chunming Zhou | e8deea2 | 2015-12-11 18:22:52 +0800 | [diff] [blame] | 64 | if (list_empty(&entity->list)) |
| 65 | return; |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 66 | spin_lock(&rq->lock); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 67 | list_del_init(&entity->list); |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 68 | if (rq->current_entity == entity) |
| 69 | rq->current_entity = NULL; |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 70 | spin_unlock(&rq->lock); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 71 | } |
| 72 | |
| 73 | /** |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 74 | * Select an entity which could provide a job to run |
| 75 | * |
| 76 | * @rq The run queue to check. |
| 77 | * |
| 78 | * Try to find a ready entity, returns NULL if none found. |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 79 | */ |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 80 | static struct amd_sched_entity * |
| 81 | amd_sched_rq_select_entity(struct amd_sched_rq *rq) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 82 | { |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 83 | struct amd_sched_entity *entity; |
Christian König | 4cd7f42c | 2015-08-05 18:18:52 +0200 | [diff] [blame] | 84 | |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 85 | spin_lock(&rq->lock); |
| 86 | |
| 87 | entity = rq->current_entity; |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 88 | if (entity) { |
| 89 | list_for_each_entry_continue(entity, &rq->entities, list) { |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 90 | if (amd_sched_entity_is_ready(entity)) { |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 91 | rq->current_entity = entity; |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 92 | spin_unlock(&rq->lock); |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 93 | return entity; |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 94 | } |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 95 | } |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 96 | } |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 97 | |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 98 | list_for_each_entry(entity, &rq->entities, list) { |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 99 | |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 100 | if (amd_sched_entity_is_ready(entity)) { |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 101 | rq->current_entity = entity; |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 102 | spin_unlock(&rq->lock); |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 103 | return entity; |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 104 | } |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 105 | |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 106 | if (entity == rq->current_entity) |
| 107 | break; |
| 108 | } |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 109 | |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 110 | spin_unlock(&rq->lock); |
| 111 | |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 112 | return NULL; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 113 | } |
| 114 | |
| 115 | /** |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 116 | * Init a context entity used by scheduler when submit to HW ring. |
| 117 | * |
| 118 | * @sched The pointer to the scheduler |
Christian König | 91404fb | 2015-08-05 18:33:21 +0200 | [diff] [blame] | 119 | * @entity The pointer to a valid amd_sched_entity |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 120 | * @rq The run queue this entity belongs |
Christian König | 0e89d0c | 2015-08-04 16:58:36 +0200 | [diff] [blame] | 121 | * @kernel If this is an entity for the kernel |
Jammy Zhou | 1333f72 | 2015-07-30 16:36:58 +0800 | [diff] [blame] | 122 | * @jobs The max number of jobs in the job queue |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 123 | * |
| 124 | * return 0 if succeed. negative error code on failure |
| 125 | */ |
Christian König | 91404fb | 2015-08-05 18:33:21 +0200 | [diff] [blame] | 126 | int amd_sched_entity_init(struct amd_gpu_scheduler *sched, |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 127 | struct amd_sched_entity *entity, |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 128 | struct amd_sched_rq *rq, |
Monk Liu | b3eebe3 | 2017-10-23 12:23:29 +0800 | [diff] [blame] | 129 | uint32_t jobs, atomic_t *guilty) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 130 | { |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 131 | if (!(sched && entity && rq)) |
| 132 | return -EINVAL; |
| 133 | |
Christian König | 91404fb | 2015-08-05 18:33:21 +0200 | [diff] [blame] | 134 | memset(entity, 0, sizeof(struct amd_sched_entity)); |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 135 | INIT_LIST_HEAD(&entity->list); |
| 136 | entity->rq = rq; |
| 137 | entity->sched = sched; |
Monk Liu | b3eebe3 | 2017-10-23 12:23:29 +0800 | [diff] [blame] | 138 | entity->guilty = guilty; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 139 | |
Andres Rodriguez | 9ebbaab | 2017-06-02 15:09:00 -0400 | [diff] [blame] | 140 | spin_lock_init(&entity->rq_lock); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 141 | spin_lock_init(&entity->queue_lock); |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 142 | spsc_queue_init(&entity->job_queue); |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 143 | |
Christian König | ce882e6 | 2015-08-19 15:00:55 +0200 | [diff] [blame] | 144 | atomic_set(&entity->fence_seq, 0); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 145 | entity->fence_context = dma_fence_context_alloc(2); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 146 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 147 | return 0; |
| 148 | } |
| 149 | |
| 150 | /** |
| 151 | * Query if entity is initialized |
| 152 | * |
| 153 | * @sched Pointer to scheduler instance |
| 154 | * @entity The pointer to a valid scheduler entity |
| 155 | * |
| 156 | * return true if entity is initialized, false otherwise |
| 157 | */ |
Christian König | d54fdb9 | 2015-08-20 17:03:48 +0200 | [diff] [blame] | 158 | static bool amd_sched_entity_is_initialized(struct amd_gpu_scheduler *sched, |
| 159 | struct amd_sched_entity *entity) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 160 | { |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 161 | return entity->sched == sched && |
| 162 | entity->rq != NULL; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 163 | } |
| 164 | |
Christian König | aef4852 | 2015-08-20 14:47:46 +0200 | [diff] [blame] | 165 | /** |
| 166 | * Check if entity is idle |
| 167 | * |
| 168 | * @entity The pointer to a valid scheduler entity |
| 169 | * |
| 170 | * Return true if entity don't has any unscheduled jobs. |
| 171 | */ |
| 172 | static bool amd_sched_entity_is_idle(struct amd_sched_entity *entity) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 173 | { |
Christian König | aef4852 | 2015-08-20 14:47:46 +0200 | [diff] [blame] | 174 | rmb(); |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 175 | if (spsc_queue_peek(&entity->job_queue) == NULL) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 176 | return true; |
| 177 | |
| 178 | return false; |
| 179 | } |
| 180 | |
| 181 | /** |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 182 | * Check if entity is ready |
| 183 | * |
| 184 | * @entity The pointer to a valid scheduler entity |
| 185 | * |
| 186 | * Return true if entity could provide a job. |
| 187 | */ |
| 188 | static bool amd_sched_entity_is_ready(struct amd_sched_entity *entity) |
| 189 | { |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 190 | if (spsc_queue_peek(&entity->job_queue) == NULL) |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 191 | return false; |
| 192 | |
Mark Rutland | 6aa7de0 | 2017-10-23 14:07:29 -0700 | [diff] [blame] | 193 | if (READ_ONCE(entity->dependency)) |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 194 | return false; |
| 195 | |
| 196 | return true; |
| 197 | } |
| 198 | |
| 199 | /** |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 200 | * Destroy a context entity |
| 201 | * |
| 202 | * @sched Pointer to scheduler instance |
| 203 | * @entity The pointer to a valid scheduler entity |
| 204 | * |
Christian König | 062c7fb | 2015-08-21 15:46:43 +0200 | [diff] [blame] | 205 | * Cleanup and free the allocated resources. |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 206 | */ |
Christian König | 062c7fb | 2015-08-21 15:46:43 +0200 | [diff] [blame] | 207 | void amd_sched_entity_fini(struct amd_gpu_scheduler *sched, |
| 208 | struct amd_sched_entity *entity) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 209 | { |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 210 | int r; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 211 | |
Christian König | d54fdb9 | 2015-08-20 17:03:48 +0200 | [diff] [blame] | 212 | if (!amd_sched_entity_is_initialized(sched, entity)) |
Christian König | 062c7fb | 2015-08-21 15:46:43 +0200 | [diff] [blame] | 213 | return; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 214 | /** |
| 215 | * The client will not queue more IBs during this fini, consume existing |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 216 | * queued IBs or discard them on SIGKILL |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 217 | */ |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 218 | if ((current->flags & PF_SIGNALED) && current->exit_code == SIGKILL) |
| 219 | r = -ERESTARTSYS; |
| 220 | else |
| 221 | r = wait_event_killable(sched->job_scheduled, |
| 222 | amd_sched_entity_is_idle(entity)); |
Andres Rodriguez | 9ebbaab | 2017-06-02 15:09:00 -0400 | [diff] [blame] | 223 | amd_sched_entity_set_rq(entity, NULL); |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 224 | if (r) { |
| 225 | struct amd_sched_job *job; |
Alex Deucher | c945012 | 2017-10-12 13:08:48 -0400 | [diff] [blame] | 226 | |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 227 | /* Park the kernel for a moment to make sure it isn't processing |
| 228 | * our enity. |
| 229 | */ |
| 230 | kthread_park(sched->thread); |
| 231 | kthread_unpark(sched->thread); |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 232 | while ((job = to_amd_sched_job(spsc_queue_pop(&entity->job_queue)))) { |
Nicolai Hähnle | 7986746 | 2017-09-28 11:57:32 +0200 | [diff] [blame] | 233 | struct amd_sched_fence *s_fence = job->s_fence; |
| 234 | amd_sched_fence_scheduled(s_fence); |
| 235 | dma_fence_set_error(&s_fence->finished, -ESRCH); |
| 236 | amd_sched_fence_finished(s_fence); |
| 237 | dma_fence_put(&s_fence->finished); |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 238 | sched->ops->free_job(job); |
Nicolai Hähnle | 7986746 | 2017-09-28 11:57:32 +0200 | [diff] [blame] | 239 | } |
Christian König | f0694d3 | 2017-08-21 14:27:51 +0200 | [diff] [blame] | 240 | } |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 241 | } |
| 242 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 243 | static void amd_sched_entity_wakeup(struct dma_fence *f, struct dma_fence_cb *cb) |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 244 | { |
| 245 | struct amd_sched_entity *entity = |
| 246 | container_of(cb, struct amd_sched_entity, cb); |
| 247 | entity->dependency = NULL; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 248 | dma_fence_put(f); |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 249 | amd_sched_wakeup(entity->sched); |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 250 | } |
| 251 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 252 | static void amd_sched_entity_clear_dep(struct dma_fence *f, struct dma_fence_cb *cb) |
Monk Liu | 777dbd4 | 2016-01-26 14:59:57 +0800 | [diff] [blame] | 253 | { |
| 254 | struct amd_sched_entity *entity = |
| 255 | container_of(cb, struct amd_sched_entity, cb); |
| 256 | entity->dependency = NULL; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 257 | dma_fence_put(f); |
Monk Liu | 777dbd4 | 2016-01-26 14:59:57 +0800 | [diff] [blame] | 258 | } |
| 259 | |
Andres Rodriguez | 9ebbaab | 2017-06-02 15:09:00 -0400 | [diff] [blame] | 260 | void amd_sched_entity_set_rq(struct amd_sched_entity *entity, |
| 261 | struct amd_sched_rq *rq) |
| 262 | { |
| 263 | if (entity->rq == rq) |
| 264 | return; |
| 265 | |
| 266 | spin_lock(&entity->rq_lock); |
| 267 | |
| 268 | if (entity->rq) |
| 269 | amd_sched_rq_remove_entity(entity->rq, entity); |
| 270 | |
| 271 | entity->rq = rq; |
| 272 | if (rq) |
| 273 | amd_sched_rq_add_entity(rq, entity); |
| 274 | |
| 275 | spin_unlock(&entity->rq_lock); |
| 276 | } |
| 277 | |
Chunming Zhou | 30514de | 2017-05-09 13:39:40 +0800 | [diff] [blame] | 278 | bool amd_sched_dependency_optimized(struct dma_fence* fence, |
| 279 | struct amd_sched_entity *entity) |
| 280 | { |
| 281 | struct amd_gpu_scheduler *sched = entity->sched; |
| 282 | struct amd_sched_fence *s_fence; |
| 283 | |
| 284 | if (!fence || dma_fence_is_signaled(fence)) |
| 285 | return false; |
| 286 | if (fence->context == entity->fence_context) |
| 287 | return true; |
| 288 | s_fence = to_amd_sched_fence(fence); |
| 289 | if (s_fence && s_fence->sched == sched) |
| 290 | return true; |
| 291 | |
| 292 | return false; |
| 293 | } |
| 294 | |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 295 | static bool amd_sched_entity_add_dependency_cb(struct amd_sched_entity *entity) |
| 296 | { |
| 297 | struct amd_gpu_scheduler *sched = entity->sched; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 298 | struct dma_fence * fence = entity->dependency; |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 299 | struct amd_sched_fence *s_fence; |
| 300 | |
| 301 | if (fence->context == entity->fence_context) { |
| 302 | /* We can ignore fences from ourself */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 303 | dma_fence_put(entity->dependency); |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 304 | return false; |
| 305 | } |
| 306 | |
| 307 | s_fence = to_amd_sched_fence(fence); |
| 308 | if (s_fence && s_fence->sched == sched) { |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 309 | |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 310 | /* |
| 311 | * Fence is from the same scheduler, only need to wait for |
| 312 | * it to be scheduled |
| 313 | */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 314 | fence = dma_fence_get(&s_fence->scheduled); |
| 315 | dma_fence_put(entity->dependency); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 316 | entity->dependency = fence; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 317 | if (!dma_fence_add_callback(fence, &entity->cb, |
| 318 | amd_sched_entity_clear_dep)) |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 319 | return true; |
| 320 | |
| 321 | /* Ignore it when it is already scheduled */ |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 322 | dma_fence_put(fence); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 323 | return false; |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 324 | } |
| 325 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 326 | if (!dma_fence_add_callback(entity->dependency, &entity->cb, |
| 327 | amd_sched_entity_wakeup)) |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 328 | return true; |
| 329 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 330 | dma_fence_put(entity->dependency); |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 331 | return false; |
| 332 | } |
| 333 | |
Christian König | 69bd5bf | 2015-08-26 11:31:23 +0200 | [diff] [blame] | 334 | static struct amd_sched_job * |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 335 | amd_sched_entity_pop_job(struct amd_sched_entity *entity) |
Christian König | 69bd5bf | 2015-08-26 11:31:23 +0200 | [diff] [blame] | 336 | { |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 337 | struct amd_gpu_scheduler *sched = entity->sched; |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 338 | struct amd_sched_job *sched_job = to_amd_sched_job( |
| 339 | spsc_queue_peek(&entity->job_queue)); |
Christian König | 69bd5bf | 2015-08-26 11:31:23 +0200 | [diff] [blame] | 340 | |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 341 | if (!sched_job) |
Christian König | 69bd5bf | 2015-08-26 11:31:23 +0200 | [diff] [blame] | 342 | return NULL; |
| 343 | |
Andrey Grodzovsky | a4176cb | 2017-10-24 13:30:16 -0400 | [diff] [blame] | 344 | while ((entity->dependency = sched->ops->dependency(sched_job, entity))) |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 345 | if (amd_sched_entity_add_dependency_cb(entity)) |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 346 | return NULL; |
Christian König | e61235d | 2015-08-25 11:05:36 +0200 | [diff] [blame] | 347 | |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame^] | 348 | /* skip jobs from entity that marked guilty */ |
| 349 | if (entity->guilty && atomic_read(entity->guilty)) |
| 350 | dma_fence_set_error(&sched_job->s_fence->finished, -ECANCELED); |
| 351 | |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 352 | spsc_queue_pop(&entity->job_queue); |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 353 | return sched_job; |
Christian König | 69bd5bf | 2015-08-26 11:31:23 +0200 | [diff] [blame] | 354 | } |
| 355 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 356 | /** |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 357 | * Submit a job to the job queue |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 358 | * |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 359 | * @sched_job The pointer to job required to submit |
Christian König | 6c85927 | 2015-08-20 16:12:50 +0200 | [diff] [blame] | 360 | * |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 361 | * Returns 0 for success, negative error code otherwise. |
Christian König | 6c85927 | 2015-08-20 16:12:50 +0200 | [diff] [blame] | 362 | */ |
Andrey Grodzovsky | a4176cb | 2017-10-24 13:30:16 -0400 | [diff] [blame] | 363 | void amd_sched_entity_push_job(struct amd_sched_job *sched_job, |
| 364 | struct amd_sched_entity *entity) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 365 | { |
Nicolai Hähnle | 786b521 | 2015-12-02 17:35:12 +0100 | [diff] [blame] | 366 | struct amd_gpu_scheduler *sched = sched_job->sched; |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 367 | bool first = false; |
| 368 | |
Andrey Grodzovsky | a4176cb | 2017-10-24 13:30:16 -0400 | [diff] [blame] | 369 | trace_amd_sched_job(sched_job, entity); |
Christian König | 6c85927 | 2015-08-20 16:12:50 +0200 | [diff] [blame] | 370 | |
| 371 | spin_lock(&entity->queue_lock); |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 372 | first = spsc_queue_push(&entity->job_queue, &sched_job->queue_node); |
Christian König | 6c85927 | 2015-08-20 16:12:50 +0200 | [diff] [blame] | 373 | |
| 374 | spin_unlock(&entity->queue_lock); |
| 375 | |
| 376 | /* first job wakes up scheduler */ |
Chunming Zhou | e8deea2 | 2015-12-11 18:22:52 +0800 | [diff] [blame] | 377 | if (first) { |
| 378 | /* Add the entity to the run queue */ |
Andres Rodriguez | 9ebbaab | 2017-06-02 15:09:00 -0400 | [diff] [blame] | 379 | spin_lock(&entity->rq_lock); |
Chunming Zhou | e8deea2 | 2015-12-11 18:22:52 +0800 | [diff] [blame] | 380 | amd_sched_rq_add_entity(entity->rq, entity); |
Andres Rodriguez | 9ebbaab | 2017-06-02 15:09:00 -0400 | [diff] [blame] | 381 | spin_unlock(&entity->rq_lock); |
Nicolai Hähnle | 786b521 | 2015-12-02 17:35:12 +0100 | [diff] [blame] | 382 | amd_sched_wakeup(sched); |
Chunming Zhou | e8deea2 | 2015-12-11 18:22:52 +0800 | [diff] [blame] | 383 | } |
Christian König | 6c85927 | 2015-08-20 16:12:50 +0200 | [diff] [blame] | 384 | } |
| 385 | |
Nicolai Hähnle | 1650c14 | 2017-09-28 11:35:05 +0200 | [diff] [blame] | 386 | /* job_finish is called after hw fence signaled |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 387 | */ |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 388 | static void amd_sched_job_finish(struct work_struct *work) |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 389 | { |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 390 | struct amd_sched_job *s_job = container_of(work, struct amd_sched_job, |
| 391 | finish_work); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 392 | struct amd_gpu_scheduler *sched = s_job->sched; |
| 393 | |
Christian König | f42d20a9 | 2016-05-18 15:40:58 +0200 | [diff] [blame] | 394 | /* remove job from ring_mirror_list */ |
Christian König | 1059e11 | 2016-06-13 16:12:43 +0200 | [diff] [blame] | 395 | spin_lock(&sched->job_list_lock); |
Christian König | f42d20a9 | 2016-05-18 15:40:58 +0200 | [diff] [blame] | 396 | list_del_init(&s_job->node); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 397 | if (sched->timeout != MAX_SCHEDULE_TIMEOUT) { |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 398 | struct amd_sched_job *next; |
| 399 | |
Christian König | 1059e11 | 2016-06-13 16:12:43 +0200 | [diff] [blame] | 400 | spin_unlock(&sched->job_list_lock); |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 401 | cancel_delayed_work_sync(&s_job->work_tdr); |
Christian König | 1059e11 | 2016-06-13 16:12:43 +0200 | [diff] [blame] | 402 | spin_lock(&sched->job_list_lock); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 403 | |
| 404 | /* queue TDR for next job */ |
| 405 | next = list_first_entry_or_null(&sched->ring_mirror_list, |
| 406 | struct amd_sched_job, node); |
| 407 | |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 408 | if (next) |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 409 | schedule_delayed_work(&next->work_tdr, sched->timeout); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 410 | } |
Christian König | 1059e11 | 2016-06-13 16:12:43 +0200 | [diff] [blame] | 411 | spin_unlock(&sched->job_list_lock); |
Christian König | 7fd5e36 | 2017-10-13 10:58:15 +0200 | [diff] [blame] | 412 | dma_fence_put(&s_job->s_fence->finished); |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 413 | sched->ops->free_job(s_job); |
| 414 | } |
| 415 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 416 | static void amd_sched_job_finish_cb(struct dma_fence *f, |
| 417 | struct dma_fence_cb *cb) |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 418 | { |
| 419 | struct amd_sched_job *job = container_of(cb, struct amd_sched_job, |
| 420 | finish_cb); |
| 421 | schedule_work(&job->finish_work); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 422 | } |
| 423 | |
Christian König | 7392c32 | 2016-05-18 13:00:38 +0200 | [diff] [blame] | 424 | static void amd_sched_job_begin(struct amd_sched_job *s_job) |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 425 | { |
| 426 | struct amd_gpu_scheduler *sched = s_job->sched; |
| 427 | |
Nicolai Hähnle | 214a91e | 2017-09-28 11:37:02 +0200 | [diff] [blame] | 428 | dma_fence_add_callback(&s_job->s_fence->finished, &s_job->finish_cb, |
| 429 | amd_sched_job_finish_cb); |
| 430 | |
Christian König | 1059e11 | 2016-06-13 16:12:43 +0200 | [diff] [blame] | 431 | spin_lock(&sched->job_list_lock); |
Christian König | f42d20a9 | 2016-05-18 15:40:58 +0200 | [diff] [blame] | 432 | list_add_tail(&s_job->node, &sched->ring_mirror_list); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 433 | if (sched->timeout != MAX_SCHEDULE_TIMEOUT && |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 434 | list_first_entry_or_null(&sched->ring_mirror_list, |
| 435 | struct amd_sched_job, node) == s_job) |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 436 | schedule_delayed_work(&s_job->work_tdr, sched->timeout); |
Christian König | 1059e11 | 2016-06-13 16:12:43 +0200 | [diff] [blame] | 437 | spin_unlock(&sched->job_list_lock); |
Monk Liu | 0de2479 | 2016-03-04 18:51:02 +0800 | [diff] [blame] | 438 | } |
| 439 | |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 440 | static void amd_sched_job_timedout(struct work_struct *work) |
| 441 | { |
| 442 | struct amd_sched_job *job = container_of(work, struct amd_sched_job, |
| 443 | work_tdr.work); |
| 444 | |
| 445 | job->sched->ops->timedout_job(job); |
| 446 | } |
| 447 | |
Monk Liu | a8a51a7 | 2017-10-16 19:46:43 +0800 | [diff] [blame] | 448 | void amd_sched_hw_job_reset(struct amd_gpu_scheduler *sched, struct amd_sched_job *bad) |
Chunming Zhou | e686e75 | 2016-06-30 11:30:37 +0800 | [diff] [blame] | 449 | { |
| 450 | struct amd_sched_job *s_job; |
Monk Liu | a8a51a7 | 2017-10-16 19:46:43 +0800 | [diff] [blame] | 451 | struct amd_sched_entity *entity, *tmp; |
| 452 | int i;; |
Chunming Zhou | e686e75 | 2016-06-30 11:30:37 +0800 | [diff] [blame] | 453 | |
| 454 | spin_lock(&sched->job_list_lock); |
| 455 | list_for_each_entry_reverse(s_job, &sched->ring_mirror_list, node) { |
Chunming Zhou | a6bef67 | 2017-04-24 17:39:00 +0800 | [diff] [blame] | 456 | if (s_job->s_fence->parent && |
| 457 | dma_fence_remove_callback(s_job->s_fence->parent, |
| 458 | &s_job->s_fence->cb)) { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 459 | dma_fence_put(s_job->s_fence->parent); |
Chunming Zhou | e686e75 | 2016-06-30 11:30:37 +0800 | [diff] [blame] | 460 | s_job->s_fence->parent = NULL; |
Monk Liu | 65781c7 | 2017-05-11 13:36:44 +0800 | [diff] [blame] | 461 | atomic_dec(&sched->hw_rq_count); |
Chunming Zhou | e686e75 | 2016-06-30 11:30:37 +0800 | [diff] [blame] | 462 | } |
| 463 | } |
Monk Liu | 65781c7 | 2017-05-11 13:36:44 +0800 | [diff] [blame] | 464 | spin_unlock(&sched->job_list_lock); |
Monk Liu | a8a51a7 | 2017-10-16 19:46:43 +0800 | [diff] [blame] | 465 | |
| 466 | if (bad) { |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame^] | 467 | /* don't increase @bad's karma if it's from KERNEL RQ, |
| 468 | * becuase sometimes GPU hang would cause kernel jobs (like VM updating jobs) |
| 469 | * corrupt but keep in mind that kernel jobs always considered good. |
| 470 | */ |
| 471 | for (i = AMD_SCHED_PRIORITY_MIN; i < AMD_SCHED_PRIORITY_KERNEL; i++ ) { |
Monk Liu | a8a51a7 | 2017-10-16 19:46:43 +0800 | [diff] [blame] | 472 | struct amd_sched_rq *rq = &sched->sched_rq[i]; |
| 473 | |
| 474 | spin_lock(&rq->lock); |
| 475 | list_for_each_entry_safe(entity, tmp, &rq->entities, list) { |
| 476 | if (bad->s_fence->scheduled.context == entity->fence_context) { |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame^] | 477 | if (atomic_inc_return(&bad->karma) > bad->sched->hang_limit) |
| 478 | if (entity->guilty) |
| 479 | atomic_set(entity->guilty, 1); |
Monk Liu | a8a51a7 | 2017-10-16 19:46:43 +0800 | [diff] [blame] | 480 | break; |
| 481 | } |
| 482 | } |
| 483 | spin_unlock(&rq->lock); |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame^] | 484 | if (&entity->list != &rq->entities) |
Monk Liu | a8a51a7 | 2017-10-16 19:46:43 +0800 | [diff] [blame] | 485 | break; |
| 486 | } |
| 487 | } |
Monk Liu | 65781c7 | 2017-05-11 13:36:44 +0800 | [diff] [blame] | 488 | } |
| 489 | |
| 490 | void amd_sched_job_kickout(struct amd_sched_job *s_job) |
| 491 | { |
| 492 | struct amd_gpu_scheduler *sched = s_job->sched; |
| 493 | |
| 494 | spin_lock(&sched->job_list_lock); |
| 495 | list_del_init(&s_job->node); |
Chunming Zhou | e686e75 | 2016-06-30 11:30:37 +0800 | [diff] [blame] | 496 | spin_unlock(&sched->job_list_lock); |
| 497 | } |
| 498 | |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 499 | void amd_sched_job_recovery(struct amd_gpu_scheduler *sched) |
| 500 | { |
Chunming Zhou | 1c62cf9 | 2016-07-25 13:55:35 +0800 | [diff] [blame] | 501 | struct amd_sched_job *s_job, *tmp; |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame^] | 502 | bool found_guilty = false; |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 503 | int r; |
| 504 | |
| 505 | spin_lock(&sched->job_list_lock); |
| 506 | s_job = list_first_entry_or_null(&sched->ring_mirror_list, |
| 507 | struct amd_sched_job, node); |
Christian König | bdf0013 | 2016-08-16 19:52:35 +0200 | [diff] [blame] | 508 | if (s_job && sched->timeout != MAX_SCHEDULE_TIMEOUT) |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 509 | schedule_delayed_work(&s_job->work_tdr, sched->timeout); |
| 510 | |
Chunming Zhou | 1c62cf9 | 2016-07-25 13:55:35 +0800 | [diff] [blame] | 511 | list_for_each_entry_safe(s_job, tmp, &sched->ring_mirror_list, node) { |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 512 | struct amd_sched_fence *s_fence = s_job->s_fence; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 513 | struct dma_fence *fence; |
Monk Liu | 48f05f2 | 2017-10-25 16:21:08 +0800 | [diff] [blame^] | 514 | uint64_t guilty_context; |
| 515 | |
| 516 | if (!found_guilty && atomic_read(&s_job->karma) > sched->hang_limit) { |
| 517 | found_guilty = true; |
| 518 | guilty_context = s_job->s_fence->scheduled.context; |
| 519 | } |
| 520 | |
| 521 | if (found_guilty && s_job->s_fence->scheduled.context == guilty_context) |
| 522 | dma_fence_set_error(&s_fence->finished, -ECANCELED); |
Chunming Zhou | bdc2eea | 2016-07-22 13:01:02 +0800 | [diff] [blame] | 523 | |
Chunming Zhou | 1c62cf9 | 2016-07-25 13:55:35 +0800 | [diff] [blame] | 524 | spin_unlock(&sched->job_list_lock); |
| 525 | fence = sched->ops->run_job(s_job); |
Chunming Zhou | bdc2eea | 2016-07-22 13:01:02 +0800 | [diff] [blame] | 526 | atomic_inc(&sched->hw_rq_count); |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 527 | if (fence) { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 528 | s_fence->parent = dma_fence_get(fence); |
| 529 | r = dma_fence_add_callback(fence, &s_fence->cb, |
| 530 | amd_sched_process_job); |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 531 | if (r == -ENOENT) |
| 532 | amd_sched_process_job(fence, &s_fence->cb); |
| 533 | else if (r) |
| 534 | DRM_ERROR("fence add callback failed (%d)\n", |
| 535 | r); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 536 | dma_fence_put(fence); |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 537 | } else { |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 538 | amd_sched_process_job(NULL, &s_fence->cb); |
| 539 | } |
Chunming Zhou | 1c62cf9 | 2016-07-25 13:55:35 +0800 | [diff] [blame] | 540 | spin_lock(&sched->job_list_lock); |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 541 | } |
| 542 | spin_unlock(&sched->job_list_lock); |
| 543 | } |
| 544 | |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 545 | /* init a sched_job with basic field */ |
| 546 | int amd_sched_job_init(struct amd_sched_job *job, |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 547 | struct amd_gpu_scheduler *sched, |
| 548 | struct amd_sched_entity *entity, |
Christian König | 595a9cd | 2016-06-30 10:52:03 +0200 | [diff] [blame] | 549 | void *owner) |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 550 | { |
| 551 | job->sched = sched; |
Andrey Grodzovsky | d1f6dc1 | 2017-10-19 14:29:46 -0400 | [diff] [blame] | 552 | job->s_priority = entity->rq - sched->sched_rq; |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 553 | job->s_fence = amd_sched_fence_create(entity, owner); |
| 554 | if (!job->s_fence) |
| 555 | return -ENOMEM; |
Chunming Zhou | cb3696f | 2017-05-09 15:34:07 +0800 | [diff] [blame] | 556 | job->id = atomic64_inc_return(&sched->job_id_count); |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 557 | |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 558 | INIT_WORK(&job->finish_work, amd_sched_job_finish); |
| 559 | INIT_LIST_HEAD(&job->node); |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 560 | INIT_DELAYED_WORK(&job->work_tdr, amd_sched_job_timedout); |
Monk Liu | 4835096 | 2016-03-04 14:33:44 +0800 | [diff] [blame] | 561 | |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 562 | return 0; |
| 563 | } |
| 564 | |
Christian König | e688b728 | 2015-08-20 17:01:01 +0200 | [diff] [blame] | 565 | /** |
| 566 | * Return ture if we can push more jobs to the hw. |
| 567 | */ |
| 568 | static bool amd_sched_ready(struct amd_gpu_scheduler *sched) |
| 569 | { |
| 570 | return atomic_read(&sched->hw_rq_count) < |
| 571 | sched->hw_submission_limit; |
| 572 | } |
| 573 | |
| 574 | /** |
Christian König | 8807900 | 2015-08-24 14:29:40 +0200 | [diff] [blame] | 575 | * Wake up the scheduler when it is ready |
| 576 | */ |
| 577 | static void amd_sched_wakeup(struct amd_gpu_scheduler *sched) |
| 578 | { |
| 579 | if (amd_sched_ready(sched)) |
Christian König | c2b6bd7 | 2015-08-25 21:39:31 +0200 | [diff] [blame] | 580 | wake_up_interruptible(&sched->wake_up_worker); |
Christian König | 8807900 | 2015-08-24 14:29:40 +0200 | [diff] [blame] | 581 | } |
| 582 | |
| 583 | /** |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 584 | * Select next entity to process |
Christian König | e688b728 | 2015-08-20 17:01:01 +0200 | [diff] [blame] | 585 | */ |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 586 | static struct amd_sched_entity * |
| 587 | amd_sched_select_entity(struct amd_gpu_scheduler *sched) |
Christian König | e688b728 | 2015-08-20 17:01:01 +0200 | [diff] [blame] | 588 | { |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 589 | struct amd_sched_entity *entity; |
Chunming Zhou | d033a6d | 2015-11-05 15:23:09 +0800 | [diff] [blame] | 590 | int i; |
Christian König | e688b728 | 2015-08-20 17:01:01 +0200 | [diff] [blame] | 591 | |
| 592 | if (!amd_sched_ready(sched)) |
| 593 | return NULL; |
| 594 | |
| 595 | /* Kernel run queue has higher priority than normal run queue*/ |
Chunming Zhou | 153de9d | 2017-03-16 11:44:49 +0800 | [diff] [blame] | 596 | for (i = AMD_SCHED_PRIORITY_MAX - 1; i >= AMD_SCHED_PRIORITY_MIN; i--) { |
Chunming Zhou | d033a6d | 2015-11-05 15:23:09 +0800 | [diff] [blame] | 597 | entity = amd_sched_rq_select_entity(&sched->sched_rq[i]); |
| 598 | if (entity) |
| 599 | break; |
| 600 | } |
Christian König | e688b728 | 2015-08-20 17:01:01 +0200 | [diff] [blame] | 601 | |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 602 | return entity; |
Christian König | e688b728 | 2015-08-20 17:01:01 +0200 | [diff] [blame] | 603 | } |
| 604 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 605 | static void amd_sched_process_job(struct dma_fence *f, struct dma_fence_cb *cb) |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 606 | { |
Christian König | 258f3f9 | 2015-08-31 17:02:52 +0200 | [diff] [blame] | 607 | struct amd_sched_fence *s_fence = |
| 608 | container_of(cb, struct amd_sched_fence, cb); |
Christian König | 9b398fa | 2015-09-07 18:16:49 +0200 | [diff] [blame] | 609 | struct amd_gpu_scheduler *sched = s_fence->sched; |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 610 | |
Christian König | 7fd5e36 | 2017-10-13 10:58:15 +0200 | [diff] [blame] | 611 | dma_fence_get(&s_fence->finished); |
Christian König | c746ba2 | 2015-08-19 16:12:15 +0200 | [diff] [blame] | 612 | atomic_dec(&sched->hw_rq_count); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 613 | amd_sched_fence_finished(s_fence); |
Monk Liu | cccd9bc | 2016-03-04 14:42:26 +0800 | [diff] [blame] | 614 | |
Chunming Zhou | 7034dec | 2015-11-11 14:56:00 +0800 | [diff] [blame] | 615 | trace_amd_sched_process_job(s_fence); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 616 | dma_fence_put(&s_fence->finished); |
Christian König | c2b6bd7 | 2015-08-25 21:39:31 +0200 | [diff] [blame] | 617 | wake_up_interruptible(&sched->wake_up_worker); |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 618 | } |
| 619 | |
Chunming Zhou | 0875dc9 | 2016-06-12 15:41:58 +0800 | [diff] [blame] | 620 | static bool amd_sched_blocked(struct amd_gpu_scheduler *sched) |
| 621 | { |
| 622 | if (kthread_should_park()) { |
| 623 | kthread_parkme(); |
| 624 | return true; |
| 625 | } |
| 626 | |
| 627 | return false; |
| 628 | } |
| 629 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 630 | static int amd_sched_main(void *param) |
| 631 | { |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 632 | struct sched_param sparam = {.sched_priority = 1}; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 633 | struct amd_gpu_scheduler *sched = (struct amd_gpu_scheduler *)param; |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 634 | int r; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 635 | |
| 636 | sched_setscheduler(current, SCHED_FIFO, &sparam); |
| 637 | |
| 638 | while (!kthread_should_stop()) { |
Chunming Zhou | 0875dc9 | 2016-06-12 15:41:58 +0800 | [diff] [blame] | 639 | struct amd_sched_entity *entity = NULL; |
Christian König | 258f3f9 | 2015-08-31 17:02:52 +0200 | [diff] [blame] | 640 | struct amd_sched_fence *s_fence; |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 641 | struct amd_sched_job *sched_job; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 642 | struct dma_fence *fence; |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 643 | |
Christian König | c2b6bd7 | 2015-08-25 21:39:31 +0200 | [diff] [blame] | 644 | wait_event_interruptible(sched->wake_up_worker, |
Chunming Zhou | 0875dc9 | 2016-06-12 15:41:58 +0800 | [diff] [blame] | 645 | (!amd_sched_blocked(sched) && |
| 646 | (entity = amd_sched_select_entity(sched))) || |
| 647 | kthread_should_stop()); |
Christian König | f85a6dd | 2015-08-19 17:37:52 +0200 | [diff] [blame] | 648 | |
Christian König | 3d65193 | 2015-11-12 21:10:35 +0100 | [diff] [blame] | 649 | if (!entity) |
| 650 | continue; |
| 651 | |
Andrey Grodzovsky | 83f4b11 | 2017-10-12 16:46:26 -0400 | [diff] [blame] | 652 | sched_job = amd_sched_entity_pop_job(entity); |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 653 | if (!sched_job) |
Christian König | f85a6dd | 2015-08-19 17:37:52 +0200 | [diff] [blame] | 654 | continue; |
| 655 | |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 656 | s_fence = sched_job->s_fence; |
Junwei Zhang | 2440ff2 | 2015-10-10 08:48:42 +0800 | [diff] [blame] | 657 | |
Christian König | b034b57 | 2015-08-20 17:08:25 +0200 | [diff] [blame] | 658 | atomic_inc(&sched->hw_rq_count); |
Christian König | 7392c32 | 2016-05-18 13:00:38 +0200 | [diff] [blame] | 659 | amd_sched_job_begin(sched_job); |
Christian König | 7392c32 | 2016-05-18 13:00:38 +0200 | [diff] [blame] | 660 | |
Junwei Zhang | 4c7eb91 | 2015-09-09 09:05:55 +0800 | [diff] [blame] | 661 | fence = sched->ops->run_job(sched_job); |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 662 | amd_sched_fence_scheduled(s_fence); |
Nicolai Hähnle | 29d2535 | 2017-09-28 11:51:32 +0200 | [diff] [blame] | 663 | |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 664 | if (fence) { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 665 | s_fence->parent = dma_fence_get(fence); |
| 666 | r = dma_fence_add_callback(fence, &s_fence->cb, |
| 667 | amd_sched_process_job); |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 668 | if (r == -ENOENT) |
Christian König | 258f3f9 | 2015-08-31 17:02:52 +0200 | [diff] [blame] | 669 | amd_sched_process_job(fence, &s_fence->cb); |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 670 | else if (r) |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 671 | DRM_ERROR("fence add callback failed (%d)\n", |
| 672 | r); |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 673 | dma_fence_put(fence); |
Christian König | 27439fc | 2015-09-02 12:03:06 +0200 | [diff] [blame] | 674 | } else { |
Christian König | 258f3f9 | 2015-08-31 17:02:52 +0200 | [diff] [blame] | 675 | amd_sched_process_job(NULL, &s_fence->cb); |
Christian König | 6f0e54a | 2015-08-05 21:22:10 +0200 | [diff] [blame] | 676 | } |
Christian König | aef4852 | 2015-08-20 14:47:46 +0200 | [diff] [blame] | 677 | |
Christian König | c2b6bd7 | 2015-08-25 21:39:31 +0200 | [diff] [blame] | 678 | wake_up(&sched->job_scheduled); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 679 | } |
| 680 | return 0; |
| 681 | } |
| 682 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 683 | /** |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 684 | * Init a gpu scheduler instance |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 685 | * |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 686 | * @sched The pointer to the scheduler |
Christian König | 69f7dd6 | 2015-08-20 17:24:40 +0200 | [diff] [blame] | 687 | * @ops The backend operations for this scheduler. |
Christian König | 69f7dd6 | 2015-08-20 17:24:40 +0200 | [diff] [blame] | 688 | * @hw_submissions Number of hw submissions to do. |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 689 | * @name Name used for debugging |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 690 | * |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 691 | * Return 0 on success, otherwise error code. |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 692 | */ |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 693 | int amd_sched_init(struct amd_gpu_scheduler *sched, |
Nils Wallménius | 62250a9 | 2016-04-10 16:30:00 +0200 | [diff] [blame] | 694 | const struct amd_sched_backend_ops *ops, |
Monk Liu | 95aa9b1 | 2017-10-17 13:40:54 +0800 | [diff] [blame] | 695 | unsigned hw_submission, |
| 696 | unsigned hang_limit, |
| 697 | long timeout, |
| 698 | const char *name) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 699 | { |
Chunming Zhou | d033a6d | 2015-11-05 15:23:09 +0800 | [diff] [blame] | 700 | int i; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 701 | sched->ops = ops; |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 702 | sched->hw_submission_limit = hw_submission; |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 703 | sched->name = name; |
Junwei Zhang | 2440ff2 | 2015-10-10 08:48:42 +0800 | [diff] [blame] | 704 | sched->timeout = timeout; |
Monk Liu | 95aa9b1 | 2017-10-17 13:40:54 +0800 | [diff] [blame] | 705 | sched->hang_limit = hang_limit; |
Chunming Zhou | 153de9d | 2017-03-16 11:44:49 +0800 | [diff] [blame] | 706 | for (i = AMD_SCHED_PRIORITY_MIN; i < AMD_SCHED_PRIORITY_MAX; i++) |
Chunming Zhou | d033a6d | 2015-11-05 15:23:09 +0800 | [diff] [blame] | 707 | amd_sched_rq_init(&sched->sched_rq[i]); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 708 | |
Christian König | c2b6bd7 | 2015-08-25 21:39:31 +0200 | [diff] [blame] | 709 | init_waitqueue_head(&sched->wake_up_worker); |
| 710 | init_waitqueue_head(&sched->job_scheduled); |
Monk Liu | 4835096 | 2016-03-04 14:33:44 +0800 | [diff] [blame] | 711 | INIT_LIST_HEAD(&sched->ring_mirror_list); |
| 712 | spin_lock_init(&sched->job_list_lock); |
Christian König | c746ba2 | 2015-08-19 16:12:15 +0200 | [diff] [blame] | 713 | atomic_set(&sched->hw_rq_count, 0); |
Andres Rodriguez | 93f8b36 | 2017-03-09 21:25:50 -0500 | [diff] [blame] | 714 | atomic64_set(&sched->job_id_count, 0); |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 715 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 716 | /* Each scheduler will run on a seperate kernel thread */ |
Christian König | c14692f0 | 2015-08-21 15:18:47 +0200 | [diff] [blame] | 717 | sched->thread = kthread_run(amd_sched_main, sched, sched->name); |
Christian König | f495659 | 2015-08-20 16:59:38 +0200 | [diff] [blame] | 718 | if (IS_ERR(sched->thread)) { |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 719 | DRM_ERROR("Failed to create scheduler for %s.\n", name); |
| 720 | return PTR_ERR(sched->thread); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 721 | } |
| 722 | |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 723 | return 0; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 724 | } |
| 725 | |
| 726 | /** |
| 727 | * Destroy a gpu scheduler |
| 728 | * |
| 729 | * @sched The pointer to the scheduler |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 730 | */ |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 731 | void amd_sched_fini(struct amd_gpu_scheduler *sched) |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 732 | { |
Dave Airlie | 32544d0 | 2015-11-03 11:10:03 -0500 | [diff] [blame] | 733 | if (sched->thread) |
| 734 | kthread_stop(sched->thread); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 735 | } |