Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 2015 Advanced Micro Devices, Inc. |
| 3 | * |
| 4 | * Permission is hereby granted, free of charge, to any person obtaining a |
| 5 | * copy of this software and associated documentation files (the "Software"), |
| 6 | * to deal in the Software without restriction, including without limitation |
| 7 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
| 8 | * and/or sell copies of the Software, and to permit persons to whom the |
| 9 | * Software is furnished to do so, subject to the following conditions: |
| 10 | * |
| 11 | * The above copyright notice and this permission notice shall be included in |
| 12 | * all copies or substantial portions of the Software. |
| 13 | * |
| 14 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
| 15 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
| 16 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
| 17 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
| 18 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
| 19 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
| 20 | * OTHER DEALINGS IN THE SOFTWARE. |
| 21 | * |
| 22 | */ |
| 23 | |
| 24 | #ifndef _GPU_SCHEDULER_H_ |
| 25 | #define _GPU_SCHEDULER_H_ |
| 26 | |
| 27 | #include <linux/kfifo.h> |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 28 | #include <linux/dma-fence.h> |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 29 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 30 | struct amd_gpu_scheduler; |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 31 | struct amd_sched_rq; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 32 | |
| 33 | /** |
| 34 | * A scheduler entity is a wrapper around a job queue or a group |
Monk Liu | e472d25 | 2016-03-03 19:00:50 +0800 | [diff] [blame] | 35 | * of other entities. Entities take turns emitting jobs from their |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 36 | * job queues to corresponding hardware ring based on scheduling |
| 37 | * policy. |
| 38 | */ |
| 39 | struct amd_sched_entity { |
| 40 | struct list_head list; |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 41 | struct amd_sched_rq *rq; |
| 42 | struct amd_gpu_scheduler *sched; |
| 43 | |
Christian König | 91404fb | 2015-08-05 18:33:21 +0200 | [diff] [blame] | 44 | spinlock_t queue_lock; |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 45 | struct kfifo job_queue; |
| 46 | |
| 47 | atomic_t fence_seq; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 48 | uint64_t fence_context; |
Christian König | 0f75aee | 2015-09-07 18:07:14 +0200 | [diff] [blame] | 49 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 50 | struct dma_fence *dependency; |
| 51 | struct dma_fence_cb cb; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 52 | }; |
| 53 | |
| 54 | /** |
| 55 | * Run queue is a set of entities scheduling command submissions for |
| 56 | * one specific ring. It implements the scheduling policy that selects |
| 57 | * the next entity to emit commands from. |
| 58 | */ |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 59 | struct amd_sched_rq { |
Christian König | 2b184d8 | 2015-08-18 14:41:25 +0200 | [diff] [blame] | 60 | spinlock_t lock; |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 61 | struct list_head entities; |
| 62 | struct amd_sched_entity *current_entity; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 63 | }; |
| 64 | |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 65 | struct amd_sched_fence { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 66 | struct dma_fence scheduled; |
| 67 | struct dma_fence finished; |
| 68 | struct dma_fence_cb cb; |
| 69 | struct dma_fence *parent; |
Christian König | 9b398fa | 2015-09-07 18:16:49 +0200 | [diff] [blame] | 70 | struct amd_gpu_scheduler *sched; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 71 | spinlock_t lock; |
Chunming Zhou | 84f76ea | 2015-08-24 12:47:36 +0800 | [diff] [blame] | 72 | void *owner; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 73 | }; |
| 74 | |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 75 | struct amd_sched_job { |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 76 | struct amd_gpu_scheduler *sched; |
Chunming Zhou | 953e8fd | 2015-08-06 15:19:12 +0800 | [diff] [blame] | 77 | struct amd_sched_entity *s_entity; |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 78 | struct amd_sched_fence *s_fence; |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 79 | struct dma_fence_cb finish_cb; |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 80 | struct work_struct finish_work; |
| 81 | struct list_head node; |
| 82 | struct delayed_work work_tdr; |
Andres Rodriguez | 93f8b36 | 2017-03-09 21:25:50 -0500 | [diff] [blame] | 83 | uint64_t id; |
Monk Liu | 65781c7 | 2017-05-11 13:36:44 +0800 | [diff] [blame] | 84 | atomic_t karma; |
Chunming Zhou | 4cef926 | 2015-08-05 19:52:14 +0800 | [diff] [blame] | 85 | }; |
| 86 | |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 87 | extern const struct dma_fence_ops amd_sched_fence_ops_scheduled; |
| 88 | extern const struct dma_fence_ops amd_sched_fence_ops_finished; |
| 89 | static inline struct amd_sched_fence *to_amd_sched_fence(struct dma_fence *f) |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 90 | { |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 91 | if (f->ops == &amd_sched_fence_ops_scheduled) |
| 92 | return container_of(f, struct amd_sched_fence, scheduled); |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 93 | |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 94 | if (f->ops == &amd_sched_fence_ops_finished) |
| 95 | return container_of(f, struct amd_sched_fence, finished); |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 96 | |
| 97 | return NULL; |
| 98 | } |
| 99 | |
Monk Liu | 65781c7 | 2017-05-11 13:36:44 +0800 | [diff] [blame] | 100 | static inline bool amd_sched_invalidate_job(struct amd_sched_job *s_job, int threshold) |
| 101 | { |
| 102 | return (s_job && atomic_inc_return(&s_job->karma) > threshold); |
| 103 | } |
| 104 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 105 | /** |
| 106 | * Define the backend operations called by the scheduler, |
| 107 | * these functions should be implemented in driver side |
| 108 | */ |
| 109 | struct amd_sched_backend_ops { |
Chris Wilson | f54d186 | 2016-10-25 13:00:45 +0100 | [diff] [blame] | 110 | struct dma_fence *(*dependency)(struct amd_sched_job *sched_job); |
| 111 | struct dma_fence *(*run_job)(struct amd_sched_job *sched_job); |
Christian König | 0e51a77 | 2016-05-18 14:19:32 +0200 | [diff] [blame] | 112 | void (*timedout_job)(struct amd_sched_job *sched_job); |
Christian König | c5f74f7 | 2016-05-19 09:54:15 +0200 | [diff] [blame] | 113 | void (*free_job)(struct amd_sched_job *sched_job); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 114 | }; |
| 115 | |
Chunming Zhou | d033a6d | 2015-11-05 15:23:09 +0800 | [diff] [blame] | 116 | enum amd_sched_priority { |
Chunming Zhou | 153de9d | 2017-03-16 11:44:49 +0800 | [diff] [blame] | 117 | AMD_SCHED_PRIORITY_MIN, |
Andres Rodriguez | c2636dc | 2016-12-22 17:06:50 -0500 | [diff] [blame^] | 118 | AMD_SCHED_PRIORITY_LOW = AMD_SCHED_PRIORITY_MIN, |
| 119 | AMD_SCHED_PRIORITY_NORMAL, |
| 120 | AMD_SCHED_PRIORITY_HIGH_SW, |
| 121 | AMD_SCHED_PRIORITY_HIGH_HW, |
Chunming Zhou | 153de9d | 2017-03-16 11:44:49 +0800 | [diff] [blame] | 122 | AMD_SCHED_PRIORITY_KERNEL, |
| 123 | AMD_SCHED_PRIORITY_MAX |
Chunming Zhou | d033a6d | 2015-11-05 15:23:09 +0800 | [diff] [blame] | 124 | }; |
| 125 | |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 126 | /** |
| 127 | * One scheduler is implemented for each hardware ring |
| 128 | */ |
| 129 | struct amd_gpu_scheduler { |
Nils Wallménius | 62250a9 | 2016-04-10 16:30:00 +0200 | [diff] [blame] | 130 | const struct amd_sched_backend_ops *ops; |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 131 | uint32_t hw_submission_limit; |
Junwei Zhang | 2440ff2 | 2015-10-10 08:48:42 +0800 | [diff] [blame] | 132 | long timeout; |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 133 | const char *name; |
Chunming Zhou | 153de9d | 2017-03-16 11:44:49 +0800 | [diff] [blame] | 134 | struct amd_sched_rq sched_rq[AMD_SCHED_PRIORITY_MAX]; |
Christian König | c2b6bd7 | 2015-08-25 21:39:31 +0200 | [diff] [blame] | 135 | wait_queue_head_t wake_up_worker; |
| 136 | wait_queue_head_t job_scheduled; |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 137 | atomic_t hw_rq_count; |
Andres Rodriguez | 93f8b36 | 2017-03-09 21:25:50 -0500 | [diff] [blame] | 138 | atomic64_t job_id_count; |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 139 | struct task_struct *thread; |
Monk Liu | 4835096 | 2016-03-04 14:33:44 +0800 | [diff] [blame] | 140 | struct list_head ring_mirror_list; |
| 141 | spinlock_t job_list_lock; |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 142 | }; |
| 143 | |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 144 | int amd_sched_init(struct amd_gpu_scheduler *sched, |
Nils Wallménius | 62250a9 | 2016-04-10 16:30:00 +0200 | [diff] [blame] | 145 | const struct amd_sched_backend_ops *ops, |
Junwei Zhang | 2440ff2 | 2015-10-10 08:48:42 +0800 | [diff] [blame] | 146 | uint32_t hw_submission, long timeout, const char *name); |
Christian König | 4f839a2 | 2015-09-08 20:22:31 +0200 | [diff] [blame] | 147 | void amd_sched_fini(struct amd_gpu_scheduler *sched); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 148 | |
Christian König | 91404fb | 2015-08-05 18:33:21 +0200 | [diff] [blame] | 149 | int amd_sched_entity_init(struct amd_gpu_scheduler *sched, |
| 150 | struct amd_sched_entity *entity, |
Christian König | 432a4ff | 2015-08-12 11:46:04 +0200 | [diff] [blame] | 151 | struct amd_sched_rq *rq, |
Christian König | 91404fb | 2015-08-05 18:33:21 +0200 | [diff] [blame] | 152 | uint32_t jobs); |
Christian König | 062c7fb | 2015-08-21 15:46:43 +0200 | [diff] [blame] | 153 | void amd_sched_entity_fini(struct amd_gpu_scheduler *sched, |
| 154 | struct amd_sched_entity *entity); |
Christian König | e284022 | 2015-11-05 19:49:48 +0100 | [diff] [blame] | 155 | void amd_sched_entity_push_job(struct amd_sched_job *sched_job); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 156 | |
Christian König | c24784f | 2016-10-28 17:04:07 +0200 | [diff] [blame] | 157 | int amd_sched_fence_slab_init(void); |
| 158 | void amd_sched_fence_slab_fini(void); |
| 159 | |
Chunming Zhou | f556cb0c | 2015-08-02 11:18:04 +0800 | [diff] [blame] | 160 | struct amd_sched_fence *amd_sched_fence_create( |
Chunming Zhou | 84f76ea | 2015-08-24 12:47:36 +0800 | [diff] [blame] | 161 | struct amd_sched_entity *s_entity, void *owner); |
Christian König | 393a0bd | 2015-11-05 12:57:10 +0100 | [diff] [blame] | 162 | void amd_sched_fence_scheduled(struct amd_sched_fence *fence); |
Christian König | 6fc1367 | 2016-05-20 12:53:52 +0200 | [diff] [blame] | 163 | void amd_sched_fence_finished(struct amd_sched_fence *fence); |
Monk Liu | e686941 | 2016-03-07 12:49:55 +0800 | [diff] [blame] | 164 | int amd_sched_job_init(struct amd_sched_job *job, |
Christian König | 16a7133 | 2016-05-18 09:43:07 +0200 | [diff] [blame] | 165 | struct amd_gpu_scheduler *sched, |
| 166 | struct amd_sched_entity *entity, |
Christian König | 595a9cd | 2016-06-30 10:52:03 +0200 | [diff] [blame] | 167 | void *owner); |
Chunming Zhou | e686e75 | 2016-06-30 11:30:37 +0800 | [diff] [blame] | 168 | void amd_sched_hw_job_reset(struct amd_gpu_scheduler *sched); |
Chunming Zhou | ec75f57 | 2016-06-29 15:23:55 +0800 | [diff] [blame] | 169 | void amd_sched_job_recovery(struct amd_gpu_scheduler *sched); |
Chunming Zhou | 30514de | 2017-05-09 13:39:40 +0800 | [diff] [blame] | 170 | bool amd_sched_dependency_optimized(struct dma_fence* fence, |
| 171 | struct amd_sched_entity *entity); |
Monk Liu | 65781c7 | 2017-05-11 13:36:44 +0800 | [diff] [blame] | 172 | void amd_sched_job_kickout(struct amd_sched_job *s_job); |
Jammy Zhou | a72ce6f | 2015-05-22 18:55:07 +0800 | [diff] [blame] | 173 | #endif |