blob: 4c2c5adbc53746666e31ff2c3e05b76533ec778d [file] [log] [blame]
Jammy Zhoua72ce6f2015-05-22 18:55:07 +08001/*
2 * Copyright 2015 Advanced Micro Devices, Inc.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice shall be included in
12 * all copies or substantial portions of the Software.
13 *
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20 * OTHER DEALINGS IN THE SOFTWARE.
21 *
22 *
23 */
24#include <linux/kthread.h>
25#include <linux/wait.h>
26#include <linux/sched.h>
27#include <drm/drmP.h>
28#include "gpu_scheduler.h"
29
30/* Initialize a given run queue struct */
31static void init_rq(struct amd_run_queue *rq)
32{
33 INIT_LIST_HEAD(&rq->head.list);
34 rq->head.belongto_rq = rq;
35 mutex_init(&rq->lock);
36 atomic_set(&rq->nr_entity, 0);
37 rq->current_entity = &rq->head;
38}
39
40/* Note: caller must hold the lock or in a atomic context */
41static void rq_remove_entity(struct amd_run_queue *rq,
42 struct amd_sched_entity *entity)
43{
44 if (rq->current_entity == entity)
45 rq->current_entity = list_entry(entity->list.prev,
46 typeof(*entity), list);
47 list_del_init(&entity->list);
48 atomic_dec(&rq->nr_entity);
49}
50
51static void rq_add_entity(struct amd_run_queue *rq,
52 struct amd_sched_entity *entity)
53{
54 list_add_tail(&entity->list, &rq->head.list);
55 atomic_inc(&rq->nr_entity);
56}
57
58/**
59 * Select next entity from a specified run queue with round robin policy.
60 * It could return the same entity as current one if current is the only
61 * available one in the queue. Return NULL if nothing available.
62 */
63static struct amd_sched_entity *rq_select_entity(struct amd_run_queue *rq)
64{
65 struct amd_sched_entity *p = rq->current_entity;
66 int i = atomic_read(&rq->nr_entity) + 1; /*real count + dummy head*/
67 while (i) {
68 p = list_entry(p->list.next, typeof(*p), list);
69 if (!rq->check_entity_status(p)) {
70 rq->current_entity = p;
71 break;
72 }
73 i--;
74 }
75 return i ? p : NULL;
76}
77
78static bool context_entity_is_waiting(struct amd_context_entity *entity)
79{
80 /* TODO: sync obj for multi-ring synchronization */
81 return false;
82}
83
84static int gpu_entity_check_status(struct amd_sched_entity *entity)
85{
86 struct amd_context_entity *tmp = NULL;
87
88 if (entity == &entity->belongto_rq->head)
89 return -1;
90
91 tmp = container_of(entity, typeof(*tmp), generic_entity);
92 if (kfifo_is_empty(&tmp->job_queue) ||
93 context_entity_is_waiting(tmp))
94 return -1;
95
96 return 0;
97}
98
99/**
100 * Note: This function should only been called inside scheduler main
101 * function for thread safety, there is no other protection here.
102 * return ture if scheduler has something ready to run.
103 *
104 * For active_hw_rq, there is only one producer(scheduler thread) and
105 * one consumer(ISR). It should be safe to use this function in scheduler
106 * main thread to decide whether to continue emit more IBs.
107*/
108static bool is_scheduler_ready(struct amd_gpu_scheduler *sched)
109{
Chunming Zhou4cef9262015-08-05 19:52:14 +0800110 unsigned long flags;
111 bool full;
112 spin_lock_irqsave(&sched->queue_lock, flags);
113 full = atomic64_read(&sched->hw_rq_count) <
114 sched->hw_submission_limit ? true : false;
115 spin_unlock_irqrestore(&sched->queue_lock, flags);
116
117 return full;
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800118}
119
120/**
121 * Select next entity from the kernel run queue, if not available,
122 * return null.
123*/
124static struct amd_context_entity *kernel_rq_select_context(
125 struct amd_gpu_scheduler *sched)
126{
127 struct amd_sched_entity *sched_entity = NULL;
128 struct amd_context_entity *tmp = NULL;
129 struct amd_run_queue *rq = &sched->kernel_rq;
130
131 mutex_lock(&rq->lock);
132 sched_entity = rq_select_entity(rq);
133 if (sched_entity)
134 tmp = container_of(sched_entity,
135 typeof(*tmp),
136 generic_entity);
137 mutex_unlock(&rq->lock);
138 return tmp;
139}
140
141/**
142 * Select next entity containing real IB submissions
143*/
144static struct amd_context_entity *select_context(
145 struct amd_gpu_scheduler *sched)
146{
147 struct amd_context_entity *wake_entity = NULL;
148 struct amd_context_entity *tmp;
149 struct amd_run_queue *rq;
150
151 if (!is_scheduler_ready(sched))
152 return NULL;
153
154 /* Kernel run queue has higher priority than normal run queue*/
155 tmp = kernel_rq_select_context(sched);
156 if (tmp != NULL)
157 goto exit;
158
159 WARN_ON(offsetof(struct amd_context_entity, generic_entity) != 0);
160
161 rq = &sched->sched_rq;
162 mutex_lock(&rq->lock);
163 tmp = container_of(rq_select_entity(rq),
164 typeof(*tmp), generic_entity);
165 mutex_unlock(&rq->lock);
166exit:
167 if (sched->current_entity && (sched->current_entity != tmp))
168 wake_entity = sched->current_entity;
169 sched->current_entity = tmp;
170 if (wake_entity)
171 wake_up(&wake_entity->wait_queue);
172 return tmp;
173}
174
175/**
176 * Init a context entity used by scheduler when submit to HW ring.
177 *
178 * @sched The pointer to the scheduler
179 * @entity The pointer to a valid amd_context_entity
180 * @parent The parent entity of this amd_context_entity
181 * @rq The run queue this entity belongs
Christian König0e89d0c2015-08-04 16:58:36 +0200182 * @kernel If this is an entity for the kernel
Jammy Zhou1333f722015-07-30 16:36:58 +0800183 * @jobs The max number of jobs in the job queue
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800184 *
185 * return 0 if succeed. negative error code on failure
186*/
187int amd_context_entity_init(struct amd_gpu_scheduler *sched,
188 struct amd_context_entity *entity,
189 struct amd_sched_entity *parent,
190 struct amd_run_queue *rq,
Jammy Zhou1333f722015-07-30 16:36:58 +0800191 uint32_t jobs)
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800192{
193 uint64_t seq_ring = 0;
194
195 if (!(sched && entity && rq))
196 return -EINVAL;
197
198 memset(entity, 0, sizeof(struct amd_context_entity));
199 seq_ring = ((uint64_t)sched->ring_id) << 60;
200 spin_lock_init(&entity->lock);
201 entity->generic_entity.belongto_rq = rq;
202 entity->generic_entity.parent = parent;
203 entity->scheduler = sched;
204 init_waitqueue_head(&entity->wait_queue);
205 init_waitqueue_head(&entity->wait_emit);
206 if(kfifo_alloc(&entity->job_queue,
Jammy Zhou1333f722015-07-30 16:36:58 +0800207 jobs * sizeof(void *),
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800208 GFP_KERNEL))
209 return -EINVAL;
210
211 spin_lock_init(&entity->queue_lock);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800212 atomic64_set(&entity->last_emitted_v_seq, seq_ring);
213 atomic64_set(&entity->last_queued_v_seq, seq_ring);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800214
215 /* Add the entity to the run queue */
216 mutex_lock(&rq->lock);
217 rq_add_entity(rq, &entity->generic_entity);
218 mutex_unlock(&rq->lock);
219 return 0;
220}
221
222/**
223 * Query if entity is initialized
224 *
225 * @sched Pointer to scheduler instance
226 * @entity The pointer to a valid scheduler entity
227 *
228 * return true if entity is initialized, false otherwise
229*/
230static bool is_context_entity_initialized(struct amd_gpu_scheduler *sched,
231 struct amd_context_entity *entity)
232{
233 return entity->scheduler == sched &&
234 entity->generic_entity.belongto_rq != NULL;
235}
236
237static bool is_context_entity_idle(struct amd_gpu_scheduler *sched,
238 struct amd_context_entity *entity)
239{
240 /**
241 * Idle means no pending IBs, and the entity is not
242 * currently being used.
243 */
244 barrier();
245 if ((sched->current_entity != entity) &&
246 kfifo_is_empty(&entity->job_queue))
247 return true;
248
249 return false;
250}
251
252/**
253 * Destroy a context entity
254 *
255 * @sched Pointer to scheduler instance
256 * @entity The pointer to a valid scheduler entity
257 *
258 * return 0 if succeed. negative error code on failure
259 */
260int amd_context_entity_fini(struct amd_gpu_scheduler *sched,
261 struct amd_context_entity *entity)
262{
263 int r = 0;
264 struct amd_run_queue *rq = entity->generic_entity.belongto_rq;
265
266 if (!is_context_entity_initialized(sched, entity))
267 return 0;
268
269 /**
270 * The client will not queue more IBs during this fini, consume existing
271 * queued IBs
272 */
273 r = wait_event_timeout(
274 entity->wait_queue,
275 is_context_entity_idle(sched, entity),
276 msecs_to_jiffies(AMD_GPU_WAIT_IDLE_TIMEOUT_IN_MS)
277 ) ? 0 : -1;
278
279 if (r) {
280 if (entity->is_pending)
Christian König0e89d0c2015-08-04 16:58:36 +0200281 DRM_INFO("Entity %p is in waiting state during fini,\
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800282 all pending ibs will be canceled.\n",
Christian König0e89d0c2015-08-04 16:58:36 +0200283 entity);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800284 }
285
286 mutex_lock(&rq->lock);
287 rq_remove_entity(rq, &entity->generic_entity);
288 mutex_unlock(&rq->lock);
289 kfifo_free(&entity->job_queue);
290 return r;
291}
292
293/**
294 * Submit a normal job to the job queue
295 *
296 * @sched The pointer to the scheduler
297 * @c_entity The pointer to amd_context_entity
298 * @job The pointer to job required to submit
Chunming Zhou80de5912015-08-05 19:07:08 +0800299 * return 0 if succeed. -1 if failed.
300 * -2 indicate queue is full for this client, client should wait untill
301 * scheduler consum some queued command.
302 * -1 other fail.
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800303*/
Chunming Zhou80de5912015-08-05 19:07:08 +0800304int amd_sched_push_job(struct amd_gpu_scheduler *sched,
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800305 struct amd_context_entity *c_entity,
306 void *job)
307{
308 while (kfifo_in_spinlocked(&c_entity->job_queue, &job, sizeof(void *),
309 &c_entity->queue_lock) != sizeof(void *)) {
310 /**
311 * Current context used up all its IB slots
312 * wait here, or need to check whether GPU is hung
313 */
314 schedule();
315 }
316
317 wake_up_interruptible(&sched->wait_queue);
Chunming Zhou80de5912015-08-05 19:07:08 +0800318 return 0;
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800319}
320
321/**
Christian König1d7dd222015-07-31 14:31:49 +0200322 * Wait for a virtual sequence number to be emitted.
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800323 *
324 * @c_entity The pointer to a valid context entity
325 * @seq The virtual sequence number to wait
326 * @intr Interruptible or not
327 * @timeout Timeout in ms, wait infinitely if <0
328 * @emit wait for emit or signal
329 *
330 * return =0 signaled , <0 failed
331*/
Christian König1d7dd222015-07-31 14:31:49 +0200332int amd_sched_wait_emit(struct amd_context_entity *c_entity,
333 uint64_t seq,
334 bool intr,
335 long timeout)
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800336{
Christian König1d7dd222015-07-31 14:31:49 +0200337 atomic64_t *v_seq = &c_entity->last_emitted_v_seq;
338 wait_queue_head_t *wait_queue = &c_entity->wait_emit;
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800339
340 if (intr && (timeout < 0)) {
341 wait_event_interruptible(
342 *wait_queue,
343 seq <= atomic64_read(v_seq));
344 return 0;
345 } else if (intr && (timeout >= 0)) {
346 wait_event_interruptible_timeout(
347 *wait_queue,
348 seq <= atomic64_read(v_seq),
349 msecs_to_jiffies(timeout));
350 return (seq <= atomic64_read(v_seq)) ?
351 0 : -1;
352 } else if (!intr && (timeout < 0)) {
353 wait_event(
354 *wait_queue,
355 seq <= atomic64_read(v_seq));
356 return 0;
357 } else if (!intr && (timeout >= 0)) {
358 wait_event_timeout(
359 *wait_queue,
360 seq <= atomic64_read(v_seq),
361 msecs_to_jiffies(timeout));
362 return (seq <= atomic64_read(v_seq)) ?
363 0 : -1;
364 }
365 return 0;
366}
367
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800368static int amd_sched_main(void *param)
369{
370 int r;
371 void *job;
372 struct sched_param sparam = {.sched_priority = 1};
373 struct amd_context_entity *c_entity = NULL;
374 struct amd_gpu_scheduler *sched = (struct amd_gpu_scheduler *)param;
375
376 sched_setscheduler(current, SCHED_FIFO, &sparam);
377
378 while (!kthread_should_stop()) {
Chunming Zhou4cef9262015-08-05 19:52:14 +0800379 struct amd_sched_job *sched_job = NULL;
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800380 wait_event_interruptible(sched->wait_queue,
381 is_scheduler_ready(sched) &&
382 (c_entity = select_context(sched)));
383 r = kfifo_out(&c_entity->job_queue, &job, sizeof(void *));
384 if (r != sizeof(void *))
385 continue;
386 r = sched->ops->prepare_job(sched, c_entity, job);
Chunming Zhou4cef9262015-08-05 19:52:14 +0800387 if (!r) {
388 unsigned long flags;
389 sched_job = kzalloc(sizeof(struct amd_sched_job),
390 GFP_KERNEL);
391 if (!sched_job) {
392 WARN(true, "No memory to allocate\n");
393 continue;
394 }
395 sched_job->job = job;
396 sched_job->sched = sched;
397 spin_lock_irqsave(&sched->queue_lock, flags);
398 list_add_tail(&sched_job->list, &sched->active_hw_rq);
399 atomic64_inc(&sched->hw_rq_count);
400 spin_unlock_irqrestore(&sched->queue_lock, flags);
401 }
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800402 mutex_lock(&sched->sched_lock);
Chunming Zhou4cef9262015-08-05 19:52:14 +0800403 sched->ops->run_job(sched, c_entity, sched_job);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800404 mutex_unlock(&sched->sched_lock);
405 }
406 return 0;
407}
408
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800409/**
410 * ISR to handle EOP inetrrupts
411 *
412 * @sched: gpu scheduler
413 *
414*/
Chunming Zhou4cef9262015-08-05 19:52:14 +0800415void amd_sched_process_job(struct amd_sched_job *sched_job)
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800416{
Chunming Zhou4cef9262015-08-05 19:52:14 +0800417 unsigned long flags;
418 struct amd_gpu_scheduler *sched;
419 if (!sched_job)
420 return;
421 sched = sched_job->sched;
422 spin_lock_irqsave(&sched->queue_lock, flags);
423 list_del(&sched_job->list);
424 atomic64_dec(&sched->hw_rq_count);
425 spin_unlock_irqrestore(&sched->queue_lock, flags);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800426
Chunming Zhou4cef9262015-08-05 19:52:14 +0800427 sched->ops->process_job(sched, sched_job->job);
428 kfree(sched_job);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800429 wake_up_interruptible(&sched->wait_queue);
430}
431
432/**
433 * Create a gpu scheduler
434 *
435 * @device The device context for this scheduler
436 * @ops The backend operations for this scheduler.
437 * @id The scheduler is per ring, here is ring id.
438 * @granularity The minumum ms unit the scheduler will scheduled.
439 * @preemption Indicate whether this ring support preemption, 0 is no.
440 *
441 * return the pointer to scheduler for success, otherwise return NULL
442*/
443struct amd_gpu_scheduler *amd_sched_create(void *device,
444 struct amd_sched_backend_ops *ops,
445 unsigned ring,
446 unsigned granularity,
Jammy Zhou4afcb302015-07-30 16:44:05 +0800447 unsigned preemption,
448 unsigned hw_submission)
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800449{
450 struct amd_gpu_scheduler *sched;
451 char name[20] = "gpu_sched[0]";
452
453 sched = kzalloc(sizeof(struct amd_gpu_scheduler), GFP_KERNEL);
454 if (!sched)
455 return NULL;
456
457 sched->device = device;
458 sched->ops = ops;
459 sched->granularity = granularity;
460 sched->ring_id = ring;
461 sched->preemption = preemption;
Chunming Zhou4cef9262015-08-05 19:52:14 +0800462 sched->hw_submission_limit = hw_submission;
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800463 snprintf(name, sizeof(name), "gpu_sched[%d]", ring);
464 mutex_init(&sched->sched_lock);
465 spin_lock_init(&sched->queue_lock);
466 init_rq(&sched->sched_rq);
467 sched->sched_rq.check_entity_status = gpu_entity_check_status;
468
469 init_rq(&sched->kernel_rq);
470 sched->kernel_rq.check_entity_status = gpu_entity_check_status;
471
472 init_waitqueue_head(&sched->wait_queue);
Chunming Zhou4cef9262015-08-05 19:52:14 +0800473 INIT_LIST_HEAD(&sched->active_hw_rq);
474 atomic64_set(&sched->hw_rq_count, 0);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800475 /* Each scheduler will run on a seperate kernel thread */
476 sched->thread = kthread_create(amd_sched_main, sched, name);
477 if (sched->thread) {
478 wake_up_process(sched->thread);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800479 return sched;
480 }
481
482 DRM_ERROR("Failed to create scheduler for id %d.\n", ring);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800483 kfree(sched);
484 return NULL;
485}
486
487/**
488 * Destroy a gpu scheduler
489 *
490 * @sched The pointer to the scheduler
491 *
492 * return 0 if succeed. -1 if failed.
493 */
494int amd_sched_destroy(struct amd_gpu_scheduler *sched)
495{
496 kthread_stop(sched->thread);
Jammy Zhoua72ce6f2015-05-22 18:55:07 +0800497 kfree(sched);
498 return 0;
499}
500
Jammy Zhouf95b7e32015-07-31 17:18:15 +0800501/**
502 * Update emitted sequence and wake up the waiters, called by run_job
503 * in driver side
504 *
505 * @entity The context entity
506 * @seq The sequence number for the latest emitted job
507*/
508void amd_sched_emit(struct amd_context_entity *c_entity, uint64_t seq)
509{
510 atomic64_set(&c_entity->last_emitted_v_seq, seq);
511 wake_up_all(&c_entity->wait_emit);
512}
Jammy Zhou27f66422015-08-03 10:27:57 +0800513
514/**
515 * Get next queued sequence number
516 *
517 * @entity The context entity
518 *
519 * return the next queued sequence number
520*/
521uint64_t amd_sched_next_queued_seq(struct amd_context_entity *c_entity)
522{
523 return atomic64_read(&c_entity->last_queued_v_seq) + 1;
524}