blob: 07d0d095c62a4d64add130ae0c3c70b8d3bccd11 [file] [log] [blame]
Arnd Bergmann8b3d6662005-11-15 15:53:52 -05001/* sched.c - SPU scheduler.
2 *
3 * Copyright (C) IBM 2005
4 * Author: Mark Nutter <mnutter@us.ibm.com>
5 *
Mark Nuttera68cf982006-10-04 17:26:12 +02006 * 2006-03-31 NUMA domains added.
Arnd Bergmann8b3d6662005-11-15 15:53:52 -05007 *
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License as published by
10 * the Free Software Foundation; either version 2, or (at your option)
11 * any later version.
12 *
13 * This program is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 * GNU General Public License for more details.
17 *
18 * You should have received a copy of the GNU General Public License
19 * along with this program; if not, write to the Free Software
20 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
21 */
22
Arnd Bergmann3b3d22c2005-12-05 22:52:24 -050023#undef DEBUG
24
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050025#include <linux/module.h>
26#include <linux/errno.h>
27#include <linux/sched.h>
28#include <linux/kernel.h>
29#include <linux/mm.h>
30#include <linux/completion.h>
31#include <linux/vmalloc.h>
32#include <linux/smp.h>
33#include <linux/smp_lock.h>
34#include <linux/stddef.h>
35#include <linux/unistd.h>
Mark Nuttera68cf982006-10-04 17:26:12 +020036#include <linux/numa.h>
37#include <linux/mutex.h>
Arnd Bergmann86767272006-10-04 17:26:21 +020038#include <linux/notifier.h>
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050039
40#include <asm/io.h>
41#include <asm/mmu_context.h>
42#include <asm/spu.h>
43#include <asm/spu_csa.h>
Geoff Levanda91942a2006-06-19 20:33:30 +020044#include <asm/spu_priv1.h>
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050045#include "spufs.h"
46
Arnd Bergmann7945a4a2005-12-09 19:04:16 +010047#define SPU_MIN_TIMESLICE (100 * HZ / 1000)
Arnd Bergmann2a911f02005-12-05 22:52:26 -050048
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050049#define SPU_BITMAP_SIZE (((MAX_PRIO+BITS_PER_LONG)/BITS_PER_LONG)+1)
50struct spu_prio_array {
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050051 unsigned long bitmap[SPU_BITMAP_SIZE];
Christoph Hellwig079cdb62007-02-13 21:54:23 +010052 struct list_head runq[MAX_PRIO];
53 spinlock_t runq_lock;
Mark Nuttera68cf982006-10-04 17:26:12 +020054 struct list_head active_list[MAX_NUMNODES];
55 struct mutex active_mutex[MAX_NUMNODES];
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050056};
57
Mark Nuttera68cf982006-10-04 17:26:12 +020058static struct spu_prio_array *spu_prio;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050059
Mark Nuttera68cf982006-10-04 17:26:12 +020060static inline int node_allowed(int node)
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050061{
Mark Nuttera68cf982006-10-04 17:26:12 +020062 cpumask_t mask;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050063
Mark Nuttera68cf982006-10-04 17:26:12 +020064 if (!nr_cpus_node(node))
65 return 0;
66 mask = node_to_cpumask(node);
67 if (!cpus_intersects(mask, current->cpus_allowed))
68 return 0;
69 return 1;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -050070}
71
Christoph Hellwig202557d2007-02-13 21:36:49 +010072/**
73 * spu_add_to_active_list - add spu to active list
74 * @spu: spu to add to the active list
75 */
76static void spu_add_to_active_list(struct spu *spu)
77{
78 mutex_lock(&spu_prio->active_mutex[spu->node]);
79 list_add_tail(&spu->list, &spu_prio->active_list[spu->node]);
80 mutex_unlock(&spu_prio->active_mutex[spu->node]);
81}
82
83/**
84 * spu_remove_from_active_list - remove spu from active list
85 * @spu: spu to remove from the active list
86 *
87 * This function removes an spu from the active list. If the spu was
88 * found on the active list the function returns 1, else it doesn't do
89 * anything and returns 0.
90 */
91static int spu_remove_from_active_list(struct spu *spu)
92{
93 int node = spu->node;
94 struct spu *tmp;
95 int rc = 0;
96
97 mutex_lock(&spu_prio->active_mutex[node]);
98 list_for_each_entry(tmp, &spu_prio->active_list[node], list) {
99 if (tmp == spu) {
100 list_del_init(&spu->list);
101 rc = 1;
102 break;
103 }
104 }
105 mutex_unlock(&spu_prio->active_mutex[node]);
106 return rc;
107}
108
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500109static inline void mm_needs_global_tlbie(struct mm_struct *mm)
110{
Mark Nuttera68cf982006-10-04 17:26:12 +0200111 int nr = (NR_CPUS > 1) ? NR_CPUS : NR_CPUS + 1;
112
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500113 /* Global TLBIE broadcast required with SPEs. */
Mark Nuttera68cf982006-10-04 17:26:12 +0200114 __cpus_setall(&mm->cpu_vm_mask, nr);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500115}
116
Arnd Bergmann86767272006-10-04 17:26:21 +0200117static BLOCKING_NOTIFIER_HEAD(spu_switch_notifier);
118
119static void spu_switch_notify(struct spu *spu, struct spu_context *ctx)
120{
121 blocking_notifier_call_chain(&spu_switch_notifier,
122 ctx ? ctx->object_id : 0, spu);
123}
124
125int spu_switch_event_register(struct notifier_block * n)
126{
127 return blocking_notifier_chain_register(&spu_switch_notifier, n);
128}
129
130int spu_switch_event_unregister(struct notifier_block * n)
131{
132 return blocking_notifier_chain_unregister(&spu_switch_notifier, n);
133}
134
Christoph Hellwig202557d2007-02-13 21:36:49 +0100135/**
136 * spu_bind_context - bind spu context to physical spu
137 * @spu: physical spu to bind to
138 * @ctx: context to bind
139 */
140static void spu_bind_context(struct spu *spu, struct spu_context *ctx)
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500141{
Mark Nuttera68cf982006-10-04 17:26:12 +0200142 pr_debug("%s: pid=%d SPU=%d NODE=%d\n", __FUNCTION__, current->pid,
143 spu->number, spu->node);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500144 spu->ctx = ctx;
145 spu->flags = 0;
146 ctx->spu = spu;
147 ctx->ops = &spu_hw_ops;
148 spu->pid = current->pid;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500149 spu->mm = ctx->owner;
150 mm_needs_global_tlbie(spu->mm);
151 spu->ibox_callback = spufs_ibox_callback;
152 spu->wbox_callback = spufs_wbox_callback;
Arnd Bergmann51104592005-12-05 22:52:25 -0500153 spu->stop_callback = spufs_stop_callback;
Arnd Bergmanna33a7d72006-03-23 00:00:11 +0100154 spu->mfc_callback = spufs_mfc_callback;
Arnd Bergmann9add11d2006-10-04 17:26:14 +0200155 spu->dma_callback = spufs_dma_callback;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500156 mb();
Arnd Bergmann51104592005-12-05 22:52:25 -0500157 spu_unmap_mappings(ctx);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500158 spu_restore(&ctx->csa, spu);
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500159 spu->timestamp = jiffies;
Mark Nuttera68cf982006-10-04 17:26:12 +0200160 spu_cpu_affinity_set(spu, raw_smp_processor_id());
Arnd Bergmann86767272006-10-04 17:26:21 +0200161 spu_switch_notify(spu, ctx);
Christoph Hellwig202557d2007-02-13 21:36:49 +0100162 spu_add_to_active_list(spu);
Christoph Hellwig81998ba2007-02-13 21:36:48 +0100163 ctx->state = SPU_STATE_RUNNABLE;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500164}
165
Christoph Hellwig202557d2007-02-13 21:36:49 +0100166/**
167 * spu_unbind_context - unbind spu context from physical spu
168 * @spu: physical spu to unbind from
169 * @ctx: context to unbind
170 *
171 * If the spu was on the active list the function returns 1, else 0.
172 */
173static int spu_unbind_context(struct spu *spu, struct spu_context *ctx)
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500174{
Christoph Hellwig202557d2007-02-13 21:36:49 +0100175 int was_active = spu_remove_from_active_list(spu);
176
Mark Nuttera68cf982006-10-04 17:26:12 +0200177 pr_debug("%s: unbind pid=%d SPU=%d NODE=%d\n", __FUNCTION__,
178 spu->pid, spu->number, spu->node);
Christoph Hellwig202557d2007-02-13 21:36:49 +0100179
Arnd Bergmann86767272006-10-04 17:26:21 +0200180 spu_switch_notify(spu, NULL);
Arnd Bergmann51104592005-12-05 22:52:25 -0500181 spu_unmap_mappings(ctx);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500182 spu_save(&ctx->csa, spu);
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500183 spu->timestamp = jiffies;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500184 ctx->state = SPU_STATE_SAVED;
185 spu->ibox_callback = NULL;
186 spu->wbox_callback = NULL;
Arnd Bergmann51104592005-12-05 22:52:25 -0500187 spu->stop_callback = NULL;
Arnd Bergmanna33a7d72006-03-23 00:00:11 +0100188 spu->mfc_callback = NULL;
Arnd Bergmann9add11d2006-10-04 17:26:14 +0200189 spu->dma_callback = NULL;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500190 spu->mm = NULL;
191 spu->pid = 0;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500192 ctx->ops = &spu_backing_ops;
193 ctx->spu = NULL;
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500194 spu->flags = 0;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500195 spu->ctx = NULL;
Christoph Hellwig202557d2007-02-13 21:36:49 +0100196
197 return was_active;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500198}
199
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100200/**
201 * spu_add_to_rq - add a context to the runqueue
202 * @ctx: context to add
203 */
204static void spu_add_to_rq(struct spu_context *ctx)
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500205{
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100206 spin_lock(&spu_prio->runq_lock);
207 list_add_tail(&ctx->rq, &spu_prio->runq[ctx->prio]);
208 set_bit(ctx->prio, spu_prio->bitmap);
209 spin_unlock(&spu_prio->runq_lock);
Mark Nuttera68cf982006-10-04 17:26:12 +0200210}
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500211
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100212/**
213 * spu_del_from_rq - remove a context from the runqueue
214 * @ctx: context to remove
215 */
216static void spu_del_from_rq(struct spu_context *ctx)
Mark Nuttera68cf982006-10-04 17:26:12 +0200217{
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100218 spin_lock(&spu_prio->runq_lock);
219 list_del_init(&ctx->rq);
220 if (list_empty(&spu_prio->runq[ctx->prio]))
221 clear_bit(ctx->prio, spu_prio->bitmap);
222 spin_unlock(&spu_prio->runq_lock);
Mark Nuttera68cf982006-10-04 17:26:12 +0200223}
224
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100225/**
226 * spu_grab_context - remove one context from the runqueue
227 * @prio: priority of the context to be removed
228 *
229 * This function removes one context from the runqueue for priority @prio.
230 * If there is more than one context with the given priority the first
231 * task on the runqueue will be taken.
232 *
233 * Returns the spu_context it just removed.
234 *
235 * Must be called with spu_prio->runq_lock held.
236 */
237static struct spu_context *spu_grab_context(int prio)
Mark Nuttera68cf982006-10-04 17:26:12 +0200238{
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100239 struct list_head *rq = &spu_prio->runq[prio];
240
241 if (list_empty(rq))
242 return NULL;
243 return list_entry(rq->next, struct spu_context, rq);
244}
245
246static void spu_prio_wait(struct spu_context *ctx)
247{
Mark Nuttera68cf982006-10-04 17:26:12 +0200248 DEFINE_WAIT(wait);
249
Christoph Hellwig26bec672007-02-13 21:54:24 +0100250 set_bit(SPU_SCHED_WAKE, &ctx->sched_flags);
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100251 prepare_to_wait_exclusive(&ctx->stop_wq, &wait, TASK_INTERRUPTIBLE);
Mark Nuttera68cf982006-10-04 17:26:12 +0200252 if (!signal_pending(current)) {
Christoph Hellwig650f8b02007-02-13 21:36:50 +0100253 mutex_unlock(&ctx->state_mutex);
Mark Nuttera68cf982006-10-04 17:26:12 +0200254 schedule();
Christoph Hellwig650f8b02007-02-13 21:36:50 +0100255 mutex_lock(&ctx->state_mutex);
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500256 }
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100257 __set_current_state(TASK_RUNNING);
258 remove_wait_queue(&ctx->stop_wq, &wait);
Christoph Hellwig26bec672007-02-13 21:54:24 +0100259 clear_bit(SPU_SCHED_WAKE, &ctx->sched_flags);
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500260}
261
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100262/**
263 * spu_reschedule - try to find a runnable context for a spu
264 * @spu: spu available
265 *
266 * This function is called whenever a spu becomes idle. It looks for the
267 * most suitable runnable spu context and schedules it for execution.
268 */
269static void spu_reschedule(struct spu *spu)
Arnd Bergmann2a911f02005-12-05 22:52:26 -0500270{
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100271 int best;
272
273 spu_free(spu);
274
275 spin_lock(&spu_prio->runq_lock);
276 best = sched_find_first_bit(spu_prio->bitmap);
Mark Nuttera68cf982006-10-04 17:26:12 +0200277 if (best < MAX_PRIO) {
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100278 struct spu_context *ctx = spu_grab_context(best);
Christoph Hellwig26bec672007-02-13 21:54:24 +0100279 if (ctx && test_bit(SPU_SCHED_WAKE, &ctx->sched_flags))
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100280 wake_up(&ctx->stop_wq);
Arnd Bergmann51104592005-12-05 22:52:25 -0500281 }
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100282 spin_unlock(&spu_prio->runq_lock);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500283}
284
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100285static struct spu *spu_get_idle(struct spu_context *ctx)
Mark Nuttera68cf982006-10-04 17:26:12 +0200286{
287 struct spu *spu = NULL;
288 int node = cpu_to_node(raw_smp_processor_id());
289 int n;
290
291 for (n = 0; n < MAX_NUMNODES; n++, node++) {
292 node = (node < MAX_NUMNODES) ? node : 0;
293 if (!node_allowed(node))
294 continue;
295 spu = spu_alloc_node(node);
296 if (spu)
297 break;
298 }
299 return spu;
300}
301
Mark Nuttera68cf982006-10-04 17:26:12 +0200302/* The three externally callable interfaces
303 * for the scheduler begin here.
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500304 *
Mark Nuttera68cf982006-10-04 17:26:12 +0200305 * spu_activate - bind a context to SPU, waiting as needed.
306 * spu_deactivate - unbind a context from its SPU.
307 * spu_yield - yield an SPU if others are waiting.
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500308 */
309
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100310/**
311 * spu_activate - find a free spu for a context and execute it
312 * @ctx: spu context to schedule
313 * @flags: flags (currently ignored)
314 *
315 * Tries to find a free spu to run @ctx. If no free spu is availble
316 * add the context to the runqueue so it gets woken up once an spu
317 * is available.
318 */
Christoph Hellwig26bec672007-02-13 21:54:24 +0100319int spu_activate(struct spu_context *ctx, unsigned long flags)
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500320{
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500321
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100322 if (ctx->spu)
323 return 0;
324
325 do {
326 struct spu *spu;
327
328 spu = spu_get_idle(ctx);
329 if (spu) {
Christoph Hellwig202557d2007-02-13 21:36:49 +0100330 spu_bind_context(spu, ctx);
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100331 return 0;
Mark Nuttera68cf982006-10-04 17:26:12 +0200332 }
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100333
334 spu_add_to_rq(ctx);
Christoph Hellwig26bec672007-02-13 21:54:24 +0100335 if (!(flags & SPU_ACTIVATE_NOWAKE))
336 spu_prio_wait(ctx);
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100337 spu_del_from_rq(ctx);
338 } while (!signal_pending(current));
339
340 return -ERESTARTSYS;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500341}
342
343void spu_deactivate(struct spu_context *ctx)
344{
345 struct spu *spu;
Christoph Hellwig202557d2007-02-13 21:36:49 +0100346 int was_active;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500347
348 spu = ctx->spu;
349 if (!spu)
350 return;
Christoph Hellwig202557d2007-02-13 21:36:49 +0100351 was_active = spu_unbind_context(spu, ctx);
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100352 if (was_active)
353 spu_reschedule(spu);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500354}
355
356void spu_yield(struct spu_context *ctx)
357{
358 struct spu *spu;
Arnd Bergmann51104592005-12-05 22:52:25 -0500359 int need_yield = 0;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500360
Christoph Hellwig650f8b02007-02-13 21:36:50 +0100361 if (mutex_trylock(&ctx->state_mutex)) {
Mark Nuttera68cf982006-10-04 17:26:12 +0200362 if ((spu = ctx->spu) != NULL) {
363 int best = sched_find_first_bit(spu_prio->bitmap);
364 if (best < MAX_PRIO) {
365 pr_debug("%s: yielding SPU %d NODE %d\n",
366 __FUNCTION__, spu->number, spu->node);
367 spu_deactivate(ctx);
Mark Nuttera68cf982006-10-04 17:26:12 +0200368 need_yield = 1;
Mark Nuttera68cf982006-10-04 17:26:12 +0200369 }
370 }
Christoph Hellwig650f8b02007-02-13 21:36:50 +0100371 mutex_unlock(&ctx->state_mutex);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500372 }
Arnd Bergmann51104592005-12-05 22:52:25 -0500373 if (unlikely(need_yield))
374 yield();
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500375}
376
377int __init spu_sched_init(void)
378{
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500379 int i;
380
Mark Nuttera68cf982006-10-04 17:26:12 +0200381 spu_prio = kzalloc(sizeof(struct spu_prio_array), GFP_KERNEL);
382 if (!spu_prio) {
383 printk(KERN_WARNING "%s: Unable to allocate priority queue.\n",
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500384 __FUNCTION__);
385 return 1;
386 }
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500387 for (i = 0; i < MAX_PRIO; i++) {
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100388 INIT_LIST_HEAD(&spu_prio->runq[i]);
Mark Nuttera68cf982006-10-04 17:26:12 +0200389 __clear_bit(i, spu_prio->bitmap);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500390 }
Mark Nuttera68cf982006-10-04 17:26:12 +0200391 __set_bit(MAX_PRIO, spu_prio->bitmap);
392 for (i = 0; i < MAX_NUMNODES; i++) {
393 mutex_init(&spu_prio->active_mutex[i]);
394 INIT_LIST_HEAD(&spu_prio->active_list[i]);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500395 }
Christoph Hellwig079cdb62007-02-13 21:54:23 +0100396 spin_lock_init(&spu_prio->runq_lock);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500397 return 0;
398}
399
400void __exit spu_sched_exit(void)
401{
Mark Nuttera68cf982006-10-04 17:26:12 +0200402 struct spu *spu, *tmp;
403 int node;
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500404
Mark Nuttera68cf982006-10-04 17:26:12 +0200405 for (node = 0; node < MAX_NUMNODES; node++) {
406 mutex_lock(&spu_prio->active_mutex[node]);
407 list_for_each_entry_safe(spu, tmp, &spu_prio->active_list[node],
408 list) {
409 list_del_init(&spu->list);
410 spu_free(spu);
411 }
412 mutex_unlock(&spu_prio->active_mutex[node]);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500413 }
Mark Nuttera68cf982006-10-04 17:26:12 +0200414 kfree(spu_prio);
Arnd Bergmann8b3d6662005-11-15 15:53:52 -0500415}