blob: c07961bedb75ea7a379176275022c3cca26bae53 [file] [log] [blame]
Jeff Dike995473a2006-09-27 01:50:40 -07001/*
Jeff Dikeba180fd2007-10-16 01:27:00 -07002 * Copyright (C) 2000 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 * Copyright 2003 PathScale, Inc.
4 * Licensed under the GPL
5 */
6
Jeff Dikec5d4bb12008-02-04 22:31:14 -08007#include <linux/stddef.h>
8#include <linux/err.h>
9#include <linux/hardirq.h>
10#include <linux/gfp.h>
11#include <linux/mm.h>
12#include <linux/personality.h>
13#include <linux/proc_fs.h>
14#include <linux/ptrace.h>
15#include <linux/random.h>
16#include <linux/sched.h>
17#include <linux/tick.h>
18#include <linux/threads.h>
19#include <asm/current.h>
20#include <asm/pgtable.h>
21#include <asm/uaccess.h>
Jeff Dike4ff83ce2007-05-06 14:51:08 -070022#include "as-layout.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070023#include "kern_util.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include "os.h"
Jeff Dike77bf4402007-10-16 01:26:58 -070025#include "skas.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070026#include "tlb.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070027
Jeff Dikeba180fd2007-10-16 01:27:00 -070028/*
29 * This is a per-cpu array. A processor only modifies its entry and it only
Linus Torvalds1da177e2005-04-16 15:20:36 -070030 * cares about its entry, so it's OK if another processor is modifying its
31 * entry.
32 */
33struct cpu_task cpu_tasks[NR_CPUS] = { [0 ... NR_CPUS - 1] = { -1, NULL } };
34
Karol Swietlicki2dc58022008-02-04 22:31:03 -080035static inline int external_pid(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070036{
Jeff Dike77bf4402007-10-16 01:26:58 -070037 /* FIXME: Need to look up userspace_pid by cpu */
Jeff Dikeba180fd2007-10-16 01:27:00 -070038 return userspace_pid[0];
Linus Torvalds1da177e2005-04-16 15:20:36 -070039}
40
41int pid_to_processor_id(int pid)
42{
43 int i;
44
Jeff Dikec5d4bb12008-02-04 22:31:14 -080045 for (i = 0; i < ncpus; i++) {
Jeff Dikeba180fd2007-10-16 01:27:00 -070046 if (cpu_tasks[i].pid == pid)
Jeff Dike6e21aec2007-05-06 14:51:21 -070047 return i;
Linus Torvalds1da177e2005-04-16 15:20:36 -070048 }
Jeff Dike6e21aec2007-05-06 14:51:21 -070049 return -1;
Linus Torvalds1da177e2005-04-16 15:20:36 -070050}
51
52void free_stack(unsigned long stack, int order)
53{
54 free_pages(stack, order);
55}
56
57unsigned long alloc_stack(int order, int atomic)
58{
59 unsigned long page;
Al Viro53f9fc92005-10-21 03:22:24 -040060 gfp_t flags = GFP_KERNEL;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061
Paolo 'Blaisorblade' Giarrusso46db4a42005-09-22 21:44:20 -070062 if (atomic)
63 flags = GFP_ATOMIC;
Linus Torvalds1da177e2005-04-16 15:20:36 -070064 page = __get_free_pages(flags, order);
Jeff Dike5c8aace2007-10-16 01:26:46 -070065
Jeff Dike6e21aec2007-05-06 14:51:21 -070066 return page;
Linus Torvalds1da177e2005-04-16 15:20:36 -070067}
68
69int kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
70{
71 int pid;
72
73 current->thread.request.u.thread.proc = fn;
74 current->thread.request.u.thread.arg = arg;
Jeff Dikee0877f02005-06-25 14:55:21 -070075 pid = do_fork(CLONE_VM | CLONE_UNTRACED | flags, 0,
76 &current->thread.regs, 0, NULL, NULL);
Jeff Dike6e21aec2007-05-06 14:51:21 -070077 return pid;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078}
79
Jeff Dike6e21aec2007-05-06 14:51:21 -070080static inline void set_current(struct task_struct *task)
Linus Torvalds1da177e2005-04-16 15:20:36 -070081{
Al Viroca9bc0b2006-01-12 01:05:48 -080082 cpu_tasks[task_thread_info(task)->cpu] = ((struct cpu_task)
Karol Swietlicki2dc58022008-02-04 22:31:03 -080083 { external_pid(), task });
Linus Torvalds1da177e2005-04-16 15:20:36 -070084}
85
Karol Swietlicki291248f2008-02-04 22:30:49 -080086extern void arch_switch_to(struct task_struct *to);
Jeff Dike77bf4402007-10-16 01:26:58 -070087
Linus Torvalds1da177e2005-04-16 15:20:36 -070088void *_switch_to(void *prev, void *next, void *last)
89{
Jeff Dike995473a2006-09-27 01:50:40 -070090 struct task_struct *from = prev;
Karol Swietlicki291248f2008-02-04 22:30:49 -080091 struct task_struct *to = next;
Jeff Dikef6e34c62005-09-16 19:27:43 -070092
Jeff Dike995473a2006-09-27 01:50:40 -070093 to->thread.prev_sched = from;
94 set_current(to);
Jeff Dikef6e34c62005-09-16 19:27:43 -070095
Jeff Dike3eddddc2005-09-16 19:27:46 -070096 do {
Jeff Dike6aa802c2007-10-16 01:26:56 -070097 current->thread.saved_task = NULL;
Jeff Dike77bf4402007-10-16 01:26:58 -070098
Jeff Dikec5d4bb12008-02-04 22:31:14 -080099 switch_threads(&from->thread.switch_buf,
100 &to->thread.switch_buf);
Jeff Dike77bf4402007-10-16 01:26:58 -0700101
Karol Swietlicki291248f2008-02-04 22:30:49 -0800102 arch_switch_to(current);
Jeff Dike77bf4402007-10-16 01:26:58 -0700103
Jeff Dikeba180fd2007-10-16 01:27:00 -0700104 if (current->thread.saved_task)
Jeff Dike3eddddc2005-09-16 19:27:46 -0700105 show_regs(&(current->thread.regs));
Jeff Dikec5d4bb12008-02-04 22:31:14 -0800106 to = current->thread.saved_task;
107 from = current;
Karol Swietlicki291248f2008-02-04 22:30:49 -0800108 } while (current->thread.saved_task);
Jeff Dikef6e34c62005-09-16 19:27:43 -0700109
Jeff Dike6e21aec2007-05-06 14:51:21 -0700110 return current->thread.prev_sched;
Jeff Dikef6e34c62005-09-16 19:27:43 -0700111
Linus Torvalds1da177e2005-04-16 15:20:36 -0700112}
113
114void interrupt_end(void)
115{
Jeff Dikeba180fd2007-10-16 01:27:00 -0700116 if (need_resched())
Jeff Dike6e21aec2007-05-06 14:51:21 -0700117 schedule();
Jeff Dikeba180fd2007-10-16 01:27:00 -0700118 if (test_tsk_thread_flag(current, TIF_SIGPENDING))
Jeff Dike6e21aec2007-05-06 14:51:21 -0700119 do_signal();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120}
121
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122void exit_thread(void)
123{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700124}
Jeff Dike995473a2006-09-27 01:50:40 -0700125
Linus Torvalds1da177e2005-04-16 15:20:36 -0700126void *get_current(void)
127{
Jeff Dike6e21aec2007-05-06 14:51:21 -0700128 return current;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129}
130
Jeff Dike77bf4402007-10-16 01:26:58 -0700131extern void schedule_tail(struct task_struct *prev);
132
Jeff Dikeba180fd2007-10-16 01:27:00 -0700133/*
134 * This is called magically, by its address being stuffed in a jmp_buf
Jeff Dike77bf4402007-10-16 01:26:58 -0700135 * and being longjmp-d to.
136 */
137void new_thread_handler(void)
138{
139 int (*fn)(void *), n;
140 void *arg;
141
Jeff Dikeba180fd2007-10-16 01:27:00 -0700142 if (current->thread.prev_sched != NULL)
Jeff Dike77bf4402007-10-16 01:26:58 -0700143 schedule_tail(current->thread.prev_sched);
144 current->thread.prev_sched = NULL;
145
146 fn = current->thread.request.u.thread.proc;
147 arg = current->thread.request.u.thread.arg;
148
Jeff Dikeba180fd2007-10-16 01:27:00 -0700149 /*
150 * The return value is 1 if the kernel thread execs a process,
Jeff Dike77bf4402007-10-16 01:26:58 -0700151 * 0 if it just exits
152 */
153 n = run_kernel_thread(fn, arg, &current->thread.exec_buf);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700154 if (n == 1) {
Jeff Dike77bf4402007-10-16 01:26:58 -0700155 /* Handle any immediate reschedules or signals */
156 interrupt_end();
157 userspace(&current->thread.regs.regs);
158 }
159 else do_exit(0);
160}
161
162/* Called magically, see new_thread_handler above */
163void fork_handler(void)
164{
165 force_flush_all();
Jeff Dike77bf4402007-10-16 01:26:58 -0700166
167 schedule_tail(current->thread.prev_sched);
168
Jeff Dikeba180fd2007-10-16 01:27:00 -0700169 /*
170 * XXX: if interrupt_end() calls schedule, this call to
Jeff Dike77bf4402007-10-16 01:26:58 -0700171 * arch_switch_to isn't needed. We could want to apply this to
Jeff Dikeba180fd2007-10-16 01:27:00 -0700172 * improve performance. -bb
173 */
Karol Swietlicki291248f2008-02-04 22:30:49 -0800174 arch_switch_to(current);
Jeff Dike77bf4402007-10-16 01:26:58 -0700175
176 current->thread.prev_sched = NULL;
177
178 /* Handle any immediate reschedules or signals */
179 interrupt_end();
180
181 userspace(&current->thread.regs.regs);
182}
183
Linus Torvalds1da177e2005-04-16 15:20:36 -0700184int copy_thread(int nr, unsigned long clone_flags, unsigned long sp,
Jeff Dike995473a2006-09-27 01:50:40 -0700185 unsigned long stack_top, struct task_struct * p,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186 struct pt_regs *regs)
187{
Jeff Dike77bf4402007-10-16 01:26:58 -0700188 void (*handler)(void);
189 int ret = 0;
Paolo 'Blaisorblade' Giarrussoaa6758d2006-03-31 02:30:22 -0800190
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191 p->thread = (struct thread_struct) INIT_THREAD;
Paolo 'Blaisorblade' Giarrussoaa6758d2006-03-31 02:30:22 -0800192
Jeff Dikeba180fd2007-10-16 01:27:00 -0700193 if (current->thread.forking) {
Jeff Dike77bf4402007-10-16 01:26:58 -0700194 memcpy(&p->thread.regs.regs, &regs->regs,
195 sizeof(p->thread.regs.regs));
Jeff Dike18baddd2007-10-16 01:27:07 -0700196 REGS_SET_SYSCALL_RETURN(p->thread.regs.regs.gp, 0);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700197 if (sp != 0)
Jeff Dike18baddd2007-10-16 01:27:07 -0700198 REGS_SP(p->thread.regs.regs.gp) = sp;
Paolo 'Blaisorblade' Giarrussoaa6758d2006-03-31 02:30:22 -0800199
Jeff Dike77bf4402007-10-16 01:26:58 -0700200 handler = fork_handler;
Paolo 'Blaisorblade' Giarrussoaa6758d2006-03-31 02:30:22 -0800201
Jeff Dike77bf4402007-10-16 01:26:58 -0700202 arch_copy_thread(&current->thread.arch, &p->thread.arch);
203 }
204 else {
Jeff Diked25f2e12008-02-04 22:30:57 -0800205 get_safe_registers(p->thread.regs.regs.gp);
Jeff Dike77bf4402007-10-16 01:26:58 -0700206 p->thread.request.u.thread = current->thread.request.u.thread;
207 handler = new_thread_handler;
208 }
Paolo 'Blaisorblade' Giarrussoaa6758d2006-03-31 02:30:22 -0800209
Jeff Dike77bf4402007-10-16 01:26:58 -0700210 new_thread(task_stack_page(p), &p->thread.switch_buf, handler);
211
212 if (current->thread.forking) {
213 clear_flushed_tls(p);
214
215 /*
216 * Set a new TLS for the child thread?
217 */
218 if (clone_flags & CLONE_SETTLS)
219 ret = arch_copy_tls(p);
220 }
221
Paolo 'Blaisorblade' Giarrussoaa6758d2006-03-31 02:30:22 -0800222 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223}
224
225void initial_thread_cb(void (*proc)(void *), void *arg)
226{
227 int save_kmalloc_ok = kmalloc_ok;
228
229 kmalloc_ok = 0;
Jeff Dike6aa802c2007-10-16 01:26:56 -0700230 initial_thread_cb_skas(proc, arg);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700231 kmalloc_ok = save_kmalloc_ok;
232}
Jeff Dike995473a2006-09-27 01:50:40 -0700233
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234void default_idle(void)
235{
Jeff Dikeb160fb62007-10-16 01:27:26 -0700236 unsigned long long nsecs;
237
Jeff Dikec5d4bb12008-02-04 22:31:14 -0800238 while (1) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700239 /* endless idle loop with no priority at all */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700240
241 /*
242 * although we are an idle CPU, we do not want to
243 * get into the scheduler unnecessarily.
244 */
Jeff Dikeba180fd2007-10-16 01:27:00 -0700245 if (need_resched())
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246 schedule();
Jeff Dike995473a2006-09-27 01:50:40 -0700247
Jeff Diked2753a6d2007-10-16 01:27:25 -0700248 tick_nohz_stop_sched_tick();
Jeff Dikeb160fb62007-10-16 01:27:26 -0700249 nsecs = disable_timer();
250 idle_sleep(nsecs);
Jeff Diked2753a6d2007-10-16 01:27:25 -0700251 tick_nohz_restart_sched_tick();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 }
253}
254
255void cpu_idle(void)
256{
Jeff Dikea5a678c2008-02-04 22:30:54 -0800257 cpu_tasks[current_thread_info()->cpu].pid = os_getpid();
Jeff Dike77bf4402007-10-16 01:26:58 -0700258 default_idle();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700259}
260
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261void dump_thread(struct pt_regs *regs, struct user *u)
262{
263}
264
Paolo 'Blaisorblade' Giarrussob6316292006-01-18 17:42:58 -0800265int __cant_sleep(void) {
266 return in_atomic() || irqs_disabled() || in_interrupt();
267 /* Is in_interrupt() really needed? */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268}
269
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270int user_context(unsigned long sp)
271{
272 unsigned long stack;
273
274 stack = sp & (PAGE_MASK << CONFIG_KERNEL_STACK_ORDER);
Jeff Dikea5a678c2008-02-04 22:30:54 -0800275 return stack != (unsigned long) current_thread_info();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276}
277
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278extern exitcall_t __uml_exitcall_begin, __uml_exitcall_end;
279
280void do_uml_exitcalls(void)
281{
282 exitcall_t *call;
283
284 call = &__uml_exitcall_end;
285 while (--call >= &__uml_exitcall_begin)
286 (*call)();
287}
288
WANG Congc0a92902008-02-04 22:30:41 -0800289char *uml_strdup(const char *string)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290{
Robert Lovedfe52242005-06-23 00:09:04 -0700291 return kstrdup(string, GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292}
293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294int copy_to_user_proc(void __user *to, void *from, int size)
295{
Jeff Dike6e21aec2007-05-06 14:51:21 -0700296 return copy_to_user(to, from, size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297}
298
299int copy_from_user_proc(void *to, void __user *from, int size)
300{
Jeff Dike6e21aec2007-05-06 14:51:21 -0700301 return copy_from_user(to, from, size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302}
303
304int clear_user_proc(void __user *buf, int size)
305{
Jeff Dike6e21aec2007-05-06 14:51:21 -0700306 return clear_user(buf, size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700307}
308
309int strlen_user_proc(char __user *str)
310{
Jeff Dike6e21aec2007-05-06 14:51:21 -0700311 return strlen_user(str);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312}
313
314int smp_sigio_handler(void)
315{
316#ifdef CONFIG_SMP
Jeff Dikea5a678c2008-02-04 22:30:54 -0800317 int cpu = current_thread_info()->cpu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700318 IPI_handler(cpu);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700319 if (cpu != 0)
Jeff Dike6e21aec2007-05-06 14:51:21 -0700320 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700321#endif
Jeff Dike6e21aec2007-05-06 14:51:21 -0700322 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323}
324
Linus Torvalds1da177e2005-04-16 15:20:36 -0700325int cpu(void)
326{
Jeff Dikea5a678c2008-02-04 22:30:54 -0800327 return current_thread_info()->cpu;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328}
329
330static atomic_t using_sysemu = ATOMIC_INIT(0);
331int sysemu_supported;
332
333void set_using_sysemu(int value)
334{
335 if (value > sysemu_supported)
336 return;
337 atomic_set(&using_sysemu, value);
338}
339
340int get_using_sysemu(void)
341{
342 return atomic_read(&using_sysemu);
343}
344
345static int proc_read_sysemu(char *buf, char **start, off_t offset, int size,int *eof, void *data)
346{
Jeff Dikeba180fd2007-10-16 01:27:00 -0700347 if (snprintf(buf, size, "%d\n", get_using_sysemu()) < size)
348 /* No overflow */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349 *eof = 1;
350
351 return strlen(buf);
352}
353
Al Viro4d338e12006-03-31 02:30:15 -0800354static int proc_write_sysemu(struct file *file,const char __user *buf, unsigned long count,void *data)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700355{
356 char tmp[2];
357
358 if (copy_from_user(tmp, buf, 1))
359 return -EFAULT;
360
361 if (tmp[0] >= '0' && tmp[0] <= '2')
362 set_using_sysemu(tmp[0] - '0');
Jeff Dikeba180fd2007-10-16 01:27:00 -0700363 /* We use the first char, but pretend to write everything */
364 return count;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365}
366
367int __init make_proc_sysemu(void)
368{
369 struct proc_dir_entry *ent;
370 if (!sysemu_supported)
371 return 0;
372
373 ent = create_proc_entry("sysemu", 0600, &proc_root);
374
375 if (ent == NULL)
376 {
Christophe Lucas30f417c2005-07-28 21:16:12 -0700377 printk(KERN_WARNING "Failed to register /proc/sysemu\n");
Jeff Dike6e21aec2007-05-06 14:51:21 -0700378 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700379 }
380
381 ent->read_proc = proc_read_sysemu;
382 ent->write_proc = proc_write_sysemu;
383
384 return 0;
385}
386
387late_initcall(make_proc_sysemu);
388
389int singlestepping(void * t)
390{
391 struct task_struct *task = t ? t : current;
392
Jeff Dikec5d4bb12008-02-04 22:31:14 -0800393 if (!(task->ptrace & PT_DTRACE))
Jeff Dikeba180fd2007-10-16 01:27:00 -0700394 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700395
396 if (task->thread.singlestep_syscall)
Jeff Dikeba180fd2007-10-16 01:27:00 -0700397 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700398
399 return 2;
400}
401
Bodo Stroesserb8bd0222005-05-06 21:30:53 -0700402/*
403 * Only x86 and x86_64 have an arch_align_stack().
404 * All other arches have "#define arch_align_stack(x) (x)"
405 * in their asm/system.h
406 * As this is included in UML from asm-um/system-generic.h,
407 * we can use it to behave as the subarch does.
408 */
409#ifndef arch_align_stack
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410unsigned long arch_align_stack(unsigned long sp)
411{
Jeff Dike8f80e942006-09-25 23:33:01 -0700412 if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700413 sp -= get_random_int() % 8192;
414 return sp & ~0xf;
415}
Bodo Stroesserb8bd0222005-05-06 21:30:53 -0700416#endif
Jeff Dikec1127462008-02-04 22:30:36 -0800417
418unsigned long get_wchan(struct task_struct *p)
419{
420 unsigned long stack_page, sp, ip;
421 bool seen_sched = 0;
422
423 if ((p == NULL) || (p == current) || (p->state == TASK_RUNNING))
424 return 0;
425
426 stack_page = (unsigned long) task_stack_page(p);
427 /* Bail if the process has no kernel stack for some reason */
428 if (stack_page == 0)
429 return 0;
430
431 sp = p->thread.switch_buf->JB_SP;
432 /*
433 * Bail if the stack pointer is below the bottom of the kernel
434 * stack for some reason
435 */
436 if (sp < stack_page)
437 return 0;
438
439 while (sp < stack_page + THREAD_SIZE) {
440 ip = *((unsigned long *) sp);
441 if (in_sched_functions(ip))
442 /* Ignore everything until we're above the scheduler */
443 seen_sched = 1;
444 else if (kernel_text_address(ip) && seen_sched)
445 return ip;
446
447 sp += sizeof(unsigned long);
448 }
449
450 return 0;
451}
Jeff Dike8192ab42008-02-04 22:30:53 -0800452
453int elf_core_copy_fpregs(struct task_struct *t, elf_fpregset_t *fpu)
454{
455 int cpu = current_thread_info()->cpu;
456
457 return save_fp_registers(userspace_pid[cpu], (unsigned long *) fpu);
458}
459