blob: 7618085b416431379adafe2c1f7e65ea74c0b133 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Heiko Carstenscbdc2292009-03-26 15:23:52 +01002 * This file handles the architecture dependent parts of process handling.
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
Heiko Carstenscbdc2292009-03-26 15:23:52 +01004 * Copyright IBM Corp. 1999,2009
5 * Author(s): Martin Schwidefsky <schwidefsky@de.ibm.com>,
6 * Hartmut Penner <hp@de.ibm.com>,
7 * Denis Joseph Barrow,
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 */
9
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include <linux/compiler.h>
11#include <linux/cpu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070012#include <linux/sched.h>
13#include <linux/kernel.h>
14#include <linux/mm.h>
Martin Schwidefsky638ad342011-10-30 15:17:13 +010015#include <linux/elfcore.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070016#include <linux/smp.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090017#include <linux/slab.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/interrupt.h>
Heiko Carstens5a62b192008-04-17 07:46:25 +020019#include <linux/tick.h>
Heiko Carstens9887a1f2011-01-12 09:55:28 +010020#include <linux/personality.h>
Heiko Carstens26689452009-01-14 14:14:36 +010021#include <linux/syscalls.h>
Heiko Carstens3e86a8c2009-09-22 22:58:42 +020022#include <linux/compat.h>
Martin Schwidefsky860dba42011-01-05 12:47:25 +010023#include <linux/kprobes.h>
Heiko Carstens9887a1f2011-01-12 09:55:28 +010024#include <linux/random.h>
Jan Glauber3af6fb62011-05-23 10:24:44 +020025#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include <asm/system.h>
27#include <asm/io.h>
28#include <asm/processor.h>
29#include <asm/irq.h>
30#include <asm/timer.h>
Heiko Carstensf5daba12009-03-26 15:24:01 +010031#include <asm/nmi.h>
Heiko Carstensda7f51c2011-01-05 12:48:09 +010032#include <asm/smp.h>
Heiko Carstensa8061702008-04-17 07:46:26 +020033#include "entry.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070034
Martin Schwidefsky94c12cc2006-09-28 16:56:43 +020035asmlinkage void ret_from_fork(void) asm ("ret_from_fork");
Linus Torvalds1da177e2005-04-16 15:20:36 -070036
37/*
38 * Return saved PC of a blocked thread. used in kernel/sched.
39 * resume in entry.S does not create a new stack frame, it
40 * just stores the registers %r6-%r15 to the frame given by
41 * schedule. We want to return the address of the caller of
42 * schedule, so we have to walk the backchain one time to
43 * find the frame schedule() store its return address.
44 */
45unsigned long thread_saved_pc(struct task_struct *tsk)
46{
Heiko Carstenseb33c192006-01-14 13:20:57 -080047 struct stack_frame *sf, *low, *high;
Linus Torvalds1da177e2005-04-16 15:20:36 -070048
Heiko Carstenseb33c192006-01-14 13:20:57 -080049 if (!tsk || !task_stack_page(tsk))
50 return 0;
51 low = task_stack_page(tsk);
52 high = (struct stack_frame *) task_pt_regs(tsk);
53 sf = (struct stack_frame *) (tsk->thread.ksp & PSW_ADDR_INSN);
54 if (sf <= low || sf > high)
55 return 0;
56 sf = (struct stack_frame *) (sf->back_chain & PSW_ADDR_INSN);
57 if (sf <= low || sf > high)
58 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070059 return sf->gprs[8];
60}
61
Linus Torvalds1da177e2005-04-16 15:20:36 -070062/*
63 * The idle loop on a S390...
64 */
Adrian Bunkcdb04522006-03-24 03:15:57 -080065static void default_idle(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070066{
Heiko Carstensda7f51c2011-01-05 12:48:09 +010067 if (cpu_is_offline(smp_processor_id()))
Linus Torvalds1da177e2005-04-16 15:20:36 -070068 cpu_die();
Heiko Carstens6931be02010-10-25 16:10:12 +020069 local_irq_disable();
70 if (need_resched()) {
71 local_irq_enable();
72 return;
73 }
Heiko Carstens77fa2242005-06-25 14:55:30 -070074 local_mcck_disable();
75 if (test_thread_flag(TIF_MCCK_PENDING)) {
76 local_mcck_enable();
77 local_irq_enable();
Heiko Carstens77fa2242005-06-25 14:55:30 -070078 return;
79 }
Heiko Carstens1f194a42006-07-03 00:24:46 -070080 trace_hardirqs_on();
Heiko Carstens632448f2008-11-14 18:18:04 +010081 /* Don't trace preempt off for idle. */
82 stop_critical_timings();
Martin Schwidefsky9cfb9b32008-12-31 15:11:41 +010083 /* Stop virtual timer and halt the cpu. */
84 vtime_stop_cpu();
85 /* Reenable preemption tracer. */
Heiko Carstens632448f2008-11-14 18:18:04 +010086 start_critical_timings();
Linus Torvalds1da177e2005-04-16 15:20:36 -070087}
88
89void cpu_idle(void)
90{
Nick Piggin5bfb5d62005-11-08 21:39:01 -080091 for (;;) {
Frederic Weisbecker1268fbc2011-11-17 18:48:14 +010092 tick_nohz_idle_enter();
93 rcu_idle_enter();
Heiko Carstensf36123042012-02-17 10:29:20 +010094 while (!need_resched() && !test_thread_flag(TIF_MCCK_PENDING))
Nick Piggin5bfb5d62005-11-08 21:39:01 -080095 default_idle();
Frederic Weisbecker1268fbc2011-11-17 18:48:14 +010096 rcu_idle_exit();
97 tick_nohz_idle_exit();
Heiko Carstensf36123042012-02-17 10:29:20 +010098 if (test_thread_flag(TIF_MCCK_PENDING))
99 s390_handle_mcck();
Thomas Gleixnerbd2f5532011-03-21 12:33:18 +0100100 schedule_preempt_disabled();
Nick Piggin5bfb5d62005-11-08 21:39:01 -0800101 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102}
103
Martin Schwidefsky860dba42011-01-05 12:47:25 +0100104extern void __kprobes kernel_thread_starter(void);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105
Martin Schwidefsky94c12cc2006-09-28 16:56:43 +0200106asm(
Martin Schwidefsky860dba42011-01-05 12:47:25 +0100107 ".section .kprobes.text, \"ax\"\n"
108 ".global kernel_thread_starter\n"
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109 "kernel_thread_starter:\n"
110 " la 2,0(10)\n"
111 " basr 14,9\n"
112 " la 2,0\n"
Martin Schwidefsky860dba42011-01-05 12:47:25 +0100113 " br 11\n"
114 ".previous\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115
116int kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
117{
118 struct pt_regs regs;
119
120 memset(&regs, 0, sizeof(regs));
Martin Schwidefskyb50511e2011-10-30 15:16:50 +0100121 regs.psw.mask = psw_kernel_bits |
122 PSW_MASK_DAT | PSW_MASK_IO | PSW_MASK_EXT | PSW_MASK_MCHECK;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123 regs.psw.addr = (unsigned long) kernel_thread_starter | PSW_ADDR_AMODE;
124 regs.gprs[9] = (unsigned long) fn;
125 regs.gprs[10] = (unsigned long) arg;
126 regs.gprs[11] = (unsigned long) do_exit;
127 regs.orig_gpr2 = -1;
128
129 /* Ok, create the new process.. */
130 return do_fork(flags | CLONE_VM | CLONE_UNTRACED,
131 0, &regs, 0, NULL, NULL);
132}
Heiko Carstens1485c5c2009-03-26 15:24:04 +0100133EXPORT_SYMBOL(kernel_thread);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700134
135/*
136 * Free current thread data structures etc..
137 */
138void exit_thread(void)
139{
140}
141
142void flush_thread(void)
143{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700144}
145
146void release_thread(struct task_struct *dead_task)
147{
148}
149
Alexey Dobriyan6f2c55b2009-04-02 16:56:59 -0700150int copy_thread(unsigned long clone_flags, unsigned long new_stackp,
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100151 unsigned long unused,
152 struct task_struct *p, struct pt_regs *regs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700153{
Heiko Carstens5168ce2c2009-03-26 15:23:53 +0100154 struct thread_info *ti;
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100155 struct fake_frame
156 {
157 struct stack_frame sf;
158 struct pt_regs childregs;
159 } *frame;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700160
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100161 frame = container_of(task_pt_regs(p), struct fake_frame, childregs);
162 p->thread.ksp = (unsigned long) frame;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700163 /* Store access registers to kernel stack of new process. */
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100164 frame->childregs = *regs;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700165 frame->childregs.gprs[2] = 0; /* child returns 0 on fork. */
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100166 frame->childregs.gprs[15] = new_stackp;
167 frame->sf.back_chain = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100169 /* new return point is ret_from_fork */
170 frame->sf.gprs[8] = (unsigned long) ret_from_fork;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100172 /* fake return stack for resume(), don't go back to schedule */
173 frame->sf.gprs[9] = (unsigned long) frame;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174
175 /* Save access registers to new thread structure. */
176 save_access_regs(&p->thread.acrs[0]);
177
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800178#ifndef CONFIG_64BIT
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100179 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700180 * save fprs to current->thread.fp_regs to merge them with
181 * the emulated registers and then copy the result to the child.
182 */
183 save_fp_regs(&current->thread.fp_regs);
184 memcpy(&p->thread.fp_regs, &current->thread.fp_regs,
185 sizeof(s390_fp_regs));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186 /* Set a new TLS ? */
187 if (clone_flags & CLONE_SETTLS)
188 p->thread.acrs[0] = regs->gprs[6];
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800189#else /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190 /* Save the fpu registers to new thread structure. */
191 save_fp_regs(&p->thread.fp_regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192 /* Set a new TLS ? */
193 if (clone_flags & CLONE_SETTLS) {
Heiko Carstens77575912009-06-12 10:26:25 +0200194 if (is_compat_task()) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700195 p->thread.acrs[0] = (unsigned int) regs->gprs[6];
196 } else {
197 p->thread.acrs[0] = (unsigned int)(regs->gprs[6] >> 32);
198 p->thread.acrs[1] = (unsigned int) regs->gprs[6];
199 }
200 }
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800201#endif /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700202 /* start new process with ar4 pointing to the correct address space */
203 p->thread.mm_segment = get_fs();
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100204 /* Don't copy debug registers */
Martin Schwidefsky5e9a2692011-01-05 12:48:10 +0100205 memset(&p->thread.per_user, 0, sizeof(p->thread.per_user));
206 memset(&p->thread.per_event, 0, sizeof(p->thread.per_event));
Martin Schwidefskyf8d5faf2010-01-13 20:44:26 +0100207 clear_tsk_thread_flag(p, TIF_SINGLE_STEP);
Martin Schwidefsky5e9a2692011-01-05 12:48:10 +0100208 clear_tsk_thread_flag(p, TIF_PER_TRAP);
Heiko Carstens5168ce2c2009-03-26 15:23:53 +0100209 /* Initialize per thread user and system timer values */
210 ti = task_thread_info(p);
211 ti->user_timer = 0;
212 ti->system_timer = 0;
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100213 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700214}
215
Heiko Carstens26689452009-01-14 14:14:36 +0100216SYSCALL_DEFINE0(fork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200218 struct pt_regs *regs = task_pt_regs(current);
219 return do_fork(SIGCHLD, regs->gprs[15], regs, 0, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220}
221
Heiko Carstens2d70ca22009-09-22 22:58:41 +0200222SYSCALL_DEFINE4(clone, unsigned long, newsp, unsigned long, clone_flags,
223 int __user *, parent_tidptr, int __user *, child_tidptr)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700224{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200225 struct pt_regs *regs = task_pt_regs(current);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200227 if (!newsp)
228 newsp = regs->gprs[15];
229 return do_fork(clone_flags, newsp, regs, 0,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700230 parent_tidptr, child_tidptr);
231}
232
233/*
234 * This is trivial, and on the face of it looks like it
235 * could equally well be done in user mode.
236 *
237 * Not so, for quite unobvious reasons - register pressure.
238 * In user mode vfork() cannot have a stack frame, and if
239 * done by calling the "clone()" system call directly, you
240 * do not have enough call-clobbered registers to hold all
241 * the information you need.
242 */
Heiko Carstens26689452009-01-14 14:14:36 +0100243SYSCALL_DEFINE0(vfork)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700244{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200245 struct pt_regs *regs = task_pt_regs(current);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700246 return do_fork(CLONE_VFORK | CLONE_VM | SIGCHLD,
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200247 regs->gprs[15], regs, 0, NULL, NULL);
248}
249
250asmlinkage void execve_tail(void)
251{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200252 current->thread.fp_regs.fpc = 0;
253 if (MACHINE_HAS_IEEE)
254 asm volatile("sfpc %0,%0" : : "d" (0));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255}
256
257/*
258 * sys_execve() executes a new program.
259 */
David Howellsd7627462010-08-17 23:52:56 +0100260SYSCALL_DEFINE3(execve, const char __user *, name,
261 const char __user *const __user *, argv,
262 const char __user *const __user *, envp)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200264 struct pt_regs *regs = task_pt_regs(current);
265 char *filename;
Heiko Carstens3e86a8c2009-09-22 22:58:42 +0200266 long rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700267
Heiko Carstens3e86a8c2009-09-22 22:58:42 +0200268 filename = getname(name);
269 rc = PTR_ERR(filename);
270 if (IS_ERR(filename))
271 return rc;
272 rc = do_execve(filename, argv, envp, regs);
273 if (rc)
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200274 goto out;
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200275 execve_tail();
Heiko Carstens3e86a8c2009-09-22 22:58:42 +0200276 rc = regs->gprs[2];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700277out:
Heiko Carstens3e86a8c2009-09-22 22:58:42 +0200278 putname(filename);
279 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700280}
281
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282/*
283 * fill in the FPU structure for a core dump.
284 */
285int dump_fpu (struct pt_regs * regs, s390_fp_regs *fpregs)
286{
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800287#ifndef CONFIG_64BIT
Heiko Carstenscbdc2292009-03-26 15:23:52 +0100288 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700289 * save fprs to current->thread.fp_regs to merge them with
290 * the emulated registers and then copy the result to the dump.
291 */
292 save_fp_regs(&current->thread.fp_regs);
293 memcpy(fpregs, &current->thread.fp_regs, sizeof(s390_fp_regs));
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800294#else /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700295 save_fp_regs(fpregs);
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800296#endif /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 return 1;
298}
Heiko Carstens1485c5c2009-03-26 15:24:04 +0100299EXPORT_SYMBOL(dump_fpu);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301unsigned long get_wchan(struct task_struct *p)
302{
303 struct stack_frame *sf, *low, *high;
304 unsigned long return_address;
305 int count;
306
Al Viro30af7122006-01-12 01:05:50 -0800307 if (!p || p == current || p->state == TASK_RUNNING || !task_stack_page(p))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700308 return 0;
Al Viro30af7122006-01-12 01:05:50 -0800309 low = task_stack_page(p);
310 high = (struct stack_frame *) task_pt_regs(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311 sf = (struct stack_frame *) (p->thread.ksp & PSW_ADDR_INSN);
312 if (sf <= low || sf > high)
313 return 0;
314 for (count = 0; count < 16; count++) {
315 sf = (struct stack_frame *) (sf->back_chain & PSW_ADDR_INSN);
316 if (sf <= low || sf > high)
317 return 0;
318 return_address = sf->gprs[8] & PSW_ADDR_INSN;
319 if (!in_sched_functions(return_address))
320 return return_address;
321 }
322 return 0;
323}
Heiko Carstens9887a1f2011-01-12 09:55:28 +0100324
325unsigned long arch_align_stack(unsigned long sp)
326{
327 if (!(current->personality & ADDR_NO_RANDOMIZE) && randomize_va_space)
328 sp -= get_random_int() & ~PAGE_MASK;
329 return sp & ~0xf;
330}
Heiko Carstens33519182011-01-12 09:55:30 +0100331
332static inline unsigned long brk_rnd(void)
333{
334 /* 8MB for 32bit, 1GB for 64bit */
335 if (is_32bit_task())
336 return (get_random_int() & 0x7ffUL) << PAGE_SHIFT;
337 else
338 return (get_random_int() & 0x3ffffUL) << PAGE_SHIFT;
339}
340
341unsigned long arch_randomize_brk(struct mm_struct *mm)
342{
343 unsigned long ret = PAGE_ALIGN(mm->brk + brk_rnd());
344
345 if (ret < mm->brk)
346 return mm->brk;
347 return ret;
348}
Heiko Carstensd2c9dfc2011-01-12 09:55:31 +0100349
350unsigned long randomize_et_dyn(unsigned long base)
351{
352 unsigned long ret = PAGE_ALIGN(base + brk_rnd());
353
354 if (!(current->flags & PF_RANDOMIZE))
355 return base;
356 if (ret < base)
357 return base;
358 return ret;
359}