blob: 6c34f14708a958ac622b74eca22eff0ecd35b5db [file] [log] [blame]
Gennady Sharapovabaf6972006-01-18 17:42:46 -08001/*
Jeff Dikeba180fd2007-10-16 01:27:00 -07002 * Copyright (C) 2002- 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
Gennady Sharapovabaf6972006-01-18 17:42:46 -08003 * Licensed under the GPL
4 */
5
6#include <stdlib.h>
Gennady Sharapovabaf6972006-01-18 17:42:46 -08007#include <unistd.h>
Gennady Sharapovabaf6972006-01-18 17:42:46 -08008#include <sched.h>
Jeff Dikeba180fd2007-10-16 01:27:00 -07009#include <errno.h>
10#include <string.h>
Gennady Sharapovabaf6972006-01-18 17:42:46 -080011#include <sys/mman.h>
Jeff Dikeba180fd2007-10-16 01:27:00 -070012#include <sys/ptrace.h>
13#include <sys/wait.h>
14#include <asm/unistd.h>
Jeff Dike16dd07b2007-05-06 14:51:48 -070015#include "as-layout.h"
Al Viro510c72a32011-08-18 20:08:29 +010016#include "init.h"
Jeff Dikeedea1382008-02-04 22:30:46 -080017#include "kern_util.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070018#include "mem.h"
19#include "os.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070020#include "proc_mm.h"
21#include "ptrace_user.h"
22#include "registers.h"
23#include "skas.h"
24#include "skas_ptrace.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070025#include "sysdep/stub.h"
Gennady Sharapovabaf6972006-01-18 17:42:46 -080026
27int is_skas_winch(int pid, int fd, void *data)
28{
Al Viro17e05202011-08-18 20:08:19 +010029 return pid == getpgrp();
Gennady Sharapovabaf6972006-01-18 17:42:46 -080030}
31
Jeff Dikef30c2c92007-05-06 14:51:29 -070032static int ptrace_dump_regs(int pid)
33{
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080034 unsigned long regs[MAX_REG_NR];
35 int i;
Jeff Dikef30c2c92007-05-06 14:51:29 -070036
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080037 if (ptrace(PTRACE_GETREGS, pid, 0, regs) < 0)
38 return -errno;
Jeff Dikeba180fd2007-10-16 01:27:00 -070039
40 printk(UM_KERN_ERR "Stub registers -\n");
41 for (i = 0; i < ARRAY_SIZE(regs); i++)
42 printk(UM_KERN_ERR "\t%d - %lx\n", i, regs[i]);
Jeff Dikef30c2c92007-05-06 14:51:29 -070043
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080044 return 0;
Jeff Dikef30c2c92007-05-06 14:51:29 -070045}
46
Jeff Dike16dd07b2007-05-06 14:51:48 -070047/*
48 * Signals that are OK to receive in the stub - we'll just continue it.
49 * SIGWINCH will happen when UML is inside a detached screen.
50 */
Jeff Dike3d5ede62008-06-05 22:46:13 -070051#define STUB_SIG_MASK ((1 << SIGVTALRM) | (1 << SIGWINCH))
Jeff Dike16dd07b2007-05-06 14:51:48 -070052
53/* Signals that the stub will finish with - anything else is an error */
Jeff Dikeee3d9bd2008-02-04 22:30:56 -080054#define STUB_DONE_MASK (1 << SIGTRAP)
Jeff Dike16dd07b2007-05-06 14:51:48 -070055
56void wait_stub_done(int pid)
Gennady Sharapovabaf6972006-01-18 17:42:46 -080057{
58 int n, status, err;
59
Jeff Dikeba180fd2007-10-16 01:27:00 -070060 while (1) {
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -080061 CATCH_EINTR(n = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dikeba180fd2007-10-16 01:27:00 -070062 if ((n < 0) || !WIFSTOPPED(status))
Jeff Dike16dd07b2007-05-06 14:51:48 -070063 goto bad_wait;
Gennady Sharapovabaf6972006-01-18 17:42:46 -080064
Jeff Dikeba180fd2007-10-16 01:27:00 -070065 if (((1 << WSTOPSIG(status)) & STUB_SIG_MASK) == 0)
Jeff Dike16dd07b2007-05-06 14:51:48 -070066 break;
67
68 err = ptrace(PTRACE_CONT, pid, 0, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080069 if (err) {
70 printk(UM_KERN_ERR "wait_stub_done : continue failed, "
71 "errno = %d\n", errno);
72 fatal_sigsegv();
73 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -080074 }
Jeff Dike16dd07b2007-05-06 14:51:48 -070075
Jeff Dikeba180fd2007-10-16 01:27:00 -070076 if (((1 << WSTOPSIG(status)) & STUB_DONE_MASK) != 0)
Jeff Dike16dd07b2007-05-06 14:51:48 -070077 return;
78
79bad_wait:
80 err = ptrace_dump_regs(pid);
Jeff Dikeba180fd2007-10-16 01:27:00 -070081 if (err)
82 printk(UM_KERN_ERR "Failed to get registers from stub, "
83 "errno = %d\n", -err);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080084 printk(UM_KERN_ERR "wait_stub_done : failed to wait for SIGTRAP, "
85 "pid = %d, n = %d, errno = %d, status = 0x%x\n", pid, n, errno,
86 status);
87 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -080088}
89
90extern unsigned long current_stub_stack(void);
91
WANG Cong99764fa2008-07-23 21:28:49 -070092static void get_skas_faultinfo(int pid, struct faultinfo *fi)
Gennady Sharapovabaf6972006-01-18 17:42:46 -080093{
94 int err;
95
Jeff Dikeba180fd2007-10-16 01:27:00 -070096 if (ptrace_faultinfo) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -080097 err = ptrace(PTRACE_FAULTINFO, pid, 0, fi);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080098 if (err) {
99 printk(UM_KERN_ERR "get_skas_faultinfo - "
100 "PTRACE_FAULTINFO failed, errno = %d\n", errno);
101 fatal_sigsegv();
102 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800103
104 /* Special handling for i386, which has different structs */
105 if (sizeof(struct ptrace_faultinfo) < sizeof(struct faultinfo))
106 memset((char *)fi + sizeof(struct ptrace_faultinfo), 0,
107 sizeof(struct faultinfo) -
108 sizeof(struct ptrace_faultinfo));
109 }
110 else {
Jeff Dike2f56deb2008-02-23 15:23:49 -0800111 unsigned long fpregs[FP_SIZE];
112
113 err = get_fp_registers(pid, fpregs);
114 if (err < 0) {
115 printk(UM_KERN_ERR "save_fp_registers returned %d\n",
116 err);
117 fatal_sigsegv();
118 }
Jeff Dike16dd07b2007-05-06 14:51:48 -0700119 err = ptrace(PTRACE_CONT, pid, 0, SIGSEGV);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800120 if (err) {
121 printk(UM_KERN_ERR "Failed to continue stub, pid = %d, "
122 "errno = %d\n", pid, errno);
123 fatal_sigsegv();
124 }
Jeff Dike16dd07b2007-05-06 14:51:48 -0700125 wait_stub_done(pid);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800126
Jeff Dikeba180fd2007-10-16 01:27:00 -0700127 /*
128 * faultinfo is prepared by the stub-segv-handler at start of
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800129 * the stub stack page. We just have to copy it.
130 */
131 memcpy(fi, (void *)current_stub_stack(), sizeof(*fi));
Jeff Dike2f56deb2008-02-23 15:23:49 -0800132
133 err = put_fp_registers(pid, fpregs);
134 if (err < 0) {
135 printk(UM_KERN_ERR "put_fp_registers returned %d\n",
136 err);
137 fatal_sigsegv();
138 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800139 }
140}
141
Jeff Dike77bf4402007-10-16 01:26:58 -0700142static void handle_segv(int pid, struct uml_pt_regs * regs)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800143{
Jeff Dike77bf4402007-10-16 01:26:58 -0700144 get_skas_faultinfo(pid, &regs->faultinfo);
145 segv(regs->faultinfo, 0, 1, NULL);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800146}
147
Jeff Dikeba180fd2007-10-16 01:27:00 -0700148/*
149 * To use the same value of using_sysemu as the caller, ask it that value
150 * (in local_using_sysemu
151 */
152static void handle_trap(int pid, struct uml_pt_regs *regs,
153 int local_using_sysemu)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800154{
155 int err, status;
156
Jeff Dikee06173b2008-02-04 22:31:12 -0800157 if ((UPT_IP(regs) >= STUB_START) && (UPT_IP(regs) < STUB_END))
158 fatal_sigsegv();
159
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800160 /* Mark this as a syscall */
Jeff Dike18baddd2007-10-16 01:27:07 -0700161 UPT_SYSCALL_NR(regs) = PT_SYSCALL_NR(regs->gp);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800162
163 if (!local_using_sysemu)
164 {
165 err = ptrace(PTRACE_POKEUSR, pid, PT_SYSCALL_NR_OFFSET,
166 __NR_getpid);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800167 if (err < 0) {
168 printk(UM_KERN_ERR "handle_trap - nullifying syscall "
169 "failed, errno = %d\n", errno);
170 fatal_sigsegv();
171 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800172
Jeff Dikeba180fd2007-10-16 01:27:00 -0700173 err = ptrace(PTRACE_SYSCALL, pid, 0, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800174 if (err < 0) {
175 printk(UM_KERN_ERR "handle_trap - continuing to end of "
176 "syscall failed, errno = %d\n", errno);
177 fatal_sigsegv();
178 }
Jeff Dikeba180fd2007-10-16 01:27:00 -0700179
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800180 CATCH_EINTR(err = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dikeba180fd2007-10-16 01:27:00 -0700181 if ((err < 0) || !WIFSTOPPED(status) ||
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800182 (WSTOPSIG(status) != SIGTRAP + 0x80)) {
183 err = ptrace_dump_regs(pid);
184 if (err)
185 printk(UM_KERN_ERR "Failed to get registers "
Jeff Dikeba180fd2007-10-16 01:27:00 -0700186 "from process, errno = %d\n", -err);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800187 printk(UM_KERN_ERR "handle_trap - failed to wait at "
188 "end of syscall, errno = %d, status = %d\n",
189 errno, status);
190 fatal_sigsegv();
191 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800192 }
193
194 handle_syscall(regs);
195}
196
197extern int __syscall_stub_start;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800198
199static int userspace_tramp(void *stack)
200{
201 void *addr;
Jeff Dike537ae942006-09-25 23:33:05 -0700202 int err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800203
204 ptrace(PTRACE_TRACEME, 0, 0, 0);
205
Lepton Wua24864a2007-10-16 01:27:35 -0700206 signal(SIGTERM, SIG_DFL);
Jeff Dikeee3d9bd2008-02-04 22:30:56 -0800207 signal(SIGWINCH, SIG_IGN);
Jeff Dikea2f018b2007-10-16 01:27:22 -0700208 err = set_interval();
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800209 if (err) {
210 printk(UM_KERN_ERR "userspace_tramp - setting timer failed, "
211 "errno = %d\n", err);
212 exit(1);
213 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800214
Jeff Dikeba180fd2007-10-16 01:27:00 -0700215 if (!proc_mm) {
216 /*
217 * This has a pte, but it can't be mapped in with the usual
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800218 * tlb_flush mechanism because this is part of that mechanism
219 */
Jeff Dike09ee0112006-01-18 17:42:48 -0800220 int fd;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700221 unsigned long long offset;
Jeff Dike09ee0112006-01-18 17:42:48 -0800222 fd = phys_mapping(to_phys(&__syscall_stub_start), &offset);
Jeff Dike54ae36f2007-10-16 01:27:33 -0700223 addr = mmap64((void *) STUB_CODE, UM_KERN_PAGE_SIZE,
Jeff Dike09ee0112006-01-18 17:42:48 -0800224 PROT_EXEC, MAP_FIXED | MAP_PRIVATE, fd, offset);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700225 if (addr == MAP_FAILED) {
Jeff Dike54ae36f2007-10-16 01:27:33 -0700226 printk(UM_KERN_ERR "mapping mmap stub at 0x%lx failed, "
227 "errno = %d\n", STUB_CODE, errno);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800228 exit(1);
229 }
230
Jeff Dikeba180fd2007-10-16 01:27:00 -0700231 if (stack != NULL) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800232 fd = phys_mapping(to_phys(stack), &offset);
Jeff Dike54ae36f2007-10-16 01:27:33 -0700233 addr = mmap((void *) STUB_DATA,
Jeff Dike1ffb9162007-05-06 14:51:22 -0700234 UM_KERN_PAGE_SIZE, PROT_READ | PROT_WRITE,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800235 MAP_FIXED | MAP_SHARED, fd, offset);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700236 if (addr == MAP_FAILED) {
237 printk(UM_KERN_ERR "mapping segfault stack "
Jeff Dike54ae36f2007-10-16 01:27:33 -0700238 "at 0x%lx failed, errno = %d\n",
239 STUB_DATA, errno);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800240 exit(1);
241 }
242 }
243 }
Jeff Dikeba180fd2007-10-16 01:27:00 -0700244 if (!ptrace_faultinfo && (stack != NULL)) {
Jeff Dike4b84c692006-09-25 23:33:04 -0700245 struct sigaction sa;
246
Jeff Dike54ae36f2007-10-16 01:27:33 -0700247 unsigned long v = STUB_CODE +
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800248 (unsigned long) stub_segv_handler -
249 (unsigned long) &__syscall_stub_start;
250
Jeff Dike54ae36f2007-10-16 01:27:33 -0700251 set_sigstack((void *) STUB_DATA, UM_KERN_PAGE_SIZE);
Jeff Dike4b84c692006-09-25 23:33:04 -0700252 sigemptyset(&sa.sa_mask);
Al Viro9b25fcb2011-08-18 20:04:09 +0100253 sa.sa_flags = SA_ONSTACK | SA_NODEFER | SA_SIGINFO;
254 sa.sa_sigaction = (void *) v;
Jeff Dike4b84c692006-09-25 23:33:04 -0700255 sa.sa_restorer = NULL;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800256 if (sigaction(SIGSEGV, &sa, NULL) < 0) {
257 printk(UM_KERN_ERR "userspace_tramp - setting SIGSEGV "
258 "handler failed - errno = %d\n", errno);
259 exit(1);
260 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800261 }
262
Jeff Dike512b6fb2007-10-16 01:27:11 -0700263 kill(os_getpid(), SIGSTOP);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700264 return 0;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800265}
266
267/* Each element set once, and only accessed by a single processor anyway */
268#undef NR_CPUS
269#define NR_CPUS 1
270int userspace_pid[NR_CPUS];
271
272int start_userspace(unsigned long stub_stack)
273{
274 void *stack;
275 unsigned long sp;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800276 int pid, status, n, flags, err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800277
Jeff Dikec539ab72007-06-16 10:16:09 -0700278 stack = mmap(NULL, UM_KERN_PAGE_SIZE,
279 PROT_READ | PROT_WRITE | PROT_EXEC,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800280 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800281 if (stack == MAP_FAILED) {
282 err = -errno;
283 printk(UM_KERN_ERR "start_userspace : mmap failed, "
Jeff Dikeb5498832008-02-04 22:31:21 -0800284 "errno = %d\n", errno);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800285 return err;
286 }
287
Jeff Dikec539ab72007-06-16 10:16:09 -0700288 sp = (unsigned long) stack + UM_KERN_PAGE_SIZE - sizeof(void *);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800289
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800290 flags = CLONE_FILES;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700291 if (proc_mm)
292 flags |= CLONE_VM;
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800293 else
294 flags |= SIGCHLD;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700295
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800296 pid = clone(userspace_tramp, (void *) sp, flags, (void *) stub_stack);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800297 if (pid < 0) {
298 err = -errno;
299 printk(UM_KERN_ERR "start_userspace : clone failed, "
Jeff Dikeb5498832008-02-04 22:31:21 -0800300 "errno = %d\n", errno);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800301 return err;
302 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800303
304 do {
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800305 CATCH_EINTR(n = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800306 if (n < 0) {
307 err = -errno;
308 printk(UM_KERN_ERR "start_userspace : wait failed, "
Jeff Dikeb5498832008-02-04 22:31:21 -0800309 "errno = %d\n", errno);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800310 goto out_kill;
311 }
Jeff Dikeba180fd2007-10-16 01:27:00 -0700312 } while (WIFSTOPPED(status) && (WSTOPSIG(status) == SIGVTALRM));
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800313
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800314 if (!WIFSTOPPED(status) || (WSTOPSIG(status) != SIGSTOP)) {
315 err = -EINVAL;
316 printk(UM_KERN_ERR "start_userspace : expected SIGSTOP, got "
Jeff Dikeb5498832008-02-04 22:31:21 -0800317 "status = %d\n", status);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800318 goto out_kill;
319 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800320
Jeff Dikeba180fd2007-10-16 01:27:00 -0700321 if (ptrace(PTRACE_OLDSETOPTIONS, pid, NULL,
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800322 (void *) PTRACE_O_TRACESYSGOOD) < 0) {
323 err = -errno;
324 printk(UM_KERN_ERR "start_userspace : PTRACE_OLDSETOPTIONS "
325 "failed, errno = %d\n", errno);
326 goto out_kill;
327 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800328
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800329 if (munmap(stack, UM_KERN_PAGE_SIZE) < 0) {
330 err = -errno;
331 printk(UM_KERN_ERR "start_userspace : munmap failed, "
332 "errno = %d\n", errno);
333 goto out_kill;
334 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800335
Jeff Dikeba180fd2007-10-16 01:27:00 -0700336 return pid;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800337
338 out_kill:
339 os_kill_ptraced_process(pid, 1);
340 return err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800341}
342
Jeff Dike77bf4402007-10-16 01:26:58 -0700343void userspace(struct uml_pt_regs *regs)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800344{
Jeff Diked2753a6d2007-10-16 01:27:25 -0700345 struct itimerval timer;
346 unsigned long long nsecs, now;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800347 int err, status, op, pid = userspace_pid[0];
Jeff Dike2ea5bc52007-05-10 22:22:32 -0700348 /* To prevent races if using_sysemu changes under us.*/
349 int local_using_sysemu;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800350
Jeff Diked2753a6d2007-10-16 01:27:25 -0700351 if (getitimer(ITIMER_VIRTUAL, &timer))
Jeff Dike5134d8f2008-02-08 04:22:08 -0800352 printk(UM_KERN_ERR "Failed to get itimer, errno = %d\n", errno);
Jeff Dike1a805212007-10-16 01:27:28 -0700353 nsecs = timer.it_value.tv_sec * UM_NSEC_PER_SEC +
354 timer.it_value.tv_usec * UM_NSEC_PER_USEC;
Jeff Diked2753a6d2007-10-16 01:27:25 -0700355 nsecs += os_nsecs();
356
Jeff Dikeba180fd2007-10-16 01:27:00 -0700357 while (1) {
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800358 /*
359 * This can legitimately fail if the process loads a
360 * bogus value into a segment register. It will
361 * segfault and PTRACE_GETREGS will read that value
362 * out of the process. However, PTRACE_SETREGS will
363 * fail. In this case, there is nothing to do but
364 * just kill the process.
365 */
Jeff Diked25f2e12008-02-04 22:30:57 -0800366 if (ptrace(PTRACE_SETREGS, pid, 0, regs->gp))
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800367 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800368
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700369 if (put_fp_registers(pid, regs->fp))
370 fatal_sigsegv();
371
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800372 /* Now we set local_using_sysemu to be used for one loop */
373 local_using_sysemu = get_using_sysemu();
374
Jeff Dike2ea5bc52007-05-10 22:22:32 -0700375 op = SELECT_PTRACE_OPERATION(local_using_sysemu,
376 singlestepping(NULL));
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800377
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800378 if (ptrace(op, pid, 0, 0)) {
379 printk(UM_KERN_ERR "userspace - ptrace continue "
380 "failed, op = %d, errno = %d\n", op, errno);
381 fatal_sigsegv();
382 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800383
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800384 CATCH_EINTR(err = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800385 if (err < 0) {
386 printk(UM_KERN_ERR "userspace - wait failed, "
387 "errno = %d\n", errno);
388 fatal_sigsegv();
389 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800390
Jeff Dike77bf4402007-10-16 01:26:58 -0700391 regs->is_user = 1;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800392 if (ptrace(PTRACE_GETREGS, pid, 0, regs->gp)) {
393 printk(UM_KERN_ERR "userspace - PTRACE_GETREGS failed, "
394 "errno = %d\n", errno);
395 fatal_sigsegv();
396 }
Jeff Diked25f2e12008-02-04 22:30:57 -0800397
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700398 if (get_fp_registers(pid, regs->fp)) {
399 printk(UM_KERN_ERR "userspace - get_fp_registers failed, "
400 "errno = %d\n", errno);
401 fatal_sigsegv();
402 }
403
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800404 UPT_SYSCALL_NR(regs) = -1; /* Assume: It's not a syscall */
405
Jeff Dikeba180fd2007-10-16 01:27:00 -0700406 if (WIFSTOPPED(status)) {
Jeff Dike16dd07b2007-05-06 14:51:48 -0700407 int sig = WSTOPSIG(status);
Jeff Dike5134d8f2008-02-08 04:22:08 -0800408 switch (sig) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800409 case SIGSEGV:
Jeff Dikeba180fd2007-10-16 01:27:00 -0700410 if (PTRACE_FULL_FAULTINFO ||
411 !ptrace_faultinfo) {
412 get_skas_faultinfo(pid,
413 &regs->faultinfo);
Jeff Dike16dd07b2007-05-06 14:51:48 -0700414 (*sig_info[SIGSEGV])(SIGSEGV, regs);
415 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800416 else handle_segv(pid, regs);
417 break;
418 case SIGTRAP + 0x80:
419 handle_trap(pid, regs, local_using_sysemu);
420 break;
421 case SIGTRAP:
422 relay_signal(SIGTRAP, regs);
423 break;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800424 case SIGVTALRM:
Jeff Diked2753a6d2007-10-16 01:27:25 -0700425 now = os_nsecs();
Jeff Diked25f2e12008-02-04 22:30:57 -0800426 if (now < nsecs)
Jeff Diked2753a6d2007-10-16 01:27:25 -0700427 break;
428 block_signals();
429 (*sig_info[sig])(sig, regs);
430 unblock_signals();
Jeff Dike1a805212007-10-16 01:27:28 -0700431 nsecs = timer.it_value.tv_sec *
432 UM_NSEC_PER_SEC +
433 timer.it_value.tv_usec *
434 UM_NSEC_PER_USEC;
Jeff Diked2753a6d2007-10-16 01:27:25 -0700435 nsecs += os_nsecs();
436 break;
437 case SIGIO:
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800438 case SIGILL:
439 case SIGBUS:
440 case SIGFPE:
441 case SIGWINCH:
Jeff Dike16dd07b2007-05-06 14:51:48 -0700442 block_signals();
443 (*sig_info[sig])(sig, regs);
444 unblock_signals();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800445 break;
446 default:
Jeff Dike96cee302008-05-12 14:01:48 -0700447 printk(UM_KERN_ERR "userspace - child stopped "
Jeff Dikeba180fd2007-10-16 01:27:00 -0700448 "with signal %d\n", sig);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800449 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800450 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800451 pid = userspace_pid[0];
452 interrupt_end();
453
454 /* Avoid -ERESTARTSYS handling in host */
Jeff Dikeba180fd2007-10-16 01:27:00 -0700455 if (PT_SYSCALL_NR_OFFSET != PT_SYSCALL_RET_OFFSET)
Jeff Dike18baddd2007-10-16 01:27:07 -0700456 PT_SYSCALL_NR(regs->gp) = -1;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800457 }
458 }
459}
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800460
Jeff Dike16dd07b2007-05-06 14:51:48 -0700461static unsigned long thread_regs[MAX_REG_NR];
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700462static unsigned long thread_fp_regs[FP_SIZE];
Jeff Dike16dd07b2007-05-06 14:51:48 -0700463
464static int __init init_thread_regs(void)
465{
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700466 get_safe_registers(thread_regs, thread_fp_regs);
Jeff Dike16dd07b2007-05-06 14:51:48 -0700467 /* Set parent's instruction pointer to start of clone-stub */
Jeff Dike54ae36f2007-10-16 01:27:33 -0700468 thread_regs[REGS_IP_INDEX] = STUB_CODE +
Jeff Dike16dd07b2007-05-06 14:51:48 -0700469 (unsigned long) stub_clone_handler -
470 (unsigned long) &__syscall_stub_start;
Jeff Dike54ae36f2007-10-16 01:27:33 -0700471 thread_regs[REGS_SP_INDEX] = STUB_DATA + UM_KERN_PAGE_SIZE -
Jeff Dike16dd07b2007-05-06 14:51:48 -0700472 sizeof(void *);
473#ifdef __SIGNAL_FRAMESIZE
474 thread_regs[REGS_SP_INDEX] -= __SIGNAL_FRAMESIZE;
475#endif
476 return 0;
477}
478
479__initcall(init_thread_regs);
480
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800481int copy_context_skas0(unsigned long new_stack, int pid)
482{
Jeff Dike1a805212007-10-16 01:27:28 -0700483 struct timeval tv = { .tv_sec = 0, .tv_usec = UM_USEC_PER_SEC / UM_HZ };
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800484 int err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800485 unsigned long current_stack = current_stub_stack();
486 struct stub_data *data = (struct stub_data *) current_stack;
487 struct stub_data *child_data = (struct stub_data *) new_stack;
Jeff Dike0a7675a2007-10-16 01:27:05 -0700488 unsigned long long new_offset;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800489 int new_fd = phys_mapping(to_phys((void *)new_stack), &new_offset);
490
Jeff Dikeba180fd2007-10-16 01:27:00 -0700491 /*
492 * prepare offset and fd of child's stack as argument for parent's
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800493 * and child's mmap2 calls
494 */
495 *data = ((struct stub_data) { .offset = MMAP_OFFSET(new_offset),
496 .fd = new_fd,
497 .timer = ((struct itimerval)
Jeff Diked2753a6d2007-10-16 01:27:25 -0700498 { .it_value = tv,
499 .it_interval = tv }) });
500
Jeff Dike16dd07b2007-05-06 14:51:48 -0700501 err = ptrace_setregs(pid, thread_regs);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800502 if (err < 0) {
503 err = -errno;
504 printk(UM_KERN_ERR "copy_context_skas0 : PTRACE_SETREGS "
505 "failed, pid = %d, errno = %d\n", pid, -err);
506 return err;
507 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800508
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700509 err = put_fp_registers(pid, thread_fp_regs);
510 if (err < 0) {
511 printk(UM_KERN_ERR "copy_context_skas0 : put_fp_registers "
512 "failed, pid = %d, err = %d\n", pid, err);
513 return err;
514 }
515
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800516 /* set a well known return code for detection of child write failure */
517 child_data->err = 12345678;
518
Jeff Dikeba180fd2007-10-16 01:27:00 -0700519 /*
520 * Wait, until parent has finished its work: read child's pid from
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800521 * parent's stack, and check, if bad result.
522 */
Jeff Dike16dd07b2007-05-06 14:51:48 -0700523 err = ptrace(PTRACE_CONT, pid, 0, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800524 if (err) {
525 err = -errno;
526 printk(UM_KERN_ERR "Failed to continue new process, pid = %d, "
527 "errno = %d\n", pid, errno);
528 return err;
529 }
530
Jeff Dike16dd07b2007-05-06 14:51:48 -0700531 wait_stub_done(pid);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800532
533 pid = data->err;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800534 if (pid < 0) {
535 printk(UM_KERN_ERR "copy_context_skas0 - stub-parent reports "
536 "error %d\n", -pid);
537 return pid;
538 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800539
Jeff Dikeba180fd2007-10-16 01:27:00 -0700540 /*
541 * Wait, until child has finished too: read child's result from
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800542 * child's stack and check it.
543 */
Jeff Dike16dd07b2007-05-06 14:51:48 -0700544 wait_stub_done(pid);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800545 if (child_data->err != STUB_DATA) {
546 printk(UM_KERN_ERR "copy_context_skas0 - stub-child reports "
547 "error %ld\n", child_data->err);
548 err = child_data->err;
549 goto out_kill;
550 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800551
552 if (ptrace(PTRACE_OLDSETOPTIONS, pid, NULL,
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800553 (void *)PTRACE_O_TRACESYSGOOD) < 0) {
554 err = -errno;
555 printk(UM_KERN_ERR "copy_context_skas0 : PTRACE_OLDSETOPTIONS "
556 "failed, errno = %d\n", errno);
557 goto out_kill;
558 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800559
560 return pid;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800561
562 out_kill:
563 os_kill_ptraced_process(pid, 1);
564 return err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800565}
566
567/*
568 * This is used only, if stub pages are needed, while proc_mm is
Jeff Dikeef0470c2007-05-06 14:51:33 -0700569 * available. Opening /proc/mm creates a new mm_context, which lacks
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800570 * the stub-pages. Thus, we map them using /proc/mm-fd
571 */
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800572int map_stub_pages(int fd, unsigned long code, unsigned long data,
573 unsigned long stack)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800574{
575 struct proc_mm_op mmop;
576 int n;
Jeff Dike0a7675a2007-10-16 01:27:05 -0700577 unsigned long long code_offset;
Jeff Dike09ee0112006-01-18 17:42:48 -0800578 int code_fd = phys_mapping(to_phys((void *) &__syscall_stub_start),
579 &code_offset);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800580
581 mmop = ((struct proc_mm_op) { .op = MM_MMAP,
582 .u =
583 { .mmap =
584 { .addr = code,
Jeff Dikec539ab72007-06-16 10:16:09 -0700585 .len = UM_KERN_PAGE_SIZE,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800586 .prot = PROT_EXEC,
587 .flags = MAP_FIXED | MAP_PRIVATE,
Jeff Dike09ee0112006-01-18 17:42:48 -0800588 .fd = code_fd,
589 .offset = code_offset
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800590 } } });
Jeff Dikea61f3342007-05-06 14:51:35 -0700591 CATCH_EINTR(n = write(fd, &mmop, sizeof(mmop)));
Jeff Dikeba180fd2007-10-16 01:27:00 -0700592 if (n != sizeof(mmop)) {
Jeff Dikea61f3342007-05-06 14:51:35 -0700593 n = errno;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700594 printk(UM_KERN_ERR "mmap args - addr = 0x%lx, fd = %d, "
595 "offset = %llx\n", code, code_fd,
596 (unsigned long long) code_offset);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800597 printk(UM_KERN_ERR "map_stub_pages : /proc/mm map for code "
598 "failed, err = %d\n", n);
599 return -n;
Jeff Dikeb4cf95c2007-03-06 01:42:19 -0800600 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800601
Jeff Dikeba180fd2007-10-16 01:27:00 -0700602 if (stack) {
Jeff Dike0a7675a2007-10-16 01:27:05 -0700603 unsigned long long map_offset;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800604 int map_fd = phys_mapping(to_phys((void *)stack), &map_offset);
605 mmop = ((struct proc_mm_op)
606 { .op = MM_MMAP,
607 .u =
608 { .mmap =
609 { .addr = data,
Jeff Dikec539ab72007-06-16 10:16:09 -0700610 .len = UM_KERN_PAGE_SIZE,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800611 .prot = PROT_READ | PROT_WRITE,
612 .flags = MAP_FIXED | MAP_SHARED,
613 .fd = map_fd,
614 .offset = map_offset
615 } } });
Jeff Dikea61f3342007-05-06 14:51:35 -0700616 CATCH_EINTR(n = write(fd, &mmop, sizeof(mmop)));
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800617 if (n != sizeof(mmop)) {
618 n = errno;
619 printk(UM_KERN_ERR "map_stub_pages : /proc/mm map for "
620 "data failed, err = %d\n", n);
621 return -n;
622 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800623 }
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800624
625 return 0;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800626}
627
Jeff Dike3c917352006-09-27 01:50:40 -0700628void new_thread(void *stack, jmp_buf *buf, void (*handler)(void))
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800629{
Jeff Dike3c917352006-09-27 01:50:40 -0700630 (*buf)[0].JB_IP = (unsigned long) handler;
Jeff Dikee1a79c42007-05-10 22:22:31 -0700631 (*buf)[0].JB_SP = (unsigned long) stack + UM_THREAD_SIZE -
632 sizeof(void *);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800633}
634
Jeff Dikee2216fe2006-02-07 12:58:43 -0800635#define INIT_JMP_NEW_THREAD 0
Jeff Dike3c917352006-09-27 01:50:40 -0700636#define INIT_JMP_CALLBACK 1
637#define INIT_JMP_HALT 2
638#define INIT_JMP_REBOOT 3
Jeff Dikee2216fe2006-02-07 12:58:43 -0800639
Jeff Dike3c917352006-09-27 01:50:40 -0700640void switch_threads(jmp_buf *me, jmp_buf *you)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800641{
Jeff Dikeba180fd2007-10-16 01:27:00 -0700642 if (UML_SETJMP(me) == 0)
Jeff Dike3c917352006-09-27 01:50:40 -0700643 UML_LONGJMP(you, 1);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800644}
645
Jeff Dikead28e0292006-04-18 22:21:41 -0700646static jmp_buf initial_jmpbuf;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800647
648/* XXX Make these percpu */
649static void (*cb_proc)(void *arg);
650static void *cb_arg;
Jeff Dikead28e0292006-04-18 22:21:41 -0700651static jmp_buf *cb_back;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800652
Jeff Dike3c917352006-09-27 01:50:40 -0700653int start_idle_thread(void *stack, jmp_buf *switch_buf)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800654{
Jeff Dikea5df0d12006-07-14 00:24:02 -0700655 int n;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800656
Al Viro00361682011-08-18 20:04:39 +0100657 set_handler(SIGWINCH);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800658
Jeff Dike77f6af72007-05-06 14:51:40 -0700659 /*
660 * Can't use UML_SETJMP or UML_LONGJMP here because they save
661 * and restore signals, with the possible side-effect of
662 * trying to handle any signals which came when they were
663 * blocked, which can't be done on this stack.
664 * Signals must be blocked when jumping back here and restored
665 * after returning to the jumper.
666 */
667 n = setjmp(initial_jmpbuf);
Jeff Dike5134d8f2008-02-08 04:22:08 -0800668 switch (n) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800669 case INIT_JMP_NEW_THREAD:
Jeff Dike3c917352006-09-27 01:50:40 -0700670 (*switch_buf)[0].JB_IP = (unsigned long) new_thread_handler;
671 (*switch_buf)[0].JB_SP = (unsigned long) stack +
Jeff Dikee1a79c42007-05-10 22:22:31 -0700672 UM_THREAD_SIZE - sizeof(void *);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800673 break;
674 case INIT_JMP_CALLBACK:
675 (*cb_proc)(cb_arg);
Jeff Dike77f6af72007-05-06 14:51:40 -0700676 longjmp(*cb_back, 1);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800677 break;
678 case INIT_JMP_HALT:
679 kmalloc_ok = 0;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700680 return 0;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800681 case INIT_JMP_REBOOT:
682 kmalloc_ok = 0;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700683 return 1;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800684 default:
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800685 printk(UM_KERN_ERR "Bad sigsetjmp return in "
686 "start_idle_thread - %d\n", n);
687 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800688 }
Jeff Dike77f6af72007-05-06 14:51:40 -0700689 longjmp(*switch_buf, 1);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800690}
691
692void initial_thread_cb_skas(void (*proc)(void *), void *arg)
693{
Jeff Dikead28e0292006-04-18 22:21:41 -0700694 jmp_buf here;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800695
696 cb_proc = proc;
697 cb_arg = arg;
698 cb_back = &here;
699
700 block_signals();
Jeff Dikeba180fd2007-10-16 01:27:00 -0700701 if (UML_SETJMP(&here) == 0)
Jeff Dikead28e0292006-04-18 22:21:41 -0700702 UML_LONGJMP(&initial_jmpbuf, INIT_JMP_CALLBACK);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800703 unblock_signals();
704
705 cb_proc = NULL;
706 cb_arg = NULL;
707 cb_back = NULL;
708}
709
710void halt_skas(void)
711{
712 block_signals();
Jeff Dikead28e0292006-04-18 22:21:41 -0700713 UML_LONGJMP(&initial_jmpbuf, INIT_JMP_HALT);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800714}
715
716void reboot_skas(void)
717{
718 block_signals();
Jeff Dikead28e0292006-04-18 22:21:41 -0700719 UML_LONGJMP(&initial_jmpbuf, INIT_JMP_REBOOT);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800720}
721
Jeff Dike77bf4402007-10-16 01:26:58 -0700722void __switch_mm(struct mm_id *mm_idp)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800723{
724 int err;
725
Jeff Dike77bf4402007-10-16 01:26:58 -0700726 /* FIXME: need cpu pid in __switch_mm */
Jeff Dikeba180fd2007-10-16 01:27:00 -0700727 if (proc_mm) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800728 err = ptrace(PTRACE_SWITCH_MM, userspace_pid[0], 0,
729 mm_idp->u.mm_fd);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800730 if (err) {
731 printk(UM_KERN_ERR "__switch_mm - PTRACE_SWITCH_MM "
732 "failed, errno = %d\n", errno);
733 fatal_sigsegv();
734 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800735 }
736 else userspace_pid[0] = mm_idp->u.pid;
737}