blob: 2687f1f3a709b06ce5661763a86a12d8ca488a12 [file] [log] [blame]
Gennady Sharapovabaf6972006-01-18 17:42:46 -08001/*
Jeff Dikeba180fd2007-10-16 01:27:00 -07002 * Copyright (C) 2002- 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com)
Gennady Sharapovabaf6972006-01-18 17:42:46 -08003 * Licensed under the GPL
4 */
5
6#include <stdlib.h>
Gennady Sharapovabaf6972006-01-18 17:42:46 -08007#include <unistd.h>
Gennady Sharapovabaf6972006-01-18 17:42:46 -08008#include <sched.h>
Jeff Dikeba180fd2007-10-16 01:27:00 -07009#include <errno.h>
10#include <string.h>
Gennady Sharapovabaf6972006-01-18 17:42:46 -080011#include <sys/mman.h>
Jeff Dikeba180fd2007-10-16 01:27:00 -070012#include <sys/wait.h>
13#include <asm/unistd.h>
Jeff Dike16dd07b2007-05-06 14:51:48 -070014#include "as-layout.h"
Al Viro510c72a32011-08-18 20:08:29 +010015#include "init.h"
Jeff Dikeedea1382008-02-04 22:30:46 -080016#include "kern_util.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070017#include "mem.h"
18#include "os.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070019#include "proc_mm.h"
20#include "ptrace_user.h"
21#include "registers.h"
22#include "skas.h"
23#include "skas_ptrace.h"
Jeff Dikeba180fd2007-10-16 01:27:00 -070024#include "sysdep/stub.h"
Gennady Sharapovabaf6972006-01-18 17:42:46 -080025
26int is_skas_winch(int pid, int fd, void *data)
27{
Al Viro17e05202011-08-18 20:08:19 +010028 return pid == getpgrp();
Gennady Sharapovabaf6972006-01-18 17:42:46 -080029}
30
Jeff Dikef30c2c92007-05-06 14:51:29 -070031static int ptrace_dump_regs(int pid)
32{
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080033 unsigned long regs[MAX_REG_NR];
34 int i;
Jeff Dikef30c2c92007-05-06 14:51:29 -070035
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080036 if (ptrace(PTRACE_GETREGS, pid, 0, regs) < 0)
37 return -errno;
Jeff Dikeba180fd2007-10-16 01:27:00 -070038
39 printk(UM_KERN_ERR "Stub registers -\n");
40 for (i = 0; i < ARRAY_SIZE(regs); i++)
41 printk(UM_KERN_ERR "\t%d - %lx\n", i, regs[i]);
Jeff Dikef30c2c92007-05-06 14:51:29 -070042
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080043 return 0;
Jeff Dikef30c2c92007-05-06 14:51:29 -070044}
45
Jeff Dike16dd07b2007-05-06 14:51:48 -070046/*
47 * Signals that are OK to receive in the stub - we'll just continue it.
48 * SIGWINCH will happen when UML is inside a detached screen.
49 */
Jeff Dike3d5ede62008-06-05 22:46:13 -070050#define STUB_SIG_MASK ((1 << SIGVTALRM) | (1 << SIGWINCH))
Jeff Dike16dd07b2007-05-06 14:51:48 -070051
52/* Signals that the stub will finish with - anything else is an error */
Jeff Dikeee3d9bd2008-02-04 22:30:56 -080053#define STUB_DONE_MASK (1 << SIGTRAP)
Jeff Dike16dd07b2007-05-06 14:51:48 -070054
55void wait_stub_done(int pid)
Gennady Sharapovabaf6972006-01-18 17:42:46 -080056{
57 int n, status, err;
58
Jeff Dikeba180fd2007-10-16 01:27:00 -070059 while (1) {
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -080060 CATCH_EINTR(n = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dikeba180fd2007-10-16 01:27:00 -070061 if ((n < 0) || !WIFSTOPPED(status))
Jeff Dike16dd07b2007-05-06 14:51:48 -070062 goto bad_wait;
Gennady Sharapovabaf6972006-01-18 17:42:46 -080063
Jeff Dikeba180fd2007-10-16 01:27:00 -070064 if (((1 << WSTOPSIG(status)) & STUB_SIG_MASK) == 0)
Jeff Dike16dd07b2007-05-06 14:51:48 -070065 break;
66
67 err = ptrace(PTRACE_CONT, pid, 0, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080068 if (err) {
69 printk(UM_KERN_ERR "wait_stub_done : continue failed, "
70 "errno = %d\n", errno);
71 fatal_sigsegv();
72 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -080073 }
Jeff Dike16dd07b2007-05-06 14:51:48 -070074
Jeff Dikeba180fd2007-10-16 01:27:00 -070075 if (((1 << WSTOPSIG(status)) & STUB_DONE_MASK) != 0)
Jeff Dike16dd07b2007-05-06 14:51:48 -070076 return;
77
78bad_wait:
79 err = ptrace_dump_regs(pid);
Jeff Dikeba180fd2007-10-16 01:27:00 -070080 if (err)
81 printk(UM_KERN_ERR "Failed to get registers from stub, "
82 "errno = %d\n", -err);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080083 printk(UM_KERN_ERR "wait_stub_done : failed to wait for SIGTRAP, "
84 "pid = %d, n = %d, errno = %d, status = 0x%x\n", pid, n, errno,
85 status);
86 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -080087}
88
89extern unsigned long current_stub_stack(void);
90
WANG Cong99764fa2008-07-23 21:28:49 -070091static void get_skas_faultinfo(int pid, struct faultinfo *fi)
Gennady Sharapovabaf6972006-01-18 17:42:46 -080092{
93 int err;
94
Jeff Dikeba180fd2007-10-16 01:27:00 -070095 if (ptrace_faultinfo) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -080096 err = ptrace(PTRACE_FAULTINFO, pid, 0, fi);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -080097 if (err) {
98 printk(UM_KERN_ERR "get_skas_faultinfo - "
99 "PTRACE_FAULTINFO failed, errno = %d\n", errno);
100 fatal_sigsegv();
101 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800102
103 /* Special handling for i386, which has different structs */
104 if (sizeof(struct ptrace_faultinfo) < sizeof(struct faultinfo))
105 memset((char *)fi + sizeof(struct ptrace_faultinfo), 0,
106 sizeof(struct faultinfo) -
107 sizeof(struct ptrace_faultinfo));
108 }
109 else {
Jeff Dike2f56deb2008-02-23 15:23:49 -0800110 unsigned long fpregs[FP_SIZE];
111
112 err = get_fp_registers(pid, fpregs);
113 if (err < 0) {
114 printk(UM_KERN_ERR "save_fp_registers returned %d\n",
115 err);
116 fatal_sigsegv();
117 }
Jeff Dike16dd07b2007-05-06 14:51:48 -0700118 err = ptrace(PTRACE_CONT, pid, 0, SIGSEGV);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800119 if (err) {
120 printk(UM_KERN_ERR "Failed to continue stub, pid = %d, "
121 "errno = %d\n", pid, errno);
122 fatal_sigsegv();
123 }
Jeff Dike16dd07b2007-05-06 14:51:48 -0700124 wait_stub_done(pid);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800125
Jeff Dikeba180fd2007-10-16 01:27:00 -0700126 /*
127 * faultinfo is prepared by the stub-segv-handler at start of
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800128 * the stub stack page. We just have to copy it.
129 */
130 memcpy(fi, (void *)current_stub_stack(), sizeof(*fi));
Jeff Dike2f56deb2008-02-23 15:23:49 -0800131
132 err = put_fp_registers(pid, fpregs);
133 if (err < 0) {
134 printk(UM_KERN_ERR "put_fp_registers returned %d\n",
135 err);
136 fatal_sigsegv();
137 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800138 }
139}
140
Jeff Dike77bf4402007-10-16 01:26:58 -0700141static void handle_segv(int pid, struct uml_pt_regs * regs)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800142{
Jeff Dike77bf4402007-10-16 01:26:58 -0700143 get_skas_faultinfo(pid, &regs->faultinfo);
144 segv(regs->faultinfo, 0, 1, NULL);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800145}
146
Jeff Dikeba180fd2007-10-16 01:27:00 -0700147/*
148 * To use the same value of using_sysemu as the caller, ask it that value
149 * (in local_using_sysemu
150 */
151static void handle_trap(int pid, struct uml_pt_regs *regs,
152 int local_using_sysemu)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800153{
154 int err, status;
155
Jeff Dikee06173b2008-02-04 22:31:12 -0800156 if ((UPT_IP(regs) >= STUB_START) && (UPT_IP(regs) < STUB_END))
157 fatal_sigsegv();
158
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800159 /* Mark this as a syscall */
Jeff Dike18baddd2007-10-16 01:27:07 -0700160 UPT_SYSCALL_NR(regs) = PT_SYSCALL_NR(regs->gp);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800161
162 if (!local_using_sysemu)
163 {
Al Viro966e8032011-08-18 20:12:19 +0100164 err = ptrace(PTRACE_POKEUSER, pid, PT_SYSCALL_NR_OFFSET,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800165 __NR_getpid);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800166 if (err < 0) {
167 printk(UM_KERN_ERR "handle_trap - nullifying syscall "
168 "failed, errno = %d\n", errno);
169 fatal_sigsegv();
170 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800171
Jeff Dikeba180fd2007-10-16 01:27:00 -0700172 err = ptrace(PTRACE_SYSCALL, pid, 0, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800173 if (err < 0) {
174 printk(UM_KERN_ERR "handle_trap - continuing to end of "
175 "syscall failed, errno = %d\n", errno);
176 fatal_sigsegv();
177 }
Jeff Dikeba180fd2007-10-16 01:27:00 -0700178
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800179 CATCH_EINTR(err = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dikeba180fd2007-10-16 01:27:00 -0700180 if ((err < 0) || !WIFSTOPPED(status) ||
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800181 (WSTOPSIG(status) != SIGTRAP + 0x80)) {
182 err = ptrace_dump_regs(pid);
183 if (err)
184 printk(UM_KERN_ERR "Failed to get registers "
Jeff Dikeba180fd2007-10-16 01:27:00 -0700185 "from process, errno = %d\n", -err);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800186 printk(UM_KERN_ERR "handle_trap - failed to wait at "
187 "end of syscall, errno = %d, status = %d\n",
188 errno, status);
189 fatal_sigsegv();
190 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800191 }
192
193 handle_syscall(regs);
194}
195
196extern int __syscall_stub_start;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800197
198static int userspace_tramp(void *stack)
199{
200 void *addr;
Jeff Dike537ae942006-09-25 23:33:05 -0700201 int err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800202
203 ptrace(PTRACE_TRACEME, 0, 0, 0);
204
Lepton Wua24864a2007-10-16 01:27:35 -0700205 signal(SIGTERM, SIG_DFL);
Jeff Dikeee3d9bd2008-02-04 22:30:56 -0800206 signal(SIGWINCH, SIG_IGN);
Jeff Dikea2f018b2007-10-16 01:27:22 -0700207 err = set_interval();
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800208 if (err) {
209 printk(UM_KERN_ERR "userspace_tramp - setting timer failed, "
210 "errno = %d\n", err);
211 exit(1);
212 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800213
Jeff Dikeba180fd2007-10-16 01:27:00 -0700214 if (!proc_mm) {
215 /*
216 * This has a pte, but it can't be mapped in with the usual
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800217 * tlb_flush mechanism because this is part of that mechanism
218 */
Jeff Dike09ee0112006-01-18 17:42:48 -0800219 int fd;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700220 unsigned long long offset;
Jeff Dike09ee0112006-01-18 17:42:48 -0800221 fd = phys_mapping(to_phys(&__syscall_stub_start), &offset);
Jeff Dike54ae36f2007-10-16 01:27:33 -0700222 addr = mmap64((void *) STUB_CODE, UM_KERN_PAGE_SIZE,
Jeff Dike09ee0112006-01-18 17:42:48 -0800223 PROT_EXEC, MAP_FIXED | MAP_PRIVATE, fd, offset);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700224 if (addr == MAP_FAILED) {
Jeff Dike54ae36f2007-10-16 01:27:33 -0700225 printk(UM_KERN_ERR "mapping mmap stub at 0x%lx failed, "
226 "errno = %d\n", STUB_CODE, errno);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800227 exit(1);
228 }
229
Jeff Dikeba180fd2007-10-16 01:27:00 -0700230 if (stack != NULL) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800231 fd = phys_mapping(to_phys(stack), &offset);
Jeff Dike54ae36f2007-10-16 01:27:33 -0700232 addr = mmap((void *) STUB_DATA,
Jeff Dike1ffb9162007-05-06 14:51:22 -0700233 UM_KERN_PAGE_SIZE, PROT_READ | PROT_WRITE,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800234 MAP_FIXED | MAP_SHARED, fd, offset);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700235 if (addr == MAP_FAILED) {
236 printk(UM_KERN_ERR "mapping segfault stack "
Jeff Dike54ae36f2007-10-16 01:27:33 -0700237 "at 0x%lx failed, errno = %d\n",
238 STUB_DATA, errno);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800239 exit(1);
240 }
241 }
242 }
Jeff Dikeba180fd2007-10-16 01:27:00 -0700243 if (!ptrace_faultinfo && (stack != NULL)) {
Jeff Dike4b84c692006-09-25 23:33:04 -0700244 struct sigaction sa;
245
Jeff Dike54ae36f2007-10-16 01:27:33 -0700246 unsigned long v = STUB_CODE +
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800247 (unsigned long) stub_segv_handler -
248 (unsigned long) &__syscall_stub_start;
249
Jeff Dike54ae36f2007-10-16 01:27:33 -0700250 set_sigstack((void *) STUB_DATA, UM_KERN_PAGE_SIZE);
Jeff Dike4b84c692006-09-25 23:33:04 -0700251 sigemptyset(&sa.sa_mask);
Al Viro9b25fcb2011-08-18 20:04:09 +0100252 sa.sa_flags = SA_ONSTACK | SA_NODEFER | SA_SIGINFO;
253 sa.sa_sigaction = (void *) v;
Jeff Dike4b84c692006-09-25 23:33:04 -0700254 sa.sa_restorer = NULL;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800255 if (sigaction(SIGSEGV, &sa, NULL) < 0) {
256 printk(UM_KERN_ERR "userspace_tramp - setting SIGSEGV "
257 "handler failed - errno = %d\n", errno);
258 exit(1);
259 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800260 }
261
Jeff Dike512b6fb2007-10-16 01:27:11 -0700262 kill(os_getpid(), SIGSTOP);
Jeff Dikeba180fd2007-10-16 01:27:00 -0700263 return 0;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800264}
265
266/* Each element set once, and only accessed by a single processor anyway */
267#undef NR_CPUS
268#define NR_CPUS 1
269int userspace_pid[NR_CPUS];
270
271int start_userspace(unsigned long stub_stack)
272{
273 void *stack;
274 unsigned long sp;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800275 int pid, status, n, flags, err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800276
Jeff Dikec539ab72007-06-16 10:16:09 -0700277 stack = mmap(NULL, UM_KERN_PAGE_SIZE,
278 PROT_READ | PROT_WRITE | PROT_EXEC,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800279 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800280 if (stack == MAP_FAILED) {
281 err = -errno;
282 printk(UM_KERN_ERR "start_userspace : mmap failed, "
Jeff Dikeb5498832008-02-04 22:31:21 -0800283 "errno = %d\n", errno);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800284 return err;
285 }
286
Jeff Dikec539ab72007-06-16 10:16:09 -0700287 sp = (unsigned long) stack + UM_KERN_PAGE_SIZE - sizeof(void *);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800288
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800289 flags = CLONE_FILES;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700290 if (proc_mm)
291 flags |= CLONE_VM;
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800292 else
293 flags |= SIGCHLD;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700294
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800295 pid = clone(userspace_tramp, (void *) sp, flags, (void *) stub_stack);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800296 if (pid < 0) {
297 err = -errno;
298 printk(UM_KERN_ERR "start_userspace : clone failed, "
Jeff Dikeb5498832008-02-04 22:31:21 -0800299 "errno = %d\n", errno);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800300 return err;
301 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800302
303 do {
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800304 CATCH_EINTR(n = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800305 if (n < 0) {
306 err = -errno;
307 printk(UM_KERN_ERR "start_userspace : wait failed, "
Jeff Dikeb5498832008-02-04 22:31:21 -0800308 "errno = %d\n", errno);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800309 goto out_kill;
310 }
Jeff Dikeba180fd2007-10-16 01:27:00 -0700311 } while (WIFSTOPPED(status) && (WSTOPSIG(status) == SIGVTALRM));
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800312
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800313 if (!WIFSTOPPED(status) || (WSTOPSIG(status) != SIGSTOP)) {
314 err = -EINVAL;
315 printk(UM_KERN_ERR "start_userspace : expected SIGSTOP, got "
Jeff Dikeb5498832008-02-04 22:31:21 -0800316 "status = %d\n", status);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800317 goto out_kill;
318 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800319
Jeff Dikeba180fd2007-10-16 01:27:00 -0700320 if (ptrace(PTRACE_OLDSETOPTIONS, pid, NULL,
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800321 (void *) PTRACE_O_TRACESYSGOOD) < 0) {
322 err = -errno;
323 printk(UM_KERN_ERR "start_userspace : PTRACE_OLDSETOPTIONS "
324 "failed, errno = %d\n", errno);
325 goto out_kill;
326 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800327
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800328 if (munmap(stack, UM_KERN_PAGE_SIZE) < 0) {
329 err = -errno;
330 printk(UM_KERN_ERR "start_userspace : munmap failed, "
331 "errno = %d\n", errno);
332 goto out_kill;
333 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800334
Jeff Dikeba180fd2007-10-16 01:27:00 -0700335 return pid;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800336
337 out_kill:
338 os_kill_ptraced_process(pid, 1);
339 return err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800340}
341
Jeff Dike77bf4402007-10-16 01:26:58 -0700342void userspace(struct uml_pt_regs *regs)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800343{
Jeff Diked2753a6d2007-10-16 01:27:25 -0700344 struct itimerval timer;
345 unsigned long long nsecs, now;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800346 int err, status, op, pid = userspace_pid[0];
Jeff Dike2ea5bc52007-05-10 22:22:32 -0700347 /* To prevent races if using_sysemu changes under us.*/
348 int local_using_sysemu;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800349
Al Virob8a42092012-05-23 00:25:15 -0400350 /* Handle any immediate reschedules or signals */
351 interrupt_end();
352
Jeff Diked2753a6d2007-10-16 01:27:25 -0700353 if (getitimer(ITIMER_VIRTUAL, &timer))
Jeff Dike5134d8f2008-02-08 04:22:08 -0800354 printk(UM_KERN_ERR "Failed to get itimer, errno = %d\n", errno);
Jeff Dike1a805212007-10-16 01:27:28 -0700355 nsecs = timer.it_value.tv_sec * UM_NSEC_PER_SEC +
356 timer.it_value.tv_usec * UM_NSEC_PER_USEC;
Jeff Diked2753a6d2007-10-16 01:27:25 -0700357 nsecs += os_nsecs();
358
Jeff Dikeba180fd2007-10-16 01:27:00 -0700359 while (1) {
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800360 /*
361 * This can legitimately fail if the process loads a
362 * bogus value into a segment register. It will
363 * segfault and PTRACE_GETREGS will read that value
364 * out of the process. However, PTRACE_SETREGS will
365 * fail. In this case, there is nothing to do but
366 * just kill the process.
367 */
Jeff Diked25f2e12008-02-04 22:30:57 -0800368 if (ptrace(PTRACE_SETREGS, pid, 0, regs->gp))
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800369 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800370
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700371 if (put_fp_registers(pid, regs->fp))
372 fatal_sigsegv();
373
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800374 /* Now we set local_using_sysemu to be used for one loop */
375 local_using_sysemu = get_using_sysemu();
376
Jeff Dike2ea5bc52007-05-10 22:22:32 -0700377 op = SELECT_PTRACE_OPERATION(local_using_sysemu,
378 singlestepping(NULL));
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800379
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800380 if (ptrace(op, pid, 0, 0)) {
381 printk(UM_KERN_ERR "userspace - ptrace continue "
382 "failed, op = %d, errno = %d\n", op, errno);
383 fatal_sigsegv();
384 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800385
Stanislaw Gruszka4dbed852007-12-17 16:19:46 -0800386 CATCH_EINTR(err = waitpid(pid, &status, WUNTRACED | __WALL));
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800387 if (err < 0) {
388 printk(UM_KERN_ERR "userspace - wait failed, "
389 "errno = %d\n", errno);
390 fatal_sigsegv();
391 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800392
Jeff Dike77bf4402007-10-16 01:26:58 -0700393 regs->is_user = 1;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800394 if (ptrace(PTRACE_GETREGS, pid, 0, regs->gp)) {
395 printk(UM_KERN_ERR "userspace - PTRACE_GETREGS failed, "
396 "errno = %d\n", errno);
397 fatal_sigsegv();
398 }
Jeff Diked25f2e12008-02-04 22:30:57 -0800399
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700400 if (get_fp_registers(pid, regs->fp)) {
401 printk(UM_KERN_ERR "userspace - get_fp_registers failed, "
402 "errno = %d\n", errno);
403 fatal_sigsegv();
404 }
405
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800406 UPT_SYSCALL_NR(regs) = -1; /* Assume: It's not a syscall */
407
Jeff Dikeba180fd2007-10-16 01:27:00 -0700408 if (WIFSTOPPED(status)) {
Jeff Dike16dd07b2007-05-06 14:51:48 -0700409 int sig = WSTOPSIG(status);
Jeff Dike5134d8f2008-02-08 04:22:08 -0800410 switch (sig) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800411 case SIGSEGV:
Jeff Dikeba180fd2007-10-16 01:27:00 -0700412 if (PTRACE_FULL_FAULTINFO ||
413 !ptrace_faultinfo) {
414 get_skas_faultinfo(pid,
415 &regs->faultinfo);
Jeff Dike16dd07b2007-05-06 14:51:48 -0700416 (*sig_info[SIGSEGV])(SIGSEGV, regs);
417 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800418 else handle_segv(pid, regs);
419 break;
420 case SIGTRAP + 0x80:
421 handle_trap(pid, regs, local_using_sysemu);
422 break;
423 case SIGTRAP:
424 relay_signal(SIGTRAP, regs);
425 break;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800426 case SIGVTALRM:
Jeff Diked2753a6d2007-10-16 01:27:25 -0700427 now = os_nsecs();
Jeff Diked25f2e12008-02-04 22:30:57 -0800428 if (now < nsecs)
Jeff Diked2753a6d2007-10-16 01:27:25 -0700429 break;
430 block_signals();
431 (*sig_info[sig])(sig, regs);
432 unblock_signals();
Jeff Dike1a805212007-10-16 01:27:28 -0700433 nsecs = timer.it_value.tv_sec *
434 UM_NSEC_PER_SEC +
435 timer.it_value.tv_usec *
436 UM_NSEC_PER_USEC;
Jeff Diked2753a6d2007-10-16 01:27:25 -0700437 nsecs += os_nsecs();
438 break;
439 case SIGIO:
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800440 case SIGILL:
441 case SIGBUS:
442 case SIGFPE:
443 case SIGWINCH:
Jeff Dike16dd07b2007-05-06 14:51:48 -0700444 block_signals();
445 (*sig_info[sig])(sig, regs);
446 unblock_signals();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800447 break;
448 default:
Jeff Dike96cee302008-05-12 14:01:48 -0700449 printk(UM_KERN_ERR "userspace - child stopped "
Jeff Dikeba180fd2007-10-16 01:27:00 -0700450 "with signal %d\n", sig);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800451 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800452 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800453 pid = userspace_pid[0];
454 interrupt_end();
455
456 /* Avoid -ERESTARTSYS handling in host */
Jeff Dikeba180fd2007-10-16 01:27:00 -0700457 if (PT_SYSCALL_NR_OFFSET != PT_SYSCALL_RET_OFFSET)
Jeff Dike18baddd2007-10-16 01:27:07 -0700458 PT_SYSCALL_NR(regs->gp) = -1;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800459 }
460 }
461}
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800462
Jeff Dike16dd07b2007-05-06 14:51:48 -0700463static unsigned long thread_regs[MAX_REG_NR];
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700464static unsigned long thread_fp_regs[FP_SIZE];
Jeff Dike16dd07b2007-05-06 14:51:48 -0700465
466static int __init init_thread_regs(void)
467{
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700468 get_safe_registers(thread_regs, thread_fp_regs);
Jeff Dike16dd07b2007-05-06 14:51:48 -0700469 /* Set parent's instruction pointer to start of clone-stub */
Jeff Dike54ae36f2007-10-16 01:27:33 -0700470 thread_regs[REGS_IP_INDEX] = STUB_CODE +
Jeff Dike16dd07b2007-05-06 14:51:48 -0700471 (unsigned long) stub_clone_handler -
472 (unsigned long) &__syscall_stub_start;
Jeff Dike54ae36f2007-10-16 01:27:33 -0700473 thread_regs[REGS_SP_INDEX] = STUB_DATA + UM_KERN_PAGE_SIZE -
Jeff Dike16dd07b2007-05-06 14:51:48 -0700474 sizeof(void *);
475#ifdef __SIGNAL_FRAMESIZE
476 thread_regs[REGS_SP_INDEX] -= __SIGNAL_FRAMESIZE;
477#endif
478 return 0;
479}
480
481__initcall(init_thread_regs);
482
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800483int copy_context_skas0(unsigned long new_stack, int pid)
484{
Jeff Dike1a805212007-10-16 01:27:28 -0700485 struct timeval tv = { .tv_sec = 0, .tv_usec = UM_USEC_PER_SEC / UM_HZ };
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800486 int err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800487 unsigned long current_stack = current_stub_stack();
488 struct stub_data *data = (struct stub_data *) current_stack;
489 struct stub_data *child_data = (struct stub_data *) new_stack;
Jeff Dike0a7675a2007-10-16 01:27:05 -0700490 unsigned long long new_offset;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800491 int new_fd = phys_mapping(to_phys((void *)new_stack), &new_offset);
492
Jeff Dikeba180fd2007-10-16 01:27:00 -0700493 /*
494 * prepare offset and fd of child's stack as argument for parent's
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800495 * and child's mmap2 calls
496 */
497 *data = ((struct stub_data) { .offset = MMAP_OFFSET(new_offset),
498 .fd = new_fd,
499 .timer = ((struct itimerval)
Jeff Diked2753a6d2007-10-16 01:27:25 -0700500 { .it_value = tv,
501 .it_interval = tv }) });
502
Jeff Dike16dd07b2007-05-06 14:51:48 -0700503 err = ptrace_setregs(pid, thread_regs);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800504 if (err < 0) {
505 err = -errno;
506 printk(UM_KERN_ERR "copy_context_skas0 : PTRACE_SETREGS "
507 "failed, pid = %d, errno = %d\n", pid, -err);
508 return err;
509 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800510
Ingo van Lilfbfe9c82011-09-14 16:21:23 -0700511 err = put_fp_registers(pid, thread_fp_regs);
512 if (err < 0) {
513 printk(UM_KERN_ERR "copy_context_skas0 : put_fp_registers "
514 "failed, pid = %d, err = %d\n", pid, err);
515 return err;
516 }
517
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800518 /* set a well known return code for detection of child write failure */
519 child_data->err = 12345678;
520
Jeff Dikeba180fd2007-10-16 01:27:00 -0700521 /*
522 * Wait, until parent has finished its work: read child's pid from
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800523 * parent's stack, and check, if bad result.
524 */
Jeff Dike16dd07b2007-05-06 14:51:48 -0700525 err = ptrace(PTRACE_CONT, pid, 0, 0);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800526 if (err) {
527 err = -errno;
528 printk(UM_KERN_ERR "Failed to continue new process, pid = %d, "
529 "errno = %d\n", pid, errno);
530 return err;
531 }
532
Jeff Dike16dd07b2007-05-06 14:51:48 -0700533 wait_stub_done(pid);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800534
535 pid = data->err;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800536 if (pid < 0) {
537 printk(UM_KERN_ERR "copy_context_skas0 - stub-parent reports "
538 "error %d\n", -pid);
539 return pid;
540 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800541
Jeff Dikeba180fd2007-10-16 01:27:00 -0700542 /*
543 * Wait, until child has finished too: read child's result from
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800544 * child's stack and check it.
545 */
Jeff Dike16dd07b2007-05-06 14:51:48 -0700546 wait_stub_done(pid);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800547 if (child_data->err != STUB_DATA) {
548 printk(UM_KERN_ERR "copy_context_skas0 - stub-child reports "
549 "error %ld\n", child_data->err);
550 err = child_data->err;
551 goto out_kill;
552 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800553
554 if (ptrace(PTRACE_OLDSETOPTIONS, pid, NULL,
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800555 (void *)PTRACE_O_TRACESYSGOOD) < 0) {
556 err = -errno;
557 printk(UM_KERN_ERR "copy_context_skas0 : PTRACE_OLDSETOPTIONS "
558 "failed, errno = %d\n", errno);
559 goto out_kill;
560 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800561
562 return pid;
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800563
564 out_kill:
565 os_kill_ptraced_process(pid, 1);
566 return err;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800567}
568
569/*
570 * This is used only, if stub pages are needed, while proc_mm is
Jeff Dikeef0470c2007-05-06 14:51:33 -0700571 * available. Opening /proc/mm creates a new mm_context, which lacks
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800572 * the stub-pages. Thus, we map them using /proc/mm-fd
573 */
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800574int map_stub_pages(int fd, unsigned long code, unsigned long data,
575 unsigned long stack)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800576{
577 struct proc_mm_op mmop;
578 int n;
Jeff Dike0a7675a2007-10-16 01:27:05 -0700579 unsigned long long code_offset;
Jeff Dike09ee0112006-01-18 17:42:48 -0800580 int code_fd = phys_mapping(to_phys((void *) &__syscall_stub_start),
581 &code_offset);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800582
583 mmop = ((struct proc_mm_op) { .op = MM_MMAP,
584 .u =
585 { .mmap =
586 { .addr = code,
Jeff Dikec539ab72007-06-16 10:16:09 -0700587 .len = UM_KERN_PAGE_SIZE,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800588 .prot = PROT_EXEC,
589 .flags = MAP_FIXED | MAP_PRIVATE,
Jeff Dike09ee0112006-01-18 17:42:48 -0800590 .fd = code_fd,
591 .offset = code_offset
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800592 } } });
Jeff Dikea61f3342007-05-06 14:51:35 -0700593 CATCH_EINTR(n = write(fd, &mmop, sizeof(mmop)));
Jeff Dikeba180fd2007-10-16 01:27:00 -0700594 if (n != sizeof(mmop)) {
Jeff Dikea61f3342007-05-06 14:51:35 -0700595 n = errno;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700596 printk(UM_KERN_ERR "mmap args - addr = 0x%lx, fd = %d, "
597 "offset = %llx\n", code, code_fd,
598 (unsigned long long) code_offset);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800599 printk(UM_KERN_ERR "map_stub_pages : /proc/mm map for code "
600 "failed, err = %d\n", n);
601 return -n;
Jeff Dikeb4cf95c2007-03-06 01:42:19 -0800602 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800603
Jeff Dikeba180fd2007-10-16 01:27:00 -0700604 if (stack) {
Jeff Dike0a7675a2007-10-16 01:27:05 -0700605 unsigned long long map_offset;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800606 int map_fd = phys_mapping(to_phys((void *)stack), &map_offset);
607 mmop = ((struct proc_mm_op)
608 { .op = MM_MMAP,
609 .u =
610 { .mmap =
611 { .addr = data,
Jeff Dikec539ab72007-06-16 10:16:09 -0700612 .len = UM_KERN_PAGE_SIZE,
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800613 .prot = PROT_READ | PROT_WRITE,
614 .flags = MAP_FIXED | MAP_SHARED,
615 .fd = map_fd,
616 .offset = map_offset
617 } } });
Jeff Dikea61f3342007-05-06 14:51:35 -0700618 CATCH_EINTR(n = write(fd, &mmop, sizeof(mmop)));
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800619 if (n != sizeof(mmop)) {
620 n = errno;
621 printk(UM_KERN_ERR "map_stub_pages : /proc/mm map for "
622 "data failed, err = %d\n", n);
623 return -n;
624 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800625 }
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800626
627 return 0;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800628}
629
Jeff Dike3c917352006-09-27 01:50:40 -0700630void new_thread(void *stack, jmp_buf *buf, void (*handler)(void))
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800631{
Jeff Dike3c917352006-09-27 01:50:40 -0700632 (*buf)[0].JB_IP = (unsigned long) handler;
Jeff Dikee1a79c42007-05-10 22:22:31 -0700633 (*buf)[0].JB_SP = (unsigned long) stack + UM_THREAD_SIZE -
634 sizeof(void *);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800635}
636
Jeff Dikee2216fe2006-02-07 12:58:43 -0800637#define INIT_JMP_NEW_THREAD 0
Jeff Dike3c917352006-09-27 01:50:40 -0700638#define INIT_JMP_CALLBACK 1
639#define INIT_JMP_HALT 2
640#define INIT_JMP_REBOOT 3
Jeff Dikee2216fe2006-02-07 12:58:43 -0800641
Jeff Dike3c917352006-09-27 01:50:40 -0700642void switch_threads(jmp_buf *me, jmp_buf *you)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800643{
Jeff Dikeba180fd2007-10-16 01:27:00 -0700644 if (UML_SETJMP(me) == 0)
Jeff Dike3c917352006-09-27 01:50:40 -0700645 UML_LONGJMP(you, 1);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800646}
647
Jeff Dikead28e022006-04-18 22:21:41 -0700648static jmp_buf initial_jmpbuf;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800649
650/* XXX Make these percpu */
651static void (*cb_proc)(void *arg);
652static void *cb_arg;
Jeff Dikead28e022006-04-18 22:21:41 -0700653static jmp_buf *cb_back;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800654
Jeff Dike3c917352006-09-27 01:50:40 -0700655int start_idle_thread(void *stack, jmp_buf *switch_buf)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800656{
Jeff Dikea5df0d12006-07-14 00:24:02 -0700657 int n;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800658
Al Viro00361682011-08-18 20:04:39 +0100659 set_handler(SIGWINCH);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800660
Jeff Dike77f6af72007-05-06 14:51:40 -0700661 /*
662 * Can't use UML_SETJMP or UML_LONGJMP here because they save
663 * and restore signals, with the possible side-effect of
664 * trying to handle any signals which came when they were
665 * blocked, which can't be done on this stack.
666 * Signals must be blocked when jumping back here and restored
667 * after returning to the jumper.
668 */
669 n = setjmp(initial_jmpbuf);
Jeff Dike5134d8f2008-02-08 04:22:08 -0800670 switch (n) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800671 case INIT_JMP_NEW_THREAD:
Jeff Dike3c917352006-09-27 01:50:40 -0700672 (*switch_buf)[0].JB_IP = (unsigned long) new_thread_handler;
673 (*switch_buf)[0].JB_SP = (unsigned long) stack +
Jeff Dikee1a79c42007-05-10 22:22:31 -0700674 UM_THREAD_SIZE - sizeof(void *);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800675 break;
676 case INIT_JMP_CALLBACK:
677 (*cb_proc)(cb_arg);
Jeff Dike77f6af72007-05-06 14:51:40 -0700678 longjmp(*cb_back, 1);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800679 break;
680 case INIT_JMP_HALT:
681 kmalloc_ok = 0;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700682 return 0;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800683 case INIT_JMP_REBOOT:
684 kmalloc_ok = 0;
Jeff Dikeba180fd2007-10-16 01:27:00 -0700685 return 1;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800686 default:
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800687 printk(UM_KERN_ERR "Bad sigsetjmp return in "
688 "start_idle_thread - %d\n", n);
689 fatal_sigsegv();
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800690 }
Jeff Dike77f6af72007-05-06 14:51:40 -0700691 longjmp(*switch_buf, 1);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800692}
693
694void initial_thread_cb_skas(void (*proc)(void *), void *arg)
695{
Jeff Dikead28e022006-04-18 22:21:41 -0700696 jmp_buf here;
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800697
698 cb_proc = proc;
699 cb_arg = arg;
700 cb_back = &here;
701
702 block_signals();
Jeff Dikeba180fd2007-10-16 01:27:00 -0700703 if (UML_SETJMP(&here) == 0)
Jeff Dikead28e022006-04-18 22:21:41 -0700704 UML_LONGJMP(&initial_jmpbuf, INIT_JMP_CALLBACK);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800705 unblock_signals();
706
707 cb_proc = NULL;
708 cb_arg = NULL;
709 cb_back = NULL;
710}
711
712void halt_skas(void)
713{
714 block_signals();
Jeff Dikead28e022006-04-18 22:21:41 -0700715 UML_LONGJMP(&initial_jmpbuf, INIT_JMP_HALT);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800716}
717
718void reboot_skas(void)
719{
720 block_signals();
Jeff Dikead28e022006-04-18 22:21:41 -0700721 UML_LONGJMP(&initial_jmpbuf, INIT_JMP_REBOOT);
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800722}
723
Jeff Dike77bf4402007-10-16 01:26:58 -0700724void __switch_mm(struct mm_id *mm_idp)
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800725{
726 int err;
727
Jeff Dike77bf4402007-10-16 01:26:58 -0700728 /* FIXME: need cpu pid in __switch_mm */
Jeff Dikeba180fd2007-10-16 01:27:00 -0700729 if (proc_mm) {
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800730 err = ptrace(PTRACE_SWITCH_MM, userspace_pid[0], 0,
731 mm_idp->u.mm_fd);
Jeff Dike3e6f2ac2008-02-04 22:30:58 -0800732 if (err) {
733 printk(UM_KERN_ERR "__switch_mm - PTRACE_SWITCH_MM "
734 "failed, errno = %d\n", errno);
735 fatal_sigsegv();
736 }
Gennady Sharapovabaf6972006-01-18 17:42:46 -0800737 }
738 else userspace_pid[0] = mm_idp->u.pid;
739}