blob: 1e06436f07c21db67d893e757fb242dd03943317 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * arch/s390/kernel/process.c
3 *
4 * S390 version
5 * Copyright (C) 1999 IBM Deutschland Entwicklung GmbH, IBM Corporation
6 * Author(s): Martin Schwidefsky (schwidefsky@de.ibm.com),
7 * Hartmut Penner (hp@de.ibm.com),
8 * Denis Joseph Barrow (djbarrow@de.ibm.com,barrow_dj@yahoo.com),
9 *
10 * Derived from "arch/i386/kernel/process.c"
11 * Copyright (C) 1995, Linus Torvalds
12 */
13
14/*
15 * This file handles the architecture-dependent parts of process handling..
16 */
17
Linus Torvalds1da177e2005-04-16 15:20:36 -070018#include <linux/compiler.h>
19#include <linux/cpu.h>
20#include <linux/errno.h>
21#include <linux/sched.h>
22#include <linux/kernel.h>
23#include <linux/mm.h>
Alexey Dobriyan4e950f62007-07-30 02:36:13 +040024#include <linux/fs.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025#include <linux/smp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include <linux/stddef.h>
27#include <linux/unistd.h>
28#include <linux/ptrace.h>
29#include <linux/slab.h>
30#include <linux/vmalloc.h>
31#include <linux/user.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#include <linux/interrupt.h>
33#include <linux/delay.h>
34#include <linux/reboot.h>
35#include <linux/init.h>
36#include <linux/module.h>
37#include <linux/notifier.h>
Heiko Carstens5c699712008-01-26 14:11:01 +010038#include <linux/utsname.h>
Heiko Carstens5a62b192008-04-17 07:46:25 +020039#include <linux/tick.h>
Heiko Carstensa8061702008-04-17 07:46:26 +020040#include <linux/elfcore.h>
Martin Schwidefsky6f430922008-12-31 15:11:40 +010041#include <linux/kernel_stat.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070042#include <asm/uaccess.h>
43#include <asm/pgtable.h>
44#include <asm/system.h>
45#include <asm/io.h>
46#include <asm/processor.h>
47#include <asm/irq.h>
48#include <asm/timer.h>
Heiko Carstensfae8b222007-10-22 12:52:39 +020049#include <asm/cpu.h>
Heiko Carstensa8061702008-04-17 07:46:26 +020050#include "entry.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
Martin Schwidefsky94c12cc2006-09-28 16:56:43 +020052asmlinkage void ret_from_fork(void) asm ("ret_from_fork");
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
54/*
55 * Return saved PC of a blocked thread. used in kernel/sched.
56 * resume in entry.S does not create a new stack frame, it
57 * just stores the registers %r6-%r15 to the frame given by
58 * schedule. We want to return the address of the caller of
59 * schedule, so we have to walk the backchain one time to
60 * find the frame schedule() store its return address.
61 */
62unsigned long thread_saved_pc(struct task_struct *tsk)
63{
Heiko Carstenseb33c192006-01-14 13:20:57 -080064 struct stack_frame *sf, *low, *high;
Linus Torvalds1da177e2005-04-16 15:20:36 -070065
Heiko Carstenseb33c192006-01-14 13:20:57 -080066 if (!tsk || !task_stack_page(tsk))
67 return 0;
68 low = task_stack_page(tsk);
69 high = (struct stack_frame *) task_pt_regs(tsk);
70 sf = (struct stack_frame *) (tsk->thread.ksp & PSW_ADDR_INSN);
71 if (sf <= low || sf > high)
72 return 0;
73 sf = (struct stack_frame *) (sf->back_chain & PSW_ADDR_INSN);
74 if (sf <= low || sf > high)
75 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070076 return sf->gprs[8];
77}
78
Josef 'Jeff' Sipek3e972392008-08-21 19:46:31 +020079DEFINE_PER_CPU(struct s390_idle_data, s390_idle) = {
80 .lock = __SPIN_LOCK_UNLOCKED(s390_idle.lock)
81};
Linus Torvalds1da177e2005-04-16 15:20:36 -070082
Heiko Carstens43ca5c32008-04-17 07:46:23 +020083void s390_idle_leave(void)
84{
Heiko Carstensfae8b222007-10-22 12:52:39 +020085 struct s390_idle_data *idle;
Martin Schwidefsky6f430922008-12-31 15:11:40 +010086 unsigned long long idle_time;
Heiko Carstensfae8b222007-10-22 12:52:39 +020087
88 idle = &__get_cpu_var(s390_idle);
Martin Schwidefsky6f430922008-12-31 15:11:40 +010089 idle_time = S390_lowcore.int_clock - idle->idle_enter;
Heiko Carstensfae8b222007-10-22 12:52:39 +020090 spin_lock(&idle->lock);
Martin Schwidefsky6f430922008-12-31 15:11:40 +010091 idle->idle_time += idle_time;
92 idle->idle_enter = 0ULL;
93 idle->idle_count++;
Heiko Carstensfae8b222007-10-22 12:52:39 +020094 spin_unlock(&idle->lock);
Martin Schwidefsky6f430922008-12-31 15:11:40 +010095 vtime_start_cpu_timer();
Linus Torvalds1da177e2005-04-16 15:20:36 -070096}
97
Heiko Carstens77fa2242005-06-25 14:55:30 -070098extern void s390_handle_mcck(void);
Linus Torvalds1da177e2005-04-16 15:20:36 -070099/*
100 * The idle loop on a S390...
101 */
Adrian Bunkcdb04522006-03-24 03:15:57 -0800102static void default_idle(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700103{
Martin Schwidefsky6f430922008-12-31 15:11:40 +0100104 struct s390_idle_data *idle = &__get_cpu_var(s390_idle);
105 unsigned long addr;
106 psw_t psw;
107
Linus Torvalds1da177e2005-04-16 15:20:36 -0700108 /* CPU is going idle. */
Nick Piggin64c7c8f2005-11-08 21:39:04 -0800109 local_irq_disable();
110 if (need_resched()) {
111 local_irq_enable();
112 return;
113 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114#ifdef CONFIG_HOTPLUG_CPU
Heiko Carstens43ca5c32008-04-17 07:46:23 +0200115 if (cpu_is_offline(smp_processor_id())) {
Heiko Carstens1fca2512006-02-17 13:52:46 -0800116 preempt_enable_no_resched();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117 cpu_die();
Heiko Carstens1fca2512006-02-17 13:52:46 -0800118 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700119#endif
Heiko Carstens77fa2242005-06-25 14:55:30 -0700120 local_mcck_disable();
121 if (test_thread_flag(TIF_MCCK_PENDING)) {
122 local_mcck_enable();
Heiko Carstens43ca5c32008-04-17 07:46:23 +0200123 s390_idle_leave();
Heiko Carstens77fa2242005-06-25 14:55:30 -0700124 local_irq_enable();
125 s390_handle_mcck();
126 return;
127 }
Heiko Carstens1f194a42006-07-03 00:24:46 -0700128 trace_hardirqs_on();
Heiko Carstens632448f2008-11-14 18:18:04 +0100129 /* Don't trace preempt off for idle. */
130 stop_critical_timings();
Martin Schwidefsky6f430922008-12-31 15:11:40 +0100131 vtime_stop_cpu_timer();
132
133 /*
134 * The inline assembly is equivalent to
135 * idle->idle_enter = get_clock();
136 * __load_psw_mask(psw_kernel_bits | PSW_MASK_WAIT |
137 * PSW_MASK_IO | PSW_MASK_EXT);
138 * The difference is that the inline assembly makes sure that
139 * the stck instruction is right before the lpsw instruction.
140 * This is done to increase the precision.
141 */
142
Heiko Carstens77fa2242005-06-25 14:55:30 -0700143 /* Wait for external, I/O or machine check interrupt. */
Martin Schwidefsky6f430922008-12-31 15:11:40 +0100144 psw.mask = psw_kernel_bits|PSW_MASK_WAIT|PSW_MASK_IO|PSW_MASK_EXT;
145#ifndef __s390x__
146 asm volatile(
147 " basr %0,0\n"
148 "0: ahi %0,1f-0b\n"
149 " st %0,4(%2)\n"
150 " stck 0(%3)\n"
151 " lpsw 0(%2)\n"
152 "1:"
153 : "=&d" (addr), "=m" (idle->idle_enter)
154 : "a" (&psw), "a" (&idle->idle_enter), "m" (psw)
155 : "memory", "cc");
156#else /* __s390x__ */
157 asm volatile(
158 " larl %0,1f\n"
159 " stg %0,8(%2)\n"
160 " stck 0(%3)\n"
161 " lpswe 0(%2)\n"
162 "1:"
163 : "=&d" (addr), "=m" (idle->idle_enter)
164 : "a" (&psw), "a" (&idle->idle_enter), "m" (psw)
165 : "memory", "cc");
166#endif /* __s390x__ */
Heiko Carstens632448f2008-11-14 18:18:04 +0100167 start_critical_timings();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700168}
169
170void cpu_idle(void)
171{
Nick Piggin5bfb5d62005-11-08 21:39:01 -0800172 for (;;) {
Thomas Gleixnere3381252008-07-19 09:33:21 +0200173 tick_nohz_stop_sched_tick(1);
Nick Piggin5bfb5d62005-11-08 21:39:01 -0800174 while (!need_resched())
175 default_idle();
Heiko Carstens5a62b192008-04-17 07:46:25 +0200176 tick_nohz_restart_sched_tick();
Nick Piggin5bfb5d62005-11-08 21:39:01 -0800177 preempt_enable_no_resched();
178 schedule();
179 preempt_disable();
180 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700181}
182
Linus Torvalds1da177e2005-04-16 15:20:36 -0700183extern void kernel_thread_starter(void);
184
Martin Schwidefsky94c12cc2006-09-28 16:56:43 +0200185asm(
186 ".align 4\n"
Linus Torvalds1da177e2005-04-16 15:20:36 -0700187 "kernel_thread_starter:\n"
188 " la 2,0(10)\n"
189 " basr 14,9\n"
190 " la 2,0\n"
191 " br 11\n");
192
193int kernel_thread(int (*fn)(void *), void * arg, unsigned long flags)
194{
195 struct pt_regs regs;
196
197 memset(&regs, 0, sizeof(regs));
Gerald Schaeferc1821c22007-02-05 21:18:17 +0100198 regs.psw.mask = psw_kernel_bits | PSW_MASK_IO | PSW_MASK_EXT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 regs.psw.addr = (unsigned long) kernel_thread_starter | PSW_ADDR_AMODE;
200 regs.gprs[9] = (unsigned long) fn;
201 regs.gprs[10] = (unsigned long) arg;
202 regs.gprs[11] = (unsigned long) do_exit;
203 regs.orig_gpr2 = -1;
204
205 /* Ok, create the new process.. */
206 return do_fork(flags | CLONE_VM | CLONE_UNTRACED,
207 0, &regs, 0, NULL, NULL);
208}
209
210/*
211 * Free current thread data structures etc..
212 */
213void exit_thread(void)
214{
215}
216
217void flush_thread(void)
218{
219 clear_used_math();
220 clear_tsk_thread_flag(current, TIF_USEDFPU);
221}
222
223void release_thread(struct task_struct *dead_task)
224{
225}
226
227int copy_thread(int nr, unsigned long clone_flags, unsigned long new_stackp,
228 unsigned long unused,
229 struct task_struct * p, struct pt_regs * regs)
230{
231 struct fake_frame
232 {
233 struct stack_frame sf;
234 struct pt_regs childregs;
235 } *frame;
236
Al Viroc7584fb2006-01-12 01:05:49 -0800237 frame = container_of(task_pt_regs(p), struct fake_frame, childregs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238 p->thread.ksp = (unsigned long) frame;
239 /* Store access registers to kernel stack of new process. */
240 frame->childregs = *regs;
241 frame->childregs.gprs[2] = 0; /* child returns 0 on fork. */
242 frame->childregs.gprs[15] = new_stackp;
243 frame->sf.back_chain = 0;
244
245 /* new return point is ret_from_fork */
246 frame->sf.gprs[8] = (unsigned long) ret_from_fork;
247
248 /* fake return stack for resume(), don't go back to schedule */
249 frame->sf.gprs[9] = (unsigned long) frame;
250
251 /* Save access registers to new thread structure. */
252 save_access_regs(&p->thread.acrs[0]);
253
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800254#ifndef CONFIG_64BIT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700255 /*
256 * save fprs to current->thread.fp_regs to merge them with
257 * the emulated registers and then copy the result to the child.
258 */
259 save_fp_regs(&current->thread.fp_regs);
260 memcpy(&p->thread.fp_regs, &current->thread.fp_regs,
261 sizeof(s390_fp_regs));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700262 /* Set a new TLS ? */
263 if (clone_flags & CLONE_SETTLS)
264 p->thread.acrs[0] = regs->gprs[6];
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800265#else /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266 /* Save the fpu registers to new thread structure. */
267 save_fp_regs(&p->thread.fp_regs);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268 /* Set a new TLS ? */
269 if (clone_flags & CLONE_SETTLS) {
270 if (test_thread_flag(TIF_31BIT)) {
271 p->thread.acrs[0] = (unsigned int) regs->gprs[6];
272 } else {
273 p->thread.acrs[0] = (unsigned int)(regs->gprs[6] >> 32);
274 p->thread.acrs[1] = (unsigned int) regs->gprs[6];
275 }
276 }
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800277#endif /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278 /* start new process with ar4 pointing to the correct address space */
279 p->thread.mm_segment = get_fs();
280 /* Don't copy debug registers */
281 memset(&p->thread.per_info,0,sizeof(p->thread.per_info));
282
283 return 0;
284}
285
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200286asmlinkage long sys_fork(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700287{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200288 struct pt_regs *regs = task_pt_regs(current);
289 return do_fork(SIGCHLD, regs->gprs[15], regs, 0, NULL, NULL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290}
291
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200292asmlinkage long sys_clone(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200294 struct pt_regs *regs = task_pt_regs(current);
295 unsigned long clone_flags;
296 unsigned long newsp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297 int __user *parent_tidptr, *child_tidptr;
298
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200299 clone_flags = regs->gprs[3];
300 newsp = regs->orig_gpr2;
301 parent_tidptr = (int __user *) regs->gprs[4];
302 child_tidptr = (int __user *) regs->gprs[5];
303 if (!newsp)
304 newsp = regs->gprs[15];
305 return do_fork(clone_flags, newsp, regs, 0,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 parent_tidptr, child_tidptr);
307}
308
309/*
310 * This is trivial, and on the face of it looks like it
311 * could equally well be done in user mode.
312 *
313 * Not so, for quite unobvious reasons - register pressure.
314 * In user mode vfork() cannot have a stack frame, and if
315 * done by calling the "clone()" system call directly, you
316 * do not have enough call-clobbered registers to hold all
317 * the information you need.
318 */
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200319asmlinkage long sys_vfork(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700320{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200321 struct pt_regs *regs = task_pt_regs(current);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322 return do_fork(CLONE_VFORK | CLONE_VM | SIGCHLD,
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200323 regs->gprs[15], regs, 0, NULL, NULL);
324}
325
326asmlinkage void execve_tail(void)
327{
328 task_lock(current);
329 current->ptrace &= ~PT_DTRACE;
330 task_unlock(current);
331 current->thread.fp_regs.fpc = 0;
332 if (MACHINE_HAS_IEEE)
333 asm volatile("sfpc %0,%0" : : "d" (0));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700334}
335
336/*
337 * sys_execve() executes a new program.
338 */
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200339asmlinkage long sys_execve(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340{
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200341 struct pt_regs *regs = task_pt_regs(current);
342 char *filename;
343 unsigned long result;
344 int rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200346 filename = getname((char __user *) regs->orig_gpr2);
347 if (IS_ERR(filename)) {
348 result = PTR_ERR(filename);
349 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350 }
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200351 rc = do_execve(filename, (char __user * __user *) regs->gprs[3],
352 (char __user * __user *) regs->gprs[4], regs);
353 if (rc) {
354 result = rc;
355 goto out_putname;
356 }
357 execve_tail();
358 result = regs->gprs[2];
359out_putname:
360 putname(filename);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361out:
Martin Schwidefsky03ff9a22007-04-27 16:01:40 +0200362 return result;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363}
364
Linus Torvalds1da177e2005-04-16 15:20:36 -0700365/*
366 * fill in the FPU structure for a core dump.
367 */
368int dump_fpu (struct pt_regs * regs, s390_fp_regs *fpregs)
369{
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800370#ifndef CONFIG_64BIT
Linus Torvalds1da177e2005-04-16 15:20:36 -0700371 /*
372 * save fprs to current->thread.fp_regs to merge them with
373 * the emulated registers and then copy the result to the dump.
374 */
375 save_fp_regs(&current->thread.fp_regs);
376 memcpy(fpregs, &current->thread.fp_regs, sizeof(s390_fp_regs));
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800377#else /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378 save_fp_regs(fpregs);
Martin Schwidefsky347a8dc2006-01-06 00:19:28 -0800379#endif /* CONFIG_64BIT */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 return 1;
381}
382
Linus Torvalds1da177e2005-04-16 15:20:36 -0700383unsigned long get_wchan(struct task_struct *p)
384{
385 struct stack_frame *sf, *low, *high;
386 unsigned long return_address;
387 int count;
388
Al Viro30af7122006-01-12 01:05:50 -0800389 if (!p || p == current || p->state == TASK_RUNNING || !task_stack_page(p))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390 return 0;
Al Viro30af7122006-01-12 01:05:50 -0800391 low = task_stack_page(p);
392 high = (struct stack_frame *) task_pt_regs(p);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 sf = (struct stack_frame *) (p->thread.ksp & PSW_ADDR_INSN);
394 if (sf <= low || sf > high)
395 return 0;
396 for (count = 0; count < 16; count++) {
397 sf = (struct stack_frame *) (sf->back_chain & PSW_ADDR_INSN);
398 if (sf <= low || sf > high)
399 return 0;
400 return_address = sf->gprs[8] & PSW_ADDR_INSN;
401 if (!in_sched_functions(return_address))
402 return return_address;
403 }
404 return 0;
405}
406