blob: 5da744204d100661f3ff35502800335702652ca4 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/i386/kernel/sysenter.c
3 *
4 * (C) Copyright 2002 Linus Torvalds
Ingo Molnare6e54942006-06-27 02:53:50 -07005 * Portions based on the vdso-randomization code from exec-shield:
6 * Copyright(C) 2005-2006, Red Hat, Inc., Ingo Molnar
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 *
8 * This file contains the needed initializations to support sysenter.
9 */
10
11#include <linux/init.h>
12#include <linux/smp.h>
13#include <linux/thread_info.h>
14#include <linux/sched.h>
15#include <linux/gfp.h>
16#include <linux/string.h>
17#include <linux/elf.h>
Ingo Molnare6e54942006-06-27 02:53:50 -070018#include <linux/mm.h>
19#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020
21#include <asm/cpufeature.h>
22#include <asm/msr.h>
23#include <asm/pgtable.h>
24#include <asm/unistd.h>
25
Ingo Molnare6e54942006-06-27 02:53:50 -070026/*
27 * Should the kernel map a VDSO page into processes and pass its
28 * address down to glibc upon exec()?
29 */
Andi Kleen3bbf5472006-12-07 02:14:08 +010030#ifdef CONFIG_PARAVIRT
31unsigned int __read_mostly vdso_enabled = 0;
32#else
Ingo Molnare6e54942006-06-27 02:53:50 -070033unsigned int __read_mostly vdso_enabled = 1;
Andi Kleen3bbf5472006-12-07 02:14:08 +010034#endif
Ingo Molnare6e54942006-06-27 02:53:50 -070035
36EXPORT_SYMBOL_GPL(vdso_enabled);
37
38static int __init vdso_setup(char *s)
39{
40 vdso_enabled = simple_strtoul(s, NULL, 0);
41
42 return 1;
43}
44
45__setup("vdso=", vdso_setup);
46
Linus Torvalds1da177e2005-04-16 15:20:36 -070047extern asmlinkage void sysenter_entry(void);
48
Li Shaohua6fe940d2005-06-25 14:54:53 -070049void enable_sep_cpu(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070050{
51 int cpu = get_cpu();
52 struct tss_struct *tss = &per_cpu(init_tss, cpu);
53
Li Shaohua6fe940d2005-06-25 14:54:53 -070054 if (!boot_cpu_has(X86_FEATURE_SEP)) {
55 put_cpu();
56 return;
57 }
58
Linus Torvalds1da177e2005-04-16 15:20:36 -070059 tss->ss1 = __KERNEL_CS;
60 tss->esp1 = sizeof(struct tss_struct) + (unsigned long) tss;
61 wrmsr(MSR_IA32_SYSENTER_CS, __KERNEL_CS, 0);
62 wrmsr(MSR_IA32_SYSENTER_ESP, tss->esp1, 0);
63 wrmsr(MSR_IA32_SYSENTER_EIP, (unsigned long) sysenter_entry, 0);
64 put_cpu();
65}
66
67/*
68 * These symbols are defined by vsyscall.o to mark the bounds
69 * of the ELF DSO images included therein.
70 */
71extern const char vsyscall_int80_start, vsyscall_int80_end;
72extern const char vsyscall_sysenter_start, vsyscall_sysenter_end;
Ingo Molnare6e54942006-06-27 02:53:50 -070073static void *syscall_page;
Linus Torvalds1da177e2005-04-16 15:20:36 -070074
Li Shaohua6fe940d2005-06-25 14:54:53 -070075int __init sysenter_setup(void)
Linus Torvalds1da177e2005-04-16 15:20:36 -070076{
Ingo Molnare6e54942006-06-27 02:53:50 -070077 syscall_page = (void *)get_zeroed_page(GFP_ATOMIC);
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
Ingo Molnare6e54942006-06-27 02:53:50 -070079#ifdef CONFIG_COMPAT_VDSO
80 __set_fixmap(FIX_VDSO, __pa(syscall_page), PAGE_READONLY);
81 printk("Compat vDSO mapped to %08lx.\n", __fix_to_virt(FIX_VDSO));
Ingo Molnare6e54942006-06-27 02:53:50 -070082#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -070083
84 if (!boot_cpu_has(X86_FEATURE_SEP)) {
Ingo Molnare6e54942006-06-27 02:53:50 -070085 memcpy(syscall_page,
Linus Torvalds1da177e2005-04-16 15:20:36 -070086 &vsyscall_int80_start,
87 &vsyscall_int80_end - &vsyscall_int80_start);
88 return 0;
89 }
90
Ingo Molnare6e54942006-06-27 02:53:50 -070091 memcpy(syscall_page,
Linus Torvalds1da177e2005-04-16 15:20:36 -070092 &vsyscall_sysenter_start,
93 &vsyscall_sysenter_end - &vsyscall_sysenter_start);
94
Linus Torvalds1da177e2005-04-16 15:20:36 -070095 return 0;
96}
Ingo Molnare6e54942006-06-27 02:53:50 -070097
Roland McGratha1f3bb92007-01-26 00:56:46 -080098#ifndef CONFIG_COMPAT_VDSO
Ingo Molnare6e54942006-06-27 02:53:50 -070099static struct page *syscall_nopage(struct vm_area_struct *vma,
100 unsigned long adr, int *type)
101{
102 struct page *p = virt_to_page(adr - vma->vm_start + syscall_page);
103 get_page(p);
104 return p;
105}
106
107/* Prevent VMA merging */
108static void syscall_vma_close(struct vm_area_struct *vma)
109{
110}
111
112static struct vm_operations_struct syscall_vm_ops = {
113 .close = syscall_vma_close,
114 .nopage = syscall_nopage,
115};
116
117/* Defined in vsyscall-sysenter.S */
118extern void SYSENTER_RETURN;
119
120/* Setup a VMA at program startup for the vsyscall page */
121int arch_setup_additional_pages(struct linux_binprm *bprm, int exstack)
122{
123 struct vm_area_struct *vma;
124 struct mm_struct *mm = current->mm;
125 unsigned long addr;
126 int ret;
127
128 down_write(&mm->mmap_sem);
129 addr = get_unmapped_area(NULL, 0, PAGE_SIZE, 0, 0);
130 if (IS_ERR_VALUE(addr)) {
131 ret = addr;
132 goto up_fail;
133 }
134
Christoph Lametere94b1762006-12-06 20:33:17 -0800135 vma = kmem_cache_zalloc(vm_area_cachep, GFP_KERNEL);
Ingo Molnare6e54942006-06-27 02:53:50 -0700136 if (!vma) {
137 ret = -ENOMEM;
138 goto up_fail;
139 }
140
141 vma->vm_start = addr;
142 vma->vm_end = addr + PAGE_SIZE;
143 /* MAYWRITE to allow gdb to COW and set breakpoints */
144 vma->vm_flags = VM_READ|VM_EXEC|VM_MAYREAD|VM_MAYEXEC|VM_MAYWRITE;
Roland McGrathf47aef52007-01-26 00:56:49 -0800145 /*
146 * Make sure the vDSO gets into every core dump.
147 * Dumping its contents makes post-mortem fully interpretable later
148 * without matching up the same kernel and hardware config to see
149 * what PC values meant.
150 */
151 vma->vm_flags |= VM_ALWAYSDUMP;
Ingo Molnare6e54942006-06-27 02:53:50 -0700152 vma->vm_flags |= mm->def_flags;
153 vma->vm_page_prot = protection_map[vma->vm_flags & 7];
154 vma->vm_ops = &syscall_vm_ops;
155 vma->vm_mm = mm;
156
157 ret = insert_vm_struct(mm, vma);
pageexec@freemail.hu79bc79b2006-06-28 20:44:16 +0200158 if (unlikely(ret)) {
159 kmem_cache_free(vm_area_cachep, vma);
160 goto up_fail;
161 }
Ingo Molnare6e54942006-06-27 02:53:50 -0700162
163 current->mm->context.vdso = (void *)addr;
164 current_thread_info()->sysenter_return =
165 (void *)VDSO_SYM(&SYSENTER_RETURN);
166 mm->total_vm++;
167up_fail:
168 up_write(&mm->mmap_sem);
169 return ret;
Ingo Molnare6e54942006-06-27 02:53:50 -0700170}
171
172const char *arch_vma_name(struct vm_area_struct *vma)
173{
174 if (vma->vm_mm && vma->vm_start == (long)vma->vm_mm->context.vdso)
175 return "[vdso]";
176 return NULL;
177}
178
179struct vm_area_struct *get_gate_vma(struct task_struct *tsk)
180{
181 return NULL;
182}
183
184int in_gate_area(struct task_struct *task, unsigned long addr)
185{
186 return 0;
187}
188
189int in_gate_area_no_task(unsigned long addr)
190{
191 return 0;
192}
Roland McGratha1f3bb92007-01-26 00:56:46 -0800193#endif