blob: 59f1fa1559151029d99f077d0861cd6bfd17392d [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/* Copyright 2002,2003 Andi Kleen, SuSE Labs */
2
3/* vsyscall handling for 32bit processes. Map a stub page into it
4 on demand because 32bit cannot reach the kernel's fixmaps */
5
6#include <linux/mm.h>
7#include <linux/string.h>
8#include <linux/kernel.h>
9#include <linux/gfp.h>
10#include <linux/init.h>
11#include <linux/stringify.h>
Andi Kleen1e014412005-04-16 15:24:55 -070012#include <linux/security.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <asm/proto.h>
14#include <asm/tlbflush.h>
15#include <asm/ia32_unistd.h>
16
Linus Torvalds1da177e2005-04-16 15:20:36 -070017extern unsigned char syscall32_syscall[], syscall32_syscall_end[];
18extern unsigned char syscall32_sysenter[], syscall32_sysenter_end[];
19extern int sysctl_vsyscall32;
20
21char *syscall32_page;
22static int use_sysenter = -1;
23
Andi Kleen1e014412005-04-16 15:24:55 -070024static struct page *
25syscall32_nopage(struct vm_area_struct *vma, unsigned long adr, int *type)
26{
27 struct page *p = virt_to_page(adr - vma->vm_start + syscall32_page);
28 get_page(p);
29 return p;
Linus Torvalds1da177e2005-04-16 15:20:36 -070030}
31
Andi Kleen1e014412005-04-16 15:24:55 -070032/* Prevent VMA merging */
33static void syscall32_vma_close(struct vm_area_struct *vma)
Linus Torvalds1da177e2005-04-16 15:20:36 -070034{
Andi Kleen1e014412005-04-16 15:24:55 -070035}
36
37static struct vm_operations_struct syscall32_vm_ops = {
38 .close = syscall32_vma_close,
39 .nopage = syscall32_nopage,
40};
41
42struct linux_binprm;
43
44/* Setup a VMA at program startup for the vsyscall page */
45int syscall32_setup_pages(struct linux_binprm *bprm, int exstack)
46{
47 int npages = (VSYSCALL32_END - VSYSCALL32_BASE) >> PAGE_SHIFT;
48 struct vm_area_struct *vma;
49 struct mm_struct *mm = current->mm;
Siddha, Suresh B9fb17592005-07-15 19:17:44 -070050 int ret;
Andi Kleen1e014412005-04-16 15:24:55 -070051
Christoph Lametere94b1762006-12-06 20:33:17 -080052 vma = kmem_cache_alloc(vm_area_cachep, GFP_KERNEL);
Andi Kleen1e014412005-04-16 15:24:55 -070053 if (!vma)
54 return -ENOMEM;
Andi Kleen1e014412005-04-16 15:24:55 -070055
56 memset(vma, 0, sizeof(struct vm_area_struct));
57 /* Could randomize here */
58 vma->vm_start = VSYSCALL32_BASE;
59 vma->vm_end = VSYSCALL32_END;
60 /* MAYWRITE to allow gdb to COW and set breakpoints */
Hugh Dickins2fd4ef82005-09-14 06:13:02 +010061 vma->vm_flags = VM_READ|VM_EXEC|VM_MAYREAD|VM_MAYEXEC|VM_MAYWRITE;
Roland McGrathe03f0ca2007-01-26 00:56:50 -080062 /*
63 * Make sure the vDSO gets into every core dump.
64 * Dumping its contents makes post-mortem fully interpretable later
65 * without matching up the same kernel and hardware config to see
66 * what PC values meant.
67 */
68 vma->vm_flags |= VM_ALWAYSDUMP;
Andi Kleen1e014412005-04-16 15:24:55 -070069 vma->vm_flags |= mm->def_flags;
70 vma->vm_page_prot = protection_map[vma->vm_flags & 7];
71 vma->vm_ops = &syscall32_vm_ops;
72 vma->vm_mm = mm;
73
74 down_write(&mm->mmap_sem);
Siddha, Suresh B9fb17592005-07-15 19:17:44 -070075 if ((ret = insert_vm_struct(mm, vma))) {
76 up_write(&mm->mmap_sem);
77 kmem_cache_free(vm_area_cachep, vma);
78 return ret;
79 }
Andi Kleen1e014412005-04-16 15:24:55 -070080 mm->total_vm += npages;
81 up_write(&mm->mmap_sem);
82 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070083}
84
Roland McGrathc6330902007-01-26 00:56:52 -080085const char *arch_vma_name(struct vm_area_struct *vma)
86{
87 if (vma->vm_start == VSYSCALL32_BASE &&
88 vma->vm_mm && vma->vm_mm->task_size == IA32_PAGE_OFFSET)
89 return "[vdso]";
90 return NULL;
91}
92
Linus Torvalds1da177e2005-04-16 15:20:36 -070093static int __init init_syscall32(void)
94{
95 syscall32_page = (void *)get_zeroed_page(GFP_KERNEL);
96 if (!syscall32_page)
97 panic("Cannot allocate syscall32 page");
Linus Torvalds1da177e2005-04-16 15:20:36 -070098 if (use_sysenter > 0) {
99 memcpy(syscall32_page, syscall32_sysenter,
100 syscall32_sysenter_end - syscall32_sysenter);
101 } else {
102 memcpy(syscall32_page, syscall32_syscall,
103 syscall32_syscall_end - syscall32_syscall);
104 }
105 return 0;
106}
107
108__initcall(init_syscall32);
109
110/* May not be __init: called during resume */
111void syscall32_cpu_init(void)
112{
113 if (use_sysenter < 0)
114 use_sysenter = (boot_cpu_data.x86_vendor == X86_VENDOR_INTEL);
115
116 /* Load these always in case some future AMD CPU supports
117 SYSENTER from compat mode too. */
118 checking_wrmsrl(MSR_IA32_SYSENTER_CS, (u64)__KERNEL_CS);
119 checking_wrmsrl(MSR_IA32_SYSENTER_ESP, 0ULL);
120 checking_wrmsrl(MSR_IA32_SYSENTER_EIP, (u64)ia32_sysenter_target);
121
122 wrmsrl(MSR_CSTAR, ia32_cstar_target);
123}