| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 1 | /* | 
|  | 2 | * Copyright (C) 2002 - 2007 Jeff Dike (jdike@{addtoit,linux.intel}.com) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 3 | * Licensed under the GPL | 
|  | 4 | */ | 
|  | 5 |  | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 6 | #include "linux/mm.h" | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 7 | #include "linux/sched.h" | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 8 | #include "asm/pgalloc.h" | 
|  | 9 | #include "asm/pgtable.h" | 
| Jeff Dike | 54ae36f | 2007-10-16 01:27:33 -0700 | [diff] [blame] | 10 | #include "as-layout.h" | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 11 | #include "os.h" | 
|  | 12 | #include "skas.h" | 
|  | 13 |  | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 14 | extern int __syscall_stub_start; | 
|  | 15 |  | 
|  | 16 | static int init_stub_pte(struct mm_struct *mm, unsigned long proc, | 
|  | 17 | unsigned long kernel) | 
|  | 18 | { | 
|  | 19 | pgd_t *pgd; | 
|  | 20 | pud_t *pud; | 
|  | 21 | pmd_t *pmd; | 
|  | 22 | pte_t *pte; | 
|  | 23 |  | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 24 | pgd = pgd_offset(mm, proc); | 
|  | 25 | pud = pud_alloc(mm, pgd, proc); | 
|  | 26 | if (!pud) | 
|  | 27 | goto out; | 
|  | 28 |  | 
|  | 29 | pmd = pmd_alloc(mm, pud, proc); | 
|  | 30 | if (!pmd) | 
|  | 31 | goto out_pmd; | 
|  | 32 |  | 
|  | 33 | pte = pte_alloc_map(mm, pmd, proc); | 
|  | 34 | if (!pte) | 
|  | 35 | goto out_pte; | 
|  | 36 |  | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 37 | /* | 
|  | 38 | * There's an interaction between the skas0 stub pages, stack | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 39 | * randomization, and the BUG at the end of exit_mmap.  exit_mmap | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 40 | * checks that the number of page tables freed is the same as had | 
|  | 41 | * been allocated.  If the stack is on the last page table page, | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 42 | * then the stack pte page will be freed, and if not, it won't.  To | 
|  | 43 | * avoid having to know where the stack is, or if the process mapped | 
|  | 44 | * something at the top of its address space for some other reason, | 
|  | 45 | * we set TASK_SIZE to end at the start of the last page table. | 
|  | 46 | * This keeps exit_mmap off the last page, but introduces a leak | 
|  | 47 | * of that page.  So, we hang onto it here and free it in | 
|  | 48 | * destroy_context_skas. | 
|  | 49 | */ | 
|  | 50 |  | 
| Jeff Dike | 6c738ff | 2007-10-16 01:27:06 -0700 | [diff] [blame] | 51 | mm->context.last_page_table = pmd_page_vaddr(*pmd); | 
| Jeff Dike | 7ef9390 | 2005-09-03 15:57:52 -0700 | [diff] [blame] | 52 | #ifdef CONFIG_3_LEVEL_PGTABLES | 
| Jeff Dike | 6c738ff | 2007-10-16 01:27:06 -0700 | [diff] [blame] | 53 | mm->context.last_pmd = (unsigned long) __va(pud_val(*pud)); | 
| Jeff Dike | 7ef9390 | 2005-09-03 15:57:52 -0700 | [diff] [blame] | 54 | #endif | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 55 |  | 
|  | 56 | *pte = mk_pte(virt_to_page(kernel), __pgprot(_PAGE_PRESENT)); | 
| Paolo 'Blaisorblade' Giarrusso | 21c935e | 2006-10-11 01:21:32 -0700 | [diff] [blame] | 57 | *pte = pte_mkread(*pte); | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 58 | return 0; | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 59 |  | 
|  | 60 | out_pmd: | 
|  | 61 | pud_free(pud); | 
|  | 62 | out_pte: | 
|  | 63 | pmd_free(pmd); | 
|  | 64 | out: | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 65 | return -ENOMEM; | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 66 | } | 
|  | 67 |  | 
| Jeff Dike | 77bf440 | 2007-10-16 01:26:58 -0700 | [diff] [blame] | 68 | int init_new_context(struct task_struct *task, struct mm_struct *mm) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 69 | { | 
| Jeff Dike | 6c738ff | 2007-10-16 01:27:06 -0700 | [diff] [blame] | 70 | struct mm_context *from_mm = NULL; | 
|  | 71 | struct mm_context *to_mm = &mm->context; | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 72 | unsigned long stack = 0; | 
| Bodo Stroesser | 12919aa | 2006-01-18 17:42:39 -0800 | [diff] [blame] | 73 | int ret = -ENOMEM; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 74 |  | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 75 | if (skas_needs_stub) { | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 76 | stack = get_zeroed_page(GFP_KERNEL); | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 77 | if (stack == 0) | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 78 | goto out; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 79 |  | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 80 | /* | 
|  | 81 | * This zeros the entry that pgd_alloc didn't, needed since | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 82 | * we are about to reinitialize it, and want mm.nr_ptes to | 
|  | 83 | * be accurate. | 
|  | 84 | */ | 
|  | 85 | mm->pgd[USER_PTRS_PER_PGD] = __pgd(0); | 
|  | 86 |  | 
| Jeff Dike | 54ae36f | 2007-10-16 01:27:33 -0700 | [diff] [blame] | 87 | ret = init_stub_pte(mm, STUB_CODE, | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 88 | (unsigned long) &__syscall_stub_start); | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 89 | if (ret) | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 90 | goto out_free; | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 91 |  | 
| Jeff Dike | 54ae36f | 2007-10-16 01:27:33 -0700 | [diff] [blame] | 92 | ret = init_stub_pte(mm, STUB_DATA, stack); | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 93 | if (ret) | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 94 | goto out_free; | 
|  | 95 |  | 
|  | 96 | mm->nr_ptes--; | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 97 | } | 
| Bodo Stroesser | 858259c | 2005-11-07 00:58:55 -0800 | [diff] [blame] | 98 |  | 
|  | 99 | to_mm->id.stack = stack; | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 100 | if (current->mm != NULL && current->mm != &init_mm) | 
| Jeff Dike | 6c738ff | 2007-10-16 01:27:06 -0700 | [diff] [blame] | 101 | from_mm = ¤t->mm->context; | 
| Bodo Stroesser | 9786a8f | 2005-07-07 17:56:50 -0700 | [diff] [blame] | 102 |  | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 103 | if (proc_mm) { | 
| Bodo Stroesser | 12919aa | 2006-01-18 17:42:39 -0800 | [diff] [blame] | 104 | ret = new_mm(stack); | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 105 | if (ret < 0) { | 
|  | 106 | printk(KERN_ERR "init_new_context_skas - " | 
|  | 107 | "new_mm failed, errno = %d\n", ret); | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 108 | goto out_free; | 
|  | 109 | } | 
| Bodo Stroesser | 858259c | 2005-11-07 00:58:55 -0800 | [diff] [blame] | 110 | to_mm->id.u.mm_fd = ret; | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 111 | } | 
|  | 112 | else { | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 113 | if (from_mm) | 
| Bodo Stroesser | 858259c | 2005-11-07 00:58:55 -0800 | [diff] [blame] | 114 | to_mm->id.u.pid = copy_context_skas0(stack, | 
|  | 115 | from_mm->id.u.pid); | 
|  | 116 | else to_mm->id.u.pid = start_userspace(stack); | 
|  | 117 | } | 
|  | 118 |  | 
|  | 119 | ret = init_new_ldt(to_mm, from_mm); | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 120 | if (ret < 0) { | 
|  | 121 | printk(KERN_ERR "init_new_context_skas - init_ldt" | 
| Bodo Stroesser | 858259c | 2005-11-07 00:58:55 -0800 | [diff] [blame] | 122 | " failed, errno = %d\n", ret); | 
|  | 123 | goto out_free; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 124 | } | 
|  | 125 |  | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 126 | return 0; | 
|  | 127 |  | 
|  | 128 | out_free: | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 129 | if (to_mm->id.stack != 0) | 
| Bodo Stroesser | 858259c | 2005-11-07 00:58:55 -0800 | [diff] [blame] | 130 | free_page(to_mm->id.stack); | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 131 | out: | 
|  | 132 | return ret; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 133 | } | 
|  | 134 |  | 
| Jeff Dike | 77bf440 | 2007-10-16 01:26:58 -0700 | [diff] [blame] | 135 | void destroy_context(struct mm_struct *mm) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 136 | { | 
| Jeff Dike | 6c738ff | 2007-10-16 01:27:06 -0700 | [diff] [blame] | 137 | struct mm_context *mmu = &mm->context; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 138 |  | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 139 | if (proc_mm) | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 140 | os_close_file(mmu->id.u.mm_fd); | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 141 | else | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 142 | os_kill_ptraced_process(mmu->id.u.pid, 1); | 
| Bodo Stroesser | 8b51304 | 2005-09-03 15:57:49 -0700 | [diff] [blame] | 143 |  | 
| Jeff Dike | ba180fd | 2007-10-16 01:27:00 -0700 | [diff] [blame] | 144 | if (!proc_mm || !ptrace_faultinfo) { | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 145 | free_page(mmu->id.stack); | 
| Hugh Dickins | 4c21e2f | 2005-10-29 18:16:40 -0700 | [diff] [blame] | 146 | pte_lock_deinit(virt_to_page(mmu->last_page_table)); | 
| Jeff Dike | 7ef9390 | 2005-09-03 15:57:52 -0700 | [diff] [blame] | 147 | pte_free_kernel((pte_t *) mmu->last_page_table); | 
| Christoph Lameter | df849a1 | 2006-06-30 01:55:38 -0700 | [diff] [blame] | 148 | dec_zone_page_state(virt_to_page(mmu->last_page_table), NR_PAGETABLE); | 
| Jeff Dike | 7ef9390 | 2005-09-03 15:57:52 -0700 | [diff] [blame] | 149 | #ifdef CONFIG_3_LEVEL_PGTABLES | 
|  | 150 | pmd_free((pmd_t *) mmu->last_pmd); | 
|  | 151 | #endif | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 152 | } | 
| Jeff Dike | 28078e8 | 2007-10-16 01:27:08 -0700 | [diff] [blame] | 153 |  | 
|  | 154 | free_ldt(mmu); | 
| Jeff Dike | d67b569 | 2005-07-07 17:56:49 -0700 | [diff] [blame] | 155 | } |