blob: 77038d8e9bfd3da7a19140615bffea99a9745171 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001#ifndef _X86_64_PGTABLE_H
2#define _X86_64_PGTABLE_H
3
Randy Dunlap6df95fd2007-05-08 00:31:11 -07004#include <linux/const.h>
Vivek Goyal9d291e72007-05-02 19:27:06 +02005#ifndef __ASSEMBLY__
6
Linus Torvalds1da177e2005-04-16 15:20:36 -07007/*
8 * This file contains the functions and defines necessary to modify and use
9 * the x86-64 page table tree.
10 */
11#include <asm/processor.h>
Jiri Slaby1977f032007-10-18 23:40:25 -070012#include <linux/bitops.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070013#include <linux/threads.h>
14#include <asm/pda.h>
15
16extern pud_t level3_kernel_pgt[512];
Linus Torvalds1da177e2005-04-16 15:20:36 -070017extern pud_t level3_ident_pgt[512];
18extern pmd_t level2_kernel_pgt[512];
19extern pgd_t init_level4_pgt[];
Linus Torvalds1da177e2005-04-16 15:20:36 -070020
Linus Torvaldse3ebadd2007-05-07 08:44:24 -070021#define swapper_pg_dir init_level4_pgt
Linus Torvalds1da177e2005-04-16 15:20:36 -070022
Linus Torvalds1da177e2005-04-16 15:20:36 -070023extern void paging_init(void);
24extern void clear_kernel_mapping(unsigned long addr, unsigned long size);
25
Linus Torvalds1da177e2005-04-16 15:20:36 -070026/*
27 * ZERO_PAGE is a global shared page that is always zero: used
28 * for zero-mapped memory areas etc..
29 */
30extern unsigned long empty_zero_page[PAGE_SIZE/sizeof(unsigned long)];
Linus Torvaldse3ebadd2007-05-07 08:44:24 -070031#define ZERO_PAGE(vaddr) (virt_to_page(empty_zero_page))
Linus Torvalds1da177e2005-04-16 15:20:36 -070032
Vivek Goyal9d291e72007-05-02 19:27:06 +020033#endif /* !__ASSEMBLY__ */
34
Linus Torvalds1da177e2005-04-16 15:20:36 -070035/*
36 * PGDIR_SHIFT determines what a top-level page table entry can map
37 */
38#define PGDIR_SHIFT 39
39#define PTRS_PER_PGD 512
40
41/*
42 * 3rd level page
43 */
44#define PUD_SHIFT 30
45#define PTRS_PER_PUD 512
46
47/*
48 * PMD_SHIFT determines the size of the area a middle-level
49 * page table can map
50 */
51#define PMD_SHIFT 21
52#define PTRS_PER_PMD 512
53
54/*
55 * entries per page directory level
56 */
57#define PTRS_PER_PTE 512
58
Vivek Goyal9d291e72007-05-02 19:27:06 +020059#ifndef __ASSEMBLY__
60
Linus Torvalds1da177e2005-04-16 15:20:36 -070061#define pte_ERROR(e) \
62 printk("%s:%d: bad pte %p(%016lx).\n", __FILE__, __LINE__, &(e), pte_val(e))
63#define pmd_ERROR(e) \
64 printk("%s:%d: bad pmd %p(%016lx).\n", __FILE__, __LINE__, &(e), pmd_val(e))
65#define pud_ERROR(e) \
66 printk("%s:%d: bad pud %p(%016lx).\n", __FILE__, __LINE__, &(e), pud_val(e))
67#define pgd_ERROR(e) \
68 printk("%s:%d: bad pgd %p(%016lx).\n", __FILE__, __LINE__, &(e), pgd_val(e))
69
70#define pgd_none(x) (!pgd_val(x))
71#define pud_none(x) (!pud_val(x))
72
73static inline void set_pte(pte_t *dst, pte_t val)
74{
Jeremy Fitzhardingec8e53932008-01-30 13:32:57 +010075 *dst = val;
Linus Torvalds1da177e2005-04-16 15:20:36 -070076}
77#define set_pte_at(mm,addr,ptep,pteval) set_pte(ptep,pteval)
78
79static inline void set_pmd(pmd_t *dst, pmd_t val)
80{
Ingo Molnar7a2389b2008-01-30 13:32:42 +010081 *dst = val;
Linus Torvalds1da177e2005-04-16 15:20:36 -070082}
83
84static inline void set_pud(pud_t *dst, pud_t val)
85{
Ingo Molnar7a2389b2008-01-30 13:32:42 +010086 *dst = val;
Linus Torvalds1da177e2005-04-16 15:20:36 -070087}
88
Adrian Bunk9c0aa0f2005-09-12 18:49:24 +020089static inline void pud_clear (pud_t *pud)
Linus Torvalds1da177e2005-04-16 15:20:36 -070090{
91 set_pud(pud, __pud(0));
92}
93
94static inline void set_pgd(pgd_t *dst, pgd_t val)
95{
Ingo Molnar7a2389b2008-01-30 13:32:42 +010096 *dst = val;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097}
98
Adrian Bunk9c0aa0f2005-09-12 18:49:24 +020099static inline void pgd_clear (pgd_t * pgd)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100{
101 set_pgd(pgd, __pgd(0));
102}
103
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104#define ptep_get_and_clear(mm,addr,xp) __pte(xchg(&(xp)->pte, 0))
Zachary Amsden61e06032005-09-03 15:55:06 -0700105
Tim Schmielau8c65b4a2005-11-07 00:59:43 -0800106struct mm_struct;
107
Zachary Amsden61e06032005-09-03 15:55:06 -0700108static inline pte_t ptep_get_and_clear_full(struct mm_struct *mm, unsigned long addr, pte_t *ptep, int full)
109{
110 pte_t pte;
111 if (full) {
112 pte = *ptep;
113 *ptep = __pte(0);
114 } else {
115 pte = ptep_get_and_clear(mm, addr, ptep);
116 }
117 return pte;
118}
119
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120#define pte_same(a, b) ((a).pte == (b).pte)
121
Arjan van de Venc7282522006-01-06 00:12:03 -0800122#define pte_pgprot(a) (__pgprot((a).pte & ~PHYSICAL_PAGE_MASK))
123
Vivek Goyal9d291e72007-05-02 19:27:06 +0200124#endif /* !__ASSEMBLY__ */
125
126#define PMD_SIZE (_AC(1,UL) << PMD_SHIFT)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127#define PMD_MASK (~(PMD_SIZE-1))
Vivek Goyal9d291e72007-05-02 19:27:06 +0200128#define PUD_SIZE (_AC(1,UL) << PUD_SHIFT)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700129#define PUD_MASK (~(PUD_SIZE-1))
Vivek Goyal9d291e72007-05-02 19:27:06 +0200130#define PGDIR_SIZE (_AC(1,UL) << PGDIR_SHIFT)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131#define PGDIR_MASK (~(PGDIR_SIZE-1))
132
Linus Torvalds1da177e2005-04-16 15:20:36 -0700133
Randy Dunlap63f65642007-05-08 00:31:14 -0700134#define MAXMEM _AC(0x3fffffffffff, UL)
135#define VMALLOC_START _AC(0xffffc20000000000, UL)
136#define VMALLOC_END _AC(0xffffe1ffffffffff, UL)
Christoph Lameter0889eba2007-10-16 01:24:15 -0700137#define VMEMMAP_START _AC(0xffffe20000000000, UL)
Randy Dunlap63f65642007-05-08 00:31:14 -0700138#define MODULES_VADDR _AC(0xffffffff88000000, UL)
139#define MODULES_END _AC(0xfffffffffff00000, UL)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700140#define MODULES_LEN (MODULES_END - MODULES_VADDR)
141
Vivek Goyal9d291e72007-05-02 19:27:06 +0200142#ifndef __ASSEMBLY__
143
Jan Beulicheab724e2006-12-07 02:14:09 +0100144static inline unsigned long pgd_bad(pgd_t pgd)
145{
146 return pgd_val(pgd) & ~(PTE_MASK | _KERNPG_TABLE | _PAGE_USER);
147}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700148
149static inline unsigned long pud_bad(pud_t pud)
150{
Jan Beulicheab724e2006-12-07 02:14:09 +0100151 return pud_val(pud) & ~(PTE_MASK | _KERNPG_TABLE | _PAGE_USER);
152}
153
154static inline unsigned long pmd_bad(pmd_t pmd)
155{
156 return pmd_val(pmd) & ~(PTE_MASK | _KERNPG_TABLE | _PAGE_USER);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700157}
158
159#define pte_none(x) (!pte_val(x))
160#define pte_present(x) (pte_val(x) & (_PAGE_PRESENT | _PAGE_PROTNONE))
161#define pte_clear(mm,addr,xp) do { set_pte_at(mm, addr, xp, __pte(0)); } while (0)
162
Joerg Roedel1c6f7032008-01-30 13:31:02 +0100163#define pages_to_mb(x) ((x) >> (20-PAGE_SHIFT)) /* FIXME: is this right? */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164#define pte_page(x) pfn_to_page(pte_pfn(x))
Andi Kleen6b75aee2005-11-05 17:25:53 +0100165#define pte_pfn(x) ((pte_val(x) & __PHYSICAL_MASK) >> PAGE_SHIFT)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167struct vm_area_struct;
168
Linus Torvalds1da177e2005-04-16 15:20:36 -0700169static inline int ptep_test_and_clear_young(struct vm_area_struct *vma, unsigned long addr, pte_t *ptep)
170{
171 if (!pte_young(*ptep))
172 return 0;
Akinobu Mita3d1712c2006-03-24 03:15:11 -0800173 return test_and_clear_bit(_PAGE_BIT_ACCESSED, &ptep->pte);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700174}
175
176static inline void ptep_set_wrprotect(struct mm_struct *mm, unsigned long addr, pte_t *ptep)
177{
Akinobu Mita3d1712c2006-03-24 03:15:11 -0800178 clear_bit(_PAGE_BIT_RW, &ptep->pte);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700179}
180
181/*
182 * Macro to mark a page protection value as "uncacheable".
183 */
184#define pgprot_noncached(prot) (__pgprot(pgprot_val(prot) | _PAGE_PCD | _PAGE_PWT))
185
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186
187/*
188 * Conversion functions: convert a page and protection to a page entry,
189 * and a page entry and page directory to the page they refer to.
190 */
191
Linus Torvalds1da177e2005-04-16 15:20:36 -0700192/*
193 * Level 4 access.
194 */
Dave McCracken46a82b22006-09-25 23:31:48 -0700195#define pgd_page_vaddr(pgd) ((unsigned long) __va((unsigned long)pgd_val(pgd) & PTE_MASK))
196#define pgd_page(pgd) (pfn_to_page(pgd_val(pgd) >> PAGE_SHIFT))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197#define pgd_index(address) (((address) >> PGDIR_SHIFT) & (PTRS_PER_PGD-1))
198#define pgd_offset(mm, addr) ((mm)->pgd + pgd_index(addr))
199#define pgd_offset_k(address) (init_level4_pgt + pgd_index(address))
200#define pgd_present(pgd) (pgd_val(pgd) & _PAGE_PRESENT)
201#define mk_kernel_pgd(address) ((pgd_t){ (address) | _KERNPG_TABLE })
202
203/* PUD - Level3 access */
204/* to find an entry in a page-table-directory. */
Dave McCracken46a82b22006-09-25 23:31:48 -0700205#define pud_page_vaddr(pud) ((unsigned long) __va(pud_val(pud) & PHYSICAL_PAGE_MASK))
206#define pud_page(pud) (pfn_to_page(pud_val(pud) >> PAGE_SHIFT))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207#define pud_index(address) (((address) >> PUD_SHIFT) & (PTRS_PER_PUD-1))
Dave McCracken46a82b22006-09-25 23:31:48 -0700208#define pud_offset(pgd, address) ((pud_t *) pgd_page_vaddr(*(pgd)) + pud_index(address))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700209#define pud_present(pud) (pud_val(pud) & _PAGE_PRESENT)
210
Linus Torvalds1da177e2005-04-16 15:20:36 -0700211/* PMD - Level 2 access */
Dave McCracken46a82b22006-09-25 23:31:48 -0700212#define pmd_page_vaddr(pmd) ((unsigned long) __va(pmd_val(pmd) & PTE_MASK))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213#define pmd_page(pmd) (pfn_to_page(pmd_val(pmd) >> PAGE_SHIFT))
214
215#define pmd_index(address) (((address) >> PMD_SHIFT) & (PTRS_PER_PMD-1))
Dave McCracken46a82b22006-09-25 23:31:48 -0700216#define pmd_offset(dir, address) ((pmd_t *) pud_page_vaddr(*(dir)) + \
Linus Torvalds1da177e2005-04-16 15:20:36 -0700217 pmd_index(address))
218#define pmd_none(x) (!pmd_val(x))
219#define pmd_present(x) (pmd_val(x) & _PAGE_PRESENT)
220#define pmd_clear(xp) do { set_pmd(xp, __pmd(0)); } while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221#define pfn_pmd(nr,prot) (__pmd(((nr) << PAGE_SHIFT) | pgprot_val(prot)))
Andi Kleen6b75aee2005-11-05 17:25:53 +0100222#define pmd_pfn(x) ((pmd_val(x) & __PHYSICAL_MASK) >> PAGE_SHIFT)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223
224#define pte_to_pgoff(pte) ((pte_val(pte) & PHYSICAL_PAGE_MASK) >> PAGE_SHIFT)
Jeremy Fitzhardingec8e53932008-01-30 13:32:57 +0100225#define pgoff_to_pte(off) ((pte_t) { .pte = ((off) << PAGE_SHIFT) | _PAGE_FILE })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700226#define PTE_FILE_MAX_BITS __PHYSICAL_MASK_SHIFT
227
228/* PTE - Level 1 access. */
229
230/* page, protection -> pte */
231#define mk_pte(page, pgprot) pfn_pte(page_to_pfn(page), (pgprot))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700232
Linus Torvalds1da177e2005-04-16 15:20:36 -0700233#define pte_index(address) \
Kirill Korotaev1294b112005-09-30 10:32:19 +0400234 (((address) >> PAGE_SHIFT) & (PTRS_PER_PTE - 1))
Dave McCracken46a82b22006-09-25 23:31:48 -0700235#define pte_offset_kernel(dir, address) ((pte_t *) pmd_page_vaddr(*(dir)) + \
Linus Torvalds1da177e2005-04-16 15:20:36 -0700236 pte_index(address))
237
238/* x86-64 always has all page tables mapped. */
239#define pte_offset_map(dir,address) pte_offset_kernel(dir,address)
240#define pte_offset_map_nested(dir,address) pte_offset_kernel(dir,address)
241#define pte_unmap(pte) /* NOP */
242#define pte_unmap_nested(pte) /* NOP */
243
244#define update_mmu_cache(vma,address,pte) do { } while (0)
245
246/* We only update the dirty/accessed state if we set
247 * the dirty bit by hand in the kernel, since the hardware
248 * will do the accessed bit for us, and we don't want to
249 * race with other CPU's that might be updating the dirty
250 * bit at the same time. */
251#define __HAVE_ARCH_PTEP_SET_ACCESS_FLAGS
252#define ptep_set_access_flags(__vma, __address, __ptep, __entry, __dirty) \
Benjamin Herrenschmidt8dab5242007-06-16 10:16:12 -0700253({ \
254 int __changed = !pte_same(*(__ptep), __entry); \
255 if (__changed && __dirty) { \
256 set_pte(__ptep, __entry); \
257 flush_tlb_page(__vma, __address); \
258 } \
259 __changed; \
260})
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261
262/* Encode and de-code a swap entry */
263#define __swp_type(x) (((x).val >> 1) & 0x3f)
264#define __swp_offset(x) ((x).val >> 8)
265#define __swp_entry(type, offset) ((swp_entry_t) { ((type) << 1) | ((offset) << 8) })
266#define __pte_to_swp_entry(pte) ((swp_entry_t) { pte_val(pte) })
Jeremy Fitzhardingec8e53932008-01-30 13:32:57 +0100267#define __swp_entry_to_pte(x) ((pte_t) { .pte = (x).val })
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268
Jan Beulich8c914cb2006-03-25 16:29:40 +0100269extern spinlock_t pgd_lock;
Christoph Lameter2bff7382007-05-02 19:27:10 +0200270extern struct list_head pgd_list;
Jan Beulich8c914cb2006-03-25 16:29:40 +0100271
Linus Torvalds1da177e2005-04-16 15:20:36 -0700272extern int kern_addr_valid(unsigned long addr);
273
Andi Kleen19d36cc2007-07-22 11:12:31 +0200274pte_t *lookup_address(unsigned long addr);
275
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276#define io_remap_pfn_range(vma, vaddr, pfn, size, prot) \
277 remap_pfn_range(vma, vaddr, pfn, size, prot)
278
Linus Torvalds1da177e2005-04-16 15:20:36 -0700279#define HAVE_ARCH_UNMAPPED_AREA
Jiri Kosinacc503c12008-01-30 13:31:07 +0100280#define HAVE_ARCH_UNMAPPED_AREA_TOPDOWN
Linus Torvalds1da177e2005-04-16 15:20:36 -0700281
282#define pgtable_cache_init() do { } while (0)
Linus Torvaldsda8f1532007-09-21 12:09:41 -0700283#define check_pgt_cache() do { } while (0)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284
285#define PAGE_AGP PAGE_KERNEL_NOCACHE
286#define HAVE_PAGE_AGP 1
287
288/* fs/proc/kcore.c */
289#define kc_vaddr_to_offset(v) ((v) & __VIRTUAL_MASK)
290#define kc_offset_to_vaddr(o) \
291 (((o) & (1UL << (__VIRTUAL_MASK_SHIFT-1))) ? ((o) | (~__VIRTUAL_MASK)) : (o))
292
293#define __HAVE_ARCH_PTEP_TEST_AND_CLEAR_YOUNG
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294#define __HAVE_ARCH_PTEP_GET_AND_CLEAR
Zachary Amsden61e06032005-09-03 15:55:06 -0700295#define __HAVE_ARCH_PTEP_GET_AND_CLEAR_FULL
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296#define __HAVE_ARCH_PTEP_SET_WRPROTECT
297#define __HAVE_ARCH_PTE_SAME
298#include <asm-generic/pgtable.h>
Vivek Goyal9d291e72007-05-02 19:27:06 +0200299#endif /* !__ASSEMBLY__ */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300
301#endif /* _X86_64_PGTABLE_H */