blob: bf37a094a46bc8dc24b8bc1491b5f68a9ee7bb59 [file] [log] [blame]
Heiko Carstensf4eb07c2006-12-08 15:56:07 +01001/*
Heiko Carstensf4eb07c2006-12-08 15:56:07 +01002 * Copyright IBM Corp. 2006
3 * Author(s): Heiko Carstens <heiko.carstens@de.ibm.com>
4 */
5
6#include <linux/bootmem.h>
7#include <linux/pfn.h>
8#include <linux/mm.h>
9#include <linux/module.h>
10#include <linux/list.h>
Gerald Schaefer53492b12008-04-30 13:38:46 +020011#include <linux/hugetlb.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090012#include <linux/slab.h>
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010013#include <asm/pgalloc.h>
14#include <asm/pgtable.h>
15#include <asm/setup.h>
16#include <asm/tlbflush.h>
Gerald Schaefer53492b12008-04-30 13:38:46 +020017#include <asm/sections.h>
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010018
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010019static DEFINE_MUTEX(vmem_mutex);
20
21struct memory_segment {
22 struct list_head list;
23 unsigned long start;
24 unsigned long size;
25};
26
27static LIST_HEAD(mem_segs);
28
Heiko Carstens67060d92008-05-30 10:03:27 +020029static void __ref *vmem_alloc_pages(unsigned int order)
30{
31 if (slab_is_available())
32 return (void *)__get_free_pages(GFP_KERNEL, order);
33 return alloc_bootmem_pages((1 << order) * PAGE_SIZE);
34}
35
36static inline pud_t *vmem_pud_alloc(void)
Martin Schwidefsky5a216a22008-02-09 18:24:36 +010037{
38 pud_t *pud = NULL;
39
40#ifdef CONFIG_64BIT
Heiko Carstens67060d92008-05-30 10:03:27 +020041 pud = vmem_alloc_pages(2);
Martin Schwidefsky5a216a22008-02-09 18:24:36 +010042 if (!pud)
43 return NULL;
Heiko Carstens8fc63652008-04-30 13:38:44 +020044 clear_table((unsigned long *) pud, _REGION3_ENTRY_EMPTY, PAGE_SIZE * 4);
Martin Schwidefsky5a216a22008-02-09 18:24:36 +010045#endif
46 return pud;
47}
Martin Schwidefsky190a1d72007-10-22 12:52:48 +020048
Heiko Carstens67060d92008-05-30 10:03:27 +020049static inline pmd_t *vmem_pmd_alloc(void)
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010050{
Martin Schwidefsky3610cce2007-10-22 12:52:47 +020051 pmd_t *pmd = NULL;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010052
Martin Schwidefsky3610cce2007-10-22 12:52:47 +020053#ifdef CONFIG_64BIT
Heiko Carstens67060d92008-05-30 10:03:27 +020054 pmd = vmem_alloc_pages(2);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010055 if (!pmd)
56 return NULL;
Heiko Carstens8fc63652008-04-30 13:38:44 +020057 clear_table((unsigned long *) pmd, _SEGMENT_ENTRY_EMPTY, PAGE_SIZE * 4);
Martin Schwidefsky3610cce2007-10-22 12:52:47 +020058#endif
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010059 return pmd;
60}
61
Martin Schwidefskye5992f22011-07-24 10:48:20 +020062static pte_t __ref *vmem_pte_alloc(unsigned long address)
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010063{
Martin Schwidefsky146e4b32008-02-09 18:24:35 +010064 pte_t *pte;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010065
Martin Schwidefsky146e4b32008-02-09 18:24:35 +010066 if (slab_is_available())
Martin Schwidefskye5992f22011-07-24 10:48:20 +020067 pte = (pte_t *) page_table_alloc(&init_mm, address);
Martin Schwidefsky146e4b32008-02-09 18:24:35 +010068 else
69 pte = alloc_bootmem(PTRS_PER_PTE * sizeof(pte_t));
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010070 if (!pte)
71 return NULL;
Christian Borntraeger6af7eea2010-04-09 13:43:01 +020072 clear_table((unsigned long *) pte, _PAGE_TYPE_EMPTY,
73 PTRS_PER_PTE * sizeof(pte_t));
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010074 return pte;
75}
76
77/*
78 * Add a physical memory range to the 1:1 mapping.
79 */
Heiko Carstens17f34582008-04-30 13:38:47 +020080static int vmem_add_mem(unsigned long start, unsigned long size, int ro)
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010081{
Heiko Carstens378b1e72012-10-01 12:58:34 +020082 unsigned long end = start + size;
83 unsigned long address = start;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010084 pgd_t *pg_dir;
Martin Schwidefsky190a1d72007-10-22 12:52:48 +020085 pud_t *pu_dir;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010086 pmd_t *pm_dir;
87 pte_t *pt_dir;
88 pte_t pte;
89 int ret = -ENOMEM;
90
Heiko Carstens378b1e72012-10-01 12:58:34 +020091 while (address < end) {
Heiko Carstens18da2362012-10-08 09:18:26 +020092 pte = mk_pte_phys(address, __pgprot(ro ? _PAGE_RO : 0));
Heiko Carstensf4eb07c2006-12-08 15:56:07 +010093 pg_dir = pgd_offset_k(address);
94 if (pgd_none(*pg_dir)) {
Martin Schwidefsky190a1d72007-10-22 12:52:48 +020095 pu_dir = vmem_pud_alloc();
96 if (!pu_dir)
97 goto out;
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +020098 pgd_populate(&init_mm, pg_dir, pu_dir);
Martin Schwidefsky190a1d72007-10-22 12:52:48 +020099 }
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200100 pu_dir = pud_offset(pg_dir, address);
Heiko Carstens18da2362012-10-08 09:18:26 +0200101#if defined(CONFIG_64BIT) && !defined(CONFIG_DEBUG_PAGEALLOC)
102 if (MACHINE_HAS_EDAT2 && pud_none(*pu_dir) && address &&
103 !(address & ~PUD_MASK) && (address + PUD_SIZE <= end)) {
104 pte_val(pte) |= _REGION3_ENTRY_LARGE;
105 pte_val(pte) |= _REGION_ENTRY_TYPE_R3;
106 pud_val(*pu_dir) = pte_val(pte);
107 address += PUD_SIZE;
108 continue;
109 }
110#endif
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200111 if (pud_none(*pu_dir)) {
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100112 pm_dir = vmem_pmd_alloc();
113 if (!pm_dir)
114 goto out;
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +0200115 pud_populate(&init_mm, pu_dir, pm_dir);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100116 }
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200117 pm_dir = pmd_offset(pu_dir, address);
Gerald Schaefer648609e2012-08-21 12:36:34 +0200118#if defined(CONFIG_64BIT) && !defined(CONFIG_DEBUG_PAGEALLOC)
Heiko Carstensfc7e48aa2012-10-08 07:54:32 +0200119 if (MACHINE_HAS_EDAT1 && pmd_none(*pm_dir) && address &&
120 !(address & ~PMD_MASK) && (address + PMD_SIZE <= end)) {
Christian Borntraeger6af7eea2010-04-09 13:43:01 +0200121 pte_val(pte) |= _SEGMENT_ENTRY_LARGE;
Gerald Schaefer53492b12008-04-30 13:38:46 +0200122 pmd_val(*pm_dir) = pte_val(pte);
Heiko Carstens378b1e72012-10-01 12:58:34 +0200123 address += PMD_SIZE;
Gerald Schaefer53492b12008-04-30 13:38:46 +0200124 continue;
125 }
126#endif
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100127 if (pmd_none(*pm_dir)) {
Martin Schwidefskye5992f22011-07-24 10:48:20 +0200128 pt_dir = vmem_pte_alloc(address);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100129 if (!pt_dir)
130 goto out;
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +0200131 pmd_populate(&init_mm, pm_dir, pt_dir);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100132 }
133
134 pt_dir = pte_offset_kernel(pm_dir, address);
Gerald Schaeferc1821c22007-02-05 21:18:17 +0100135 *pt_dir = pte;
Heiko Carstens378b1e72012-10-01 12:58:34 +0200136 address += PAGE_SIZE;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100137 }
138 ret = 0;
139out:
Heiko Carstens378b1e72012-10-01 12:58:34 +0200140 flush_tlb_kernel_range(start, end);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100141 return ret;
142}
143
144/*
145 * Remove a physical memory range from the 1:1 mapping.
146 * Currently only invalidates page table entries.
147 */
148static void vmem_remove_range(unsigned long start, unsigned long size)
149{
Heiko Carstens378b1e72012-10-01 12:58:34 +0200150 unsigned long end = start + size;
151 unsigned long address = start;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100152 pgd_t *pg_dir;
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200153 pud_t *pu_dir;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100154 pmd_t *pm_dir;
155 pte_t *pt_dir;
156 pte_t pte;
157
158 pte_val(pte) = _PAGE_TYPE_EMPTY;
Heiko Carstens378b1e72012-10-01 12:58:34 +0200159 while (address < end) {
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100160 pg_dir = pgd_offset_k(address);
Heiko Carstensfc7e48aa2012-10-08 07:54:32 +0200161 if (pgd_none(*pg_dir)) {
162 address += PGDIR_SIZE;
163 continue;
164 }
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200165 pu_dir = pud_offset(pg_dir, address);
Heiko Carstensfc7e48aa2012-10-08 07:54:32 +0200166 if (pud_none(*pu_dir)) {
167 address += PUD_SIZE;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100168 continue;
Heiko Carstensfc7e48aa2012-10-08 07:54:32 +0200169 }
Heiko Carstens18da2362012-10-08 09:18:26 +0200170 if (pud_large(*pu_dir)) {
171 pud_clear(pu_dir);
172 address += PUD_SIZE;
173 continue;
174 }
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200175 pm_dir = pmd_offset(pu_dir, address);
Heiko Carstensfc7e48aa2012-10-08 07:54:32 +0200176 if (pmd_none(*pm_dir)) {
177 address += PMD_SIZE;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100178 continue;
Heiko Carstensfc7e48aa2012-10-08 07:54:32 +0200179 }
Heiko Carstens378b1e72012-10-01 12:58:34 +0200180 if (pmd_large(*pm_dir)) {
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +0200181 pmd_clear(pm_dir);
Heiko Carstens378b1e72012-10-01 12:58:34 +0200182 address += PMD_SIZE;
Gerald Schaefer53492b12008-04-30 13:38:46 +0200183 continue;
184 }
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100185 pt_dir = pte_offset_kernel(pm_dir, address);
Gerald Schaeferc1821c22007-02-05 21:18:17 +0100186 *pt_dir = pte;
Heiko Carstens378b1e72012-10-01 12:58:34 +0200187 address += PAGE_SIZE;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100188 }
Heiko Carstens378b1e72012-10-01 12:58:34 +0200189 flush_tlb_kernel_range(start, end);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100190}
191
192/*
193 * Add a backed mem_map array to the virtual mem_map array.
194 */
Heiko Carstens17f34582008-04-30 13:38:47 +0200195int __meminit vmemmap_populate(struct page *start, unsigned long nr, int node)
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100196{
197 unsigned long address, start_addr, end_addr;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100198 pgd_t *pg_dir;
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200199 pud_t *pu_dir;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100200 pmd_t *pm_dir;
201 pte_t *pt_dir;
202 pte_t pte;
203 int ret = -ENOMEM;
204
Heiko Carstens17f34582008-04-30 13:38:47 +0200205 start_addr = (unsigned long) start;
206 end_addr = (unsigned long) (start + nr);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100207
208 for (address = start_addr; address < end_addr; address += PAGE_SIZE) {
209 pg_dir = pgd_offset_k(address);
210 if (pgd_none(*pg_dir)) {
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200211 pu_dir = vmem_pud_alloc();
212 if (!pu_dir)
213 goto out;
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +0200214 pgd_populate(&init_mm, pg_dir, pu_dir);
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200215 }
216
217 pu_dir = pud_offset(pg_dir, address);
218 if (pud_none(*pu_dir)) {
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100219 pm_dir = vmem_pmd_alloc();
220 if (!pm_dir)
221 goto out;
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +0200222 pud_populate(&init_mm, pu_dir, pm_dir);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100223 }
224
Martin Schwidefsky190a1d72007-10-22 12:52:48 +0200225 pm_dir = pmd_offset(pu_dir, address);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100226 if (pmd_none(*pm_dir)) {
Martin Schwidefskye5992f22011-07-24 10:48:20 +0200227 pt_dir = vmem_pte_alloc(address);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100228 if (!pt_dir)
229 goto out;
Martin Schwidefskyb2fa47e2011-05-23 10:24:40 +0200230 pmd_populate(&init_mm, pm_dir, pt_dir);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100231 }
232
233 pt_dir = pte_offset_kernel(pm_dir, address);
234 if (pte_none(*pt_dir)) {
235 unsigned long new_page;
236
Heiko Carstens67060d92008-05-30 10:03:27 +0200237 new_page =__pa(vmem_alloc_pages(0));
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100238 if (!new_page)
239 goto out;
240 pte = pfn_pte(new_page >> PAGE_SHIFT, PAGE_KERNEL);
Gerald Schaeferc1821c22007-02-05 21:18:17 +0100241 *pt_dir = pte;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100242 }
243 }
Heiko Carstens67060d92008-05-30 10:03:27 +0200244 memset(start, 0, nr * sizeof(struct page));
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100245 ret = 0;
246out:
247 flush_tlb_kernel_range(start_addr, end_addr);
248 return ret;
249}
250
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100251/*
252 * Add memory segment to the segment list if it doesn't overlap with
253 * an already present segment.
254 */
255static int insert_memory_segment(struct memory_segment *seg)
256{
257 struct memory_segment *tmp;
258
Heiko Carstensee0ddad2008-06-10 10:03:20 +0200259 if (seg->start + seg->size > VMEM_MAX_PHYS ||
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100260 seg->start + seg->size < seg->start)
261 return -ERANGE;
262
263 list_for_each_entry(tmp, &mem_segs, list) {
264 if (seg->start >= tmp->start + tmp->size)
265 continue;
266 if (seg->start + seg->size <= tmp->start)
267 continue;
268 return -ENOSPC;
269 }
270 list_add(&seg->list, &mem_segs);
271 return 0;
272}
273
274/*
275 * Remove memory segment from the segment list.
276 */
277static void remove_memory_segment(struct memory_segment *seg)
278{
279 list_del(&seg->list);
280}
281
282static void __remove_shared_memory(struct memory_segment *seg)
283{
284 remove_memory_segment(seg);
285 vmem_remove_range(seg->start, seg->size);
286}
287
Heiko Carstens17f34582008-04-30 13:38:47 +0200288int vmem_remove_mapping(unsigned long start, unsigned long size)
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100289{
290 struct memory_segment *seg;
291 int ret;
292
293 mutex_lock(&vmem_mutex);
294
295 ret = -ENOENT;
296 list_for_each_entry(seg, &mem_segs, list) {
297 if (seg->start == start && seg->size == size)
298 break;
299 }
300
301 if (seg->start != start || seg->size != size)
302 goto out;
303
304 ret = 0;
305 __remove_shared_memory(seg);
306 kfree(seg);
307out:
308 mutex_unlock(&vmem_mutex);
309 return ret;
310}
311
Heiko Carstens17f34582008-04-30 13:38:47 +0200312int vmem_add_mapping(unsigned long start, unsigned long size)
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100313{
314 struct memory_segment *seg;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100315 int ret;
316
317 mutex_lock(&vmem_mutex);
318 ret = -ENOMEM;
319 seg = kzalloc(sizeof(*seg), GFP_KERNEL);
320 if (!seg)
321 goto out;
322 seg->start = start;
323 seg->size = size;
324
325 ret = insert_memory_segment(seg);
326 if (ret)
327 goto out_free;
328
Gerald Schaefer53492b12008-04-30 13:38:46 +0200329 ret = vmem_add_mem(start, size, 0);
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100330 if (ret)
331 goto out_remove;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100332 goto out;
333
334out_remove:
335 __remove_shared_memory(seg);
336out_free:
337 kfree(seg);
338out:
339 mutex_unlock(&vmem_mutex);
340 return ret;
341}
342
343/*
344 * map whole physical memory to virtual memory (identity mapping)
Christian Borntraeger5fd9c6e2008-01-26 14:11:00 +0100345 * we reserve enough space in the vmalloc area for vmemmap to hotplug
346 * additional memory segments.
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100347 */
348void __init vmem_map_init(void)
349{
Gerald Schaefer53492b12008-04-30 13:38:46 +0200350 unsigned long ro_start, ro_end;
351 unsigned long start, end;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100352 int i;
353
Heiko Carstens8fe234d2012-10-04 17:02:02 +0200354 ro_start = PFN_ALIGN((unsigned long)&_stext);
355 ro_end = (unsigned long)&_eshared & PAGE_MASK;
Gerald Schaefer53492b12008-04-30 13:38:46 +0200356 for (i = 0; i < MEMORY_CHUNKS && memory_chunk[i].size > 0; i++) {
Michael Holzheu60a0c682011-10-30 15:16:40 +0100357 if (memory_chunk[i].type == CHUNK_CRASHK ||
358 memory_chunk[i].type == CHUNK_OLDMEM)
359 continue;
Gerald Schaefer53492b12008-04-30 13:38:46 +0200360 start = memory_chunk[i].addr;
361 end = memory_chunk[i].addr + memory_chunk[i].size;
362 if (start >= ro_end || end <= ro_start)
363 vmem_add_mem(start, end - start, 0);
364 else if (start >= ro_start && end <= ro_end)
365 vmem_add_mem(start, end - start, 1);
366 else if (start >= ro_start) {
367 vmem_add_mem(start, ro_end - start, 1);
368 vmem_add_mem(ro_end, end - ro_end, 0);
369 } else if (end < ro_end) {
370 vmem_add_mem(start, ro_start - start, 0);
371 vmem_add_mem(ro_start, end - ro_start, 1);
372 } else {
373 vmem_add_mem(start, ro_start - start, 0);
374 vmem_add_mem(ro_start, ro_end - ro_start, 1);
375 vmem_add_mem(ro_end, end - ro_end, 0);
376 }
377 }
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100378}
379
380/*
381 * Convert memory chunk array to a memory segment list so there is a single
382 * list that contains both r/w memory and shared memory segments.
383 */
384static int __init vmem_convert_memory_chunk(void)
385{
386 struct memory_segment *seg;
387 int i;
388
389 mutex_lock(&vmem_mutex);
Heiko Carstens9f4b0ba2008-01-26 14:11:02 +0100390 for (i = 0; i < MEMORY_CHUNKS; i++) {
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100391 if (!memory_chunk[i].size)
392 continue;
Michael Holzheu60a0c682011-10-30 15:16:40 +0100393 if (memory_chunk[i].type == CHUNK_CRASHK ||
394 memory_chunk[i].type == CHUNK_OLDMEM)
395 continue;
Heiko Carstensf4eb07c2006-12-08 15:56:07 +0100396 seg = kzalloc(sizeof(*seg), GFP_KERNEL);
397 if (!seg)
398 panic("Out of memory...\n");
399 seg->start = memory_chunk[i].addr;
400 seg->size = memory_chunk[i].size;
401 insert_memory_segment(seg);
402 }
403 mutex_unlock(&vmem_mutex);
404 return 0;
405}
406
407core_initcall(vmem_convert_memory_chunk);