Commit | Line | Data |
---|---|---|
f4eb07c1 | 1 | /* |
f4eb07c1 HC |
2 | * Copyright IBM Corp. 2006 |
3 | * Author(s): Heiko Carstens <heiko.carstens@de.ibm.com> | |
4 | */ | |
5 | ||
6 | #include <linux/bootmem.h> | |
7 | #include <linux/pfn.h> | |
8 | #include <linux/mm.h> | |
9 | #include <linux/module.h> | |
10 | #include <linux/list.h> | |
53492b1d | 11 | #include <linux/hugetlb.h> |
5a0e3ad6 | 12 | #include <linux/slab.h> |
50be6345 | 13 | #include <linux/memblock.h> |
f4eb07c1 HC |
14 | #include <asm/pgalloc.h> |
15 | #include <asm/pgtable.h> | |
16 | #include <asm/setup.h> | |
17 | #include <asm/tlbflush.h> | |
53492b1d | 18 | #include <asm/sections.h> |
f4eb07c1 | 19 | |
f4eb07c1 HC |
20 | static DEFINE_MUTEX(vmem_mutex); |
21 | ||
22 | struct memory_segment { | |
23 | struct list_head list; | |
24 | unsigned long start; | |
25 | unsigned long size; | |
26 | }; | |
27 | ||
28 | static LIST_HEAD(mem_segs); | |
29 | ||
67060d9c HC |
30 | static void __ref *vmem_alloc_pages(unsigned int order) |
31 | { | |
32 | if (slab_is_available()) | |
33 | return (void *)__get_free_pages(GFP_KERNEL, order); | |
34 | return alloc_bootmem_pages((1 << order) * PAGE_SIZE); | |
35 | } | |
36 | ||
37 | static inline pud_t *vmem_pud_alloc(void) | |
5a216a20 MS |
38 | { |
39 | pud_t *pud = NULL; | |
40 | ||
67060d9c | 41 | pud = vmem_alloc_pages(2); |
5a216a20 MS |
42 | if (!pud) |
43 | return NULL; | |
8fc63658 | 44 | clear_table((unsigned long *) pud, _REGION3_ENTRY_EMPTY, PAGE_SIZE * 4); |
5a216a20 MS |
45 | return pud; |
46 | } | |
190a1d72 | 47 | |
67060d9c | 48 | static inline pmd_t *vmem_pmd_alloc(void) |
f4eb07c1 | 49 | { |
3610cce8 | 50 | pmd_t *pmd = NULL; |
f4eb07c1 | 51 | |
67060d9c | 52 | pmd = vmem_alloc_pages(2); |
f4eb07c1 HC |
53 | if (!pmd) |
54 | return NULL; | |
8fc63658 | 55 | clear_table((unsigned long *) pmd, _SEGMENT_ENTRY_EMPTY, PAGE_SIZE * 4); |
f4eb07c1 HC |
56 | return pmd; |
57 | } | |
58 | ||
e5992f2e | 59 | static pte_t __ref *vmem_pte_alloc(unsigned long address) |
f4eb07c1 | 60 | { |
146e4b3c | 61 | pte_t *pte; |
f4eb07c1 | 62 | |
146e4b3c | 63 | if (slab_is_available()) |
527e30b4 | 64 | pte = (pte_t *) page_table_alloc(&init_mm); |
146e4b3c | 65 | else |
50be6345 PH |
66 | pte = alloc_bootmem_align(PTRS_PER_PTE * sizeof(pte_t), |
67 | PTRS_PER_PTE * sizeof(pte_t)); | |
f4eb07c1 HC |
68 | if (!pte) |
69 | return NULL; | |
e5098611 | 70 | clear_table((unsigned long *) pte, _PAGE_INVALID, |
6af7eea2 | 71 | PTRS_PER_PTE * sizeof(pte_t)); |
f4eb07c1 HC |
72 | return pte; |
73 | } | |
74 | ||
75 | /* | |
76 | * Add a physical memory range to the 1:1 mapping. | |
77 | */ | |
17f34580 | 78 | static int vmem_add_mem(unsigned long start, unsigned long size, int ro) |
f4eb07c1 | 79 | { |
378b1e7a HC |
80 | unsigned long end = start + size; |
81 | unsigned long address = start; | |
f4eb07c1 | 82 | pgd_t *pg_dir; |
190a1d72 | 83 | pud_t *pu_dir; |
f4eb07c1 HC |
84 | pmd_t *pm_dir; |
85 | pte_t *pt_dir; | |
f4eb07c1 HC |
86 | int ret = -ENOMEM; |
87 | ||
378b1e7a | 88 | while (address < end) { |
f4eb07c1 HC |
89 | pg_dir = pgd_offset_k(address); |
90 | if (pgd_none(*pg_dir)) { | |
190a1d72 MS |
91 | pu_dir = vmem_pud_alloc(); |
92 | if (!pu_dir) | |
93 | goto out; | |
b2fa47e6 | 94 | pgd_populate(&init_mm, pg_dir, pu_dir); |
190a1d72 | 95 | } |
190a1d72 | 96 | pu_dir = pud_offset(pg_dir, address); |
18da2369 | 97 | if (MACHINE_HAS_EDAT2 && pud_none(*pu_dir) && address && |
10917b83 CB |
98 | !(address & ~PUD_MASK) && (address + PUD_SIZE <= end) && |
99 | !debug_pagealloc_enabled()) { | |
abf09bed MS |
100 | pud_val(*pu_dir) = __pa(address) | |
101 | _REGION_ENTRY_TYPE_R3 | _REGION3_ENTRY_LARGE | | |
e5098611 | 102 | (ro ? _REGION_ENTRY_PROTECT : 0); |
18da2369 HC |
103 | address += PUD_SIZE; |
104 | continue; | |
105 | } | |
190a1d72 | 106 | if (pud_none(*pu_dir)) { |
f4eb07c1 HC |
107 | pm_dir = vmem_pmd_alloc(); |
108 | if (!pm_dir) | |
109 | goto out; | |
b2fa47e6 | 110 | pud_populate(&init_mm, pu_dir, pm_dir); |
f4eb07c1 | 111 | } |
190a1d72 | 112 | pm_dir = pmd_offset(pu_dir, address); |
fc7e48aa | 113 | if (MACHINE_HAS_EDAT1 && pmd_none(*pm_dir) && address && |
10917b83 CB |
114 | !(address & ~PMD_MASK) && (address + PMD_SIZE <= end) && |
115 | !debug_pagealloc_enabled()) { | |
abf09bed MS |
116 | pmd_val(*pm_dir) = __pa(address) | |
117 | _SEGMENT_ENTRY | _SEGMENT_ENTRY_LARGE | | |
0944fe3f | 118 | _SEGMENT_ENTRY_YOUNG | |
e5098611 | 119 | (ro ? _SEGMENT_ENTRY_PROTECT : 0); |
378b1e7a | 120 | address += PMD_SIZE; |
53492b1d GS |
121 | continue; |
122 | } | |
f4eb07c1 | 123 | if (pmd_none(*pm_dir)) { |
e5992f2e | 124 | pt_dir = vmem_pte_alloc(address); |
f4eb07c1 HC |
125 | if (!pt_dir) |
126 | goto out; | |
b2fa47e6 | 127 | pmd_populate(&init_mm, pm_dir, pt_dir); |
f4eb07c1 HC |
128 | } |
129 | ||
130 | pt_dir = pte_offset_kernel(pm_dir, address); | |
e5098611 MS |
131 | pte_val(*pt_dir) = __pa(address) | |
132 | pgprot_val(ro ? PAGE_KERNEL_RO : PAGE_KERNEL); | |
378b1e7a | 133 | address += PAGE_SIZE; |
f4eb07c1 HC |
134 | } |
135 | ret = 0; | |
136 | out: | |
f4eb07c1 HC |
137 | return ret; |
138 | } | |
139 | ||
140 | /* | |
141 | * Remove a physical memory range from the 1:1 mapping. | |
142 | * Currently only invalidates page table entries. | |
143 | */ | |
144 | static void vmem_remove_range(unsigned long start, unsigned long size) | |
145 | { | |
378b1e7a HC |
146 | unsigned long end = start + size; |
147 | unsigned long address = start; | |
f4eb07c1 | 148 | pgd_t *pg_dir; |
190a1d72 | 149 | pud_t *pu_dir; |
f4eb07c1 HC |
150 | pmd_t *pm_dir; |
151 | pte_t *pt_dir; | |
152 | pte_t pte; | |
153 | ||
e5098611 | 154 | pte_val(pte) = _PAGE_INVALID; |
378b1e7a | 155 | while (address < end) { |
f4eb07c1 | 156 | pg_dir = pgd_offset_k(address); |
fc7e48aa HC |
157 | if (pgd_none(*pg_dir)) { |
158 | address += PGDIR_SIZE; | |
159 | continue; | |
160 | } | |
190a1d72 | 161 | pu_dir = pud_offset(pg_dir, address); |
fc7e48aa HC |
162 | if (pud_none(*pu_dir)) { |
163 | address += PUD_SIZE; | |
f4eb07c1 | 164 | continue; |
fc7e48aa | 165 | } |
18da2369 HC |
166 | if (pud_large(*pu_dir)) { |
167 | pud_clear(pu_dir); | |
168 | address += PUD_SIZE; | |
169 | continue; | |
170 | } | |
190a1d72 | 171 | pm_dir = pmd_offset(pu_dir, address); |
fc7e48aa HC |
172 | if (pmd_none(*pm_dir)) { |
173 | address += PMD_SIZE; | |
f4eb07c1 | 174 | continue; |
fc7e48aa | 175 | } |
378b1e7a | 176 | if (pmd_large(*pm_dir)) { |
b2fa47e6 | 177 | pmd_clear(pm_dir); |
378b1e7a | 178 | address += PMD_SIZE; |
53492b1d GS |
179 | continue; |
180 | } | |
f4eb07c1 | 181 | pt_dir = pte_offset_kernel(pm_dir, address); |
c1821c2e | 182 | *pt_dir = pte; |
378b1e7a | 183 | address += PAGE_SIZE; |
f4eb07c1 | 184 | } |
378b1e7a | 185 | flush_tlb_kernel_range(start, end); |
f4eb07c1 HC |
186 | } |
187 | ||
188 | /* | |
189 | * Add a backed mem_map array to the virtual mem_map array. | |
190 | */ | |
0aad818b | 191 | int __meminit vmemmap_populate(unsigned long start, unsigned long end, int node) |
f4eb07c1 | 192 | { |
0aad818b | 193 | unsigned long address = start; |
f4eb07c1 | 194 | pgd_t *pg_dir; |
190a1d72 | 195 | pud_t *pu_dir; |
f4eb07c1 HC |
196 | pmd_t *pm_dir; |
197 | pte_t *pt_dir; | |
f4eb07c1 HC |
198 | int ret = -ENOMEM; |
199 | ||
0aad818b | 200 | for (address = start; address < end;) { |
f4eb07c1 HC |
201 | pg_dir = pgd_offset_k(address); |
202 | if (pgd_none(*pg_dir)) { | |
190a1d72 MS |
203 | pu_dir = vmem_pud_alloc(); |
204 | if (!pu_dir) | |
205 | goto out; | |
b2fa47e6 | 206 | pgd_populate(&init_mm, pg_dir, pu_dir); |
190a1d72 MS |
207 | } |
208 | ||
209 | pu_dir = pud_offset(pg_dir, address); | |
210 | if (pud_none(*pu_dir)) { | |
f4eb07c1 HC |
211 | pm_dir = vmem_pmd_alloc(); |
212 | if (!pm_dir) | |
213 | goto out; | |
b2fa47e6 | 214 | pud_populate(&init_mm, pu_dir, pm_dir); |
f4eb07c1 HC |
215 | } |
216 | ||
190a1d72 | 217 | pm_dir = pmd_offset(pu_dir, address); |
f4eb07c1 | 218 | if (pmd_none(*pm_dir)) { |
f7817968 HC |
219 | /* Use 1MB frames for vmemmap if available. We always |
220 | * use large frames even if they are only partially | |
221 | * used. | |
222 | * Otherwise we would have also page tables since | |
223 | * vmemmap_populate gets called for each section | |
224 | * separately. */ | |
225 | if (MACHINE_HAS_EDAT1) { | |
226 | void *new_page; | |
227 | ||
228 | new_page = vmemmap_alloc_block(PMD_SIZE, node); | |
229 | if (!new_page) | |
230 | goto out; | |
abf09bed | 231 | pmd_val(*pm_dir) = __pa(new_page) | |
6a5c1482 | 232 | _SEGMENT_ENTRY | _SEGMENT_ENTRY_LARGE; |
f7817968 HC |
233 | address = (address + PMD_SIZE) & PMD_MASK; |
234 | continue; | |
235 | } | |
e5992f2e | 236 | pt_dir = vmem_pte_alloc(address); |
f4eb07c1 HC |
237 | if (!pt_dir) |
238 | goto out; | |
b2fa47e6 | 239 | pmd_populate(&init_mm, pm_dir, pt_dir); |
f7817968 HC |
240 | } else if (pmd_large(*pm_dir)) { |
241 | address = (address + PMD_SIZE) & PMD_MASK; | |
242 | continue; | |
f4eb07c1 HC |
243 | } |
244 | ||
245 | pt_dir = pte_offset_kernel(pm_dir, address); | |
246 | if (pte_none(*pt_dir)) { | |
70c9d296 | 247 | void *new_page; |
f4eb07c1 | 248 | |
70c9d296 | 249 | new_page = vmemmap_alloc_block(PAGE_SIZE, node); |
f4eb07c1 HC |
250 | if (!new_page) |
251 | goto out; | |
e5098611 MS |
252 | pte_val(*pt_dir) = |
253 | __pa(new_page) | pgprot_val(PAGE_KERNEL); | |
f4eb07c1 | 254 | } |
f7817968 | 255 | address += PAGE_SIZE; |
f4eb07c1 HC |
256 | } |
257 | ret = 0; | |
258 | out: | |
f4eb07c1 HC |
259 | return ret; |
260 | } | |
261 | ||
0aad818b | 262 | void vmemmap_free(unsigned long start, unsigned long end) |
0197518c TC |
263 | { |
264 | } | |
265 | ||
f4eb07c1 HC |
266 | /* |
267 | * Add memory segment to the segment list if it doesn't overlap with | |
268 | * an already present segment. | |
269 | */ | |
270 | static int insert_memory_segment(struct memory_segment *seg) | |
271 | { | |
272 | struct memory_segment *tmp; | |
273 | ||
ee0ddadd | 274 | if (seg->start + seg->size > VMEM_MAX_PHYS || |
f4eb07c1 HC |
275 | seg->start + seg->size < seg->start) |
276 | return -ERANGE; | |
277 | ||
278 | list_for_each_entry(tmp, &mem_segs, list) { | |
279 | if (seg->start >= tmp->start + tmp->size) | |
280 | continue; | |
281 | if (seg->start + seg->size <= tmp->start) | |
282 | continue; | |
283 | return -ENOSPC; | |
284 | } | |
285 | list_add(&seg->list, &mem_segs); | |
286 | return 0; | |
287 | } | |
288 | ||
289 | /* | |
290 | * Remove memory segment from the segment list. | |
291 | */ | |
292 | static void remove_memory_segment(struct memory_segment *seg) | |
293 | { | |
294 | list_del(&seg->list); | |
295 | } | |
296 | ||
297 | static void __remove_shared_memory(struct memory_segment *seg) | |
298 | { | |
299 | remove_memory_segment(seg); | |
300 | vmem_remove_range(seg->start, seg->size); | |
301 | } | |
302 | ||
17f34580 | 303 | int vmem_remove_mapping(unsigned long start, unsigned long size) |
f4eb07c1 HC |
304 | { |
305 | struct memory_segment *seg; | |
306 | int ret; | |
307 | ||
308 | mutex_lock(&vmem_mutex); | |
309 | ||
310 | ret = -ENOENT; | |
311 | list_for_each_entry(seg, &mem_segs, list) { | |
312 | if (seg->start == start && seg->size == size) | |
313 | break; | |
314 | } | |
315 | ||
316 | if (seg->start != start || seg->size != size) | |
317 | goto out; | |
318 | ||
319 | ret = 0; | |
320 | __remove_shared_memory(seg); | |
321 | kfree(seg); | |
322 | out: | |
323 | mutex_unlock(&vmem_mutex); | |
324 | return ret; | |
325 | } | |
326 | ||
17f34580 | 327 | int vmem_add_mapping(unsigned long start, unsigned long size) |
f4eb07c1 HC |
328 | { |
329 | struct memory_segment *seg; | |
f4eb07c1 HC |
330 | int ret; |
331 | ||
332 | mutex_lock(&vmem_mutex); | |
333 | ret = -ENOMEM; | |
334 | seg = kzalloc(sizeof(*seg), GFP_KERNEL); | |
335 | if (!seg) | |
336 | goto out; | |
337 | seg->start = start; | |
338 | seg->size = size; | |
339 | ||
340 | ret = insert_memory_segment(seg); | |
341 | if (ret) | |
342 | goto out_free; | |
343 | ||
53492b1d | 344 | ret = vmem_add_mem(start, size, 0); |
f4eb07c1 HC |
345 | if (ret) |
346 | goto out_remove; | |
f4eb07c1 HC |
347 | goto out; |
348 | ||
349 | out_remove: | |
350 | __remove_shared_memory(seg); | |
351 | out_free: | |
352 | kfree(seg); | |
353 | out: | |
354 | mutex_unlock(&vmem_mutex); | |
355 | return ret; | |
356 | } | |
357 | ||
358 | /* | |
359 | * map whole physical memory to virtual memory (identity mapping) | |
5fd9c6e2 CB |
360 | * we reserve enough space in the vmalloc area for vmemmap to hotplug |
361 | * additional memory segments. | |
f4eb07c1 HC |
362 | */ |
363 | void __init vmem_map_init(void) | |
364 | { | |
53492b1d | 365 | unsigned long ro_start, ro_end; |
50be6345 PH |
366 | struct memblock_region *reg; |
367 | phys_addr_t start, end; | |
f4eb07c1 | 368 | |
8fe234d3 HC |
369 | ro_start = PFN_ALIGN((unsigned long)&_stext); |
370 | ro_end = (unsigned long)&_eshared & PAGE_MASK; | |
50be6345 PH |
371 | for_each_memblock(memory, reg) { |
372 | start = reg->base; | |
373 | end = reg->base + reg->size - 1; | |
53492b1d GS |
374 | if (start >= ro_end || end <= ro_start) |
375 | vmem_add_mem(start, end - start, 0); | |
376 | else if (start >= ro_start && end <= ro_end) | |
377 | vmem_add_mem(start, end - start, 1); | |
378 | else if (start >= ro_start) { | |
379 | vmem_add_mem(start, ro_end - start, 1); | |
380 | vmem_add_mem(ro_end, end - ro_end, 0); | |
381 | } else if (end < ro_end) { | |
382 | vmem_add_mem(start, ro_start - start, 0); | |
383 | vmem_add_mem(ro_start, end - ro_start, 1); | |
384 | } else { | |
385 | vmem_add_mem(start, ro_start - start, 0); | |
386 | vmem_add_mem(ro_start, ro_end - ro_start, 1); | |
387 | vmem_add_mem(ro_end, end - ro_end, 0); | |
388 | } | |
389 | } | |
f4eb07c1 HC |
390 | } |
391 | ||
392 | /* | |
50be6345 PH |
393 | * Convert memblock.memory to a memory segment list so there is a single |
394 | * list that contains all memory segments. | |
f4eb07c1 HC |
395 | */ |
396 | static int __init vmem_convert_memory_chunk(void) | |
397 | { | |
50be6345 | 398 | struct memblock_region *reg; |
f4eb07c1 | 399 | struct memory_segment *seg; |
f4eb07c1 HC |
400 | |
401 | mutex_lock(&vmem_mutex); | |
50be6345 | 402 | for_each_memblock(memory, reg) { |
f4eb07c1 HC |
403 | seg = kzalloc(sizeof(*seg), GFP_KERNEL); |
404 | if (!seg) | |
405 | panic("Out of memory...\n"); | |
50be6345 PH |
406 | seg->start = reg->base; |
407 | seg->size = reg->size; | |
f4eb07c1 HC |
408 | insert_memory_segment(seg); |
409 | } | |
410 | mutex_unlock(&vmem_mutex); | |
411 | return 0; | |
412 | } | |
413 | ||
414 | core_initcall(vmem_convert_memory_chunk); |