blob: 52715a71aede013ecc3151338986e8417b134be0 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
4 * for more details.
5 *
6 * Copyright (C) 1998-2003 Hewlett-Packard Co
7 * David Mosberger-Tang <davidm@hpl.hp.com>
8 * Stephane Eranian <eranian@hpl.hp.com>
9 * Copyright (C) 2000, Rohit Seth <rohit.seth@intel.com>
10 * Copyright (C) 1999 VA Linux Systems
11 * Copyright (C) 1999 Walt Drummond <drummond@valinux.com>
12 * Copyright (C) 2003 Silicon Graphics, Inc. All rights reserved.
13 *
14 * Routines used by ia64 machines with contiguous (or virtually contiguous)
15 * memory.
16 */
Linus Torvalds1da177e2005-04-16 15:20:36 -070017#include <linux/bootmem.h>
18#include <linux/efi.h>
Tejun Heo98e4ae82011-12-08 10:22:08 -080019#include <linux/memblock.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070020#include <linux/mm.h>
Prarit Bhargava99a19cf2007-08-22 14:34:38 -040021#include <linux/nmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070022#include <linux/swap.h>
23
24#include <asm/meminit.h>
25#include <asm/pgalloc.h>
26#include <asm/pgtable.h>
27#include <asm/sections.h>
28#include <asm/mca.h>
29
30#ifdef CONFIG_VIRTUAL_MEM_MAP
Bob Piccoe44e41d2006-06-28 12:55:43 -040031static unsigned long max_gap;
Linus Torvalds1da177e2005-04-16 15:20:36 -070032#endif
33
Linus Torvalds1da177e2005-04-16 15:20:36 -070034/* physical address where the bootmem map is located */
35unsigned long bootmap_start;
36
37/**
Linus Torvalds1da177e2005-04-16 15:20:36 -070038 * find_bootmap_location - callback to find a memory area for the bootmap
39 * @start: start of region
40 * @end: end of region
41 * @arg: unused callback data
42 *
43 * Find a place to put the bootmap and return its starting address in
44 * bootmap_start. This address must be page-aligned.
45 */
Chen, Kenneth Wdae28062006-03-22 16:54:15 -080046static int __init
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -070047find_bootmap_location (u64 start, u64 end, void *arg)
Linus Torvalds1da177e2005-04-16 15:20:36 -070048{
Matthew Wilcoxe088a4a2009-05-22 13:49:49 -070049 u64 needed = *(unsigned long *)arg;
50 u64 range_start, range_end, free_start;
Linus Torvalds1da177e2005-04-16 15:20:36 -070051 int i;
52
53#if IGNORE_PFN0
54 if (start == PAGE_OFFSET) {
55 start += PAGE_SIZE;
56 if (start >= end)
57 return 0;
58 }
59#endif
60
61 free_start = PAGE_OFFSET;
62
63 for (i = 0; i < num_rsvd_regions; i++) {
64 range_start = max(start, free_start);
65 range_end = min(end, rsvd_region[i].start & PAGE_MASK);
66
67 free_start = PAGE_ALIGN(rsvd_region[i].end);
68
69 if (range_end <= range_start)
70 continue; /* skip over empty range */
71
72 if (range_end - range_start >= needed) {
73 bootmap_start = __pa(range_start);
74 return -1; /* done */
75 }
76
77 /* nothing more available in this segment */
78 if (range_end == end)
79 return 0;
80 }
81 return 0;
82}
83
Tony Luck4b9ddc72007-11-06 15:14:45 -080084#ifdef CONFIG_SMP
85static void *cpu_data;
86/**
87 * per_cpu_init - setup per-cpu variables
88 *
89 * Allocate and setup per-cpu data areas.
90 */
Paul Gortmakerccce9bb2013-06-17 15:51:20 -040091void *per_cpu_init(void)
Tony Luck4b9ddc72007-11-06 15:14:45 -080092{
Tejun Heo36886472009-10-02 13:28:56 +090093 static bool first_time = true;
94 void *cpu0_data = __cpu0_per_cpu;
95 unsigned int cpu;
96
97 if (!first_time)
98 goto skip;
99 first_time = false;
Tony Luck4b9ddc72007-11-06 15:14:45 -0800100
101 /*
Tejun Heo525947622009-10-02 13:28:56 +0900102 * get_free_pages() cannot be used before cpu_init() done.
103 * BSP allocates PERCPU_PAGE_SIZE bytes for all possible CPUs
104 * to avoid that AP calls get_zeroed_page().
Tony Luck4b9ddc72007-11-06 15:14:45 -0800105 */
Tejun Heo525947622009-10-02 13:28:56 +0900106 for_each_possible_cpu(cpu) {
Tejun Heo36886472009-10-02 13:28:56 +0900107 void *src = cpu == 0 ? cpu0_data : __phys_per_cpu_start;
Tony Luck10617bb2008-08-12 10:34:20 -0700108
Tejun Heo36886472009-10-02 13:28:56 +0900109 memcpy(cpu_data, src, __per_cpu_end - __per_cpu_start);
110 __per_cpu_offset[cpu] = (char *)cpu_data - __per_cpu_start;
111 per_cpu(local_per_cpu_offset, cpu) = __per_cpu_offset[cpu];
Tony Luck10617bb2008-08-12 10:34:20 -0700112
Tejun Heo36886472009-10-02 13:28:56 +0900113 /*
114 * percpu area for cpu0 is moved from the __init area
115 * which is setup by head.S and used till this point.
116 * Update ar.k3. This move is ensures that percpu
117 * area for cpu0 is on the correct node and its
118 * virtual address isn't insanely far from other
119 * percpu areas which is important for congruent
120 * percpu allocator.
121 */
122 if (cpu == 0)
123 ia64_set_kr(IA64_KR_PER_CPU_DATA, __pa(cpu_data) -
124 (unsigned long)__per_cpu_start);
Tony Luck10617bb2008-08-12 10:34:20 -0700125
Tejun Heo36886472009-10-02 13:28:56 +0900126 cpu_data += PERCPU_PAGE_SIZE;
Tony Luck4b9ddc72007-11-06 15:14:45 -0800127 }
Tejun Heo36886472009-10-02 13:28:56 +0900128skip:
Tony Luck4b9ddc72007-11-06 15:14:45 -0800129 return __per_cpu_start + __per_cpu_offset[smp_processor_id()];
130}
131
132static inline void
133alloc_per_cpu_data(void)
134{
Tejun Heo525947622009-10-02 13:28:56 +0900135 cpu_data = __alloc_bootmem(PERCPU_PAGE_SIZE * num_possible_cpus(),
Tony Luck4b9ddc72007-11-06 15:14:45 -0800136 PERCPU_PAGE_SIZE, __pa(MAX_DMA_ADDRESS));
137}
Tejun Heo525947622009-10-02 13:28:56 +0900138
139/**
140 * setup_per_cpu_areas - setup percpu areas
141 *
142 * Arch code has already allocated and initialized percpu areas. All
143 * this function has to do is to teach the determined layout to the
144 * dynamic percpu allocator, which happens to be more complex than
145 * creating whole new ones using helpers.
146 */
147void __init
148setup_per_cpu_areas(void)
149{
150 struct pcpu_alloc_info *ai;
151 struct pcpu_group_info *gi;
152 unsigned int cpu;
153 ssize_t static_size, reserved_size, dyn_size;
154 int rc;
155
156 ai = pcpu_alloc_alloc_info(1, num_possible_cpus());
157 if (!ai)
158 panic("failed to allocate pcpu_alloc_info");
159 gi = &ai->groups[0];
160
161 /* units are assigned consecutively to possible cpus */
162 for_each_possible_cpu(cpu)
163 gi->cpu_map[gi->nr_units++] = cpu;
164
165 /* set parameters */
166 static_size = __per_cpu_end - __per_cpu_start;
167 reserved_size = PERCPU_MODULE_RESERVE;
168 dyn_size = PERCPU_PAGE_SIZE - static_size - reserved_size;
169 if (dyn_size < 0)
170 panic("percpu area overflow static=%zd reserved=%zd\n",
171 static_size, reserved_size);
172
173 ai->static_size = static_size;
174 ai->reserved_size = reserved_size;
175 ai->dyn_size = dyn_size;
176 ai->unit_size = PERCPU_PAGE_SIZE;
177 ai->atom_size = PAGE_SIZE;
178 ai->alloc_size = PERCPU_PAGE_SIZE;
179
180 rc = pcpu_setup_first_chunk(ai, __per_cpu_start + __per_cpu_offset[0]);
181 if (rc)
182 panic("failed to setup percpu area (err=%d)", rc);
183
184 pcpu_free_alloc_info(ai);
185}
Tony Luck4b9ddc72007-11-06 15:14:45 -0800186#else
187#define alloc_per_cpu_data() do { } while (0)
188#endif /* CONFIG_SMP */
189
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190/**
191 * find_memory - setup memory map
192 *
193 * Walk the EFI memory map and find usable memory for the system, taking
194 * into account reserved areas.
195 */
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800196void __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197find_memory (void)
198{
199 unsigned long bootmap_size;
200
201 reserve_memory();
202
203 /* first find highest page frame number */
Zou Nan haia3f5c332007-03-20 13:41:57 -0700204 min_low_pfn = ~0UL;
205 max_low_pfn = 0;
206 efi_memmap_walk(find_max_min_low_pfn, NULL);
207 max_pfn = max_low_pfn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700208 /* how many bytes to cover all the pages */
209 bootmap_size = bootmem_bootmap_pages(max_pfn) << PAGE_SHIFT;
210
211 /* look for a location to hold the bootmap */
212 bootmap_start = ~0UL;
213 efi_memmap_walk(find_bootmap_location, &bootmap_size);
214 if (bootmap_start == ~0UL)
215 panic("Cannot find %ld bytes for bootmap\n", bootmap_size);
216
Zou Nan haia3f5c332007-03-20 13:41:57 -0700217 bootmap_size = init_bootmem_node(NODE_DATA(0),
218 (bootmap_start >> PAGE_SHIFT), 0, max_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700219
220 /* Free all available memory, then mark bootmem-map as being in use. */
221 efi_memmap_walk(filter_rsvd_memory, free_bootmem);
Bernhard Walle72a7fe32008-02-07 00:15:17 -0800222 reserve_bootmem(bootmap_start, bootmap_size, BOOTMEM_DEFAULT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223
224 find_initrd();
Horms45a98fc2006-12-12 17:49:03 +0900225
Tony Luck4b9ddc72007-11-06 15:14:45 -0800226 alloc_per_cpu_data();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700227}
228
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229/*
230 * Set up the page tables.
231 */
232
Chen, Kenneth Wdae28062006-03-22 16:54:15 -0800233void __init
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234paging_init (void)
235{
236 unsigned long max_dma;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700237 unsigned long max_zone_pfns[MAX_NR_ZONES];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700238
Mel Gorman6391af12006-10-11 01:20:39 -0700239 memset(max_zone_pfns, 0, sizeof(max_zone_pfns));
Christoph Lameter09ae1f52007-02-10 01:43:11 -0800240#ifdef CONFIG_ZONE_DMA
241 max_dma = virt_to_phys((void *) MAX_DMA_ADDRESS) >> PAGE_SHIFT;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700242 max_zone_pfns[ZONE_DMA] = max_dma;
Christoph Lameter09ae1f52007-02-10 01:43:11 -0800243#endif
Mel Gorman05e0caa2006-09-27 01:49:54 -0700244 max_zone_pfns[ZONE_NORMAL] = max_low_pfn;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700245
246#ifdef CONFIG_VIRTUAL_MEM_MAP
Zoltan Menyhart98075d22008-04-11 15:21:35 -0700247 efi_memmap_walk(filter_memory, register_active_ranges);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700248 efi_memmap_walk(find_largest_hole, (u64 *)&max_gap);
249 if (max_gap < LARGE_GAP) {
250 vmem_map = (struct page *) 0;
Mel Gorman05e0caa2006-09-27 01:49:54 -0700251 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700252 } else {
253 unsigned long map_size;
254
255 /* allocate virtual_mem_map */
256
Bob Picco921eea12006-06-28 12:54:55 -0400257 map_size = PAGE_ALIGN(ALIGN(max_low_pfn, MAX_ORDER_NR_PAGES) *
258 sizeof(struct page));
Tejun Heo126b3fc2009-10-02 13:28:55 +0900259 VMALLOC_END -= map_size;
260 vmem_map = (struct page *) VMALLOC_END;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700261 efi_memmap_walk(create_mem_map_page_table, NULL);
262
Mel Gorman05e0caa2006-09-27 01:49:54 -0700263 /*
264 * alloc_node_mem_map makes an adjustment for mem_map
265 * which isn't compatible with vmem_map.
266 */
267 NODE_DATA(0)->node_mem_map = vmem_map +
268 find_min_pfn_with_active_regions();
269 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270
271 printk("Virtual mem_map starts at 0x%p\n", mem_map);
272 }
273#else /* !CONFIG_VIRTUAL_MEM_MAP */
Tejun Heo98e4ae82011-12-08 10:22:08 -0800274 memblock_add_node(0, PFN_PHYS(max_low_pfn), 0);
Mel Gorman05e0caa2006-09-27 01:49:54 -0700275 free_area_init_nodes(max_zone_pfns);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276#endif /* !CONFIG_VIRTUAL_MEM_MAP */
277 zero_page_memmap_ptr = virt_to_page(ia64_imva(empty_zero_page));
278}