]> bbs.cooldavid.org Git - net-next-2.6.git/blame - arch/x86/kernel/setup_percpu.c
percpu: give more latitude to arch specific first chunk initialization
[net-next-2.6.git] / arch / x86 / kernel / setup_percpu.c
CommitLineData
4fe29a85
GOC
1#include <linux/kernel.h>
2#include <linux/module.h>
3#include <linux/init.h>
4#include <linux/bootmem.h>
5#include <linux/percpu.h>
1ecd2765 6#include <linux/kexec.h>
17b4cceb 7#include <linux/crash_dump.h>
8a87dd9a
JSR
8#include <linux/smp.h>
9#include <linux/topology.h>
4fe29a85
GOC
10#include <asm/sections.h>
11#include <asm/processor.h>
12#include <asm/setup.h>
0fc0906e 13#include <asm/mpspec.h>
76eb4131 14#include <asm/apicdef.h>
1ecd2765 15#include <asm/highmem.h>
1a51e3a0 16#include <asm/proto.h>
06879033 17#include <asm/cpumask.h>
34019be1 18#include <asm/cpu.h>
60a5317f 19#include <asm/stackprotector.h>
76eb4131 20
c90aa894
MT
21#ifdef CONFIG_DEBUG_PER_CPU_MAPS
22# define DBG(x...) printk(KERN_DEBUG x)
23#else
24# define DBG(x...)
25#endif
26
ea927906
BG
27DEFINE_PER_CPU(int, cpu_number);
28EXPORT_PER_CPU_SYMBOL(cpu_number);
ea927906 29
1688401a
BG
30#ifdef CONFIG_X86_64
31#define BOOT_PERCPU_OFFSET ((unsigned long)__per_cpu_load)
32#else
33#define BOOT_PERCPU_OFFSET 0
34#endif
35
36DEFINE_PER_CPU(unsigned long, this_cpu_off) = BOOT_PERCPU_OFFSET;
37EXPORT_PER_CPU_SYMBOL(this_cpu_off);
38
9939ddaf 39unsigned long __per_cpu_offset[NR_CPUS] __read_mostly = {
34019be1 40 [0 ... NR_CPUS-1] = BOOT_PERCPU_OFFSET,
9939ddaf 41};
9939ddaf 42EXPORT_SYMBOL(__per_cpu_offset);
4fe29a85 43
8d408b4b
TH
44static struct page **pcpu4k_pages __initdata;
45static int pcpu4k_nr_static_pages __initdata;
46
47static struct page * __init pcpu4k_get_page(unsigned int cpu, int pageno)
48{
49 if (pageno < pcpu4k_nr_static_pages)
50 return pcpu4k_pages[cpu * pcpu4k_nr_static_pages + pageno];
51 return NULL;
52}
53
458a3e64
TH
54static void __init pcpu4k_populate_pte(unsigned long addr)
55{
56 populate_extra_pte(addr);
57}
58
b2d2f431
BG
59static inline void setup_percpu_segment(int cpu)
60{
61#ifdef CONFIG_X86_32
62 struct desc_struct gdt;
63
64 pack_descriptor(&gdt, per_cpu_offset(cpu), 0xFFFFF,
65 0x2 | DESCTYPE_S, 0x8);
66 gdt.s = 1;
67 write_gdt_entry(get_cpu_gdt_table(cpu),
68 GDT_ENTRY_PERCPU, &gdt, DESCTYPE_S);
69#endif
70}
71
4fe29a85
GOC
72/*
73 * Great future plan:
74 * Declare PDA itself and support (irqstack,tss,pgd) as per cpu data.
75 * Always point %gs to its beginning
76 */
77void __init setup_per_cpu_areas(void)
78{
11124411
TH
79 ssize_t size = __per_cpu_end - __per_cpu_start;
80 unsigned int nr_cpu_pages = DIV_ROUND_UP(size, PAGE_SIZE);
81 static struct page **pages;
82 size_t pages_size;
83 unsigned int cpu, i, j;
84 unsigned long delta;
85 size_t pcpu_unit_size;
a1681965 86
ab14398a 87 pr_info("NR_CPUS:%d nr_cpumask_bits:%d nr_cpu_ids:%d nr_node_ids:%d\n",
a1681965 88 NR_CPUS, nr_cpumask_bits, nr_cpu_ids, nr_node_ids);
11124411 89 pr_info("PERCPU: Allocating %zd bytes for static per cpu data\n", size);
a1681965 90
11124411
TH
91 pages_size = nr_cpu_pages * num_possible_cpus() * sizeof(pages[0]);
92 pages = alloc_bootmem(pages_size);
b447a468 93
11124411 94 j = 0;
3461b0af 95 for_each_possible_cpu(cpu) {
11124411
TH
96 void *ptr;
97
98 for (i = 0; i < nr_cpu_pages; i++) {
4fe29a85 99#ifndef CONFIG_NEED_MULTIPLE_NODES
11124411 100 ptr = alloc_bootmem_pages(PAGE_SIZE);
4fe29a85 101#else
11124411
TH
102 int node = early_cpu_to_node(cpu);
103
104 if (!node_online(node) || !NODE_DATA(node)) {
105 ptr = alloc_bootmem_pages(PAGE_SIZE);
106 pr_info("cpu %d has no node %d or node-local "
107 "memory\n", cpu, node);
108 pr_debug("per cpu data for cpu%d at %016lx\n",
109 cpu, __pa(ptr));
110 } else {
111 ptr = alloc_bootmem_pages_node(NODE_DATA(node),
112 PAGE_SIZE);
113 pr_debug("per cpu data for cpu%d on node%d "
114 "at %016lx\n", cpu, node, __pa(ptr));
115 }
4fe29a85 116#endif
11124411
TH
117 memcpy(ptr, __per_cpu_load + i * PAGE_SIZE, PAGE_SIZE);
118 pages[j++] = virt_to_page(ptr);
119 }
120 }
121
8d408b4b
TH
122 pcpu4k_pages = pages;
123 pcpu4k_nr_static_pages = nr_cpu_pages;
124 pcpu_unit_size = pcpu_setup_first_chunk(pcpu4k_get_page, size, 0, 0,
125 NULL, pcpu4k_populate_pte);
1a51e3a0 126
11124411
TH
127 free_bootmem(__pa(pages), pages_size);
128
129 delta = (unsigned long)pcpu_base_addr - (unsigned long)__per_cpu_start;
130 for_each_possible_cpu(cpu) {
131 per_cpu_offset(cpu) = delta + cpu * pcpu_unit_size;
26f80bd6 132 per_cpu(this_cpu_off, cpu) = per_cpu_offset(cpu);
ea927906 133 per_cpu(cpu_number, cpu) = cpu;
b2d2f431 134 setup_percpu_segment(cpu);
60a5317f 135 setup_stack_canary_segment(cpu);
0d77e7f0 136 /*
cf3997f5
TH
137 * Copy data used in early init routines from the
138 * initial arrays to the per cpu data areas. These
139 * arrays then become expendable and the *_early_ptr's
140 * are zeroed indicating that the static arrays are
141 * gone.
0d77e7f0 142 */
ec70de8b 143#ifdef CONFIG_X86_LOCAL_APIC
0d77e7f0 144 per_cpu(x86_cpu_to_apicid, cpu) =
cf3997f5 145 early_per_cpu_map(x86_cpu_to_apicid, cpu);
0d77e7f0 146 per_cpu(x86_bios_cpu_apicid, cpu) =
cf3997f5 147 early_per_cpu_map(x86_bios_cpu_apicid, cpu);
ec70de8b 148#endif
1a51e3a0 149#ifdef CONFIG_X86_64
26f80bd6 150 per_cpu(irq_stack_ptr, cpu) =
cf3997f5
TH
151 per_cpu(irq_stack_union.irq_stack, cpu) +
152 IRQ_STACK_SIZE - 64;
6470aff6
BG
153#ifdef CONFIG_NUMA
154 per_cpu(x86_cpu_to_node_map, cpu) =
cf3997f5 155 early_per_cpu_map(x86_cpu_to_node_map, cpu);
2697fbd5 156#endif
6470aff6 157#endif
1a51e3a0 158 /*
34019be1 159 * Up to this point, the boot CPU has been using .data.init
2697fbd5 160 * area. Reload any changed state for the boot CPU.
1a51e3a0 161 */
34019be1 162 if (cpu == boot_cpu_id)
552be871 163 switch_to_new_gdt(cpu);
c90aa894
MT
164
165 DBG("PERCPU: cpu %4d %p\n", cpu, ptr);
4fe29a85
GOC
166 }
167
0d77e7f0 168 /* indicate the early static arrays will soon be gone */
22f25138 169#ifdef CONFIG_X86_LOCAL_APIC
0d77e7f0
BG
170 early_per_cpu_ptr(x86_cpu_to_apicid) = NULL;
171 early_per_cpu_ptr(x86_bios_cpu_apicid) = NULL;
22f25138 172#endif
6470aff6 173#if defined(CONFIG_X86_64) && defined(CONFIG_NUMA)
0d77e7f0
BG
174 early_per_cpu_ptr(x86_cpu_to_node_map) = NULL;
175#endif
9f0e8d04 176
9f248bde
MT
177 /* Setup node to cpumask map */
178 setup_node_to_cpumask_map();
c2d1cec1
MT
179
180 /* Setup cpu initialized, callin, callout masks */
181 setup_cpu_local_masks();
4fe29a85 182}