blob: 0856ad444f90d8baf232af5903b3f7fb46143474 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/arch/x86-64/kernel/setup.c
3 *
4 * Copyright (C) 1995 Linus Torvalds
5 *
6 * Nov 2001 Dave Jones <davej@suse.de>
7 * Forked from i386 setup code.
8 *
9 * $Id$
10 */
11
12/*
13 * This file handles the architecture-dependent parts of initialization
14 */
15
16#include <linux/errno.h>
17#include <linux/sched.h>
18#include <linux/kernel.h>
19#include <linux/mm.h>
20#include <linux/stddef.h>
21#include <linux/unistd.h>
22#include <linux/ptrace.h>
23#include <linux/slab.h>
24#include <linux/user.h>
25#include <linux/a.out.h>
26#include <linux/tty.h>
27#include <linux/ioport.h>
28#include <linux/delay.h>
29#include <linux/config.h>
30#include <linux/init.h>
31#include <linux/initrd.h>
32#include <linux/highmem.h>
33#include <linux/bootmem.h>
34#include <linux/module.h>
35#include <asm/processor.h>
36#include <linux/console.h>
37#include <linux/seq_file.h>
Vivek Goyalaac04b32006-01-09 20:51:47 -080038#include <linux/crash_dump.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070039#include <linux/root_dev.h>
40#include <linux/pci.h>
41#include <linux/acpi.h>
42#include <linux/kallsyms.h>
43#include <linux/edd.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070044#include <linux/mmzone.h>
Eric W. Biederman5f5609d2005-06-25 14:58:04 -070045#include <linux/kexec.h>
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -080046#include <linux/cpufreq.h>
Andi Kleene9928672006-01-11 22:43:33 +010047#include <linux/dmi.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010048#include <linux/dma-mapping.h>
Andi Kleen681558f2006-03-25 16:29:46 +010049#include <linux/ctype.h>
Matt Tolentinobbfceef2005-06-23 00:08:07 -070050
Linus Torvalds1da177e2005-04-16 15:20:36 -070051#include <asm/mtrr.h>
52#include <asm/uaccess.h>
53#include <asm/system.h>
54#include <asm/io.h>
55#include <asm/smp.h>
56#include <asm/msr.h>
57#include <asm/desc.h>
58#include <video/edid.h>
59#include <asm/e820.h>
60#include <asm/dma.h>
61#include <asm/mpspec.h>
62#include <asm/mmu_context.h>
63#include <asm/bootsetup.h>
64#include <asm/proto.h>
65#include <asm/setup.h>
66#include <asm/mach_apic.h>
67#include <asm/numa.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010068#include <asm/swiotlb.h>
Andi Kleen2bc04142005-11-05 17:25:53 +010069#include <asm/sections.h>
Muli Ben-Yehuda17a941d2006-01-11 22:44:42 +010070#include <asm/gart-mapping.h>
Andi Kleenf2d3efe2006-03-25 16:30:22 +010071#include <asm/dmi.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070072
73/*
74 * Machine setup..
75 */
76
Ravikiran G Thirumalai6c231b72005-09-06 15:17:45 -070077struct cpuinfo_x86 boot_cpu_data __read_mostly;
Linus Torvalds1da177e2005-04-16 15:20:36 -070078
79unsigned long mmu_cr4_features;
80
81int acpi_disabled;
82EXPORT_SYMBOL(acpi_disabled);
Len Brown888ba6c2005-08-24 12:07:20 -040083#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -070084extern int __initdata acpi_ht;
85extern acpi_interrupt_flags acpi_sci_flags;
86int __initdata acpi_force = 0;
87#endif
88
89int acpi_numa __initdata;
90
Linus Torvalds1da177e2005-04-16 15:20:36 -070091/* Boot loader ID as an integer, for the benefit of proc_dointvec */
92int bootloader_type;
93
94unsigned long saved_video_mode;
95
Andi Kleenf2d3efe2006-03-25 16:30:22 +010096/*
97 * Early DMI memory
98 */
99int dmi_alloc_index;
100char dmi_alloc_data[DMI_MAX_DATA];
101
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102/*
103 * Setup options
104 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700105struct screen_info screen_info;
106struct sys_desc_table_struct {
107 unsigned short length;
108 unsigned char table[0];
109};
110
111struct edid_info edid_info;
112struct e820map e820;
113
114extern int root_mountflags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115
116char command_line[COMMAND_LINE_SIZE];
117
118struct resource standard_io_resources[] = {
119 { .name = "dma1", .start = 0x00, .end = 0x1f,
120 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
121 { .name = "pic1", .start = 0x20, .end = 0x21,
122 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
123 { .name = "timer0", .start = 0x40, .end = 0x43,
124 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
125 { .name = "timer1", .start = 0x50, .end = 0x53,
126 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
127 { .name = "keyboard", .start = 0x60, .end = 0x6f,
128 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
129 { .name = "dma page reg", .start = 0x80, .end = 0x8f,
130 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
131 { .name = "pic2", .start = 0xa0, .end = 0xa1,
132 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
133 { .name = "dma2", .start = 0xc0, .end = 0xdf,
134 .flags = IORESOURCE_BUSY | IORESOURCE_IO },
135 { .name = "fpu", .start = 0xf0, .end = 0xff,
136 .flags = IORESOURCE_BUSY | IORESOURCE_IO }
137};
138
139#define STANDARD_IO_RESOURCES \
140 (sizeof standard_io_resources / sizeof standard_io_resources[0])
141
142#define IORESOURCE_RAM (IORESOURCE_BUSY | IORESOURCE_MEM)
143
144struct resource data_resource = {
145 .name = "Kernel data",
146 .start = 0,
147 .end = 0,
148 .flags = IORESOURCE_RAM,
149};
150struct resource code_resource = {
151 .name = "Kernel code",
152 .start = 0,
153 .end = 0,
154 .flags = IORESOURCE_RAM,
155};
156
157#define IORESOURCE_ROM (IORESOURCE_BUSY | IORESOURCE_READONLY | IORESOURCE_MEM)
158
159static struct resource system_rom_resource = {
160 .name = "System ROM",
161 .start = 0xf0000,
162 .end = 0xfffff,
163 .flags = IORESOURCE_ROM,
164};
165
166static struct resource extension_rom_resource = {
167 .name = "Extension ROM",
168 .start = 0xe0000,
169 .end = 0xeffff,
170 .flags = IORESOURCE_ROM,
171};
172
173static struct resource adapter_rom_resources[] = {
174 { .name = "Adapter ROM", .start = 0xc8000, .end = 0,
175 .flags = IORESOURCE_ROM },
176 { .name = "Adapter ROM", .start = 0, .end = 0,
177 .flags = IORESOURCE_ROM },
178 { .name = "Adapter ROM", .start = 0, .end = 0,
179 .flags = IORESOURCE_ROM },
180 { .name = "Adapter ROM", .start = 0, .end = 0,
181 .flags = IORESOURCE_ROM },
182 { .name = "Adapter ROM", .start = 0, .end = 0,
183 .flags = IORESOURCE_ROM },
184 { .name = "Adapter ROM", .start = 0, .end = 0,
185 .flags = IORESOURCE_ROM }
186};
187
188#define ADAPTER_ROM_RESOURCES \
189 (sizeof adapter_rom_resources / sizeof adapter_rom_resources[0])
190
191static struct resource video_rom_resource = {
192 .name = "Video ROM",
193 .start = 0xc0000,
194 .end = 0xc7fff,
195 .flags = IORESOURCE_ROM,
196};
197
198static struct resource video_ram_resource = {
199 .name = "Video RAM area",
200 .start = 0xa0000,
201 .end = 0xbffff,
202 .flags = IORESOURCE_RAM,
203};
204
205#define romsignature(x) (*(unsigned short *)(x) == 0xaa55)
206
207static int __init romchecksum(unsigned char *rom, unsigned long length)
208{
209 unsigned char *p, sum = 0;
210
211 for (p = rom; p < rom + length; p++)
212 sum += *p;
213 return sum == 0;
214}
215
216static void __init probe_roms(void)
217{
218 unsigned long start, length, upper;
219 unsigned char *rom;
220 int i;
221
222 /* video rom */
223 upper = adapter_rom_resources[0].start;
224 for (start = video_rom_resource.start; start < upper; start += 2048) {
225 rom = isa_bus_to_virt(start);
226 if (!romsignature(rom))
227 continue;
228
229 video_rom_resource.start = start;
230
231 /* 0 < length <= 0x7f * 512, historically */
232 length = rom[2] * 512;
233
234 /* if checksum okay, trust length byte */
235 if (length && romchecksum(rom, length))
236 video_rom_resource.end = start + length - 1;
237
238 request_resource(&iomem_resource, &video_rom_resource);
239 break;
240 }
241
242 start = (video_rom_resource.end + 1 + 2047) & ~2047UL;
243 if (start < upper)
244 start = upper;
245
246 /* system rom */
247 request_resource(&iomem_resource, &system_rom_resource);
248 upper = system_rom_resource.start;
249
250 /* check for extension rom (ignore length byte!) */
251 rom = isa_bus_to_virt(extension_rom_resource.start);
252 if (romsignature(rom)) {
253 length = extension_rom_resource.end - extension_rom_resource.start + 1;
254 if (romchecksum(rom, length)) {
255 request_resource(&iomem_resource, &extension_rom_resource);
256 upper = extension_rom_resource.start;
257 }
258 }
259
260 /* check for adapter roms on 2k boundaries */
261 for (i = 0; i < ADAPTER_ROM_RESOURCES && start < upper; start += 2048) {
262 rom = isa_bus_to_virt(start);
263 if (!romsignature(rom))
264 continue;
265
266 /* 0 < length <= 0x7f * 512, historically */
267 length = rom[2] * 512;
268
269 /* but accept any length that fits if checksum okay */
270 if (!length || start + length > upper || !romchecksum(rom, length))
271 continue;
272
273 adapter_rom_resources[i].start = start;
274 adapter_rom_resources[i].end = start + length - 1;
275 request_resource(&iomem_resource, &adapter_rom_resources[i]);
276
277 start = adapter_rom_resources[i++].end & ~2047UL;
278 }
279}
280
Andi Kleen681558f2006-03-25 16:29:46 +0100281/* Check for full argument with no trailing characters */
282static int fullarg(char *p, char *arg)
283{
284 int l = strlen(arg);
285 return !memcmp(p, arg, l) && (p[l] == 0 || isspace(p[l]));
286}
287
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288static __init void parse_cmdline_early (char ** cmdline_p)
289{
290 char c = ' ', *to = command_line, *from = COMMAND_LINE;
291 int len = 0;
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800292 int userdef = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294 for (;;) {
295 if (c != ' ')
296 goto next_char;
297
298#ifdef CONFIG_SMP
299 /*
300 * If the BIOS enumerates physical processors before logical,
301 * maxcpus=N at enumeration-time can be used to disable HT.
302 */
303 else if (!memcmp(from, "maxcpus=", 8)) {
304 extern unsigned int maxcpus;
305
306 maxcpus = simple_strtoul(from + 8, NULL, 0);
307 }
308#endif
Len Brown888ba6c2005-08-24 12:07:20 -0400309#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700310 /* "acpi=off" disables both ACPI table parsing and interpreter init */
Andi Kleen681558f2006-03-25 16:29:46 +0100311 if (fullarg(from,"acpi=off"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700312 disable_acpi();
313
Andi Kleen681558f2006-03-25 16:29:46 +0100314 if (fullarg(from, "acpi=force")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700315 /* add later when we do DMI horrors: */
316 acpi_force = 1;
317 acpi_disabled = 0;
318 }
319
320 /* acpi=ht just means: do ACPI MADT parsing
321 at bootup, but don't enable the full ACPI interpreter */
Andi Kleen681558f2006-03-25 16:29:46 +0100322 if (fullarg(from, "acpi=ht")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700323 if (!acpi_force)
324 disable_acpi();
325 acpi_ht = 1;
326 }
Andi Kleen681558f2006-03-25 16:29:46 +0100327 else if (fullarg(from, "pci=noacpi"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 acpi_disable_pci();
Andi Kleen681558f2006-03-25 16:29:46 +0100329 else if (fullarg(from, "acpi=noirq"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700330 acpi_noirq_set();
331
Andi Kleen681558f2006-03-25 16:29:46 +0100332 else if (fullarg(from, "acpi_sci=edge"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 acpi_sci_flags.trigger = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100334 else if (fullarg(from, "acpi_sci=level"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335 acpi_sci_flags.trigger = 3;
Andi Kleen681558f2006-03-25 16:29:46 +0100336 else if (fullarg(from, "acpi_sci=high"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 acpi_sci_flags.polarity = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100338 else if (fullarg(from, "acpi_sci=low"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700339 acpi_sci_flags.polarity = 3;
340
341 /* acpi=strict disables out-of-spec workarounds */
Andi Kleen681558f2006-03-25 16:29:46 +0100342 else if (fullarg(from, "acpi=strict")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700343 acpi_strict = 1;
344 }
Andi Kleen22999242005-04-16 15:25:17 -0700345#ifdef CONFIG_X86_IO_APIC
Andi Kleen681558f2006-03-25 16:29:46 +0100346 else if (fullarg(from, "acpi_skip_timer_override"))
Andi Kleen22999242005-04-16 15:25:17 -0700347 acpi_skip_timer_override = 1;
348#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -0700349#endif
350
Andi Kleen681558f2006-03-25 16:29:46 +0100351 if (fullarg(from, "disable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200352 disable_timer_pin_1 = 1;
Andi Kleen681558f2006-03-25 16:29:46 +0100353 if (fullarg(from, "enable_timer_pin_1"))
Chuck Ebbert66759a02005-09-12 18:49:25 +0200354 disable_timer_pin_1 = -1;
355
Andi Kleen681558f2006-03-25 16:29:46 +0100356 if (fullarg(from, "nolapic") || fullarg(from, "disableapic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700357 disable_apic = 1;
358
Andi Kleen681558f2006-03-25 16:29:46 +0100359 if (fullarg(from, "noapic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700360 skip_ioapic_setup = 1;
361
Andi Kleen681558f2006-03-25 16:29:46 +0100362 if (fullarg(from,"apic")) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700363 skip_ioapic_setup = 0;
364 ioapic_force = 1;
365 }
366
367 if (!memcmp(from, "mem=", 4))
368 parse_memopt(from+4, &from);
369
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800370 if (!memcmp(from, "memmap=", 7)) {
371 /* exactmap option is for used defined memory */
372 if (!memcmp(from+7, "exactmap", 8)) {
373#ifdef CONFIG_CRASH_DUMP
374 /* If we are doing a crash dump, we
375 * still need to know the real mem
376 * size before original memory map is
377 * reset.
378 */
379 saved_max_pfn = e820_end_of_ram();
380#endif
381 from += 8+7;
382 end_pfn_map = 0;
383 e820.nr_map = 0;
384 userdef = 1;
385 }
386 else {
387 parse_memmapopt(from+7, &from);
388 userdef = 1;
389 }
390 }
391
Matt Tolentino2b976902005-06-23 00:08:06 -0700392#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700393 if (!memcmp(from, "numa=", 5))
394 numa_setup(from+5);
395#endif
396
Linus Torvalds1da177e2005-04-16 15:20:36 -0700397 if (!memcmp(from,"iommu=",6)) {
398 iommu_setup(from+6);
399 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700400
Andi Kleen681558f2006-03-25 16:29:46 +0100401 if (fullarg(from,"oops=panic"))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700402 panic_on_oops = 1;
403
404 if (!memcmp(from, "noexec=", 7))
405 nonx_setup(from + 7);
406
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700407#ifdef CONFIG_KEXEC
408 /* crashkernel=size@addr specifies the location to reserve for
409 * a crash kernel. By reserving this memory we guarantee
410 * that linux never set's it up as a DMA target.
411 * Useful for holding code to do something appropriate
412 * after a kernel panic.
413 */
414 else if (!memcmp(from, "crashkernel=", 12)) {
415 unsigned long size, base;
416 size = memparse(from+12, &from);
417 if (*from == '@') {
418 base = memparse(from+1, &from);
419 /* FIXME: Do I want a sanity check
420 * to validate the memory range?
421 */
422 crashk_res.start = base;
423 crashk_res.end = base + size - 1;
424 }
425 }
426#endif
427
Vivek Goyalaac04b32006-01-09 20:51:47 -0800428#ifdef CONFIG_PROC_VMCORE
429 /* elfcorehdr= specifies the location of elf core header
430 * stored by the crashed kernel. This option will be passed
431 * by kexec loader to the capture kernel.
432 */
433 else if(!memcmp(from, "elfcorehdr=", 11))
434 elfcorehdr_addr = memparse(from+11, &from);
435#endif
Andi Kleene2c03882006-02-26 04:18:46 +0100436
Brian Magnusond5176122006-02-27 04:02:04 +0100437#ifdef CONFIG_HOTPLUG_CPU
Andi Kleene2c03882006-02-26 04:18:46 +0100438 else if (!memcmp(from, "additional_cpus=", 16))
439 setup_additional_cpus(from+16);
440#endif
441
Linus Torvalds1da177e2005-04-16 15:20:36 -0700442 next_char:
443 c = *(from++);
444 if (!c)
445 break;
446 if (COMMAND_LINE_SIZE <= ++len)
447 break;
448 *(to++) = c;
449 }
akpm@osdl.org69cda7b2006-01-09 20:51:46 -0800450 if (userdef) {
451 printk(KERN_INFO "user-defined physical RAM map:\n");
452 e820_print_map("user");
453 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 *to = '\0';
455 *cmdline_p = command_line;
456}
457
Matt Tolentino2b976902005-06-23 00:08:06 -0700458#ifndef CONFIG_NUMA
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700459static void __init
460contig_initmem_init(unsigned long start_pfn, unsigned long end_pfn)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700461{
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700462 unsigned long bootmap_size, bootmap;
463
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700464 bootmap_size = bootmem_bootmap_pages(end_pfn)<<PAGE_SHIFT;
465 bootmap = find_e820_area(0, end_pfn<<PAGE_SHIFT, bootmap_size);
466 if (bootmap == -1L)
467 panic("Cannot find bootmem map of size %ld\n",bootmap_size);
468 bootmap_size = init_bootmem(bootmap >> PAGE_SHIFT, end_pfn);
469 e820_bootmem_free(NODE_DATA(0), 0, end_pfn << PAGE_SHIFT);
470 reserve_bootmem(bootmap, bootmap_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700471}
472#endif
473
474/* Use inline assembly to define this because the nops are defined
475 as inline assembly strings in the include files and we cannot
476 get them easily into strings. */
477asm("\t.data\nk8nops: "
478 K8_NOP1 K8_NOP2 K8_NOP3 K8_NOP4 K8_NOP5 K8_NOP6
479 K8_NOP7 K8_NOP8);
480
481extern unsigned char k8nops[];
482static unsigned char *k8_nops[ASM_NOP_MAX+1] = {
483 NULL,
484 k8nops,
485 k8nops + 1,
486 k8nops + 1 + 2,
487 k8nops + 1 + 2 + 3,
488 k8nops + 1 + 2 + 3 + 4,
489 k8nops + 1 + 2 + 3 + 4 + 5,
490 k8nops + 1 + 2 + 3 + 4 + 5 + 6,
491 k8nops + 1 + 2 + 3 + 4 + 5 + 6 + 7,
492};
493
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100494extern char __vsyscall_0;
495
Linus Torvalds1da177e2005-04-16 15:20:36 -0700496/* Replace instructions with better alternatives for this CPU type.
497
498 This runs before SMP is initialized to avoid SMP problems with
499 self modifying code. This implies that assymetric systems where
500 APs have less capabilities than the boot processor are not handled.
501 In this case boot with "noreplacement". */
502void apply_alternatives(void *start, void *end)
503{
504 struct alt_instr *a;
505 int diff, i, k;
506 for (a = start; (void *)a < end; a++) {
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100507 u8 *instr;
508
Linus Torvalds1da177e2005-04-16 15:20:36 -0700509 if (!boot_cpu_has(a->cpuid))
510 continue;
511
512 BUG_ON(a->replacementlen > a->instrlen);
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100513 instr = a->instr;
514 /* vsyscall code is not mapped yet. resolve it manually. */
515 if (instr >= (u8 *)VSYSCALL_START && instr < (u8*)VSYSCALL_END)
516 instr = __va(instr - (u8*)VSYSCALL_START + (u8*)__pa_symbol(&__vsyscall_0));
517 __inline_memcpy(instr, a->replacement, a->replacementlen);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700518 diff = a->instrlen - a->replacementlen;
519
520 /* Pad the rest with nops */
521 for (i = a->replacementlen; diff > 0; diff -= k, i += k) {
522 k = diff;
523 if (k > ASM_NOP_MAX)
524 k = ASM_NOP_MAX;
Andi Kleen7f6c5b02006-01-11 22:45:21 +0100525 __inline_memcpy(instr + i, k8_nops[k], k);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700526 }
527 }
528}
529
530static int no_replacement __initdata = 0;
531
532void __init alternative_instructions(void)
533{
534 extern struct alt_instr __alt_instructions[], __alt_instructions_end[];
535 if (no_replacement)
536 return;
537 apply_alternatives(__alt_instructions, __alt_instructions_end);
538}
539
540static int __init noreplacement_setup(char *s)
541{
542 no_replacement = 1;
OGAWA Hirofumi9b410462006-03-31 02:30:33 -0800543 return 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544}
545
546__setup("noreplacement", noreplacement_setup);
547
548#if defined(CONFIG_EDD) || defined(CONFIG_EDD_MODULE)
549struct edd edd;
550#ifdef CONFIG_EDD_MODULE
551EXPORT_SYMBOL(edd);
552#endif
553/**
554 * copy_edd() - Copy the BIOS EDD information
555 * from boot_params into a safe place.
556 *
557 */
558static inline void copy_edd(void)
559{
560 memcpy(edd.mbr_signature, EDD_MBR_SIGNATURE, sizeof(edd.mbr_signature));
561 memcpy(edd.edd_info, EDD_BUF, sizeof(edd.edd_info));
562 edd.mbr_signature_nr = EDD_MBR_SIG_NR;
563 edd.edd_info_nr = EDD_NR;
564}
565#else
566static inline void copy_edd(void)
567{
568}
569#endif
570
571#define EBDA_ADDR_POINTER 0x40E
572static void __init reserve_ebda_region(void)
573{
574 unsigned int addr;
575 /**
576 * there is a real-mode segmented pointer pointing to the
577 * 4K EBDA area at 0x40E
578 */
579 addr = *(unsigned short *)phys_to_virt(EBDA_ADDR_POINTER);
580 addr <<= 4;
581 if (addr)
582 reserve_bootmem_generic(addr, PAGE_SIZE);
583}
584
585void __init setup_arch(char **cmdline_p)
586{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700587 unsigned long kernel_end;
588
589 ROOT_DEV = old_decode_dev(ORIG_ROOT_DEV);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700590 screen_info = SCREEN_INFO;
591 edid_info = EDID_INFO;
592 saved_video_mode = SAVED_VIDEO_MODE;
593 bootloader_type = LOADER_TYPE;
594
595#ifdef CONFIG_BLK_DEV_RAM
596 rd_image_start = RAMDISK_FLAGS & RAMDISK_IMAGE_START_MASK;
597 rd_prompt = ((RAMDISK_FLAGS & RAMDISK_PROMPT_FLAG) != 0);
598 rd_doload = ((RAMDISK_FLAGS & RAMDISK_LOAD_FLAG) != 0);
599#endif
600 setup_memory_region();
601 copy_edd();
602
603 if (!MOUNT_ROOT_RDONLY)
604 root_mountflags &= ~MS_RDONLY;
605 init_mm.start_code = (unsigned long) &_text;
606 init_mm.end_code = (unsigned long) &_etext;
607 init_mm.end_data = (unsigned long) &_edata;
608 init_mm.brk = (unsigned long) &_end;
609
610 code_resource.start = virt_to_phys(&_text);
611 code_resource.end = virt_to_phys(&_etext)-1;
612 data_resource.start = virt_to_phys(&_etext);
613 data_resource.end = virt_to_phys(&_edata)-1;
614
615 parse_cmdline_early(cmdline_p);
616
617 early_identify_cpu(&boot_cpu_data);
618
619 /*
620 * partially used pages are not usable - thus
621 * we are rounding upwards:
622 */
623 end_pfn = e820_end_of_ram();
Andi Kleen1f502492006-03-25 16:29:58 +0100624 num_physpages = end_pfn; /* for pfn_valid */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700625
626 check_efer();
627
628 init_memory_mapping(0, (end_pfn_map << PAGE_SHIFT));
629
Andi Kleenf2d3efe2006-03-25 16:30:22 +0100630 dmi_scan_machine();
631
Siddha, Suresh Bf6c2e332005-11-05 17:25:53 +0100632 zap_low_mappings(0);
633
Len Brown888ba6c2005-08-24 12:07:20 -0400634#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700635 /*
636 * Initialize the ACPI boot-time table parser (gets the RSDP and SDT).
637 * Call this early for SRAT node setup.
638 */
639 acpi_boot_table_init();
640#endif
641
642#ifdef CONFIG_ACPI_NUMA
643 /*
644 * Parse SRAT to discover nodes.
645 */
646 acpi_numa_init();
647#endif
648
Matt Tolentino2b976902005-06-23 00:08:06 -0700649#ifdef CONFIG_NUMA
Linus Torvalds1da177e2005-04-16 15:20:36 -0700650 numa_initmem_init(0, end_pfn);
651#else
Matt Tolentinobbfceef2005-06-23 00:08:07 -0700652 contig_initmem_init(0, end_pfn);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700653#endif
654
655 /* Reserve direct mapping */
656 reserve_bootmem_generic(table_start << PAGE_SHIFT,
657 (table_end - table_start) << PAGE_SHIFT);
658
659 /* reserve kernel */
660 kernel_end = round_up(__pa_symbol(&_end),PAGE_SIZE);
661 reserve_bootmem_generic(HIGH_MEMORY, kernel_end - HIGH_MEMORY);
662
663 /*
664 * reserve physical page 0 - it's a special BIOS page on many boxes,
665 * enabling clean reboots, SMP operation, laptop functions.
666 */
667 reserve_bootmem_generic(0, PAGE_SIZE);
668
669 /* reserve ebda region */
670 reserve_ebda_region();
671
672#ifdef CONFIG_SMP
673 /*
674 * But first pinch a few for the stack/trampoline stuff
675 * FIXME: Don't need the extra page at 4K, but need to fix
676 * trampoline before removing it. (see the GDT stuff)
677 */
678 reserve_bootmem_generic(PAGE_SIZE, PAGE_SIZE);
679
680 /* Reserve SMP trampoline */
681 reserve_bootmem_generic(SMP_TRAMPOLINE_BASE, PAGE_SIZE);
682#endif
683
684#ifdef CONFIG_ACPI_SLEEP
685 /*
686 * Reserve low memory region for sleep support.
687 */
688 acpi_reserve_bootmem();
689#endif
690#ifdef CONFIG_X86_LOCAL_APIC
691 /*
692 * Find and reserve possible boot-time SMP configuration:
693 */
694 find_smp_config();
695#endif
696#ifdef CONFIG_BLK_DEV_INITRD
697 if (LOADER_TYPE && INITRD_START) {
698 if (INITRD_START + INITRD_SIZE <= (end_pfn << PAGE_SHIFT)) {
699 reserve_bootmem_generic(INITRD_START, INITRD_SIZE);
700 initrd_start =
701 INITRD_START ? INITRD_START + PAGE_OFFSET : 0;
702 initrd_end = initrd_start+INITRD_SIZE;
703 }
704 else {
705 printk(KERN_ERR "initrd extends beyond end of memory "
706 "(0x%08lx > 0x%08lx)\ndisabling initrd\n",
707 (unsigned long)(INITRD_START + INITRD_SIZE),
708 (unsigned long)(end_pfn << PAGE_SHIFT));
709 initrd_start = 0;
710 }
711 }
712#endif
Eric W. Biederman5f5609d2005-06-25 14:58:04 -0700713#ifdef CONFIG_KEXEC
714 if (crashk_res.start != crashk_res.end) {
715 reserve_bootmem(crashk_res.start,
716 crashk_res.end - crashk_res.start + 1);
717 }
718#endif
Eric W. Biederman0d317fb2005-08-06 13:47:36 -0600719
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720 paging_init();
721
722 check_ioapic();
723
Ashok Raj51f62e12006-03-25 16:29:28 +0100724 /*
725 * set this early, so we dont allocate cpu0
726 * if MADT list doesnt list BSP first
727 * mpparse.c/MP_processor_info() allocates logical cpu numbers.
728 */
729 cpu_set(0, cpu_present_map);
Len Brown888ba6c2005-08-24 12:07:20 -0400730#ifdef CONFIG_ACPI
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731 /*
732 * Read APIC and some other early information from ACPI tables.
733 */
734 acpi_boot_init();
735#endif
736
Ravikiran Thirumalai05b3cbd2006-01-11 22:45:36 +0100737 init_cpu_to_node();
738
Linus Torvalds1da177e2005-04-16 15:20:36 -0700739#ifdef CONFIG_X86_LOCAL_APIC
740 /*
741 * get boot-time SMP configuration:
742 */
743 if (smp_found_config)
744 get_smp_config();
745 init_apic_mappings();
746#endif
747
748 /*
749 * Request address space for all standard RAM and ROM resources
750 * and also for regions reported as reserved by the e820.
751 */
752 probe_roms();
753 e820_reserve_resources();
754
755 request_resource(&iomem_resource, &video_ram_resource);
756
757 {
758 unsigned i;
759 /* request I/O space for devices used on all i[345]86 PCs */
760 for (i = 0; i < STANDARD_IO_RESOURCES; i++)
761 request_resource(&ioport_resource, &standard_io_resources[i]);
762 }
763
Andi Kleena1e97782005-04-16 15:25:12 -0700764 e820_setup_gap();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700765
766#ifdef CONFIG_GART_IOMMU
Jon Mason5b7b6442006-02-03 21:51:59 +0100767 iommu_hole_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700768#endif
769
770#ifdef CONFIG_VT
771#if defined(CONFIG_VGA_CONSOLE)
772 conswitchp = &vga_con;
773#elif defined(CONFIG_DUMMY_CONSOLE)
774 conswitchp = &dummy_con;
775#endif
776#endif
777}
778
Ashok Raje6982c62005-06-25 14:54:58 -0700779static int __cpuinit get_model_name(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700780{
781 unsigned int *v;
782
Andi Kleenebfcaa92005-04-16 15:25:18 -0700783 if (c->extended_cpuid_level < 0x80000004)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700784 return 0;
785
786 v = (unsigned int *) c->x86_model_id;
787 cpuid(0x80000002, &v[0], &v[1], &v[2], &v[3]);
788 cpuid(0x80000003, &v[4], &v[5], &v[6], &v[7]);
789 cpuid(0x80000004, &v[8], &v[9], &v[10], &v[11]);
790 c->x86_model_id[48] = 0;
791 return 1;
792}
793
794
Ashok Raje6982c62005-06-25 14:54:58 -0700795static void __cpuinit display_cacheinfo(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796{
797 unsigned int n, dummy, eax, ebx, ecx, edx;
798
Andi Kleenebfcaa92005-04-16 15:25:18 -0700799 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800
801 if (n >= 0x80000005) {
802 cpuid(0x80000005, &dummy, &ebx, &ecx, &edx);
803 printk(KERN_INFO "CPU: L1 I Cache: %dK (%d bytes/line), D cache %dK (%d bytes/line)\n",
804 edx>>24, edx&0xFF, ecx>>24, ecx&0xFF);
805 c->x86_cache_size=(ecx>>24)+(edx>>24);
806 /* On K8 L1 TLB is inclusive, so don't count it */
807 c->x86_tlbsize = 0;
808 }
809
810 if (n >= 0x80000006) {
811 cpuid(0x80000006, &dummy, &ebx, &ecx, &edx);
812 ecx = cpuid_ecx(0x80000006);
813 c->x86_cache_size = ecx >> 16;
814 c->x86_tlbsize += ((ebx >> 16) & 0xfff) + (ebx & 0xfff);
815
816 printk(KERN_INFO "CPU: L2 Cache: %dK (%d bytes/line)\n",
817 c->x86_cache_size, ecx & 0xFF);
818 }
819
820 if (n >= 0x80000007)
821 cpuid(0x80000007, &dummy, &dummy, &dummy, &c->x86_power);
822 if (n >= 0x80000008) {
823 cpuid(0x80000008, &eax, &dummy, &dummy, &dummy);
824 c->x86_virt_bits = (eax >> 8) & 0xff;
825 c->x86_phys_bits = eax & 0xff;
826 }
827}
828
Andi Kleen3f098c22005-09-12 18:49:24 +0200829#ifdef CONFIG_NUMA
830static int nearby_node(int apicid)
831{
832 int i;
833 for (i = apicid - 1; i >= 0; i--) {
834 int node = apicid_to_node[i];
835 if (node != NUMA_NO_NODE && node_online(node))
836 return node;
837 }
838 for (i = apicid + 1; i < MAX_LOCAL_APIC; i++) {
839 int node = apicid_to_node[i];
840 if (node != NUMA_NO_NODE && node_online(node))
841 return node;
842 }
843 return first_node(node_online_map); /* Shouldn't happen */
844}
845#endif
846
Andi Kleen63518642005-04-16 15:25:16 -0700847/*
848 * On a AMD dual core setup the lower bits of the APIC id distingush the cores.
849 * Assumes number of cores is a power of two.
850 */
851static void __init amd_detect_cmp(struct cpuinfo_x86 *c)
852{
853#ifdef CONFIG_SMP
Andi Kleen29422832005-05-16 21:53:26 -0700854 int cpu = smp_processor_id();
Andi Kleenb41e2932005-05-20 14:27:55 -0700855 unsigned bits;
Andi Kleen3f098c22005-09-12 18:49:24 +0200856#ifdef CONFIG_NUMA
857 int node = 0;
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100858 unsigned apicid = hard_smp_processor_id();
Andi Kleen3f098c22005-09-12 18:49:24 +0200859#endif
Andi Kleenb41e2932005-05-20 14:27:55 -0700860
861 bits = 0;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100862 while ((1 << bits) < c->x86_max_cores)
Andi Kleenb41e2932005-05-20 14:27:55 -0700863 bits++;
864
865 /* Low order bits define the core id (index of core in socket) */
866 cpu_core_id[cpu] = phys_proc_id[cpu] & ((1 << bits)-1);
867 /* Convert the APIC ID into the socket ID */
Ravikiran G Thirumalai60c1bc82006-03-25 16:30:04 +0100868 phys_proc_id[cpu] = phys_pkg_id(bits);
Andi Kleen63518642005-04-16 15:25:16 -0700869
870#ifdef CONFIG_NUMA
Andi Kleen3f098c22005-09-12 18:49:24 +0200871 node = phys_proc_id[cpu];
872 if (apicid_to_node[apicid] != NUMA_NO_NODE)
873 node = apicid_to_node[apicid];
874 if (!node_online(node)) {
875 /* Two possibilities here:
876 - The CPU is missing memory and no node was created.
877 In that case try picking one from a nearby CPU
878 - The APIC IDs differ from the HyperTransport node IDs
879 which the K8 northbridge parsing fills in.
880 Assume they are all increased by a constant offset,
881 but in the same order as the HT nodeids.
882 If that doesn't result in a usable node fall back to the
883 path for the previous case. */
884 int ht_nodeid = apicid - (phys_proc_id[0] << bits);
885 if (ht_nodeid >= 0 &&
886 apicid_to_node[ht_nodeid] != NUMA_NO_NODE)
887 node = apicid_to_node[ht_nodeid];
888 /* Pick a nearby node */
889 if (!node_online(node))
890 node = nearby_node(apicid);
891 }
Andi Kleen69d81fc2005-11-05 17:25:53 +0100892 numa_set_node(cpu, node);
Andi Kleena1586082005-05-16 21:53:21 -0700893
Andi Kleen77d910f2006-03-25 16:29:34 +0100894 printk(KERN_INFO "CPU %d/%x(%d) -> Node %d -> Core %d\n",
895 cpu, apicid, c->x86_max_cores, node, cpu_core_id[cpu]);
Andi Kleen3f098c22005-09-12 18:49:24 +0200896#endif
Andi Kleen63518642005-04-16 15:25:16 -0700897#endif
898}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700899
900static int __init init_amd(struct cpuinfo_x86 *c)
901{
902 int r;
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100903 unsigned level;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700905#ifdef CONFIG_SMP
906 unsigned long value;
907
Andi Kleen7d318d72005-09-29 22:05:55 +0200908 /*
909 * Disable TLB flush filter by setting HWCR.FFDIS on K8
910 * bit 6 of msr C001_0015
911 *
912 * Errata 63 for SH-B3 steppings
913 * Errata 122 for all steppings (F+ have it disabled by default)
914 */
915 if (c->x86 == 15) {
916 rdmsrl(MSR_K8_HWCR, value);
917 value |= 1 << 6;
918 wrmsrl(MSR_K8_HWCR, value);
919 }
Linus Torvaldsbc5e8fd2005-09-17 15:41:04 -0700920#endif
921
Linus Torvalds1da177e2005-04-16 15:20:36 -0700922 /* Bit 31 in normal CPUID used for nonstandard 3DNow ID;
923 3DNow is IDd by bit 31 in extended CPUID (1*32+31) anyway */
924 clear_bit(0*32+31, &c->x86_capability);
925
Andi Kleen7bcd3f32006-02-03 21:51:02 +0100926 /* On C+ stepping K8 rep microcode works well for copy/memset */
927 level = cpuid_eax(1);
928 if (c->x86 == 15 && ((level >= 0x0f48 && level < 0x0f50) || level >= 0x0f58))
929 set_bit(X86_FEATURE_REP_GOOD, &c->x86_capability);
930
Linus Torvalds1da177e2005-04-16 15:20:36 -0700931 r = get_model_name(c);
932 if (!r) {
933 switch (c->x86) {
934 case 15:
935 /* Should distinguish Models here, but this is only
936 a fallback anyways. */
937 strcpy(c->x86_model_id, "Hammer");
938 break;
939 }
940 }
941 display_cacheinfo(c);
942
Andi Kleen130951c2006-01-11 22:42:02 +0100943 /* c->x86_power is 8000_0007 edx. Bit 8 is constant TSC */
944 if (c->x86_power & (1<<8))
945 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
946
Andi Kleenebfcaa92005-04-16 15:25:18 -0700947 if (c->extended_cpuid_level >= 0x80000008) {
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100948 c->x86_max_cores = (cpuid_ecx(0x80000008) & 0xff) + 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700949
Andi Kleen63518642005-04-16 15:25:16 -0700950 amd_detect_cmp(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700951 }
952
953 return r;
954}
955
Ashok Raje6982c62005-06-25 14:54:58 -0700956static void __cpuinit detect_ht(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700957{
958#ifdef CONFIG_SMP
959 u32 eax, ebx, ecx, edx;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100960 int index_msb, core_bits;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700961 int cpu = smp_processor_id();
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100962
963 cpuid(1, &eax, &ebx, &ecx, &edx);
964
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100965
Andi Kleen63518642005-04-16 15:25:16 -0700966 if (!cpu_has(c, X86_FEATURE_HT) || cpu_has(c, X86_FEATURE_CMP_LEGACY))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700967 return;
968
Linus Torvalds1da177e2005-04-16 15:20:36 -0700969 smp_num_siblings = (ebx & 0xff0000) >> 16;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100970
Linus Torvalds1da177e2005-04-16 15:20:36 -0700971 if (smp_num_siblings == 1) {
972 printk(KERN_INFO "CPU: Hyper-Threading is disabled\n");
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100973 } else if (smp_num_siblings > 1 ) {
974
Linus Torvalds1da177e2005-04-16 15:20:36 -0700975 if (smp_num_siblings > NR_CPUS) {
976 printk(KERN_WARNING "CPU: Unsupported number of the siblings %d", smp_num_siblings);
977 smp_num_siblings = 1;
978 return;
979 }
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100980
981 index_msb = get_count_order(smp_num_siblings);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700982 phys_proc_id[cpu] = phys_pkg_id(index_msb);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100983
Linus Torvalds1da177e2005-04-16 15:20:36 -0700984 printk(KERN_INFO "CPU: Physical Processor ID: %d\n",
985 phys_proc_id[cpu]);
Andi Kleen3dd9d512005-04-16 15:25:15 -0700986
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100987 smp_num_siblings = smp_num_siblings / c->x86_max_cores;
Andi Kleen3dd9d512005-04-16 15:25:15 -0700988
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100989 index_msb = get_count_order(smp_num_siblings) ;
Andi Kleen3dd9d512005-04-16 15:25:15 -0700990
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100991 core_bits = get_count_order(c->x86_max_cores);
Andi Kleen3dd9d512005-04-16 15:25:15 -0700992
Siddha, Suresh B94605ef2005-11-05 17:25:54 +0100993 cpu_core_id[cpu] = phys_pkg_id(index_msb) &
994 ((1 << core_bits) - 1);
995
996 if (c->x86_max_cores > 1)
Andi Kleen3dd9d512005-04-16 15:25:15 -0700997 printk(KERN_INFO "CPU: Processor Core ID: %d\n",
998 cpu_core_id[cpu]);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700999 }
1000#endif
1001}
1002
Andi Kleen3dd9d512005-04-16 15:25:15 -07001003/*
1004 * find out the number of processor cores on the die
1005 */
Ashok Raje6982c62005-06-25 14:54:58 -07001006static int __cpuinit intel_num_cpu_cores(struct cpuinfo_x86 *c)
Andi Kleen3dd9d512005-04-16 15:25:15 -07001007{
1008 unsigned int eax;
1009
1010 if (c->cpuid_level < 4)
1011 return 1;
1012
1013 __asm__("cpuid"
1014 : "=a" (eax)
1015 : "0" (4), "c" (0)
1016 : "bx", "dx");
1017
1018 if (eax & 0x1f)
1019 return ((eax >> 26) + 1);
1020 else
1021 return 1;
1022}
1023
Andi Kleendf0cc262005-09-12 18:49:24 +02001024static void srat_detect_node(void)
1025{
1026#ifdef CONFIG_NUMA
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001027 unsigned node;
Andi Kleendf0cc262005-09-12 18:49:24 +02001028 int cpu = smp_processor_id();
1029
1030 /* Don't do the funky fallback heuristics the AMD version employs
1031 for now. */
Ravikiran G Thirumalaiddea7be2005-10-03 10:36:28 -07001032 node = apicid_to_node[hard_smp_processor_id()];
Andi Kleendf0cc262005-09-12 18:49:24 +02001033 if (node == NUMA_NO_NODE)
1034 node = 0;
Andi Kleen69d81fc2005-11-05 17:25:53 +01001035 numa_set_node(cpu, node);
Andi Kleendf0cc262005-09-12 18:49:24 +02001036
1037 if (acpi_numa > 0)
1038 printk(KERN_INFO "CPU %d -> Node %d\n", cpu, node);
1039#endif
1040}
1041
Ashok Raje6982c62005-06-25 14:54:58 -07001042static void __cpuinit init_intel(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001043{
1044 /* Cache sizes */
1045 unsigned n;
1046
1047 init_intel_cacheinfo(c);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001048 n = c->extended_cpuid_level;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001049 if (n >= 0x80000008) {
1050 unsigned eax = cpuid_eax(0x80000008);
1051 c->x86_virt_bits = (eax >> 8) & 0xff;
1052 c->x86_phys_bits = eax & 0xff;
Shaohua Liaf9c1422005-11-05 17:25:54 +01001053 /* CPUID workaround for Intel 0F34 CPU */
1054 if (c->x86_vendor == X86_VENDOR_INTEL &&
1055 c->x86 == 0xF && c->x86_model == 0x3 &&
1056 c->x86_mask == 0x4)
1057 c->x86_phys_bits = 36;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001058 }
1059
1060 if (c->x86 == 15)
1061 c->x86_cache_alignment = c->x86_clflush_size * 2;
Andi Kleen39b3a792006-01-11 22:42:45 +01001062 if ((c->x86 == 0xf && c->x86_model >= 0x03) ||
1063 (c->x86 == 0x6 && c->x86_model >= 0x0e))
Andi Kleenc29601e2005-04-16 15:25:05 -07001064 set_bit(X86_FEATURE_CONSTANT_TSC, &c->x86_capability);
Andi Kleenc818a182006-01-11 22:45:24 +01001065 set_bit(X86_FEATURE_SYNC_RDTSC, &c->x86_capability);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001066 c->x86_max_cores = intel_num_cpu_cores(c);
Andi Kleendf0cc262005-09-12 18:49:24 +02001067
1068 srat_detect_node();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069}
1070
Adrian Bunk672289e2005-09-10 00:27:21 -07001071static void __cpuinit get_cpu_vendor(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001072{
1073 char *v = c->x86_vendor_id;
1074
1075 if (!strcmp(v, "AuthenticAMD"))
1076 c->x86_vendor = X86_VENDOR_AMD;
1077 else if (!strcmp(v, "GenuineIntel"))
1078 c->x86_vendor = X86_VENDOR_INTEL;
1079 else
1080 c->x86_vendor = X86_VENDOR_UNKNOWN;
1081}
1082
1083struct cpu_model_info {
1084 int vendor;
1085 int family;
1086 char *model_names[16];
1087};
1088
1089/* Do some early cpuid on the boot CPU to get some parameter that are
1090 needed before check_bugs. Everything advanced is in identify_cpu
1091 below. */
Ashok Raje6982c62005-06-25 14:54:58 -07001092void __cpuinit early_identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001093{
1094 u32 tfms;
1095
1096 c->loops_per_jiffy = loops_per_jiffy;
1097 c->x86_cache_size = -1;
1098 c->x86_vendor = X86_VENDOR_UNKNOWN;
1099 c->x86_model = c->x86_mask = 0; /* So far unknown... */
1100 c->x86_vendor_id[0] = '\0'; /* Unset */
1101 c->x86_model_id[0] = '\0'; /* Unset */
1102 c->x86_clflush_size = 64;
1103 c->x86_cache_alignment = c->x86_clflush_size;
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001104 c->x86_max_cores = 1;
Andi Kleenebfcaa92005-04-16 15:25:18 -07001105 c->extended_cpuid_level = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001106 memset(&c->x86_capability, 0, sizeof c->x86_capability);
1107
1108 /* Get vendor name */
1109 cpuid(0x00000000, (unsigned int *)&c->cpuid_level,
1110 (unsigned int *)&c->x86_vendor_id[0],
1111 (unsigned int *)&c->x86_vendor_id[8],
1112 (unsigned int *)&c->x86_vendor_id[4]);
1113
1114 get_cpu_vendor(c);
1115
1116 /* Initialize the standard set of capabilities */
1117 /* Note that the vendor-specific code below might override */
1118
1119 /* Intel-defined flags: level 0x00000001 */
1120 if (c->cpuid_level >= 0x00000001) {
1121 __u32 misc;
1122 cpuid(0x00000001, &tfms, &misc, &c->x86_capability[4],
1123 &c->x86_capability[0]);
1124 c->x86 = (tfms >> 8) & 0xf;
1125 c->x86_model = (tfms >> 4) & 0xf;
1126 c->x86_mask = tfms & 0xf;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001127 if (c->x86 == 0xf)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001128 c->x86 += (tfms >> 20) & 0xff;
Suresh Siddhaf5f786d2005-11-05 17:25:53 +01001129 if (c->x86 >= 0x6)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001130 c->x86_model += ((tfms >> 16) & 0xF) << 4;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001131 if (c->x86_capability[0] & (1<<19))
1132 c->x86_clflush_size = ((misc >> 8) & 0xff) * 8;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001133 } else {
1134 /* Have CPUID level 0 only - unheard of */
1135 c->x86 = 4;
1136 }
Andi Kleena1586082005-05-16 21:53:21 -07001137
1138#ifdef CONFIG_SMP
Andi Kleenb41e2932005-05-20 14:27:55 -07001139 phys_proc_id[smp_processor_id()] = (cpuid_ebx(1) >> 24) & 0xff;
Andi Kleena1586082005-05-16 21:53:21 -07001140#endif
Linus Torvalds1da177e2005-04-16 15:20:36 -07001141}
1142
1143/*
1144 * This does the hard work of actually picking apart the CPU stuff...
1145 */
Ashok Raje6982c62005-06-25 14:54:58 -07001146void __cpuinit identify_cpu(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001147{
1148 int i;
1149 u32 xlvl;
1150
1151 early_identify_cpu(c);
1152
1153 /* AMD-defined flags: level 0x80000001 */
1154 xlvl = cpuid_eax(0x80000000);
Andi Kleenebfcaa92005-04-16 15:25:18 -07001155 c->extended_cpuid_level = xlvl;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001156 if ((xlvl & 0xffff0000) == 0x80000000) {
1157 if (xlvl >= 0x80000001) {
1158 c->x86_capability[1] = cpuid_edx(0x80000001);
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001159 c->x86_capability[6] = cpuid_ecx(0x80000001);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160 }
1161 if (xlvl >= 0x80000004)
1162 get_model_name(c); /* Default name */
1163 }
1164
1165 /* Transmeta-defined flags: level 0x80860001 */
1166 xlvl = cpuid_eax(0x80860000);
1167 if ((xlvl & 0xffff0000) == 0x80860000) {
1168 /* Don't set x86_cpuid_level here for now to not confuse. */
1169 if (xlvl >= 0x80860001)
1170 c->x86_capability[2] = cpuid_edx(0x80860001);
1171 }
1172
Siddha, Suresh B1e9f28f2006-03-27 01:15:22 -08001173 c->apicid = phys_pkg_id(0);
1174
Linus Torvalds1da177e2005-04-16 15:20:36 -07001175 /*
1176 * Vendor-specific initialization. In this section we
1177 * canonicalize the feature flags, meaning if there are
1178 * features a certain CPU supports which CPUID doesn't
1179 * tell us, CPUID claiming incorrect flags, or other bugs,
1180 * we handle them here.
1181 *
1182 * At the end of this section, c->x86_capability better
1183 * indicate the features this CPU genuinely supports!
1184 */
1185 switch (c->x86_vendor) {
1186 case X86_VENDOR_AMD:
1187 init_amd(c);
1188 break;
1189
1190 case X86_VENDOR_INTEL:
1191 init_intel(c);
1192 break;
1193
1194 case X86_VENDOR_UNKNOWN:
1195 default:
1196 display_cacheinfo(c);
1197 break;
1198 }
1199
1200 select_idle_routine(c);
1201 detect_ht(c);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001202
1203 /*
1204 * On SMP, boot_cpu_data holds the common feature set between
1205 * all CPUs; so make sure that we indicate which features are
1206 * common between the CPUs. The first time this routine gets
1207 * executed, c == &boot_cpu_data.
1208 */
1209 if (c != &boot_cpu_data) {
1210 /* AND the already accumulated flags with these */
1211 for (i = 0 ; i < NCAPINTS ; i++)
1212 boot_cpu_data.x86_capability[i] &= c->x86_capability[i];
1213 }
1214
1215#ifdef CONFIG_X86_MCE
1216 mcheck_init(c);
1217#endif
Shaohua Li3b520b22005-07-07 17:56:38 -07001218 if (c == &boot_cpu_data)
1219 mtrr_bp_init();
1220 else
1221 mtrr_ap_init();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001222#ifdef CONFIG_NUMA
Andi Kleen3019e8e2005-07-28 21:15:28 -07001223 numa_add_cpu(smp_processor_id());
Linus Torvalds1da177e2005-04-16 15:20:36 -07001224#endif
1225}
1226
1227
Ashok Raje6982c62005-06-25 14:54:58 -07001228void __cpuinit print_cpu_info(struct cpuinfo_x86 *c)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001229{
1230 if (c->x86_model_id[0])
1231 printk("%s", c->x86_model_id);
1232
1233 if (c->x86_mask || c->cpuid_level >= 0)
1234 printk(" stepping %02x\n", c->x86_mask);
1235 else
1236 printk("\n");
1237}
1238
1239/*
1240 * Get CPU information for use by the procfs.
1241 */
1242
1243static int show_cpuinfo(struct seq_file *m, void *v)
1244{
1245 struct cpuinfo_x86 *c = v;
1246
1247 /*
1248 * These flag bits must match the definitions in <asm/cpufeature.h>.
1249 * NULL means this bit is undefined or reserved; either way it doesn't
1250 * have meaning as far as Linux is concerned. Note that it's important
1251 * to realize there is a difference between this table and CPUID -- if
1252 * applications want to get the raw CPUID data, they should access
1253 * /dev/cpu/<cpu_nr>/cpuid instead.
1254 */
1255 static char *x86_cap_flags[] = {
1256 /* Intel-defined */
1257 "fpu", "vme", "de", "pse", "tsc", "msr", "pae", "mce",
1258 "cx8", "apic", NULL, "sep", "mtrr", "pge", "mca", "cmov",
1259 "pat", "pse36", "pn", "clflush", NULL, "dts", "acpi", "mmx",
1260 "fxsr", "sse", "sse2", "ss", "ht", "tm", "ia64", NULL,
1261
1262 /* AMD-defined */
Zwane Mwaikambo3c3b73b2005-05-01 08:58:51 -07001263 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001264 NULL, NULL, NULL, "syscall", NULL, NULL, NULL, NULL,
1265 NULL, NULL, NULL, NULL, "nx", NULL, "mmxext", NULL,
Andi Kleen3f98bc42006-01-11 22:42:51 +01001266 NULL, "fxsr_opt", "rdtscp", NULL, NULL, "lm", "3dnowext", "3dnow",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001267
1268 /* Transmeta-defined */
1269 "recovery", "longrun", NULL, "lrti", NULL, NULL, NULL, NULL,
1270 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1271 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1272 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1273
1274 /* Other (Linux-defined) */
Andi Kleen622dcaf2005-05-16 21:53:26 -07001275 "cxmmx", NULL, "cyrix_arr", "centaur_mcr", NULL,
Andi Kleenc29601e2005-04-16 15:25:05 -07001276 "constant_tsc", NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001277 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1278 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1279 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1280
1281 /* Intel-defined (#2) */
Andi Kleen9d95dd82006-03-25 16:31:22 +01001282 "pni", NULL, NULL, "monitor", "ds_cpl", "vmx", "smx", "est",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001283 "tm2", NULL, "cid", NULL, NULL, "cx16", "xtpr", NULL,
1284 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1285 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1286
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001287 /* VIA/Cyrix/Centaur-defined */
1288 NULL, NULL, "rng", "rng_en", NULL, NULL, "ace", "ace_en",
1289 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1290 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1291 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1292
Linus Torvalds1da177e2005-04-16 15:20:36 -07001293 /* AMD-defined (#2) */
Andi Kleen3f98bc42006-01-11 22:42:51 +01001294 "lahf_lm", "cmp_legacy", "svm", NULL, "cr8_legacy", NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001295 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
1296 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
H. Peter Anvin5b7abc62005-05-01 08:58:49 -07001297 NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001298 };
1299 static char *x86_power_flags[] = {
1300 "ts", /* temperature sensor */
1301 "fid", /* frequency id control */
1302 "vid", /* voltage id control */
1303 "ttp", /* thermal trip */
1304 "tm",
Andi Kleen3f98bc42006-01-11 22:42:51 +01001305 "stc",
1306 NULL,
Andi Kleen39b3a792006-01-11 22:42:45 +01001307 /* nothing */ /* constant_tsc - moved to flags */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001308 };
1309
1310
1311#ifdef CONFIG_SMP
1312 if (!cpu_online(c-cpu_data))
1313 return 0;
1314#endif
1315
1316 seq_printf(m,"processor\t: %u\n"
1317 "vendor_id\t: %s\n"
1318 "cpu family\t: %d\n"
1319 "model\t\t: %d\n"
1320 "model name\t: %s\n",
1321 (unsigned)(c-cpu_data),
1322 c->x86_vendor_id[0] ? c->x86_vendor_id : "unknown",
1323 c->x86,
1324 (int)c->x86_model,
1325 c->x86_model_id[0] ? c->x86_model_id : "unknown");
1326
1327 if (c->x86_mask || c->cpuid_level >= 0)
1328 seq_printf(m, "stepping\t: %d\n", c->x86_mask);
1329 else
1330 seq_printf(m, "stepping\t: unknown\n");
1331
1332 if (cpu_has(c,X86_FEATURE_TSC)) {
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001333 unsigned int freq = cpufreq_quick_get((unsigned)(c-cpu_data));
1334 if (!freq)
1335 freq = cpu_khz;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001336 seq_printf(m, "cpu MHz\t\t: %u.%03u\n",
Venkatesh Pallipadi95235ca2005-12-02 10:43:20 -08001337 freq / 1000, (freq % 1000));
Linus Torvalds1da177e2005-04-16 15:20:36 -07001338 }
1339
1340 /* Cache size */
1341 if (c->x86_cache_size >= 0)
1342 seq_printf(m, "cache size\t: %d KB\n", c->x86_cache_size);
1343
1344#ifdef CONFIG_SMP
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001345 if (smp_num_siblings * c->x86_max_cores > 1) {
Andi Kleendb468682005-04-16 15:24:51 -07001346 int cpu = c - cpu_data;
1347 seq_printf(m, "physical id\t: %d\n", phys_proc_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001348 seq_printf(m, "siblings\t: %d\n", cpus_weight(cpu_core_map[cpu]));
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001349 seq_printf(m, "core id\t\t: %d\n", cpu_core_id[cpu]);
Siddha, Suresh B94605ef2005-11-05 17:25:54 +01001350 seq_printf(m, "cpu cores\t: %d\n", c->booted_cores);
Andi Kleendb468682005-04-16 15:24:51 -07001351 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001352#endif
1353
1354 seq_printf(m,
1355 "fpu\t\t: yes\n"
1356 "fpu_exception\t: yes\n"
1357 "cpuid level\t: %d\n"
1358 "wp\t\t: yes\n"
1359 "flags\t\t:",
1360 c->cpuid_level);
1361
1362 {
1363 int i;
1364 for ( i = 0 ; i < 32*NCAPINTS ; i++ )
Akinobu Mita3d1712c2006-03-24 03:15:11 -08001365 if (cpu_has(c, i) && x86_cap_flags[i] != NULL)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001366 seq_printf(m, " %s", x86_cap_flags[i]);
1367 }
1368
1369 seq_printf(m, "\nbogomips\t: %lu.%02lu\n",
1370 c->loops_per_jiffy/(500000/HZ),
1371 (c->loops_per_jiffy/(5000/HZ)) % 100);
1372
1373 if (c->x86_tlbsize > 0)
1374 seq_printf(m, "TLB size\t: %d 4K pages\n", c->x86_tlbsize);
1375 seq_printf(m, "clflush size\t: %d\n", c->x86_clflush_size);
1376 seq_printf(m, "cache_alignment\t: %d\n", c->x86_cache_alignment);
1377
1378 seq_printf(m, "address sizes\t: %u bits physical, %u bits virtual\n",
1379 c->x86_phys_bits, c->x86_virt_bits);
1380
1381 seq_printf(m, "power management:");
1382 {
1383 unsigned i;
1384 for (i = 0; i < 32; i++)
1385 if (c->x86_power & (1 << i)) {
Andi Kleen3f98bc42006-01-11 22:42:51 +01001386 if (i < ARRAY_SIZE(x86_power_flags) &&
1387 x86_power_flags[i])
1388 seq_printf(m, "%s%s",
1389 x86_power_flags[i][0]?" ":"",
1390 x86_power_flags[i]);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001391 else
1392 seq_printf(m, " [%d]", i);
1393 }
1394 }
Andi Kleen3dd9d512005-04-16 15:25:15 -07001395
Siddha, Suresh Bd31ddaa2005-04-16 15:25:20 -07001396 seq_printf(m, "\n\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -07001397
Linus Torvalds1da177e2005-04-16 15:20:36 -07001398 return 0;
1399}
1400
1401static void *c_start(struct seq_file *m, loff_t *pos)
1402{
1403 return *pos < NR_CPUS ? cpu_data + *pos : NULL;
1404}
1405
1406static void *c_next(struct seq_file *m, void *v, loff_t *pos)
1407{
1408 ++*pos;
1409 return c_start(m, pos);
1410}
1411
1412static void c_stop(struct seq_file *m, void *v)
1413{
1414}
1415
1416struct seq_operations cpuinfo_op = {
1417 .start =c_start,
1418 .next = c_next,
1419 .stop = c_stop,
1420 .show = show_cpuinfo,
1421};
Andi Kleene9928672006-01-11 22:43:33 +01001422