2 * This file is subject to the terms and conditions of the GNU General Public
3 * License. See the file "COPYING" in the main directory of this archive
6 * Copyright (C) 1999,2001-2004 Silicon Graphics, Inc. All rights reserved.
9 #include <linux/config.h>
10 #include <linux/module.h>
11 #include <linux/init.h>
12 #include <linux/delay.h>
13 #include <linux/kernel.h>
14 #include <linux/kdev_t.h>
15 #include <linux/string.h>
16 #include <linux/tty.h>
17 #include <linux/console.h>
18 #include <linux/timex.h>
19 #include <linux/sched.h>
20 #include <linux/ioport.h>
22 #include <linux/serial.h>
23 #include <linux/irq.h>
24 #include <linux/bootmem.h>
25 #include <linux/mmzone.h>
26 #include <linux/interrupt.h>
27 #include <linux/acpi.h>
28 #include <linux/compiler.h>
29 #include <linux/sched.h>
30 #include <linux/root_dev.h>
31 #include <linux/nodemask.h>
36 #include <asm/machvec.h>
37 #include <asm/system.h>
38 #include <asm/processor.h>
39 #include <asm/sn/arch.h>
40 #include <asm/sn/addrs.h>
41 #include <asm/sn/pda.h>
42 #include <asm/sn/nodepda.h>
43 #include <asm/sn/sn_cpuid.h>
44 #include <asm/sn/simulator.h>
45 #include <asm/sn/leds.h>
46 #include <asm/sn/bte.h>
47 #include <asm/sn/shub_mmr.h>
48 #include <asm/sn/clksupport.h>
49 #include <asm/sn/sn_sal.h>
50 #include <asm/sn/geo.h>
51 #include "xtalk/xwidgetdev.h"
52 #include "xtalk/hubdev.h"
53 #include <asm/sn/klconfig.h>
56 DEFINE_PER_CPU(struct pda_s, pda_percpu);
58 #define MAX_PHYS_MEMORY (1UL << 49) /* 1 TB */
60 lboard_t *root_lboard[MAX_COMPACT_NODES];
62 extern void bte_init_node(nodepda_t *, cnodeid_t);
64 extern void sn_timer_init(void);
65 extern unsigned long last_time_offset;
66 extern void (*ia64_mark_idle) (int);
67 extern void snidle(int);
68 extern unsigned char acpi_kbd_controller_present;
70 unsigned long sn_rtc_cycles_per_second;
71 EXPORT_SYMBOL(sn_rtc_cycles_per_second);
73 DEFINE_PER_CPU(struct sn_hub_info_s, __sn_hub_info);
74 EXPORT_PER_CPU_SYMBOL(__sn_hub_info);
76 partid_t sn_partid = -1;
77 EXPORT_SYMBOL(sn_partid);
78 char sn_system_serial_number_string[128];
79 EXPORT_SYMBOL(sn_system_serial_number_string);
80 u64 sn_partition_serial_number;
81 EXPORT_SYMBOL(sn_partition_serial_number);
83 EXPORT_SYMBOL(sn_partition_id);
85 EXPORT_SYMBOL(sn_system_size);
86 u8 sn_sharing_domain_size;
87 EXPORT_SYMBOL(sn_sharing_domain_size);
89 EXPORT_SYMBOL(sn_coherency_id);
91 EXPORT_SYMBOL(sn_region_size);
93 short physical_node_map[MAX_PHYSNODE_ID];
95 EXPORT_SYMBOL(physical_node_map);
99 static void sn_init_pdas(char **);
100 static void scan_for_ionodes(void);
102 static nodepda_t *nodepdaindr[MAX_COMPACT_NODES];
105 * The format of "screen_info" is strange, and due to early i386-setup
106 * code. This is just enough to make the console code think we're on a
109 struct screen_info sn_screen_info = {
112 .orig_video_mode = 3,
113 .orig_video_cols = 80,
114 .orig_video_ega_bx = 3,
115 .orig_video_lines = 25,
116 .orig_video_isVGA = 1,
117 .orig_video_points = 16
121 * This is here so we can use the CMOS detection in ide-probe.c to
122 * determine what drives are present. In theory, we don't need this
123 * as the auto-detection could be done via ide-probe.c:do_probe() but
124 * in practice that would be much slower, which is painful when
125 * running in the simulator. Note that passing zeroes in DRIVE_INFO
126 * is sufficient (the IDE driver will autodetect the drive geometry).
128 #ifdef CONFIG_IA64_GENERIC
129 extern char drive_info[4 * 16];
131 char drive_info[4 * 16];
135 * Get nasid of current cpu early in boot before nodepda is initialized
142 if (ia64_sn_get_sapic_info(get_sapicid(), &nasid, NULL, NULL))
148 * This routine can only be used during init, since
149 * smp_boot_data is an init data structure.
150 * We have to use smp_boot_data.cpu_phys_id to find
151 * the physical id of the processor because the normal
152 * cpu_physical_id() relies on data structures that
153 * may not be initialized yet.
156 static int __init pxm_to_nasid(int pxm)
161 nid = pxm_to_nid_map[pxm];
162 for (i = 0; i < num_node_memblks; i++) {
163 if (node_memblk[i].nid == nid) {
164 return NASID_GET(node_memblk[i].start_paddr);
171 * early_sn_setup - early setup routine for SN platforms
173 * Sets up an initial console to aid debugging. Intended primarily
174 * for bringup. See start_kernel() in init/main.c.
177 void __init early_sn_setup(void)
179 efi_system_table_t *efi_systab;
180 efi_config_table_t *config_tables;
181 struct ia64_sal_systab *sal_systab;
182 struct ia64_sal_desc_entry_point *ep;
187 * Parse enough of the SAL tables to locate the SAL entry point. Since, console
188 * IO on SN2 is done via SAL calls, early_printk won't work without this.
190 * This code duplicates some of the ACPI table parsing that is in efi.c & sal.c.
191 * Any changes to those file may have to be made hereas well.
193 efi_systab = (efi_system_table_t *) __va(ia64_boot_param->efi_systab);
194 config_tables = __va(efi_systab->tables);
195 for (i = 0; i < efi_systab->nr_tables; i++) {
196 if (efi_guidcmp(config_tables[i].guid, SAL_SYSTEM_TABLE_GUID) ==
198 sal_systab = __va(config_tables[i].table);
199 p = (char *)(sal_systab + 1);
200 for (j = 0; j < sal_systab->entry_count; j++) {
201 if (*p == SAL_DESC_ENTRY_POINT) {
202 ep = (struct ia64_sal_desc_entry_point
204 ia64_sal_handler_init(__va
209 p += SAL_DESC_SIZE(*p);
213 /* Uh-oh, SAL not available?? */
214 printk(KERN_ERR "failed to find SAL entry point\n");
217 extern int platform_intr_list[];
218 extern nasid_t master_nasid;
219 static int shub_1_1_found __initdata;
224 * Set flag for enabling shub specific wars
227 static inline int __init is_shub_1_1(int nasid)
234 id = REMOTE_HUB_L(nasid, SH1_SHUB_ID);
235 rev = (id & SH1_SHUB_ID_REVISION_MASK) >> SH1_SHUB_ID_REVISION_SHFT;
239 static void __init sn_check_for_wars(void)
246 for_each_online_node(cnode) {
247 if (is_shub_1_1(cnodeid_to_nasid(cnode)))
248 sn_hub_info->shub_1_1_found = 1;
254 * sn_setup - SN platform setup routine
255 * @cmdline_p: kernel command line
257 * Handles platform setup for SN machines. This includes determining
258 * the RTC frequency (via a SAL call), initializing secondary CPUs, and
259 * setting up per-node data areas. The console is also initialized here.
261 void __init sn_setup(char **cmdline_p)
263 long status, ticks_per_sec, drift;
265 int major = sn_sal_rev_major(), minor = sn_sal_rev_minor();
266 extern void sn_cpu_init(void);
269 * If the generic code has enabled vga console support - lets
270 * get rid of it again. This is a kludge for the fact that ACPI
271 * currtently has no way of informing us if legacy VGA is available
274 #if defined(CONFIG_VT) && defined(CONFIG_VGA_CONSOLE)
275 if (conswitchp == &vga_con) {
276 printk(KERN_DEBUG "SGI: Disabling VGA console\n");
277 #ifdef CONFIG_DUMMY_CONSOLE
278 conswitchp = &dummy_con;
281 #endif /* CONFIG_DUMMY_CONSOLE */
283 #endif /* def(CONFIG_VT) && def(CONFIG_VGA_CONSOLE) */
285 MAX_DMA_ADDRESS = PAGE_OFFSET + MAX_PHYS_MEMORY;
287 memset(physical_node_map, -1, sizeof(physical_node_map));
288 for (pxm = 0; pxm < MAX_PXM_DOMAINS; pxm++)
289 if (pxm_to_nid_map[pxm] != -1)
290 physical_node_map[pxm_to_nasid(pxm)] =
294 * Old PROMs do not provide an ACPI FADT. Disable legacy keyboard
295 * support here so we don't have to listen to failed keyboard probe
298 if ((major < 2 || (major == 2 && minor <= 9)) &&
299 acpi_kbd_controller_present) {
300 printk(KERN_INFO "Disabling legacy keyboard support as prom "
301 "is too old and doesn't provide FADT\n");
302 acpi_kbd_controller_present = 0;
305 printk("SGI SAL version %x.%02x\n", major, minor);
308 * Confirm the SAL we're running on is recent enough...
310 if ((major < SN_SAL_MIN_MAJOR) || (major == SN_SAL_MIN_MAJOR &&
311 minor < SN_SAL_MIN_MINOR)) {
312 printk(KERN_ERR "This kernel needs SGI SAL version >= "
313 "%x.%02x\n", SN_SAL_MIN_MAJOR, SN_SAL_MIN_MINOR);
314 panic("PROM version too old\n");
317 master_nasid = boot_get_nasid();
320 ia64_sal_freq_base(SAL_FREQ_BASE_REALTIME_CLOCK, &ticks_per_sec,
322 if (status != 0 || ticks_per_sec < 100000) {
324 "unable to determine platform RTC clock frequency, guessing.\n");
325 /* PROM gives wrong value for clock freq. so guess */
326 sn_rtc_cycles_per_second = 1000000000000UL / 30000UL;
328 sn_rtc_cycles_per_second = ticks_per_sec;
330 platform_intr_list[ACPI_INTERRUPT_CPEI] = IA64_CPE_VECTOR;
333 * we set the default root device to /dev/hda
334 * to make simulation easy
336 ROOT_DEV = Root_HDA1;
339 * Create the PDAs and NODEPDAs for all the cpus.
341 sn_init_pdas(cmdline_p);
343 ia64_mark_idle = &snidle;
346 * For the bootcpu, we do this here. All other cpus will make the
347 * call as part of cpu_init in slave cpu initialization.
354 screen_info = sn_screen_info;
359 * set pm_power_off to a SAL call to allow
360 * sn machines to power off. The SAL call can be replaced
361 * by an ACPI interface call when ACPI is fully implemented
364 pm_power_off = ia64_sn_power_down;
368 * sn_init_pdas - setup node data areas
370 * One time setup for Node Data Area. Called by sn_setup().
372 static void __init sn_init_pdas(char **cmdline_p)
376 memset(pda->cnodeid_to_nasid_table, -1,
377 sizeof(pda->cnodeid_to_nasid_table));
378 for_each_online_node(cnode)
379 pda->cnodeid_to_nasid_table[cnode] =
380 pxm_to_nasid(nid_to_pxm_map[cnode]);
382 numionodes = num_online_nodes();
386 * Allocate & initalize the nodepda for each node.
388 for_each_online_node(cnode) {
390 alloc_bootmem_node(NODE_DATA(cnode), sizeof(nodepda_t));
391 memset(nodepdaindr[cnode], 0, sizeof(nodepda_t));
392 memset(nodepdaindr[cnode]->phys_cpuid, -1,
393 sizeof(nodepdaindr[cnode]->phys_cpuid));
397 * Allocate & initialize nodepda for TIOs. For now, put them on node 0.
399 for (cnode = num_online_nodes(); cnode < numionodes; cnode++) {
401 alloc_bootmem_node(NODE_DATA(0), sizeof(nodepda_t));
402 memset(nodepdaindr[cnode], 0, sizeof(nodepda_t));
406 * Now copy the array of nodepda pointers to each nodepda.
408 for (cnode = 0; cnode < numionodes; cnode++)
409 memcpy(nodepdaindr[cnode]->pernode_pdaindr, nodepdaindr,
410 sizeof(nodepdaindr));
413 * Set up IO related platform-dependent nodepda fields.
414 * The following routine actually sets up the hubinfo struct
417 for_each_online_node(cnode) {
418 bte_init_node(nodepdaindr[cnode], cnode);
422 * Initialize the per node hubdev. This includes IO Nodes and
423 * headless/memless nodes.
425 for (cnode = 0; cnode < numionodes; cnode++) {
426 hubdev_init_node(nodepdaindr[cnode], cnode);
431 * sn_cpu_init - initialize per-cpu data areas
432 * @cpuid: cpuid of the caller
434 * Called during cpu initialization on each cpu as it starts.
435 * Currently, initializes the per-cpu data area for SNIA.
436 * Also sets up a few fields in the nodepda. Also known as
437 * platform_cpu_init() by the ia64 machvec code.
439 void __init sn_cpu_init(void)
448 static int wars_have_been_checked;
450 memset(pda, 0, sizeof(pda));
451 if (ia64_sn_get_sn_info(0, &sn_hub_info->shub2, &sn_hub_info->nasid_bitmask, &sn_hub_info->nasid_shift,
452 &sn_system_size, &sn_sharing_domain_size, &sn_partition_id,
453 &sn_coherency_id, &sn_region_size))
455 sn_hub_info->as_shift = sn_hub_info->nasid_shift - 2;
458 * The boot cpu makes this call again after platform initialization is
461 if (nodepdaindr[0] == NULL)
464 cpuid = smp_processor_id();
465 cpuphyid = get_sapicid();
467 if (ia64_sn_get_sapic_info(cpuphyid, &nasid, &subnode, &slice))
470 for (i=0; i < MAX_NUMNODES; i++) {
471 if (nodepdaindr[i]) {
472 nodepdaindr[i]->phys_cpuid[cpuid].nasid = nasid;
473 nodepdaindr[i]->phys_cpuid[cpuid].slice = slice;
474 nodepdaindr[i]->phys_cpuid[cpuid].subnode = subnode;
478 cnode = nasid_to_cnodeid(nasid);
480 pda->p_nodepda = nodepdaindr[cnode];
482 (typeof(pda->led_address)) (LED0 + (slice << LED_CPU_SHIFT));
483 pda->led_state = LED_ALWAYS_SET;
484 pda->hb_count = HZ / 2;
489 memcpy(pda->cnodeid_to_nasid_table,
490 pdacpu(0)->cnodeid_to_nasid_table,
491 sizeof(pda->cnodeid_to_nasid_table));
496 * Only needs to be done once, on BSP.
497 * Has to be done after loop above, because it uses pda.cnodeid_to_nasid_table[i].
498 * Has to be done before assignment below.
500 if (!wars_have_been_checked) {
502 wars_have_been_checked = 1;
504 sn_hub_info->shub_1_1_found = shub_1_1_found;
507 * Set up addresses of PIO/MEM write status registers.
510 u64 pio1[] = {SH1_PIO_WRITE_STATUS_0, 0, SH1_PIO_WRITE_STATUS_1, 0};
511 u64 pio2[] = {SH2_PIO_WRITE_STATUS_0, SH2_PIO_WRITE_STATUS_1,
512 SH2_PIO_WRITE_STATUS_2, SH2_PIO_WRITE_STATUS_3};
514 pio = is_shub1() ? pio1 : pio2;
515 pda->pio_write_status_addr = (volatile unsigned long *) LOCAL_MMR_ADDR(pio[slice]);
516 pda->pio_write_status_val = is_shub1() ? SH_PIO_WRITE_STATUS_PENDING_WRITE_COUNT_MASK : 0;
520 * WAR addresses for SHUB 1.x.
522 if (local_node_data->active_cpu_count++ == 0 && is_shub1()) {
525 cnodeid_to_nasid(numa_node_id() ==
526 num_online_nodes() - 1 ? 0 : numa_node_id() + 1);
527 pda->pio_shub_war_cam_addr =
528 (volatile unsigned long *)GLOBAL_MMR_ADDR(nasid,
534 * Scan klconfig for ionodes. Add the nasids to the
535 * physical_node_map and the pda and increment numionodes.
538 static void __init scan_for_ionodes(void)
543 /* Setup ionodes with memory */
544 for (nasid = 0; nasid < MAX_PHYSNODE_ID; nasid += 2) {
545 char *klgraph_header;
548 if (physical_node_map[nasid] == -1)
552 klgraph_header = __va(ia64_sn_get_klconfig_addr(nasid));
553 if (!klgraph_header) {
554 if (IS_RUNNING_ON_SIMULATOR())
556 BUG(); /* All nodes must have klconfig tables! */
558 cnodeid = nasid_to_cnodeid(nasid);
559 root_lboard[cnodeid] = (lboard_t *)
560 NODE_OFFSET_TO_LBOARD((nasid),
562 *) (klgraph_header))->
566 /* Scan headless/memless IO Nodes. */
567 for (nasid = 0; nasid < MAX_PHYSNODE_ID; nasid += 2) {
568 /* if there's no nasid, don't try to read the klconfig on the node */
569 if (physical_node_map[nasid] == -1)
571 brd = find_lboard_any((lboard_t *)
572 root_lboard[nasid_to_cnodeid(nasid)],
575 brd = KLCF_NEXT_ANY(brd); /* Skip this node's lboard */
580 brd = find_lboard_any(brd, KLTYPE_SNIA);
583 pda->cnodeid_to_nasid_table[numionodes] =
585 physical_node_map[brd->brd_nasid] = numionodes;
586 root_lboard[numionodes] = brd;
588 brd = KLCF_NEXT_ANY(brd);
592 brd = find_lboard_any(brd, KLTYPE_SNIA);
596 /* Scan for TIO nodes. */
597 for (nasid = 0; nasid < MAX_PHYSNODE_ID; nasid += 2) {
598 /* if there's no nasid, don't try to read the klconfig on the node */
599 if (physical_node_map[nasid] == -1)
601 brd = find_lboard_any((lboard_t *)
602 root_lboard[nasid_to_cnodeid(nasid)],
605 pda->cnodeid_to_nasid_table[numionodes] =
607 physical_node_map[brd->brd_nasid] = numionodes;
608 root_lboard[numionodes] = brd;
610 brd = KLCF_NEXT_ANY(brd);
614 brd = find_lboard_any(brd, KLTYPE_TIO);
621 nasid_slice_to_cpuid(int nasid, int slice)
625 for (cpu=0; cpu < NR_CPUS; cpu++)
626 if (nodepda->phys_cpuid[cpu].nasid == nasid && nodepda->phys_cpuid[cpu].slice == slice)