Loading...
1// SPDX-License-Identifier: GPL-2.0-or-later
2/*
3 * Common boot and setup code for both 32-bit and 64-bit.
4 * Extracted from arch/powerpc/kernel/setup_64.c.
5 *
6 * Copyright (C) 2001 PPC64 Team, IBM Corp
7 */
8
9#undef DEBUG
10
11#include <linux/export.h>
12#include <linux/panic_notifier.h>
13#include <linux/string.h>
14#include <linux/sched.h>
15#include <linux/init.h>
16#include <linux/kernel.h>
17#include <linux/reboot.h>
18#include <linux/delay.h>
19#include <linux/initrd.h>
20#include <linux/platform_device.h>
21#include <linux/printk.h>
22#include <linux/seq_file.h>
23#include <linux/ioport.h>
24#include <linux/console.h>
25#include <linux/screen_info.h>
26#include <linux/root_dev.h>
27#include <linux/cpu.h>
28#include <linux/unistd.h>
29#include <linux/seq_buf.h>
30#include <linux/serial.h>
31#include <linux/serial_8250.h>
32#include <linux/percpu.h>
33#include <linux/memblock.h>
34#include <linux/of_irq.h>
35#include <linux/of_fdt.h>
36#include <linux/of_platform.h>
37#include <linux/hugetlb.h>
38#include <linux/pgtable.h>
39#include <asm/io.h>
40#include <asm/paca.h>
41#include <asm/processor.h>
42#include <asm/vdso_datapage.h>
43#include <asm/smp.h>
44#include <asm/elf.h>
45#include <asm/machdep.h>
46#include <asm/time.h>
47#include <asm/cputable.h>
48#include <asm/sections.h>
49#include <asm/firmware.h>
50#include <asm/btext.h>
51#include <asm/nvram.h>
52#include <asm/setup.h>
53#include <asm/rtas.h>
54#include <asm/iommu.h>
55#include <asm/serial.h>
56#include <asm/cache.h>
57#include <asm/page.h>
58#include <asm/mmu.h>
59#include <asm/xmon.h>
60#include <asm/cputhreads.h>
61#include <mm/mmu_decl.h>
62#include <asm/archrandom.h>
63#include <asm/fadump.h>
64#include <asm/udbg.h>
65#include <asm/hugetlb.h>
66#include <asm/livepatch.h>
67#include <asm/mmu_context.h>
68#include <asm/cpu_has_feature.h>
69#include <asm/kasan.h>
70#include <asm/mce.h>
71
72#include "setup.h"
73
74#ifdef DEBUG
75#define DBG(fmt...) udbg_printf(fmt)
76#else
77#define DBG(fmt...)
78#endif
79
80/* The main machine-dep calls structure
81 */
82struct machdep_calls ppc_md;
83EXPORT_SYMBOL(ppc_md);
84struct machdep_calls *machine_id;
85EXPORT_SYMBOL(machine_id);
86
87int boot_cpuid = -1;
88EXPORT_SYMBOL_GPL(boot_cpuid);
89
90/*
91 * These are used in binfmt_elf.c to put aux entries on the stack
92 * for each elf executable being started.
93 */
94int dcache_bsize;
95int icache_bsize;
96
97/*
98 * This still seems to be needed... -- paulus
99 */
100struct screen_info screen_info = {
101 .orig_x = 0,
102 .orig_y = 25,
103 .orig_video_cols = 80,
104 .orig_video_lines = 25,
105 .orig_video_isVGA = 1,
106 .orig_video_points = 16
107};
108#if defined(CONFIG_FB_VGA16_MODULE)
109EXPORT_SYMBOL(screen_info);
110#endif
111
112/* Variables required to store legacy IO irq routing */
113int of_i8042_kbd_irq;
114EXPORT_SYMBOL_GPL(of_i8042_kbd_irq);
115int of_i8042_aux_irq;
116EXPORT_SYMBOL_GPL(of_i8042_aux_irq);
117
118#ifdef __DO_IRQ_CANON
119/* XXX should go elsewhere eventually */
120int ppc_do_canonicalize_irqs;
121EXPORT_SYMBOL(ppc_do_canonicalize_irqs);
122#endif
123
124#ifdef CONFIG_CRASH_CORE
125/* This keeps a track of which one is the crashing cpu. */
126int crashing_cpu = -1;
127#endif
128
129/* also used by kexec */
130void machine_shutdown(void)
131{
132 /*
133 * if fadump is active, cleanup the fadump registration before we
134 * shutdown.
135 */
136 fadump_cleanup();
137
138 if (ppc_md.machine_shutdown)
139 ppc_md.machine_shutdown();
140}
141
142static void machine_hang(void)
143{
144 pr_emerg("System Halted, OK to turn off power\n");
145 local_irq_disable();
146 while (1)
147 ;
148}
149
150void machine_restart(char *cmd)
151{
152 machine_shutdown();
153 if (ppc_md.restart)
154 ppc_md.restart(cmd);
155
156 smp_send_stop();
157
158 do_kernel_restart(cmd);
159 mdelay(1000);
160
161 machine_hang();
162}
163
164void machine_power_off(void)
165{
166 machine_shutdown();
167 do_kernel_power_off();
168 smp_send_stop();
169 machine_hang();
170}
171/* Used by the G5 thermal driver */
172EXPORT_SYMBOL_GPL(machine_power_off);
173
174void (*pm_power_off)(void);
175EXPORT_SYMBOL_GPL(pm_power_off);
176
177size_t __must_check arch_get_random_seed_longs(unsigned long *v, size_t max_longs)
178{
179 if (max_longs && ppc_md.get_random_seed && ppc_md.get_random_seed(v))
180 return 1;
181 return 0;
182}
183EXPORT_SYMBOL(arch_get_random_seed_longs);
184
185void machine_halt(void)
186{
187 machine_shutdown();
188 if (ppc_md.halt)
189 ppc_md.halt();
190
191 smp_send_stop();
192 machine_hang();
193}
194
195#ifdef CONFIG_SMP
196DEFINE_PER_CPU(unsigned int, cpu_pvr);
197#endif
198
199static void show_cpuinfo_summary(struct seq_file *m)
200{
201 struct device_node *root;
202 const char *model = NULL;
203 unsigned long bogosum = 0;
204 int i;
205
206 if (IS_ENABLED(CONFIG_SMP) && IS_ENABLED(CONFIG_PPC32)) {
207 for_each_online_cpu(i)
208 bogosum += loops_per_jiffy;
209 seq_printf(m, "total bogomips\t: %lu.%02lu\n",
210 bogosum / (500000 / HZ), bogosum / (5000 / HZ) % 100);
211 }
212 seq_printf(m, "timebase\t: %lu\n", ppc_tb_freq);
213 if (ppc_md.name)
214 seq_printf(m, "platform\t: %s\n", ppc_md.name);
215 root = of_find_node_by_path("/");
216 if (root)
217 model = of_get_property(root, "model", NULL);
218 if (model)
219 seq_printf(m, "model\t\t: %s\n", model);
220 of_node_put(root);
221
222 if (ppc_md.show_cpuinfo != NULL)
223 ppc_md.show_cpuinfo(m);
224
225 /* Display the amount of memory */
226 if (IS_ENABLED(CONFIG_PPC32))
227 seq_printf(m, "Memory\t\t: %d MB\n",
228 (unsigned int)(total_memory / (1024 * 1024)));
229}
230
231static int show_cpuinfo(struct seq_file *m, void *v)
232{
233 unsigned long cpu_id = (unsigned long)v - 1;
234 unsigned int pvr;
235 unsigned long proc_freq;
236 unsigned short maj;
237 unsigned short min;
238
239#ifdef CONFIG_SMP
240 pvr = per_cpu(cpu_pvr, cpu_id);
241#else
242 pvr = mfspr(SPRN_PVR);
243#endif
244 maj = (pvr >> 8) & 0xFF;
245 min = pvr & 0xFF;
246
247 seq_printf(m, "processor\t: %lu\ncpu\t\t: ", cpu_id);
248
249 if (cur_cpu_spec->pvr_mask && cur_cpu_spec->cpu_name)
250 seq_puts(m, cur_cpu_spec->cpu_name);
251 else
252 seq_printf(m, "unknown (%08x)", pvr);
253
254 if (cpu_has_feature(CPU_FTR_ALTIVEC))
255 seq_puts(m, ", altivec supported");
256
257 seq_putc(m, '\n');
258
259#ifdef CONFIG_TAU
260 if (cpu_has_feature(CPU_FTR_TAU)) {
261 if (IS_ENABLED(CONFIG_TAU_AVERAGE)) {
262 /* more straightforward, but potentially misleading */
263 seq_printf(m, "temperature \t: %u C (uncalibrated)\n",
264 cpu_temp(cpu_id));
265 } else {
266 /* show the actual temp sensor range */
267 u32 temp;
268 temp = cpu_temp_both(cpu_id);
269 seq_printf(m, "temperature \t: %u-%u C (uncalibrated)\n",
270 temp & 0xff, temp >> 16);
271 }
272 }
273#endif /* CONFIG_TAU */
274
275 /*
276 * Platforms that have variable clock rates, should implement
277 * the method ppc_md.get_proc_freq() that reports the clock
278 * rate of a given cpu. The rest can use ppc_proc_freq to
279 * report the clock rate that is same across all cpus.
280 */
281 if (ppc_md.get_proc_freq)
282 proc_freq = ppc_md.get_proc_freq(cpu_id);
283 else
284 proc_freq = ppc_proc_freq;
285
286 if (proc_freq)
287 seq_printf(m, "clock\t\t: %lu.%06luMHz\n",
288 proc_freq / 1000000, proc_freq % 1000000);
289
290 /* If we are a Freescale core do a simple check so
291 * we don't have to keep adding cases in the future */
292 if (PVR_VER(pvr) & 0x8000) {
293 switch (PVR_VER(pvr)) {
294 case 0x8000: /* 7441/7450/7451, Voyager */
295 case 0x8001: /* 7445/7455, Apollo 6 */
296 case 0x8002: /* 7447/7457, Apollo 7 */
297 case 0x8003: /* 7447A, Apollo 7 PM */
298 case 0x8004: /* 7448, Apollo 8 */
299 case 0x800c: /* 7410, Nitro */
300 maj = ((pvr >> 8) & 0xF);
301 min = PVR_MIN(pvr);
302 break;
303 default: /* e500/book-e */
304 maj = PVR_MAJ(pvr);
305 min = PVR_MIN(pvr);
306 break;
307 }
308 } else {
309 switch (PVR_VER(pvr)) {
310 case 0x1008: /* 740P/750P ?? */
311 maj = ((pvr >> 8) & 0xFF) - 1;
312 min = pvr & 0xFF;
313 break;
314 case 0x004e: /* POWER9 bits 12-15 give chip type */
315 case 0x0080: /* POWER10 bit 12 gives SMT8/4 */
316 maj = (pvr >> 8) & 0x0F;
317 min = pvr & 0xFF;
318 break;
319 default:
320 maj = (pvr >> 8) & 0xFF;
321 min = pvr & 0xFF;
322 break;
323 }
324 }
325
326 seq_printf(m, "revision\t: %hd.%hd (pvr %04x %04x)\n",
327 maj, min, PVR_VER(pvr), PVR_REV(pvr));
328
329 if (IS_ENABLED(CONFIG_PPC32))
330 seq_printf(m, "bogomips\t: %lu.%02lu\n", loops_per_jiffy / (500000 / HZ),
331 (loops_per_jiffy / (5000 / HZ)) % 100);
332
333 seq_putc(m, '\n');
334
335 /* If this is the last cpu, print the summary */
336 if (cpumask_next(cpu_id, cpu_online_mask) >= nr_cpu_ids)
337 show_cpuinfo_summary(m);
338
339 return 0;
340}
341
342static void *c_start(struct seq_file *m, loff_t *pos)
343{
344 if (*pos == 0) /* just in case, cpu 0 is not the first */
345 *pos = cpumask_first(cpu_online_mask);
346 else
347 *pos = cpumask_next(*pos - 1, cpu_online_mask);
348 if ((*pos) < nr_cpu_ids)
349 return (void *)(unsigned long)(*pos + 1);
350 return NULL;
351}
352
353static void *c_next(struct seq_file *m, void *v, loff_t *pos)
354{
355 (*pos)++;
356 return c_start(m, pos);
357}
358
359static void c_stop(struct seq_file *m, void *v)
360{
361}
362
363const struct seq_operations cpuinfo_op = {
364 .start = c_start,
365 .next = c_next,
366 .stop = c_stop,
367 .show = show_cpuinfo,
368};
369
370void __init check_for_initrd(void)
371{
372#ifdef CONFIG_BLK_DEV_INITRD
373 DBG(" -> check_for_initrd() initrd_start=0x%lx initrd_end=0x%lx\n",
374 initrd_start, initrd_end);
375
376 /* If we were passed an initrd, set the ROOT_DEV properly if the values
377 * look sensible. If not, clear initrd reference.
378 */
379 if (is_kernel_addr(initrd_start) && is_kernel_addr(initrd_end) &&
380 initrd_end > initrd_start)
381 ROOT_DEV = Root_RAM0;
382 else
383 initrd_start = initrd_end = 0;
384
385 if (initrd_start)
386 pr_info("Found initrd at 0x%lx:0x%lx\n", initrd_start, initrd_end);
387
388 DBG(" <- check_for_initrd()\n");
389#endif /* CONFIG_BLK_DEV_INITRD */
390}
391
392#ifdef CONFIG_SMP
393
394int threads_per_core, threads_per_subcore, threads_shift __read_mostly;
395cpumask_t threads_core_mask __read_mostly;
396EXPORT_SYMBOL_GPL(threads_per_core);
397EXPORT_SYMBOL_GPL(threads_per_subcore);
398EXPORT_SYMBOL_GPL(threads_shift);
399EXPORT_SYMBOL_GPL(threads_core_mask);
400
401static void __init cpu_init_thread_core_maps(int tpc)
402{
403 int i;
404
405 threads_per_core = tpc;
406 threads_per_subcore = tpc;
407 cpumask_clear(&threads_core_mask);
408
409 /* This implementation only supports power of 2 number of threads
410 * for simplicity and performance
411 */
412 threads_shift = ilog2(tpc);
413 BUG_ON(tpc != (1 << threads_shift));
414
415 for (i = 0; i < tpc; i++)
416 cpumask_set_cpu(i, &threads_core_mask);
417
418 printk(KERN_INFO "CPU maps initialized for %d thread%s per core\n",
419 tpc, tpc > 1 ? "s" : "");
420 printk(KERN_DEBUG " (thread shift is %d)\n", threads_shift);
421}
422
423
424u32 *cpu_to_phys_id = NULL;
425
426/**
427 * setup_cpu_maps - initialize the following cpu maps:
428 * cpu_possible_mask
429 * cpu_present_mask
430 *
431 * Having the possible map set up early allows us to restrict allocations
432 * of things like irqstacks to nr_cpu_ids rather than NR_CPUS.
433 *
434 * We do not initialize the online map here; cpus set their own bits in
435 * cpu_online_mask as they come up.
436 *
437 * This function is valid only for Open Firmware systems. finish_device_tree
438 * must be called before using this.
439 *
440 * While we're here, we may as well set the "physical" cpu ids in the paca.
441 *
442 * NOTE: This must match the parsing done in early_init_dt_scan_cpus.
443 */
444void __init smp_setup_cpu_maps(void)
445{
446 struct device_node *dn;
447 int cpu = 0;
448 int nthreads = 1;
449
450 DBG("smp_setup_cpu_maps()\n");
451
452 cpu_to_phys_id = memblock_alloc(nr_cpu_ids * sizeof(u32),
453 __alignof__(u32));
454 if (!cpu_to_phys_id)
455 panic("%s: Failed to allocate %zu bytes align=0x%zx\n",
456 __func__, nr_cpu_ids * sizeof(u32), __alignof__(u32));
457
458 for_each_node_by_type(dn, "cpu") {
459 const __be32 *intserv;
460 __be32 cpu_be;
461 int j, len;
462
463 DBG(" * %pOF...\n", dn);
464
465 intserv = of_get_property(dn, "ibm,ppc-interrupt-server#s",
466 &len);
467 if (intserv) {
468 DBG(" ibm,ppc-interrupt-server#s -> %lu threads\n",
469 (len / sizeof(int)));
470 } else {
471 DBG(" no ibm,ppc-interrupt-server#s -> 1 thread\n");
472 intserv = of_get_property(dn, "reg", &len);
473 if (!intserv) {
474 cpu_be = cpu_to_be32(cpu);
475 /* XXX: what is this? uninitialized?? */
476 intserv = &cpu_be; /* assume logical == phys */
477 len = 4;
478 }
479 }
480
481 nthreads = len / sizeof(int);
482
483 for (j = 0; j < nthreads && cpu < nr_cpu_ids; j++) {
484 bool avail;
485
486 DBG(" thread %d -> cpu %d (hard id %d)\n",
487 j, cpu, be32_to_cpu(intserv[j]));
488
489 avail = of_device_is_available(dn);
490 if (!avail)
491 avail = !of_property_match_string(dn,
492 "enable-method", "spin-table");
493
494 set_cpu_present(cpu, avail);
495 set_cpu_possible(cpu, true);
496 cpu_to_phys_id[cpu] = be32_to_cpu(intserv[j]);
497 cpu++;
498 }
499
500 if (cpu >= nr_cpu_ids) {
501 of_node_put(dn);
502 break;
503 }
504 }
505
506 /* If no SMT supported, nthreads is forced to 1 */
507 if (!cpu_has_feature(CPU_FTR_SMT)) {
508 DBG(" SMT disabled ! nthreads forced to 1\n");
509 nthreads = 1;
510 }
511
512#ifdef CONFIG_PPC64
513 /*
514 * On pSeries LPAR, we need to know how many cpus
515 * could possibly be added to this partition.
516 */
517 if (firmware_has_feature(FW_FEATURE_LPAR) &&
518 (dn = of_find_node_by_path("/rtas"))) {
519 int num_addr_cell, num_size_cell, maxcpus;
520 const __be32 *ireg;
521
522 num_addr_cell = of_n_addr_cells(dn);
523 num_size_cell = of_n_size_cells(dn);
524
525 ireg = of_get_property(dn, "ibm,lrdr-capacity", NULL);
526
527 if (!ireg)
528 goto out;
529
530 maxcpus = be32_to_cpup(ireg + num_addr_cell + num_size_cell);
531
532 /* Double maxcpus for processors which have SMT capability */
533 if (cpu_has_feature(CPU_FTR_SMT))
534 maxcpus *= nthreads;
535
536 if (maxcpus > nr_cpu_ids) {
537 printk(KERN_WARNING
538 "Partition configured for %d cpus, "
539 "operating system maximum is %u.\n",
540 maxcpus, nr_cpu_ids);
541 maxcpus = nr_cpu_ids;
542 } else
543 printk(KERN_INFO "Partition configured for %d cpus.\n",
544 maxcpus);
545
546 for (cpu = 0; cpu < maxcpus; cpu++)
547 set_cpu_possible(cpu, true);
548 out:
549 of_node_put(dn);
550 }
551 vdso_data->processorCount = num_present_cpus();
552#endif /* CONFIG_PPC64 */
553
554 /* Initialize CPU <=> thread mapping/
555 *
556 * WARNING: We assume that the number of threads is the same for
557 * every CPU in the system. If that is not the case, then some code
558 * here will have to be reworked
559 */
560 cpu_init_thread_core_maps(nthreads);
561
562 /* Now that possible cpus are set, set nr_cpu_ids for later use */
563 setup_nr_cpu_ids();
564
565 free_unused_pacas();
566}
567#endif /* CONFIG_SMP */
568
569#ifdef CONFIG_PCSPKR_PLATFORM
570static __init int add_pcspkr(void)
571{
572 struct device_node *np;
573 struct platform_device *pd;
574 int ret;
575
576 np = of_find_compatible_node(NULL, NULL, "pnpPNP,100");
577 of_node_put(np);
578 if (!np)
579 return -ENODEV;
580
581 pd = platform_device_alloc("pcspkr", -1);
582 if (!pd)
583 return -ENOMEM;
584
585 ret = platform_device_add(pd);
586 if (ret)
587 platform_device_put(pd);
588
589 return ret;
590}
591device_initcall(add_pcspkr);
592#endif /* CONFIG_PCSPKR_PLATFORM */
593
594static char ppc_hw_desc_buf[128] __initdata;
595
596struct seq_buf ppc_hw_desc __initdata = {
597 .buffer = ppc_hw_desc_buf,
598 .size = sizeof(ppc_hw_desc_buf),
599 .len = 0,
600 .readpos = 0,
601};
602
603static __init void probe_machine(void)
604{
605 extern struct machdep_calls __machine_desc_start;
606 extern struct machdep_calls __machine_desc_end;
607 unsigned int i;
608
609 /*
610 * Iterate all ppc_md structures until we find the proper
611 * one for the current machine type
612 */
613 DBG("Probing machine type ...\n");
614
615 /*
616 * Check ppc_md is empty, if not we have a bug, ie, we setup an
617 * entry before probe_machine() which will be overwritten
618 */
619 for (i = 0; i < (sizeof(ppc_md) / sizeof(void *)); i++) {
620 if (((void **)&ppc_md)[i]) {
621 printk(KERN_ERR "Entry %d in ppc_md non empty before"
622 " machine probe !\n", i);
623 }
624 }
625
626 for (machine_id = &__machine_desc_start;
627 machine_id < &__machine_desc_end;
628 machine_id++) {
629 DBG(" %s ...", machine_id->name);
630 memcpy(&ppc_md, machine_id, sizeof(struct machdep_calls));
631 if (ppc_md.probe()) {
632 DBG(" match !\n");
633 break;
634 }
635 DBG("\n");
636 }
637 /* What can we do if we didn't find ? */
638 if (machine_id >= &__machine_desc_end) {
639 pr_err("No suitable machine description found !\n");
640 for (;;);
641 }
642
643 // Append the machine name to other info we've gathered
644 seq_buf_puts(&ppc_hw_desc, ppc_md.name);
645
646 // Set the generic hardware description shown in oopses
647 dump_stack_set_arch_desc(ppc_hw_desc.buffer);
648
649 pr_info("Hardware name: %s\n", ppc_hw_desc.buffer);
650}
651
652/* Match a class of boards, not a specific device configuration. */
653int check_legacy_ioport(unsigned long base_port)
654{
655 struct device_node *parent, *np = NULL;
656 int ret = -ENODEV;
657
658 switch(base_port) {
659 case I8042_DATA_REG:
660 if (!(np = of_find_compatible_node(NULL, NULL, "pnpPNP,303")))
661 np = of_find_compatible_node(NULL, NULL, "pnpPNP,f03");
662 if (np) {
663 parent = of_get_parent(np);
664
665 of_i8042_kbd_irq = irq_of_parse_and_map(parent, 0);
666 if (!of_i8042_kbd_irq)
667 of_i8042_kbd_irq = 1;
668
669 of_i8042_aux_irq = irq_of_parse_and_map(parent, 1);
670 if (!of_i8042_aux_irq)
671 of_i8042_aux_irq = 12;
672
673 of_node_put(np);
674 np = parent;
675 break;
676 }
677 np = of_find_node_by_type(NULL, "8042");
678 /* Pegasos has no device_type on its 8042 node, look for the
679 * name instead */
680 if (!np)
681 np = of_find_node_by_name(NULL, "8042");
682 if (np) {
683 of_i8042_kbd_irq = 1;
684 of_i8042_aux_irq = 12;
685 }
686 break;
687 case FDC_BASE: /* FDC1 */
688 np = of_find_node_by_type(NULL, "fdc");
689 break;
690 default:
691 /* ipmi is supposed to fail here */
692 break;
693 }
694 if (!np)
695 return ret;
696 parent = of_get_parent(np);
697 if (parent) {
698 if (of_node_is_type(parent, "isa"))
699 ret = 0;
700 of_node_put(parent);
701 }
702 of_node_put(np);
703 return ret;
704}
705EXPORT_SYMBOL(check_legacy_ioport);
706
707/*
708 * Panic notifiers setup
709 *
710 * We have 3 notifiers for powerpc, each one from a different "nature":
711 *
712 * - ppc_panic_fadump_handler() is a hypervisor notifier, which hard-disables
713 * IRQs and deal with the Firmware-Assisted dump, when it is configured;
714 * should run early in the panic path.
715 *
716 * - dump_kernel_offset() is an informative notifier, just showing the KASLR
717 * offset if we have RANDOMIZE_BASE set.
718 *
719 * - ppc_panic_platform_handler() is a low-level handler that's registered
720 * only if the platform wishes to perform final actions in the panic path,
721 * hence it should run late and might not even return. Currently, only
722 * pseries and ps3 platforms register callbacks.
723 */
724static int ppc_panic_fadump_handler(struct notifier_block *this,
725 unsigned long event, void *ptr)
726{
727 /*
728 * panic does a local_irq_disable, but we really
729 * want interrupts to be hard disabled.
730 */
731 hard_irq_disable();
732
733 /*
734 * If firmware-assisted dump has been registered then trigger
735 * its callback and let the firmware handles everything else.
736 */
737 crash_fadump(NULL, ptr);
738
739 return NOTIFY_DONE;
740}
741
742static int dump_kernel_offset(struct notifier_block *self, unsigned long v,
743 void *p)
744{
745 pr_emerg("Kernel Offset: 0x%lx from 0x%lx\n",
746 kaslr_offset(), KERNELBASE);
747
748 return NOTIFY_DONE;
749}
750
751static int ppc_panic_platform_handler(struct notifier_block *this,
752 unsigned long event, void *ptr)
753{
754 /*
755 * This handler is only registered if we have a panic callback
756 * on ppc_md, hence NULL check is not needed.
757 * Also, it may not return, so it runs really late on panic path.
758 */
759 ppc_md.panic(ptr);
760
761 return NOTIFY_DONE;
762}
763
764static struct notifier_block ppc_fadump_block = {
765 .notifier_call = ppc_panic_fadump_handler,
766 .priority = INT_MAX, /* run early, to notify the firmware ASAP */
767};
768
769static struct notifier_block kernel_offset_notifier = {
770 .notifier_call = dump_kernel_offset,
771};
772
773static struct notifier_block ppc_panic_block = {
774 .notifier_call = ppc_panic_platform_handler,
775 .priority = INT_MIN, /* may not return; must be done last */
776};
777
778void __init setup_panic(void)
779{
780 /* Hard-disables IRQs + deal with FW-assisted dump (fadump) */
781 atomic_notifier_chain_register(&panic_notifier_list,
782 &ppc_fadump_block);
783
784 if (IS_ENABLED(CONFIG_RANDOMIZE_BASE) && kaslr_offset() > 0)
785 atomic_notifier_chain_register(&panic_notifier_list,
786 &kernel_offset_notifier);
787
788 /* Low-level platform-specific routines that should run on panic */
789 if (ppc_md.panic)
790 atomic_notifier_chain_register(&panic_notifier_list,
791 &ppc_panic_block);
792}
793
794#ifdef CONFIG_CHECK_CACHE_COHERENCY
795/*
796 * For platforms that have configurable cache-coherency. This function
797 * checks that the cache coherency setting of the kernel matches the setting
798 * left by the firmware, as indicated in the device tree. Since a mismatch
799 * will eventually result in DMA failures, we print * and error and call
800 * BUG() in that case.
801 */
802
803#define KERNEL_COHERENCY (!IS_ENABLED(CONFIG_NOT_COHERENT_CACHE))
804
805static int __init check_cache_coherency(void)
806{
807 struct device_node *np;
808 const void *prop;
809 bool devtree_coherency;
810
811 np = of_find_node_by_path("/");
812 prop = of_get_property(np, "coherency-off", NULL);
813 of_node_put(np);
814
815 devtree_coherency = prop ? false : true;
816
817 if (devtree_coherency != KERNEL_COHERENCY) {
818 printk(KERN_ERR
819 "kernel coherency:%s != device tree_coherency:%s\n",
820 KERNEL_COHERENCY ? "on" : "off",
821 devtree_coherency ? "on" : "off");
822 BUG();
823 }
824
825 return 0;
826}
827
828late_initcall(check_cache_coherency);
829#endif /* CONFIG_CHECK_CACHE_COHERENCY */
830
831void ppc_printk_progress(char *s, unsigned short hex)
832{
833 pr_info("%s\n", s);
834}
835
836static __init void print_system_info(void)
837{
838 pr_info("-----------------------------------------------------\n");
839 pr_info("phys_mem_size = 0x%llx\n",
840 (unsigned long long)memblock_phys_mem_size());
841
842 pr_info("dcache_bsize = 0x%x\n", dcache_bsize);
843 pr_info("icache_bsize = 0x%x\n", icache_bsize);
844
845 pr_info("cpu_features = 0x%016lx\n", cur_cpu_spec->cpu_features);
846 pr_info(" possible = 0x%016lx\n",
847 (unsigned long)CPU_FTRS_POSSIBLE);
848 pr_info(" always = 0x%016lx\n",
849 (unsigned long)CPU_FTRS_ALWAYS);
850 pr_info("cpu_user_features = 0x%08x 0x%08x\n",
851 cur_cpu_spec->cpu_user_features,
852 cur_cpu_spec->cpu_user_features2);
853 pr_info("mmu_features = 0x%08x\n", cur_cpu_spec->mmu_features);
854#ifdef CONFIG_PPC64
855 pr_info("firmware_features = 0x%016lx\n", powerpc_firmware_features);
856#ifdef CONFIG_PPC_BOOK3S
857 pr_info("vmalloc start = 0x%lx\n", KERN_VIRT_START);
858 pr_info("IO start = 0x%lx\n", KERN_IO_START);
859 pr_info("vmemmap start = 0x%lx\n", (unsigned long)vmemmap);
860#endif
861#endif
862
863 if (!early_radix_enabled())
864 print_system_hash_info();
865
866 if (PHYSICAL_START > 0)
867 pr_info("physical_start = 0x%llx\n",
868 (unsigned long long)PHYSICAL_START);
869 pr_info("-----------------------------------------------------\n");
870}
871
872#ifdef CONFIG_SMP
873static void __init smp_setup_pacas(void)
874{
875 int cpu;
876
877 for_each_possible_cpu(cpu) {
878 if (cpu == smp_processor_id())
879 continue;
880 allocate_paca(cpu);
881 set_hard_smp_processor_id(cpu, cpu_to_phys_id[cpu]);
882 }
883
884 memblock_free(cpu_to_phys_id, nr_cpu_ids * sizeof(u32));
885 cpu_to_phys_id = NULL;
886}
887#endif
888
889/*
890 * Called into from start_kernel this initializes memblock, which is used
891 * to manage page allocation until mem_init is called.
892 */
893void __init setup_arch(char **cmdline_p)
894{
895 kasan_init();
896
897 *cmdline_p = boot_command_line;
898
899 /* Set a half-reasonable default so udelay does something sensible */
900 loops_per_jiffy = 500000000 / HZ;
901
902 /* Unflatten the device-tree passed by prom_init or kexec */
903 unflatten_device_tree();
904
905 /*
906 * Initialize cache line/block info from device-tree (on ppc64) or
907 * just cputable (on ppc32).
908 */
909 initialize_cache_info();
910
911 /* Initialize RTAS if available. */
912 rtas_initialize();
913
914 /* Check if we have an initrd provided via the device-tree. */
915 check_for_initrd();
916
917 /* Probe the machine type, establish ppc_md. */
918 probe_machine();
919
920 /* Setup panic notifier if requested by the platform. */
921 setup_panic();
922
923 /*
924 * Configure ppc_md.power_save (ppc32 only, 64-bit machines do
925 * it from their respective probe() function.
926 */
927 setup_power_save();
928
929 /* Discover standard serial ports. */
930 find_legacy_serial_ports();
931
932 /* Register early console with the printk subsystem. */
933 register_early_udbg_console();
934
935 /* Setup the various CPU maps based on the device-tree. */
936 smp_setup_cpu_maps();
937
938 /* Initialize xmon. */
939 xmon_setup();
940
941 /* Check the SMT related command line arguments (ppc64). */
942 check_smt_enabled();
943
944 /* Parse memory topology */
945 mem_topology_setup();
946
947 /*
948 * Release secondary cpus out of their spinloops at 0x60 now that
949 * we can map physical -> logical CPU ids.
950 *
951 * Freescale Book3e parts spin in a loop provided by firmware,
952 * so smp_release_cpus() does nothing for them.
953 */
954#ifdef CONFIG_SMP
955 smp_setup_pacas();
956
957 /* On BookE, setup per-core TLB data structures. */
958 setup_tlb_core_data();
959#endif
960
961 /* Print various info about the machine that has been gathered so far. */
962 print_system_info();
963
964 klp_init_thread_info(&init_task);
965
966 setup_initial_init_mm(_stext, _etext, _edata, _end);
967
968 mm_iommu_init(&init_mm);
969 irqstack_early_init();
970 exc_lvl_early_init();
971 emergency_stack_init();
972
973 mce_init();
974 smp_release_cpus();
975
976 initmem_init();
977
978 /*
979 * Reserve large chunks of memory for use by CMA for KVM and hugetlb. These must
980 * be called after initmem_init(), so that pageblock_order is initialised.
981 */
982 kvm_cma_reserve();
983 gigantic_hugetlb_cma_reserve();
984
985 early_memtest(min_low_pfn << PAGE_SHIFT, max_low_pfn << PAGE_SHIFT);
986
987 if (ppc_md.setup_arch)
988 ppc_md.setup_arch();
989
990 setup_barrier_nospec();
991 setup_spectre_v2();
992
993 paging_init();
994
995 /* Initialize the MMU context management stuff. */
996 mmu_context_init();
997
998 /* Interrupt code needs to be 64K-aligned. */
999 if (IS_ENABLED(CONFIG_PPC64) && (unsigned long)_stext & 0xffff)
1000 panic("Kernelbase not 64K-aligned (0x%lx)!\n",
1001 (unsigned long)_stext);
1002}
1/*
2 * Common boot and setup code for both 32-bit and 64-bit.
3 * Extracted from arch/powerpc/kernel/setup_64.c.
4 *
5 * Copyright (C) 2001 PPC64 Team, IBM Corp
6 *
7 * This program is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU General Public License
9 * as published by the Free Software Foundation; either version
10 * 2 of the License, or (at your option) any later version.
11 */
12
13#undef DEBUG
14
15#include <linux/export.h>
16#include <linux/string.h>
17#include <linux/sched.h>
18#include <linux/init.h>
19#include <linux/kernel.h>
20#include <linux/reboot.h>
21#include <linux/delay.h>
22#include <linux/initrd.h>
23#include <linux/platform_device.h>
24#include <linux/seq_file.h>
25#include <linux/ioport.h>
26#include <linux/console.h>
27#include <linux/screen_info.h>
28#include <linux/root_dev.h>
29#include <linux/notifier.h>
30#include <linux/cpu.h>
31#include <linux/unistd.h>
32#include <linux/serial.h>
33#include <linux/serial_8250.h>
34#include <linux/percpu.h>
35#include <linux/memblock.h>
36#include <linux/of_platform.h>
37#include <linux/hugetlb.h>
38#include <asm/debugfs.h>
39#include <asm/io.h>
40#include <asm/paca.h>
41#include <asm/prom.h>
42#include <asm/processor.h>
43#include <asm/vdso_datapage.h>
44#include <asm/pgtable.h>
45#include <asm/smp.h>
46#include <asm/elf.h>
47#include <asm/machdep.h>
48#include <asm/time.h>
49#include <asm/cputable.h>
50#include <asm/sections.h>
51#include <asm/firmware.h>
52#include <asm/btext.h>
53#include <asm/nvram.h>
54#include <asm/setup.h>
55#include <asm/rtas.h>
56#include <asm/iommu.h>
57#include <asm/serial.h>
58#include <asm/cache.h>
59#include <asm/page.h>
60#include <asm/mmu.h>
61#include <asm/xmon.h>
62#include <asm/cputhreads.h>
63#include <mm/mmu_decl.h>
64#include <asm/fadump.h>
65#include <asm/udbg.h>
66#include <asm/hugetlb.h>
67#include <asm/livepatch.h>
68#include <asm/mmu_context.h>
69#include <asm/cpu_has_feature.h>
70
71#include "setup.h"
72
73#ifdef DEBUG
74#include <asm/udbg.h>
75#define DBG(fmt...) udbg_printf(fmt)
76#else
77#define DBG(fmt...)
78#endif
79
80/* The main machine-dep calls structure
81 */
82struct machdep_calls ppc_md;
83EXPORT_SYMBOL(ppc_md);
84struct machdep_calls *machine_id;
85EXPORT_SYMBOL(machine_id);
86
87int boot_cpuid = -1;
88EXPORT_SYMBOL_GPL(boot_cpuid);
89
90/*
91 * These are used in binfmt_elf.c to put aux entries on the stack
92 * for each elf executable being started.
93 */
94int dcache_bsize;
95int icache_bsize;
96int ucache_bsize;
97
98
99unsigned long klimit = (unsigned long) _end;
100
101/*
102 * This still seems to be needed... -- paulus
103 */
104struct screen_info screen_info = {
105 .orig_x = 0,
106 .orig_y = 25,
107 .orig_video_cols = 80,
108 .orig_video_lines = 25,
109 .orig_video_isVGA = 1,
110 .orig_video_points = 16
111};
112#if defined(CONFIG_FB_VGA16_MODULE)
113EXPORT_SYMBOL(screen_info);
114#endif
115
116/* Variables required to store legacy IO irq routing */
117int of_i8042_kbd_irq;
118EXPORT_SYMBOL_GPL(of_i8042_kbd_irq);
119int of_i8042_aux_irq;
120EXPORT_SYMBOL_GPL(of_i8042_aux_irq);
121
122#ifdef __DO_IRQ_CANON
123/* XXX should go elsewhere eventually */
124int ppc_do_canonicalize_irqs;
125EXPORT_SYMBOL(ppc_do_canonicalize_irqs);
126#endif
127
128#ifdef CONFIG_CRASH_CORE
129/* This keeps a track of which one is the crashing cpu. */
130int crashing_cpu = -1;
131#endif
132
133/* also used by kexec */
134void machine_shutdown(void)
135{
136#ifdef CONFIG_FA_DUMP
137 /*
138 * if fadump is active, cleanup the fadump registration before we
139 * shutdown.
140 */
141 fadump_cleanup();
142#endif
143
144 if (ppc_md.machine_shutdown)
145 ppc_md.machine_shutdown();
146}
147
148static void machine_hang(void)
149{
150 pr_emerg("System Halted, OK to turn off power\n");
151 local_irq_disable();
152 while (1)
153 ;
154}
155
156void machine_restart(char *cmd)
157{
158 machine_shutdown();
159 if (ppc_md.restart)
160 ppc_md.restart(cmd);
161
162 smp_send_stop();
163
164 do_kernel_restart(cmd);
165 mdelay(1000);
166
167 machine_hang();
168}
169
170void machine_power_off(void)
171{
172 machine_shutdown();
173 if (pm_power_off)
174 pm_power_off();
175
176 smp_send_stop();
177 machine_hang();
178}
179/* Used by the G5 thermal driver */
180EXPORT_SYMBOL_GPL(machine_power_off);
181
182void (*pm_power_off)(void);
183EXPORT_SYMBOL_GPL(pm_power_off);
184
185void machine_halt(void)
186{
187 machine_shutdown();
188 if (ppc_md.halt)
189 ppc_md.halt();
190
191 smp_send_stop();
192 machine_hang();
193}
194
195
196#ifdef CONFIG_TAU
197extern u32 cpu_temp(unsigned long cpu);
198extern u32 cpu_temp_both(unsigned long cpu);
199#endif /* CONFIG_TAU */
200
201#ifdef CONFIG_SMP
202DEFINE_PER_CPU(unsigned int, cpu_pvr);
203#endif
204
205static void show_cpuinfo_summary(struct seq_file *m)
206{
207 struct device_node *root;
208 const char *model = NULL;
209#if defined(CONFIG_SMP) && defined(CONFIG_PPC32)
210 unsigned long bogosum = 0;
211 int i;
212 for_each_online_cpu(i)
213 bogosum += loops_per_jiffy;
214 seq_printf(m, "total bogomips\t: %lu.%02lu\n",
215 bogosum/(500000/HZ), bogosum/(5000/HZ) % 100);
216#endif /* CONFIG_SMP && CONFIG_PPC32 */
217 seq_printf(m, "timebase\t: %lu\n", ppc_tb_freq);
218 if (ppc_md.name)
219 seq_printf(m, "platform\t: %s\n", ppc_md.name);
220 root = of_find_node_by_path("/");
221 if (root)
222 model = of_get_property(root, "model", NULL);
223 if (model)
224 seq_printf(m, "model\t\t: %s\n", model);
225 of_node_put(root);
226
227 if (ppc_md.show_cpuinfo != NULL)
228 ppc_md.show_cpuinfo(m);
229
230#ifdef CONFIG_PPC32
231 /* Display the amount of memory */
232 seq_printf(m, "Memory\t\t: %d MB\n",
233 (unsigned int)(total_memory / (1024 * 1024)));
234#endif
235}
236
237static int show_cpuinfo(struct seq_file *m, void *v)
238{
239 unsigned long cpu_id = (unsigned long)v - 1;
240 unsigned int pvr;
241 unsigned long proc_freq;
242 unsigned short maj;
243 unsigned short min;
244
245#ifdef CONFIG_SMP
246 pvr = per_cpu(cpu_pvr, cpu_id);
247#else
248 pvr = mfspr(SPRN_PVR);
249#endif
250 maj = (pvr >> 8) & 0xFF;
251 min = pvr & 0xFF;
252
253 seq_printf(m, "processor\t: %lu\n", cpu_id);
254 seq_printf(m, "cpu\t\t: ");
255
256 if (cur_cpu_spec->pvr_mask && cur_cpu_spec->cpu_name)
257 seq_printf(m, "%s", cur_cpu_spec->cpu_name);
258 else
259 seq_printf(m, "unknown (%08x)", pvr);
260
261#ifdef CONFIG_ALTIVEC
262 if (cpu_has_feature(CPU_FTR_ALTIVEC))
263 seq_printf(m, ", altivec supported");
264#endif /* CONFIG_ALTIVEC */
265
266 seq_printf(m, "\n");
267
268#ifdef CONFIG_TAU
269 if (cur_cpu_spec->cpu_features & CPU_FTR_TAU) {
270#ifdef CONFIG_TAU_AVERAGE
271 /* more straightforward, but potentially misleading */
272 seq_printf(m, "temperature \t: %u C (uncalibrated)\n",
273 cpu_temp(cpu_id));
274#else
275 /* show the actual temp sensor range */
276 u32 temp;
277 temp = cpu_temp_both(cpu_id);
278 seq_printf(m, "temperature \t: %u-%u C (uncalibrated)\n",
279 temp & 0xff, temp >> 16);
280#endif
281 }
282#endif /* CONFIG_TAU */
283
284 /*
285 * Platforms that have variable clock rates, should implement
286 * the method ppc_md.get_proc_freq() that reports the clock
287 * rate of a given cpu. The rest can use ppc_proc_freq to
288 * report the clock rate that is same across all cpus.
289 */
290 if (ppc_md.get_proc_freq)
291 proc_freq = ppc_md.get_proc_freq(cpu_id);
292 else
293 proc_freq = ppc_proc_freq;
294
295 if (proc_freq)
296 seq_printf(m, "clock\t\t: %lu.%06luMHz\n",
297 proc_freq / 1000000, proc_freq % 1000000);
298
299 if (ppc_md.show_percpuinfo != NULL)
300 ppc_md.show_percpuinfo(m, cpu_id);
301
302 /* If we are a Freescale core do a simple check so
303 * we dont have to keep adding cases in the future */
304 if (PVR_VER(pvr) & 0x8000) {
305 switch (PVR_VER(pvr)) {
306 case 0x8000: /* 7441/7450/7451, Voyager */
307 case 0x8001: /* 7445/7455, Apollo 6 */
308 case 0x8002: /* 7447/7457, Apollo 7 */
309 case 0x8003: /* 7447A, Apollo 7 PM */
310 case 0x8004: /* 7448, Apollo 8 */
311 case 0x800c: /* 7410, Nitro */
312 maj = ((pvr >> 8) & 0xF);
313 min = PVR_MIN(pvr);
314 break;
315 default: /* e500/book-e */
316 maj = PVR_MAJ(pvr);
317 min = PVR_MIN(pvr);
318 break;
319 }
320 } else {
321 switch (PVR_VER(pvr)) {
322 case 0x0020: /* 403 family */
323 maj = PVR_MAJ(pvr) + 1;
324 min = PVR_MIN(pvr);
325 break;
326 case 0x1008: /* 740P/750P ?? */
327 maj = ((pvr >> 8) & 0xFF) - 1;
328 min = pvr & 0xFF;
329 break;
330 case 0x004e: /* POWER9 bits 12-15 give chip type */
331 maj = (pvr >> 8) & 0x0F;
332 min = pvr & 0xFF;
333 break;
334 default:
335 maj = (pvr >> 8) & 0xFF;
336 min = pvr & 0xFF;
337 break;
338 }
339 }
340
341 seq_printf(m, "revision\t: %hd.%hd (pvr %04x %04x)\n",
342 maj, min, PVR_VER(pvr), PVR_REV(pvr));
343
344#ifdef CONFIG_PPC32
345 seq_printf(m, "bogomips\t: %lu.%02lu\n",
346 loops_per_jiffy / (500000/HZ),
347 (loops_per_jiffy / (5000/HZ)) % 100);
348#endif
349 seq_printf(m, "\n");
350
351 /* If this is the last cpu, print the summary */
352 if (cpumask_next(cpu_id, cpu_online_mask) >= nr_cpu_ids)
353 show_cpuinfo_summary(m);
354
355 return 0;
356}
357
358static void *c_start(struct seq_file *m, loff_t *pos)
359{
360 if (*pos == 0) /* just in case, cpu 0 is not the first */
361 *pos = cpumask_first(cpu_online_mask);
362 else
363 *pos = cpumask_next(*pos - 1, cpu_online_mask);
364 if ((*pos) < nr_cpu_ids)
365 return (void *)(unsigned long)(*pos + 1);
366 return NULL;
367}
368
369static void *c_next(struct seq_file *m, void *v, loff_t *pos)
370{
371 (*pos)++;
372 return c_start(m, pos);
373}
374
375static void c_stop(struct seq_file *m, void *v)
376{
377}
378
379const struct seq_operations cpuinfo_op = {
380 .start = c_start,
381 .next = c_next,
382 .stop = c_stop,
383 .show = show_cpuinfo,
384};
385
386void __init check_for_initrd(void)
387{
388#ifdef CONFIG_BLK_DEV_INITRD
389 DBG(" -> check_for_initrd() initrd_start=0x%lx initrd_end=0x%lx\n",
390 initrd_start, initrd_end);
391
392 /* If we were passed an initrd, set the ROOT_DEV properly if the values
393 * look sensible. If not, clear initrd reference.
394 */
395 if (is_kernel_addr(initrd_start) && is_kernel_addr(initrd_end) &&
396 initrd_end > initrd_start)
397 ROOT_DEV = Root_RAM0;
398 else
399 initrd_start = initrd_end = 0;
400
401 if (initrd_start)
402 pr_info("Found initrd at 0x%lx:0x%lx\n", initrd_start, initrd_end);
403
404 DBG(" <- check_for_initrd()\n");
405#endif /* CONFIG_BLK_DEV_INITRD */
406}
407
408#ifdef CONFIG_SMP
409
410int threads_per_core, threads_per_subcore, threads_shift;
411cpumask_t threads_core_mask;
412EXPORT_SYMBOL_GPL(threads_per_core);
413EXPORT_SYMBOL_GPL(threads_per_subcore);
414EXPORT_SYMBOL_GPL(threads_shift);
415EXPORT_SYMBOL_GPL(threads_core_mask);
416
417static void __init cpu_init_thread_core_maps(int tpc)
418{
419 int i;
420
421 threads_per_core = tpc;
422 threads_per_subcore = tpc;
423 cpumask_clear(&threads_core_mask);
424
425 /* This implementation only supports power of 2 number of threads
426 * for simplicity and performance
427 */
428 threads_shift = ilog2(tpc);
429 BUG_ON(tpc != (1 << threads_shift));
430
431 for (i = 0; i < tpc; i++)
432 cpumask_set_cpu(i, &threads_core_mask);
433
434 printk(KERN_INFO "CPU maps initialized for %d thread%s per core\n",
435 tpc, tpc > 1 ? "s" : "");
436 printk(KERN_DEBUG " (thread shift is %d)\n", threads_shift);
437}
438
439
440u32 *cpu_to_phys_id = NULL;
441
442/**
443 * setup_cpu_maps - initialize the following cpu maps:
444 * cpu_possible_mask
445 * cpu_present_mask
446 *
447 * Having the possible map set up early allows us to restrict allocations
448 * of things like irqstacks to nr_cpu_ids rather than NR_CPUS.
449 *
450 * We do not initialize the online map here; cpus set their own bits in
451 * cpu_online_mask as they come up.
452 *
453 * This function is valid only for Open Firmware systems. finish_device_tree
454 * must be called before using this.
455 *
456 * While we're here, we may as well set the "physical" cpu ids in the paca.
457 *
458 * NOTE: This must match the parsing done in early_init_dt_scan_cpus.
459 */
460void __init smp_setup_cpu_maps(void)
461{
462 struct device_node *dn;
463 int cpu = 0;
464 int nthreads = 1;
465
466 DBG("smp_setup_cpu_maps()\n");
467
468 cpu_to_phys_id = __va(memblock_alloc(nr_cpu_ids * sizeof(u32),
469 __alignof__(u32)));
470 memset(cpu_to_phys_id, 0, nr_cpu_ids * sizeof(u32));
471
472 for_each_node_by_type(dn, "cpu") {
473 const __be32 *intserv;
474 __be32 cpu_be;
475 int j, len;
476
477 DBG(" * %pOF...\n", dn);
478
479 intserv = of_get_property(dn, "ibm,ppc-interrupt-server#s",
480 &len);
481 if (intserv) {
482 DBG(" ibm,ppc-interrupt-server#s -> %d threads\n",
483 nthreads);
484 } else {
485 DBG(" no ibm,ppc-interrupt-server#s -> 1 thread\n");
486 intserv = of_get_property(dn, "reg", &len);
487 if (!intserv) {
488 cpu_be = cpu_to_be32(cpu);
489 /* XXX: what is this? uninitialized?? */
490 intserv = &cpu_be; /* assume logical == phys */
491 len = 4;
492 }
493 }
494
495 nthreads = len / sizeof(int);
496
497 for (j = 0; j < nthreads && cpu < nr_cpu_ids; j++) {
498 bool avail;
499
500 DBG(" thread %d -> cpu %d (hard id %d)\n",
501 j, cpu, be32_to_cpu(intserv[j]));
502
503 avail = of_device_is_available(dn);
504 if (!avail)
505 avail = !of_property_match_string(dn,
506 "enable-method", "spin-table");
507
508 set_cpu_present(cpu, avail);
509 set_cpu_possible(cpu, true);
510 cpu_to_phys_id[cpu] = be32_to_cpu(intserv[j]);
511 cpu++;
512 }
513
514 if (cpu >= nr_cpu_ids) {
515 of_node_put(dn);
516 break;
517 }
518 }
519
520 /* If no SMT supported, nthreads is forced to 1 */
521 if (!cpu_has_feature(CPU_FTR_SMT)) {
522 DBG(" SMT disabled ! nthreads forced to 1\n");
523 nthreads = 1;
524 }
525
526#ifdef CONFIG_PPC64
527 /*
528 * On pSeries LPAR, we need to know how many cpus
529 * could possibly be added to this partition.
530 */
531 if (firmware_has_feature(FW_FEATURE_LPAR) &&
532 (dn = of_find_node_by_path("/rtas"))) {
533 int num_addr_cell, num_size_cell, maxcpus;
534 const __be32 *ireg;
535
536 num_addr_cell = of_n_addr_cells(dn);
537 num_size_cell = of_n_size_cells(dn);
538
539 ireg = of_get_property(dn, "ibm,lrdr-capacity", NULL);
540
541 if (!ireg)
542 goto out;
543
544 maxcpus = be32_to_cpup(ireg + num_addr_cell + num_size_cell);
545
546 /* Double maxcpus for processors which have SMT capability */
547 if (cpu_has_feature(CPU_FTR_SMT))
548 maxcpus *= nthreads;
549
550 if (maxcpus > nr_cpu_ids) {
551 printk(KERN_WARNING
552 "Partition configured for %d cpus, "
553 "operating system maximum is %u.\n",
554 maxcpus, nr_cpu_ids);
555 maxcpus = nr_cpu_ids;
556 } else
557 printk(KERN_INFO "Partition configured for %d cpus.\n",
558 maxcpus);
559
560 for (cpu = 0; cpu < maxcpus; cpu++)
561 set_cpu_possible(cpu, true);
562 out:
563 of_node_put(dn);
564 }
565 vdso_data->processorCount = num_present_cpus();
566#endif /* CONFIG_PPC64 */
567
568 /* Initialize CPU <=> thread mapping/
569 *
570 * WARNING: We assume that the number of threads is the same for
571 * every CPU in the system. If that is not the case, then some code
572 * here will have to be reworked
573 */
574 cpu_init_thread_core_maps(nthreads);
575
576 /* Now that possible cpus are set, set nr_cpu_ids for later use */
577 setup_nr_cpu_ids();
578
579 free_unused_pacas();
580}
581#endif /* CONFIG_SMP */
582
583#ifdef CONFIG_PCSPKR_PLATFORM
584static __init int add_pcspkr(void)
585{
586 struct device_node *np;
587 struct platform_device *pd;
588 int ret;
589
590 np = of_find_compatible_node(NULL, NULL, "pnpPNP,100");
591 of_node_put(np);
592 if (!np)
593 return -ENODEV;
594
595 pd = platform_device_alloc("pcspkr", -1);
596 if (!pd)
597 return -ENOMEM;
598
599 ret = platform_device_add(pd);
600 if (ret)
601 platform_device_put(pd);
602
603 return ret;
604}
605device_initcall(add_pcspkr);
606#endif /* CONFIG_PCSPKR_PLATFORM */
607
608void probe_machine(void)
609{
610 extern struct machdep_calls __machine_desc_start;
611 extern struct machdep_calls __machine_desc_end;
612 unsigned int i;
613
614 /*
615 * Iterate all ppc_md structures until we find the proper
616 * one for the current machine type
617 */
618 DBG("Probing machine type ...\n");
619
620 /*
621 * Check ppc_md is empty, if not we have a bug, ie, we setup an
622 * entry before probe_machine() which will be overwritten
623 */
624 for (i = 0; i < (sizeof(ppc_md) / sizeof(void *)); i++) {
625 if (((void **)&ppc_md)[i]) {
626 printk(KERN_ERR "Entry %d in ppc_md non empty before"
627 " machine probe !\n", i);
628 }
629 }
630
631 for (machine_id = &__machine_desc_start;
632 machine_id < &__machine_desc_end;
633 machine_id++) {
634 DBG(" %s ...", machine_id->name);
635 memcpy(&ppc_md, machine_id, sizeof(struct machdep_calls));
636 if (ppc_md.probe()) {
637 DBG(" match !\n");
638 break;
639 }
640 DBG("\n");
641 }
642 /* What can we do if we didn't find ? */
643 if (machine_id >= &__machine_desc_end) {
644 DBG("No suitable machine found !\n");
645 for (;;);
646 }
647
648 printk(KERN_INFO "Using %s machine description\n", ppc_md.name);
649}
650
651/* Match a class of boards, not a specific device configuration. */
652int check_legacy_ioport(unsigned long base_port)
653{
654 struct device_node *parent, *np = NULL;
655 int ret = -ENODEV;
656
657 switch(base_port) {
658 case I8042_DATA_REG:
659 if (!(np = of_find_compatible_node(NULL, NULL, "pnpPNP,303")))
660 np = of_find_compatible_node(NULL, NULL, "pnpPNP,f03");
661 if (np) {
662 parent = of_get_parent(np);
663
664 of_i8042_kbd_irq = irq_of_parse_and_map(parent, 0);
665 if (!of_i8042_kbd_irq)
666 of_i8042_kbd_irq = 1;
667
668 of_i8042_aux_irq = irq_of_parse_and_map(parent, 1);
669 if (!of_i8042_aux_irq)
670 of_i8042_aux_irq = 12;
671
672 of_node_put(np);
673 np = parent;
674 break;
675 }
676 np = of_find_node_by_type(NULL, "8042");
677 /* Pegasos has no device_type on its 8042 node, look for the
678 * name instead */
679 if (!np)
680 np = of_find_node_by_name(NULL, "8042");
681 if (np) {
682 of_i8042_kbd_irq = 1;
683 of_i8042_aux_irq = 12;
684 }
685 break;
686 case FDC_BASE: /* FDC1 */
687 np = of_find_node_by_type(NULL, "fdc");
688 break;
689 default:
690 /* ipmi is supposed to fail here */
691 break;
692 }
693 if (!np)
694 return ret;
695 parent = of_get_parent(np);
696 if (parent) {
697 if (strcmp(parent->type, "isa") == 0)
698 ret = 0;
699 of_node_put(parent);
700 }
701 of_node_put(np);
702 return ret;
703}
704EXPORT_SYMBOL(check_legacy_ioport);
705
706static int ppc_panic_event(struct notifier_block *this,
707 unsigned long event, void *ptr)
708{
709 /*
710 * If firmware-assisted dump has been registered then trigger
711 * firmware-assisted dump and let firmware handle everything else.
712 */
713 crash_fadump(NULL, ptr);
714 ppc_md.panic(ptr); /* May not return */
715 return NOTIFY_DONE;
716}
717
718static struct notifier_block ppc_panic_block = {
719 .notifier_call = ppc_panic_event,
720 .priority = INT_MIN /* may not return; must be done last */
721};
722
723void __init setup_panic(void)
724{
725 if (!ppc_md.panic)
726 return;
727 atomic_notifier_chain_register(&panic_notifier_list, &ppc_panic_block);
728}
729
730#ifdef CONFIG_CHECK_CACHE_COHERENCY
731/*
732 * For platforms that have configurable cache-coherency. This function
733 * checks that the cache coherency setting of the kernel matches the setting
734 * left by the firmware, as indicated in the device tree. Since a mismatch
735 * will eventually result in DMA failures, we print * and error and call
736 * BUG() in that case.
737 */
738
739#ifdef CONFIG_NOT_COHERENT_CACHE
740#define KERNEL_COHERENCY 0
741#else
742#define KERNEL_COHERENCY 1
743#endif
744
745static int __init check_cache_coherency(void)
746{
747 struct device_node *np;
748 const void *prop;
749 int devtree_coherency;
750
751 np = of_find_node_by_path("/");
752 prop = of_get_property(np, "coherency-off", NULL);
753 of_node_put(np);
754
755 devtree_coherency = prop ? 0 : 1;
756
757 if (devtree_coherency != KERNEL_COHERENCY) {
758 printk(KERN_ERR
759 "kernel coherency:%s != device tree_coherency:%s\n",
760 KERNEL_COHERENCY ? "on" : "off",
761 devtree_coherency ? "on" : "off");
762 BUG();
763 }
764
765 return 0;
766}
767
768late_initcall(check_cache_coherency);
769#endif /* CONFIG_CHECK_CACHE_COHERENCY */
770
771#ifdef CONFIG_DEBUG_FS
772struct dentry *powerpc_debugfs_root;
773EXPORT_SYMBOL(powerpc_debugfs_root);
774
775static int powerpc_debugfs_init(void)
776{
777 powerpc_debugfs_root = debugfs_create_dir("powerpc", NULL);
778
779 return powerpc_debugfs_root == NULL;
780}
781arch_initcall(powerpc_debugfs_init);
782#endif
783
784void ppc_printk_progress(char *s, unsigned short hex)
785{
786 pr_info("%s\n", s);
787}
788
789void arch_setup_pdev_archdata(struct platform_device *pdev)
790{
791 pdev->archdata.dma_mask = DMA_BIT_MASK(32);
792 pdev->dev.dma_mask = &pdev->archdata.dma_mask;
793 set_dma_ops(&pdev->dev, &dma_nommu_ops);
794}
795
796static __init void print_system_info(void)
797{
798 pr_info("-----------------------------------------------------\n");
799#ifdef CONFIG_PPC_BOOK3S_64
800 pr_info("ppc64_pft_size = 0x%llx\n", ppc64_pft_size);
801#endif
802#ifdef CONFIG_PPC_STD_MMU_32
803 pr_info("Hash_size = 0x%lx\n", Hash_size);
804#endif
805 pr_info("phys_mem_size = 0x%llx\n",
806 (unsigned long long)memblock_phys_mem_size());
807
808 pr_info("dcache_bsize = 0x%x\n", dcache_bsize);
809 pr_info("icache_bsize = 0x%x\n", icache_bsize);
810 if (ucache_bsize != 0)
811 pr_info("ucache_bsize = 0x%x\n", ucache_bsize);
812
813 pr_info("cpu_features = 0x%016lx\n", cur_cpu_spec->cpu_features);
814 pr_info(" possible = 0x%016lx\n",
815 (unsigned long)CPU_FTRS_POSSIBLE);
816 pr_info(" always = 0x%016lx\n",
817 (unsigned long)CPU_FTRS_ALWAYS);
818 pr_info("cpu_user_features = 0x%08x 0x%08x\n",
819 cur_cpu_spec->cpu_user_features,
820 cur_cpu_spec->cpu_user_features2);
821 pr_info("mmu_features = 0x%08x\n", cur_cpu_spec->mmu_features);
822#ifdef CONFIG_PPC64
823 pr_info("firmware_features = 0x%016lx\n", powerpc_firmware_features);
824#endif
825
826#ifdef CONFIG_PPC_BOOK3S_64
827 if (htab_address)
828 pr_info("htab_address = 0x%p\n", htab_address);
829 if (htab_hash_mask)
830 pr_info("htab_hash_mask = 0x%lx\n", htab_hash_mask);
831#endif
832#ifdef CONFIG_PPC_STD_MMU_32
833 if (Hash)
834 pr_info("Hash = 0x%p\n", Hash);
835 if (Hash_mask)
836 pr_info("Hash_mask = 0x%lx\n", Hash_mask);
837#endif
838
839 if (PHYSICAL_START > 0)
840 pr_info("physical_start = 0x%llx\n",
841 (unsigned long long)PHYSICAL_START);
842 pr_info("-----------------------------------------------------\n");
843}
844
845#ifdef CONFIG_SMP
846static void smp_setup_pacas(void)
847{
848 int cpu;
849
850 for_each_possible_cpu(cpu) {
851 if (cpu == smp_processor_id())
852 continue;
853 allocate_paca(cpu);
854 set_hard_smp_processor_id(cpu, cpu_to_phys_id[cpu]);
855 }
856
857 memblock_free(__pa(cpu_to_phys_id), nr_cpu_ids * sizeof(u32));
858 cpu_to_phys_id = NULL;
859}
860#endif
861
862/*
863 * Called into from start_kernel this initializes memblock, which is used
864 * to manage page allocation until mem_init is called.
865 */
866void __init setup_arch(char **cmdline_p)
867{
868 *cmdline_p = boot_command_line;
869
870 /* Set a half-reasonable default so udelay does something sensible */
871 loops_per_jiffy = 500000000 / HZ;
872
873 /* Unflatten the device-tree passed by prom_init or kexec */
874 unflatten_device_tree();
875
876 /*
877 * Initialize cache line/block info from device-tree (on ppc64) or
878 * just cputable (on ppc32).
879 */
880 initialize_cache_info();
881
882 /* Initialize RTAS if available. */
883 rtas_initialize();
884
885 /* Check if we have an initrd provided via the device-tree. */
886 check_for_initrd();
887
888 /* Probe the machine type, establish ppc_md. */
889 probe_machine();
890
891 /* Setup panic notifier if requested by the platform. */
892 setup_panic();
893
894 /*
895 * Configure ppc_md.power_save (ppc32 only, 64-bit machines do
896 * it from their respective probe() function.
897 */
898 setup_power_save();
899
900 /* Discover standard serial ports. */
901 find_legacy_serial_ports();
902
903 /* Register early console with the printk subsystem. */
904 register_early_udbg_console();
905
906 /* Setup the various CPU maps based on the device-tree. */
907 smp_setup_cpu_maps();
908
909 /* Initialize xmon. */
910 xmon_setup();
911
912 /* Check the SMT related command line arguments (ppc64). */
913 check_smt_enabled();
914
915 /* Parse memory topology */
916 mem_topology_setup();
917
918 /*
919 * Release secondary cpus out of their spinloops at 0x60 now that
920 * we can map physical -> logical CPU ids.
921 *
922 * Freescale Book3e parts spin in a loop provided by firmware,
923 * so smp_release_cpus() does nothing for them.
924 */
925#ifdef CONFIG_SMP
926 smp_setup_pacas();
927
928 /* On BookE, setup per-core TLB data structures. */
929 setup_tlb_core_data();
930
931 smp_release_cpus();
932#endif
933
934 /* Print various info about the machine that has been gathered so far. */
935 print_system_info();
936
937 /* Reserve large chunks of memory for use by CMA for KVM. */
938 kvm_cma_reserve();
939
940 klp_init_thread_info(&init_thread_info);
941
942 init_mm.start_code = (unsigned long)_stext;
943 init_mm.end_code = (unsigned long) _etext;
944 init_mm.end_data = (unsigned long) _edata;
945 init_mm.brk = klimit;
946
947#ifdef CONFIG_PPC_MM_SLICES
948#ifdef CONFIG_PPC64
949 if (!radix_enabled())
950 init_mm.context.slb_addr_limit = DEFAULT_MAP_WINDOW_USER64;
951#elif defined(CONFIG_PPC_8xx)
952 init_mm.context.slb_addr_limit = DEFAULT_MAP_WINDOW;
953#else
954#error "context.addr_limit not initialized."
955#endif
956#endif
957
958#ifdef CONFIG_SPAPR_TCE_IOMMU
959 mm_iommu_init(&init_mm);
960#endif
961 irqstack_early_init();
962 exc_lvl_early_init();
963 emergency_stack_init();
964
965 initmem_init();
966
967#ifdef CONFIG_DUMMY_CONSOLE
968 conswitchp = &dummy_con;
969#endif
970 if (ppc_md.setup_arch)
971 ppc_md.setup_arch();
972
973 paging_init();
974
975 /* Initialize the MMU context management stuff. */
976 mmu_context_init();
977
978#ifdef CONFIG_PPC64
979 /* Interrupt code needs to be 64K-aligned. */
980 if ((unsigned long)_stext & 0xffff)
981 panic("Kernelbase not 64K-aligned (0x%lx)!\n",
982 (unsigned long)_stext);
983#endif
984}