Loading...
1// SPDX-License-Identifier: GPL-2.0-or-later
2/*
3 * Procedures for interfacing to Open Firmware.
4 *
5 * Paul Mackerras August 1996.
6 * Copyright (C) 1996-2005 Paul Mackerras.
7 *
8 * Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner.
9 * {engebret|bergner}@us.ibm.com
10 */
11
12#undef DEBUG_PROM
13
14/* we cannot use FORTIFY as it brings in new symbols */
15#define __NO_FORTIFY
16
17#include <stdarg.h>
18#include <linux/kernel.h>
19#include <linux/string.h>
20#include <linux/init.h>
21#include <linux/threads.h>
22#include <linux/spinlock.h>
23#include <linux/types.h>
24#include <linux/pci.h>
25#include <linux/proc_fs.h>
26#include <linux/delay.h>
27#include <linux/initrd.h>
28#include <linux/bitops.h>
29#include <linux/pgtable.h>
30#include <asm/prom.h>
31#include <asm/rtas.h>
32#include <asm/page.h>
33#include <asm/processor.h>
34#include <asm/irq.h>
35#include <asm/io.h>
36#include <asm/smp.h>
37#include <asm/mmu.h>
38#include <asm/iommu.h>
39#include <asm/btext.h>
40#include <asm/sections.h>
41#include <asm/machdep.h>
42#include <asm/asm-prototypes.h>
43#include <asm/ultravisor-api.h>
44
45#include <linux/linux_logo.h>
46
47/* All of prom_init bss lives here */
48#define __prombss __section(.bss.prominit)
49
50/*
51 * Eventually bump that one up
52 */
53#define DEVTREE_CHUNK_SIZE 0x100000
54
55/*
56 * This is the size of the local memory reserve map that gets copied
57 * into the boot params passed to the kernel. That size is totally
58 * flexible as the kernel just reads the list until it encounters an
59 * entry with size 0, so it can be changed without breaking binary
60 * compatibility
61 */
62#define MEM_RESERVE_MAP_SIZE 8
63
64/*
65 * prom_init() is called very early on, before the kernel text
66 * and data have been mapped to KERNELBASE. At this point the code
67 * is running at whatever address it has been loaded at.
68 * On ppc32 we compile with -mrelocatable, which means that references
69 * to extern and static variables get relocated automatically.
70 * ppc64 objects are always relocatable, we just need to relocate the
71 * TOC.
72 *
73 * Because OF may have mapped I/O devices into the area starting at
74 * KERNELBASE, particularly on CHRP machines, we can't safely call
75 * OF once the kernel has been mapped to KERNELBASE. Therefore all
76 * OF calls must be done within prom_init().
77 *
78 * ADDR is used in calls to call_prom. The 4th and following
79 * arguments to call_prom should be 32-bit values.
80 * On ppc64, 64 bit values are truncated to 32 bits (and
81 * fortunately don't get interpreted as two arguments).
82 */
83#define ADDR(x) (u32)(unsigned long)(x)
84
85#ifdef CONFIG_PPC64
86#define OF_WORKAROUNDS 0
87#else
88#define OF_WORKAROUNDS of_workarounds
89static int of_workarounds __prombss;
90#endif
91
92#define OF_WA_CLAIM 1 /* do phys/virt claim separately, then map */
93#define OF_WA_LONGTRAIL 2 /* work around longtrail bugs */
94
95#define PROM_BUG() do { \
96 prom_printf("kernel BUG at %s line 0x%x!\n", \
97 __FILE__, __LINE__); \
98 __builtin_trap(); \
99} while (0)
100
101#ifdef DEBUG_PROM
102#define prom_debug(x...) prom_printf(x)
103#else
104#define prom_debug(x...) do { } while (0)
105#endif
106
107
108typedef u32 prom_arg_t;
109
110struct prom_args {
111 __be32 service;
112 __be32 nargs;
113 __be32 nret;
114 __be32 args[10];
115};
116
117struct prom_t {
118 ihandle root;
119 phandle chosen;
120 int cpu;
121 ihandle stdout;
122 ihandle mmumap;
123 ihandle memory;
124};
125
126struct mem_map_entry {
127 __be64 base;
128 __be64 size;
129};
130
131typedef __be32 cell_t;
132
133extern void __start(unsigned long r3, unsigned long r4, unsigned long r5,
134 unsigned long r6, unsigned long r7, unsigned long r8,
135 unsigned long r9);
136
137#ifdef CONFIG_PPC64
138extern int enter_prom(struct prom_args *args, unsigned long entry);
139#else
140static inline int enter_prom(struct prom_args *args, unsigned long entry)
141{
142 return ((int (*)(struct prom_args *))entry)(args);
143}
144#endif
145
146extern void copy_and_flush(unsigned long dest, unsigned long src,
147 unsigned long size, unsigned long offset);
148
149/* prom structure */
150static struct prom_t __prombss prom;
151
152static unsigned long __prombss prom_entry;
153
154static char __prombss of_stdout_device[256];
155static char __prombss prom_scratch[256];
156
157static unsigned long __prombss dt_header_start;
158static unsigned long __prombss dt_struct_start, dt_struct_end;
159static unsigned long __prombss dt_string_start, dt_string_end;
160
161static unsigned long __prombss prom_initrd_start, prom_initrd_end;
162
163#ifdef CONFIG_PPC64
164static int __prombss prom_iommu_force_on;
165static int __prombss prom_iommu_off;
166static unsigned long __prombss prom_tce_alloc_start;
167static unsigned long __prombss prom_tce_alloc_end;
168#endif
169
170#ifdef CONFIG_PPC_PSERIES
171static bool __prombss prom_radix_disable;
172static bool __prombss prom_radix_gtse_disable;
173static bool __prombss prom_xive_disable;
174#endif
175
176#ifdef CONFIG_PPC_SVM
177static bool __prombss prom_svm_enable;
178#endif
179
180struct platform_support {
181 bool hash_mmu;
182 bool radix_mmu;
183 bool radix_gtse;
184 bool xive;
185};
186
187/* Platforms codes are now obsolete in the kernel. Now only used within this
188 * file and ultimately gone too. Feel free to change them if you need, they
189 * are not shared with anything outside of this file anymore
190 */
191#define PLATFORM_PSERIES 0x0100
192#define PLATFORM_PSERIES_LPAR 0x0101
193#define PLATFORM_LPAR 0x0001
194#define PLATFORM_POWERMAC 0x0400
195#define PLATFORM_GENERIC 0x0500
196
197static int __prombss of_platform;
198
199static char __prombss prom_cmd_line[COMMAND_LINE_SIZE];
200
201static unsigned long __prombss prom_memory_limit;
202
203static unsigned long __prombss alloc_top;
204static unsigned long __prombss alloc_top_high;
205static unsigned long __prombss alloc_bottom;
206static unsigned long __prombss rmo_top;
207static unsigned long __prombss ram_top;
208
209static struct mem_map_entry __prombss mem_reserve_map[MEM_RESERVE_MAP_SIZE];
210static int __prombss mem_reserve_cnt;
211
212static cell_t __prombss regbuf[1024];
213
214static bool __prombss rtas_has_query_cpu_stopped;
215
216
217/*
218 * Error results ... some OF calls will return "-1" on error, some
219 * will return 0, some will return either. To simplify, here are
220 * macros to use with any ihandle or phandle return value to check if
221 * it is valid
222 */
223
224#define PROM_ERROR (-1u)
225#define PHANDLE_VALID(p) ((p) != 0 && (p) != PROM_ERROR)
226#define IHANDLE_VALID(i) ((i) != 0 && (i) != PROM_ERROR)
227
228/* Copied from lib/string.c and lib/kstrtox.c */
229
230static int __init prom_strcmp(const char *cs, const char *ct)
231{
232 unsigned char c1, c2;
233
234 while (1) {
235 c1 = *cs++;
236 c2 = *ct++;
237 if (c1 != c2)
238 return c1 < c2 ? -1 : 1;
239 if (!c1)
240 break;
241 }
242 return 0;
243}
244
245static char __init *prom_strcpy(char *dest, const char *src)
246{
247 char *tmp = dest;
248
249 while ((*dest++ = *src++) != '\0')
250 /* nothing */;
251 return tmp;
252}
253
254static int __init prom_strncmp(const char *cs, const char *ct, size_t count)
255{
256 unsigned char c1, c2;
257
258 while (count) {
259 c1 = *cs++;
260 c2 = *ct++;
261 if (c1 != c2)
262 return c1 < c2 ? -1 : 1;
263 if (!c1)
264 break;
265 count--;
266 }
267 return 0;
268}
269
270static size_t __init prom_strlen(const char *s)
271{
272 const char *sc;
273
274 for (sc = s; *sc != '\0'; ++sc)
275 /* nothing */;
276 return sc - s;
277}
278
279static int __init prom_memcmp(const void *cs, const void *ct, size_t count)
280{
281 const unsigned char *su1, *su2;
282 int res = 0;
283
284 for (su1 = cs, su2 = ct; 0 < count; ++su1, ++su2, count--)
285 if ((res = *su1 - *su2) != 0)
286 break;
287 return res;
288}
289
290static char __init *prom_strstr(const char *s1, const char *s2)
291{
292 size_t l1, l2;
293
294 l2 = prom_strlen(s2);
295 if (!l2)
296 return (char *)s1;
297 l1 = prom_strlen(s1);
298 while (l1 >= l2) {
299 l1--;
300 if (!prom_memcmp(s1, s2, l2))
301 return (char *)s1;
302 s1++;
303 }
304 return NULL;
305}
306
307static size_t __init prom_strlcat(char *dest, const char *src, size_t count)
308{
309 size_t dsize = prom_strlen(dest);
310 size_t len = prom_strlen(src);
311 size_t res = dsize + len;
312
313 /* This would be a bug */
314 if (dsize >= count)
315 return count;
316
317 dest += dsize;
318 count -= dsize;
319 if (len >= count)
320 len = count-1;
321 memcpy(dest, src, len);
322 dest[len] = 0;
323 return res;
324
325}
326
327#ifdef CONFIG_PPC_PSERIES
328static int __init prom_strtobool(const char *s, bool *res)
329{
330 if (!s)
331 return -EINVAL;
332
333 switch (s[0]) {
334 case 'y':
335 case 'Y':
336 case '1':
337 *res = true;
338 return 0;
339 case 'n':
340 case 'N':
341 case '0':
342 *res = false;
343 return 0;
344 case 'o':
345 case 'O':
346 switch (s[1]) {
347 case 'n':
348 case 'N':
349 *res = true;
350 return 0;
351 case 'f':
352 case 'F':
353 *res = false;
354 return 0;
355 default:
356 break;
357 }
358 default:
359 break;
360 }
361
362 return -EINVAL;
363}
364#endif
365
366/* This is the one and *ONLY* place where we actually call open
367 * firmware.
368 */
369
370static int __init call_prom(const char *service, int nargs, int nret, ...)
371{
372 int i;
373 struct prom_args args;
374 va_list list;
375
376 args.service = cpu_to_be32(ADDR(service));
377 args.nargs = cpu_to_be32(nargs);
378 args.nret = cpu_to_be32(nret);
379
380 va_start(list, nret);
381 for (i = 0; i < nargs; i++)
382 args.args[i] = cpu_to_be32(va_arg(list, prom_arg_t));
383 va_end(list);
384
385 for (i = 0; i < nret; i++)
386 args.args[nargs+i] = 0;
387
388 if (enter_prom(&args, prom_entry) < 0)
389 return PROM_ERROR;
390
391 return (nret > 0) ? be32_to_cpu(args.args[nargs]) : 0;
392}
393
394static int __init call_prom_ret(const char *service, int nargs, int nret,
395 prom_arg_t *rets, ...)
396{
397 int i;
398 struct prom_args args;
399 va_list list;
400
401 args.service = cpu_to_be32(ADDR(service));
402 args.nargs = cpu_to_be32(nargs);
403 args.nret = cpu_to_be32(nret);
404
405 va_start(list, rets);
406 for (i = 0; i < nargs; i++)
407 args.args[i] = cpu_to_be32(va_arg(list, prom_arg_t));
408 va_end(list);
409
410 for (i = 0; i < nret; i++)
411 args.args[nargs+i] = 0;
412
413 if (enter_prom(&args, prom_entry) < 0)
414 return PROM_ERROR;
415
416 if (rets != NULL)
417 for (i = 1; i < nret; ++i)
418 rets[i-1] = be32_to_cpu(args.args[nargs+i]);
419
420 return (nret > 0) ? be32_to_cpu(args.args[nargs]) : 0;
421}
422
423
424static void __init prom_print(const char *msg)
425{
426 const char *p, *q;
427
428 if (prom.stdout == 0)
429 return;
430
431 for (p = msg; *p != 0; p = q) {
432 for (q = p; *q != 0 && *q != '\n'; ++q)
433 ;
434 if (q > p)
435 call_prom("write", 3, 1, prom.stdout, p, q - p);
436 if (*q == 0)
437 break;
438 ++q;
439 call_prom("write", 3, 1, prom.stdout, ADDR("\r\n"), 2);
440 }
441}
442
443
444/*
445 * Both prom_print_hex & prom_print_dec takes an unsigned long as input so that
446 * we do not need __udivdi3 or __umoddi3 on 32bits.
447 */
448static void __init prom_print_hex(unsigned long val)
449{
450 int i, nibbles = sizeof(val)*2;
451 char buf[sizeof(val)*2+1];
452
453 for (i = nibbles-1; i >= 0; i--) {
454 buf[i] = (val & 0xf) + '0';
455 if (buf[i] > '9')
456 buf[i] += ('a'-'0'-10);
457 val >>= 4;
458 }
459 buf[nibbles] = '\0';
460 call_prom("write", 3, 1, prom.stdout, buf, nibbles);
461}
462
463/* max number of decimal digits in an unsigned long */
464#define UL_DIGITS 21
465static void __init prom_print_dec(unsigned long val)
466{
467 int i, size;
468 char buf[UL_DIGITS+1];
469
470 for (i = UL_DIGITS-1; i >= 0; i--) {
471 buf[i] = (val % 10) + '0';
472 val = val/10;
473 if (val == 0)
474 break;
475 }
476 /* shift stuff down */
477 size = UL_DIGITS - i;
478 call_prom("write", 3, 1, prom.stdout, buf+i, size);
479}
480
481__printf(1, 2)
482static void __init prom_printf(const char *format, ...)
483{
484 const char *p, *q, *s;
485 va_list args;
486 unsigned long v;
487 long vs;
488 int n = 0;
489
490 va_start(args, format);
491 for (p = format; *p != 0; p = q) {
492 for (q = p; *q != 0 && *q != '\n' && *q != '%'; ++q)
493 ;
494 if (q > p)
495 call_prom("write", 3, 1, prom.stdout, p, q - p);
496 if (*q == 0)
497 break;
498 if (*q == '\n') {
499 ++q;
500 call_prom("write", 3, 1, prom.stdout,
501 ADDR("\r\n"), 2);
502 continue;
503 }
504 ++q;
505 if (*q == 0)
506 break;
507 while (*q == 'l') {
508 ++q;
509 ++n;
510 }
511 switch (*q) {
512 case 's':
513 ++q;
514 s = va_arg(args, const char *);
515 prom_print(s);
516 break;
517 case 'x':
518 ++q;
519 switch (n) {
520 case 0:
521 v = va_arg(args, unsigned int);
522 break;
523 case 1:
524 v = va_arg(args, unsigned long);
525 break;
526 case 2:
527 default:
528 v = va_arg(args, unsigned long long);
529 break;
530 }
531 prom_print_hex(v);
532 break;
533 case 'u':
534 ++q;
535 switch (n) {
536 case 0:
537 v = va_arg(args, unsigned int);
538 break;
539 case 1:
540 v = va_arg(args, unsigned long);
541 break;
542 case 2:
543 default:
544 v = va_arg(args, unsigned long long);
545 break;
546 }
547 prom_print_dec(v);
548 break;
549 case 'd':
550 ++q;
551 switch (n) {
552 case 0:
553 vs = va_arg(args, int);
554 break;
555 case 1:
556 vs = va_arg(args, long);
557 break;
558 case 2:
559 default:
560 vs = va_arg(args, long long);
561 break;
562 }
563 if (vs < 0) {
564 prom_print("-");
565 vs = -vs;
566 }
567 prom_print_dec(vs);
568 break;
569 }
570 }
571 va_end(args);
572}
573
574
575static unsigned int __init prom_claim(unsigned long virt, unsigned long size,
576 unsigned long align)
577{
578
579 if (align == 0 && (OF_WORKAROUNDS & OF_WA_CLAIM)) {
580 /*
581 * Old OF requires we claim physical and virtual separately
582 * and then map explicitly (assuming virtual mode)
583 */
584 int ret;
585 prom_arg_t result;
586
587 ret = call_prom_ret("call-method", 5, 2, &result,
588 ADDR("claim"), prom.memory,
589 align, size, virt);
590 if (ret != 0 || result == -1)
591 return -1;
592 ret = call_prom_ret("call-method", 5, 2, &result,
593 ADDR("claim"), prom.mmumap,
594 align, size, virt);
595 if (ret != 0) {
596 call_prom("call-method", 4, 1, ADDR("release"),
597 prom.memory, size, virt);
598 return -1;
599 }
600 /* the 0x12 is M (coherence) + PP == read/write */
601 call_prom("call-method", 6, 1,
602 ADDR("map"), prom.mmumap, 0x12, size, virt, virt);
603 return virt;
604 }
605 return call_prom("claim", 3, 1, (prom_arg_t)virt, (prom_arg_t)size,
606 (prom_arg_t)align);
607}
608
609static void __init __attribute__((noreturn)) prom_panic(const char *reason)
610{
611 prom_print(reason);
612 /* Do not call exit because it clears the screen on pmac
613 * it also causes some sort of double-fault on early pmacs */
614 if (of_platform == PLATFORM_POWERMAC)
615 asm("trap\n");
616
617 /* ToDo: should put up an SRC here on pSeries */
618 call_prom("exit", 0, 0);
619
620 for (;;) /* should never get here */
621 ;
622}
623
624
625static int __init prom_next_node(phandle *nodep)
626{
627 phandle node;
628
629 if ((node = *nodep) != 0
630 && (*nodep = call_prom("child", 1, 1, node)) != 0)
631 return 1;
632 if ((*nodep = call_prom("peer", 1, 1, node)) != 0)
633 return 1;
634 for (;;) {
635 if ((node = call_prom("parent", 1, 1, node)) == 0)
636 return 0;
637 if ((*nodep = call_prom("peer", 1, 1, node)) != 0)
638 return 1;
639 }
640}
641
642static inline int __init prom_getprop(phandle node, const char *pname,
643 void *value, size_t valuelen)
644{
645 return call_prom("getprop", 4, 1, node, ADDR(pname),
646 (u32)(unsigned long) value, (u32) valuelen);
647}
648
649static inline int __init prom_getproplen(phandle node, const char *pname)
650{
651 return call_prom("getproplen", 2, 1, node, ADDR(pname));
652}
653
654static void add_string(char **str, const char *q)
655{
656 char *p = *str;
657
658 while (*q)
659 *p++ = *q++;
660 *p++ = ' ';
661 *str = p;
662}
663
664static char *tohex(unsigned int x)
665{
666 static const char digits[] __initconst = "0123456789abcdef";
667 static char result[9] __prombss;
668 int i;
669
670 result[8] = 0;
671 i = 8;
672 do {
673 --i;
674 result[i] = digits[x & 0xf];
675 x >>= 4;
676 } while (x != 0 && i > 0);
677 return &result[i];
678}
679
680static int __init prom_setprop(phandle node, const char *nodename,
681 const char *pname, void *value, size_t valuelen)
682{
683 char cmd[256], *p;
684
685 if (!(OF_WORKAROUNDS & OF_WA_LONGTRAIL))
686 return call_prom("setprop", 4, 1, node, ADDR(pname),
687 (u32)(unsigned long) value, (u32) valuelen);
688
689 /* gah... setprop doesn't work on longtrail, have to use interpret */
690 p = cmd;
691 add_string(&p, "dev");
692 add_string(&p, nodename);
693 add_string(&p, tohex((u32)(unsigned long) value));
694 add_string(&p, tohex(valuelen));
695 add_string(&p, tohex(ADDR(pname)));
696 add_string(&p, tohex(prom_strlen(pname)));
697 add_string(&p, "property");
698 *p = 0;
699 return call_prom("interpret", 1, 1, (u32)(unsigned long) cmd);
700}
701
702/* We can't use the standard versions because of relocation headaches. */
703#define isxdigit(c) (('0' <= (c) && (c) <= '9') \
704 || ('a' <= (c) && (c) <= 'f') \
705 || ('A' <= (c) && (c) <= 'F'))
706
707#define isdigit(c) ('0' <= (c) && (c) <= '9')
708#define islower(c) ('a' <= (c) && (c) <= 'z')
709#define toupper(c) (islower(c) ? ((c) - 'a' + 'A') : (c))
710
711static unsigned long prom_strtoul(const char *cp, const char **endp)
712{
713 unsigned long result = 0, base = 10, value;
714
715 if (*cp == '0') {
716 base = 8;
717 cp++;
718 if (toupper(*cp) == 'X') {
719 cp++;
720 base = 16;
721 }
722 }
723
724 while (isxdigit(*cp) &&
725 (value = isdigit(*cp) ? *cp - '0' : toupper(*cp) - 'A' + 10) < base) {
726 result = result * base + value;
727 cp++;
728 }
729
730 if (endp)
731 *endp = cp;
732
733 return result;
734}
735
736static unsigned long prom_memparse(const char *ptr, const char **retptr)
737{
738 unsigned long ret = prom_strtoul(ptr, retptr);
739 int shift = 0;
740
741 /*
742 * We can't use a switch here because GCC *may* generate a
743 * jump table which won't work, because we're not running at
744 * the address we're linked at.
745 */
746 if ('G' == **retptr || 'g' == **retptr)
747 shift = 30;
748
749 if ('M' == **retptr || 'm' == **retptr)
750 shift = 20;
751
752 if ('K' == **retptr || 'k' == **retptr)
753 shift = 10;
754
755 if (shift) {
756 ret <<= shift;
757 (*retptr)++;
758 }
759
760 return ret;
761}
762
763/*
764 * Early parsing of the command line passed to the kernel, used for
765 * "mem=x" and the options that affect the iommu
766 */
767static void __init early_cmdline_parse(void)
768{
769 const char *opt;
770
771 char *p;
772 int l = 0;
773
774 prom_cmd_line[0] = 0;
775 p = prom_cmd_line;
776
777 if (!IS_ENABLED(CONFIG_CMDLINE_FORCE) && (long)prom.chosen > 0)
778 l = prom_getprop(prom.chosen, "bootargs", p, COMMAND_LINE_SIZE-1);
779
780 if (IS_ENABLED(CONFIG_CMDLINE_EXTEND) || l <= 0 || p[0] == '\0')
781 prom_strlcat(prom_cmd_line, " " CONFIG_CMDLINE,
782 sizeof(prom_cmd_line));
783
784 prom_printf("command line: %s\n", prom_cmd_line);
785
786#ifdef CONFIG_PPC64
787 opt = prom_strstr(prom_cmd_line, "iommu=");
788 if (opt) {
789 prom_printf("iommu opt is: %s\n", opt);
790 opt += 6;
791 while (*opt && *opt == ' ')
792 opt++;
793 if (!prom_strncmp(opt, "off", 3))
794 prom_iommu_off = 1;
795 else if (!prom_strncmp(opt, "force", 5))
796 prom_iommu_force_on = 1;
797 }
798#endif
799 opt = prom_strstr(prom_cmd_line, "mem=");
800 if (opt) {
801 opt += 4;
802 prom_memory_limit = prom_memparse(opt, (const char **)&opt);
803#ifdef CONFIG_PPC64
804 /* Align to 16 MB == size of ppc64 large page */
805 prom_memory_limit = ALIGN(prom_memory_limit, 0x1000000);
806#endif
807 }
808
809#ifdef CONFIG_PPC_PSERIES
810 prom_radix_disable = !IS_ENABLED(CONFIG_PPC_RADIX_MMU_DEFAULT);
811 opt = prom_strstr(prom_cmd_line, "disable_radix");
812 if (opt) {
813 opt += 13;
814 if (*opt && *opt == '=') {
815 bool val;
816
817 if (prom_strtobool(++opt, &val))
818 prom_radix_disable = false;
819 else
820 prom_radix_disable = val;
821 } else
822 prom_radix_disable = true;
823 }
824 if (prom_radix_disable)
825 prom_debug("Radix disabled from cmdline\n");
826
827 opt = prom_strstr(prom_cmd_line, "radix_hcall_invalidate=on");
828 if (opt) {
829 prom_radix_gtse_disable = true;
830 prom_debug("Radix GTSE disabled from cmdline\n");
831 }
832
833 opt = prom_strstr(prom_cmd_line, "xive=off");
834 if (opt) {
835 prom_xive_disable = true;
836 prom_debug("XIVE disabled from cmdline\n");
837 }
838#endif /* CONFIG_PPC_PSERIES */
839
840#ifdef CONFIG_PPC_SVM
841 opt = prom_strstr(prom_cmd_line, "svm=");
842 if (opt) {
843 bool val;
844
845 opt += sizeof("svm=") - 1;
846 if (!prom_strtobool(opt, &val))
847 prom_svm_enable = val;
848 }
849#endif /* CONFIG_PPC_SVM */
850}
851
852#ifdef CONFIG_PPC_PSERIES
853/*
854 * The architecture vector has an array of PVR mask/value pairs,
855 * followed by # option vectors - 1, followed by the option vectors.
856 *
857 * See prom.h for the definition of the bits specified in the
858 * architecture vector.
859 */
860
861/* Firmware expects the value to be n - 1, where n is the # of vectors */
862#define NUM_VECTORS(n) ((n) - 1)
863
864/*
865 * Firmware expects 1 + n - 2, where n is the length of the option vector in
866 * bytes. The 1 accounts for the length byte itself, the - 2 .. ?
867 */
868#define VECTOR_LENGTH(n) (1 + (n) - 2)
869
870struct option_vector1 {
871 u8 byte1;
872 u8 arch_versions;
873 u8 arch_versions3;
874} __packed;
875
876struct option_vector2 {
877 u8 byte1;
878 __be16 reserved;
879 __be32 real_base;
880 __be32 real_size;
881 __be32 virt_base;
882 __be32 virt_size;
883 __be32 load_base;
884 __be32 min_rma;
885 __be32 min_load;
886 u8 min_rma_percent;
887 u8 max_pft_size;
888} __packed;
889
890struct option_vector3 {
891 u8 byte1;
892 u8 byte2;
893} __packed;
894
895struct option_vector4 {
896 u8 byte1;
897 u8 min_vp_cap;
898} __packed;
899
900struct option_vector5 {
901 u8 byte1;
902 u8 byte2;
903 u8 byte3;
904 u8 cmo;
905 u8 associativity;
906 u8 bin_opts;
907 u8 micro_checkpoint;
908 u8 reserved0;
909 __be32 max_cpus;
910 __be16 papr_level;
911 __be16 reserved1;
912 u8 platform_facilities;
913 u8 reserved2;
914 __be16 reserved3;
915 u8 subprocessors;
916 u8 byte22;
917 u8 intarch;
918 u8 mmu;
919 u8 hash_ext;
920 u8 radix_ext;
921} __packed;
922
923struct option_vector6 {
924 u8 reserved;
925 u8 secondary_pteg;
926 u8 os_name;
927} __packed;
928
929struct ibm_arch_vec {
930 struct { u32 mask, val; } pvrs[14];
931
932 u8 num_vectors;
933
934 u8 vec1_len;
935 struct option_vector1 vec1;
936
937 u8 vec2_len;
938 struct option_vector2 vec2;
939
940 u8 vec3_len;
941 struct option_vector3 vec3;
942
943 u8 vec4_len;
944 struct option_vector4 vec4;
945
946 u8 vec5_len;
947 struct option_vector5 vec5;
948
949 u8 vec6_len;
950 struct option_vector6 vec6;
951} __packed;
952
953static const struct ibm_arch_vec ibm_architecture_vec_template __initconst = {
954 .pvrs = {
955 {
956 .mask = cpu_to_be32(0xfffe0000), /* POWER5/POWER5+ */
957 .val = cpu_to_be32(0x003a0000),
958 },
959 {
960 .mask = cpu_to_be32(0xffff0000), /* POWER6 */
961 .val = cpu_to_be32(0x003e0000),
962 },
963 {
964 .mask = cpu_to_be32(0xffff0000), /* POWER7 */
965 .val = cpu_to_be32(0x003f0000),
966 },
967 {
968 .mask = cpu_to_be32(0xffff0000), /* POWER8E */
969 .val = cpu_to_be32(0x004b0000),
970 },
971 {
972 .mask = cpu_to_be32(0xffff0000), /* POWER8NVL */
973 .val = cpu_to_be32(0x004c0000),
974 },
975 {
976 .mask = cpu_to_be32(0xffff0000), /* POWER8 */
977 .val = cpu_to_be32(0x004d0000),
978 },
979 {
980 .mask = cpu_to_be32(0xffff0000), /* POWER9 */
981 .val = cpu_to_be32(0x004e0000),
982 },
983 {
984 .mask = cpu_to_be32(0xffff0000), /* POWER10 */
985 .val = cpu_to_be32(0x00800000),
986 },
987 {
988 .mask = cpu_to_be32(0xffffffff), /* all 3.1-compliant */
989 .val = cpu_to_be32(0x0f000006),
990 },
991 {
992 .mask = cpu_to_be32(0xffffffff), /* all 3.00-compliant */
993 .val = cpu_to_be32(0x0f000005),
994 },
995 {
996 .mask = cpu_to_be32(0xffffffff), /* all 2.07-compliant */
997 .val = cpu_to_be32(0x0f000004),
998 },
999 {
1000 .mask = cpu_to_be32(0xffffffff), /* all 2.06-compliant */
1001 .val = cpu_to_be32(0x0f000003),
1002 },
1003 {
1004 .mask = cpu_to_be32(0xffffffff), /* all 2.05-compliant */
1005 .val = cpu_to_be32(0x0f000002),
1006 },
1007 {
1008 .mask = cpu_to_be32(0xfffffffe), /* all 2.04-compliant and earlier */
1009 .val = cpu_to_be32(0x0f000001),
1010 },
1011 },
1012
1013 .num_vectors = NUM_VECTORS(6),
1014
1015 .vec1_len = VECTOR_LENGTH(sizeof(struct option_vector1)),
1016 .vec1 = {
1017 .byte1 = 0,
1018 .arch_versions = OV1_PPC_2_00 | OV1_PPC_2_01 | OV1_PPC_2_02 | OV1_PPC_2_03 |
1019 OV1_PPC_2_04 | OV1_PPC_2_05 | OV1_PPC_2_06 | OV1_PPC_2_07,
1020 .arch_versions3 = OV1_PPC_3_00 | OV1_PPC_3_1,
1021 },
1022
1023 .vec2_len = VECTOR_LENGTH(sizeof(struct option_vector2)),
1024 /* option vector 2: Open Firmware options supported */
1025 .vec2 = {
1026 .byte1 = OV2_REAL_MODE,
1027 .reserved = 0,
1028 .real_base = cpu_to_be32(0xffffffff),
1029 .real_size = cpu_to_be32(0xffffffff),
1030 .virt_base = cpu_to_be32(0xffffffff),
1031 .virt_size = cpu_to_be32(0xffffffff),
1032 .load_base = cpu_to_be32(0xffffffff),
1033 .min_rma = cpu_to_be32(512), /* 512MB min RMA */
1034 .min_load = cpu_to_be32(0xffffffff), /* full client load */
1035 .min_rma_percent = 0, /* min RMA percentage of total RAM */
1036 .max_pft_size = 48, /* max log_2(hash table size) */
1037 },
1038
1039 .vec3_len = VECTOR_LENGTH(sizeof(struct option_vector3)),
1040 /* option vector 3: processor options supported */
1041 .vec3 = {
1042 .byte1 = 0, /* don't ignore, don't halt */
1043 .byte2 = OV3_FP | OV3_VMX | OV3_DFP,
1044 },
1045
1046 .vec4_len = VECTOR_LENGTH(sizeof(struct option_vector4)),
1047 /* option vector 4: IBM PAPR implementation */
1048 .vec4 = {
1049 .byte1 = 0, /* don't halt */
1050 .min_vp_cap = OV4_MIN_ENT_CAP, /* minimum VP entitled capacity */
1051 },
1052
1053 .vec5_len = VECTOR_LENGTH(sizeof(struct option_vector5)),
1054 /* option vector 5: PAPR/OF options */
1055 .vec5 = {
1056 .byte1 = 0, /* don't ignore, don't halt */
1057 .byte2 = OV5_FEAT(OV5_LPAR) | OV5_FEAT(OV5_SPLPAR) | OV5_FEAT(OV5_LARGE_PAGES) |
1058 OV5_FEAT(OV5_DRCONF_MEMORY) | OV5_FEAT(OV5_DONATE_DEDICATE_CPU) |
1059#ifdef CONFIG_PCI_MSI
1060 /* PCIe/MSI support. Without MSI full PCIe is not supported */
1061 OV5_FEAT(OV5_MSI),
1062#else
1063 0,
1064#endif
1065 .byte3 = 0,
1066 .cmo =
1067#ifdef CONFIG_PPC_SMLPAR
1068 OV5_FEAT(OV5_CMO) | OV5_FEAT(OV5_XCMO),
1069#else
1070 0,
1071#endif
1072 .associativity = OV5_FEAT(OV5_TYPE1_AFFINITY) | OV5_FEAT(OV5_PRRN),
1073 .bin_opts = OV5_FEAT(OV5_RESIZE_HPT) | OV5_FEAT(OV5_HP_EVT),
1074 .micro_checkpoint = 0,
1075 .reserved0 = 0,
1076 .max_cpus = cpu_to_be32(NR_CPUS), /* number of cores supported */
1077 .papr_level = 0,
1078 .reserved1 = 0,
1079 .platform_facilities = OV5_FEAT(OV5_PFO_HW_RNG) | OV5_FEAT(OV5_PFO_HW_ENCR) | OV5_FEAT(OV5_PFO_HW_842),
1080 .reserved2 = 0,
1081 .reserved3 = 0,
1082 .subprocessors = 1,
1083 .byte22 = OV5_FEAT(OV5_DRMEM_V2) | OV5_FEAT(OV5_DRC_INFO),
1084 .intarch = 0,
1085 .mmu = 0,
1086 .hash_ext = 0,
1087 .radix_ext = 0,
1088 },
1089
1090 /* option vector 6: IBM PAPR hints */
1091 .vec6_len = VECTOR_LENGTH(sizeof(struct option_vector6)),
1092 .vec6 = {
1093 .reserved = 0,
1094 .secondary_pteg = 0,
1095 .os_name = OV6_LINUX,
1096 },
1097};
1098
1099static struct ibm_arch_vec __prombss ibm_architecture_vec ____cacheline_aligned;
1100
1101/* Old method - ELF header with PT_NOTE sections only works on BE */
1102#ifdef __BIG_ENDIAN__
1103static const struct fake_elf {
1104 Elf32_Ehdr elfhdr;
1105 Elf32_Phdr phdr[2];
1106 struct chrpnote {
1107 u32 namesz;
1108 u32 descsz;
1109 u32 type;
1110 char name[8]; /* "PowerPC" */
1111 struct chrpdesc {
1112 u32 real_mode;
1113 u32 real_base;
1114 u32 real_size;
1115 u32 virt_base;
1116 u32 virt_size;
1117 u32 load_base;
1118 } chrpdesc;
1119 } chrpnote;
1120 struct rpanote {
1121 u32 namesz;
1122 u32 descsz;
1123 u32 type;
1124 char name[24]; /* "IBM,RPA-Client-Config" */
1125 struct rpadesc {
1126 u32 lpar_affinity;
1127 u32 min_rmo_size;
1128 u32 min_rmo_percent;
1129 u32 max_pft_size;
1130 u32 splpar;
1131 u32 min_load;
1132 u32 new_mem_def;
1133 u32 ignore_me;
1134 } rpadesc;
1135 } rpanote;
1136} fake_elf __initconst = {
1137 .elfhdr = {
1138 .e_ident = { 0x7f, 'E', 'L', 'F',
1139 ELFCLASS32, ELFDATA2MSB, EV_CURRENT },
1140 .e_type = ET_EXEC, /* yeah right */
1141 .e_machine = EM_PPC,
1142 .e_version = EV_CURRENT,
1143 .e_phoff = offsetof(struct fake_elf, phdr),
1144 .e_phentsize = sizeof(Elf32_Phdr),
1145 .e_phnum = 2
1146 },
1147 .phdr = {
1148 [0] = {
1149 .p_type = PT_NOTE,
1150 .p_offset = offsetof(struct fake_elf, chrpnote),
1151 .p_filesz = sizeof(struct chrpnote)
1152 }, [1] = {
1153 .p_type = PT_NOTE,
1154 .p_offset = offsetof(struct fake_elf, rpanote),
1155 .p_filesz = sizeof(struct rpanote)
1156 }
1157 },
1158 .chrpnote = {
1159 .namesz = sizeof("PowerPC"),
1160 .descsz = sizeof(struct chrpdesc),
1161 .type = 0x1275,
1162 .name = "PowerPC",
1163 .chrpdesc = {
1164 .real_mode = ~0U, /* ~0 means "don't care" */
1165 .real_base = ~0U,
1166 .real_size = ~0U,
1167 .virt_base = ~0U,
1168 .virt_size = ~0U,
1169 .load_base = ~0U
1170 },
1171 },
1172 .rpanote = {
1173 .namesz = sizeof("IBM,RPA-Client-Config"),
1174 .descsz = sizeof(struct rpadesc),
1175 .type = 0x12759999,
1176 .name = "IBM,RPA-Client-Config",
1177 .rpadesc = {
1178 .lpar_affinity = 0,
1179 .min_rmo_size = 64, /* in megabytes */
1180 .min_rmo_percent = 0,
1181 .max_pft_size = 48, /* 2^48 bytes max PFT size */
1182 .splpar = 1,
1183 .min_load = ~0U,
1184 .new_mem_def = 0
1185 }
1186 }
1187};
1188#endif /* __BIG_ENDIAN__ */
1189
1190static int __init prom_count_smt_threads(void)
1191{
1192 phandle node;
1193 char type[64];
1194 unsigned int plen;
1195
1196 /* Pick up th first CPU node we can find */
1197 for (node = 0; prom_next_node(&node); ) {
1198 type[0] = 0;
1199 prom_getprop(node, "device_type", type, sizeof(type));
1200
1201 if (prom_strcmp(type, "cpu"))
1202 continue;
1203 /*
1204 * There is an entry for each smt thread, each entry being
1205 * 4 bytes long. All cpus should have the same number of
1206 * smt threads, so return after finding the first.
1207 */
1208 plen = prom_getproplen(node, "ibm,ppc-interrupt-server#s");
1209 if (plen == PROM_ERROR)
1210 break;
1211 plen >>= 2;
1212 prom_debug("Found %lu smt threads per core\n", (unsigned long)plen);
1213
1214 /* Sanity check */
1215 if (plen < 1 || plen > 64) {
1216 prom_printf("Threads per core %lu out of bounds, assuming 1\n",
1217 (unsigned long)plen);
1218 return 1;
1219 }
1220 return plen;
1221 }
1222 prom_debug("No threads found, assuming 1 per core\n");
1223
1224 return 1;
1225
1226}
1227
1228static void __init prom_parse_mmu_model(u8 val,
1229 struct platform_support *support)
1230{
1231 switch (val) {
1232 case OV5_FEAT(OV5_MMU_DYNAMIC):
1233 case OV5_FEAT(OV5_MMU_EITHER): /* Either Available */
1234 prom_debug("MMU - either supported\n");
1235 support->radix_mmu = !prom_radix_disable;
1236 support->hash_mmu = true;
1237 break;
1238 case OV5_FEAT(OV5_MMU_RADIX): /* Only Radix */
1239 prom_debug("MMU - radix only\n");
1240 if (prom_radix_disable) {
1241 /*
1242 * If we __have__ to do radix, we're better off ignoring
1243 * the command line rather than not booting.
1244 */
1245 prom_printf("WARNING: Ignoring cmdline option disable_radix\n");
1246 }
1247 support->radix_mmu = true;
1248 break;
1249 case OV5_FEAT(OV5_MMU_HASH):
1250 prom_debug("MMU - hash only\n");
1251 support->hash_mmu = true;
1252 break;
1253 default:
1254 prom_debug("Unknown mmu support option: 0x%x\n", val);
1255 break;
1256 }
1257}
1258
1259static void __init prom_parse_xive_model(u8 val,
1260 struct platform_support *support)
1261{
1262 switch (val) {
1263 case OV5_FEAT(OV5_XIVE_EITHER): /* Either Available */
1264 prom_debug("XIVE - either mode supported\n");
1265 support->xive = !prom_xive_disable;
1266 break;
1267 case OV5_FEAT(OV5_XIVE_EXPLOIT): /* Only Exploitation mode */
1268 prom_debug("XIVE - exploitation mode supported\n");
1269 if (prom_xive_disable) {
1270 /*
1271 * If we __have__ to do XIVE, we're better off ignoring
1272 * the command line rather than not booting.
1273 */
1274 prom_printf("WARNING: Ignoring cmdline option xive=off\n");
1275 }
1276 support->xive = true;
1277 break;
1278 case OV5_FEAT(OV5_XIVE_LEGACY): /* Only Legacy mode */
1279 prom_debug("XIVE - legacy mode supported\n");
1280 break;
1281 default:
1282 prom_debug("Unknown xive support option: 0x%x\n", val);
1283 break;
1284 }
1285}
1286
1287static void __init prom_parse_platform_support(u8 index, u8 val,
1288 struct platform_support *support)
1289{
1290 switch (index) {
1291 case OV5_INDX(OV5_MMU_SUPPORT): /* MMU Model */
1292 prom_parse_mmu_model(val & OV5_FEAT(OV5_MMU_SUPPORT), support);
1293 break;
1294 case OV5_INDX(OV5_RADIX_GTSE): /* Radix Extensions */
1295 if (val & OV5_FEAT(OV5_RADIX_GTSE))
1296 support->radix_gtse = !prom_radix_gtse_disable;
1297 break;
1298 case OV5_INDX(OV5_XIVE_SUPPORT): /* Interrupt mode */
1299 prom_parse_xive_model(val & OV5_FEAT(OV5_XIVE_SUPPORT),
1300 support);
1301 break;
1302 }
1303}
1304
1305static void __init prom_check_platform_support(void)
1306{
1307 struct platform_support supported = {
1308 .hash_mmu = false,
1309 .radix_mmu = false,
1310 .radix_gtse = false,
1311 .xive = false
1312 };
1313 int prop_len = prom_getproplen(prom.chosen,
1314 "ibm,arch-vec-5-platform-support");
1315
1316 /*
1317 * First copy the architecture vec template
1318 *
1319 * use memcpy() instead of *vec = *vec_template so that GCC replaces it
1320 * by __memcpy() when KASAN is active
1321 */
1322 memcpy(&ibm_architecture_vec, &ibm_architecture_vec_template,
1323 sizeof(ibm_architecture_vec));
1324
1325 if (prop_len > 1) {
1326 int i;
1327 u8 vec[8];
1328 prom_debug("Found ibm,arch-vec-5-platform-support, len: %d\n",
1329 prop_len);
1330 if (prop_len > sizeof(vec))
1331 prom_printf("WARNING: ibm,arch-vec-5-platform-support longer than expected (len: %d)\n",
1332 prop_len);
1333 prom_getprop(prom.chosen, "ibm,arch-vec-5-platform-support",
1334 &vec, sizeof(vec));
1335 for (i = 0; i < sizeof(vec); i += 2) {
1336 prom_debug("%d: index = 0x%x val = 0x%x\n", i / 2
1337 , vec[i]
1338 , vec[i + 1]);
1339 prom_parse_platform_support(vec[i], vec[i + 1],
1340 &supported);
1341 }
1342 }
1343
1344 if (supported.radix_mmu && IS_ENABLED(CONFIG_PPC_RADIX_MMU)) {
1345 /* Radix preferred - Check if GTSE is also supported */
1346 prom_debug("Asking for radix\n");
1347 ibm_architecture_vec.vec5.mmu = OV5_FEAT(OV5_MMU_RADIX);
1348 if (supported.radix_gtse)
1349 ibm_architecture_vec.vec5.radix_ext =
1350 OV5_FEAT(OV5_RADIX_GTSE);
1351 else
1352 prom_debug("Radix GTSE isn't supported\n");
1353 } else if (supported.hash_mmu) {
1354 /* Default to hash mmu (if we can) */
1355 prom_debug("Asking for hash\n");
1356 ibm_architecture_vec.vec5.mmu = OV5_FEAT(OV5_MMU_HASH);
1357 } else {
1358 /* We're probably on a legacy hypervisor */
1359 prom_debug("Assuming legacy hash support\n");
1360 }
1361
1362 if (supported.xive) {
1363 prom_debug("Asking for XIVE\n");
1364 ibm_architecture_vec.vec5.intarch = OV5_FEAT(OV5_XIVE_EXPLOIT);
1365 }
1366}
1367
1368static void __init prom_send_capabilities(void)
1369{
1370 ihandle root;
1371 prom_arg_t ret;
1372 u32 cores;
1373
1374 /* Check ibm,arch-vec-5-platform-support and fixup vec5 if required */
1375 prom_check_platform_support();
1376
1377 root = call_prom("open", 1, 1, ADDR("/"));
1378 if (root != 0) {
1379 /* We need to tell the FW about the number of cores we support.
1380 *
1381 * To do that, we count the number of threads on the first core
1382 * (we assume this is the same for all cores) and use it to
1383 * divide NR_CPUS.
1384 */
1385
1386 cores = DIV_ROUND_UP(NR_CPUS, prom_count_smt_threads());
1387 prom_printf("Max number of cores passed to firmware: %u (NR_CPUS = %d)\n",
1388 cores, NR_CPUS);
1389
1390 ibm_architecture_vec.vec5.max_cpus = cpu_to_be32(cores);
1391
1392 /* try calling the ibm,client-architecture-support method */
1393 prom_printf("Calling ibm,client-architecture-support...");
1394 if (call_prom_ret("call-method", 3, 2, &ret,
1395 ADDR("ibm,client-architecture-support"),
1396 root,
1397 ADDR(&ibm_architecture_vec)) == 0) {
1398 /* the call exists... */
1399 if (ret)
1400 prom_printf("\nWARNING: ibm,client-architecture"
1401 "-support call FAILED!\n");
1402 call_prom("close", 1, 0, root);
1403 prom_printf(" done\n");
1404 return;
1405 }
1406 call_prom("close", 1, 0, root);
1407 prom_printf(" not implemented\n");
1408 }
1409
1410#ifdef __BIG_ENDIAN__
1411 {
1412 ihandle elfloader;
1413
1414 /* no ibm,client-architecture-support call, try the old way */
1415 elfloader = call_prom("open", 1, 1,
1416 ADDR("/packages/elf-loader"));
1417 if (elfloader == 0) {
1418 prom_printf("couldn't open /packages/elf-loader\n");
1419 return;
1420 }
1421 call_prom("call-method", 3, 1, ADDR("process-elf-header"),
1422 elfloader, ADDR(&fake_elf));
1423 call_prom("close", 1, 0, elfloader);
1424 }
1425#endif /* __BIG_ENDIAN__ */
1426}
1427#endif /* CONFIG_PPC_PSERIES */
1428
1429/*
1430 * Memory allocation strategy... our layout is normally:
1431 *
1432 * at 14Mb or more we have vmlinux, then a gap and initrd. In some
1433 * rare cases, initrd might end up being before the kernel though.
1434 * We assume this won't override the final kernel at 0, we have no
1435 * provision to handle that in this version, but it should hopefully
1436 * never happen.
1437 *
1438 * alloc_top is set to the top of RMO, eventually shrink down if the
1439 * TCEs overlap
1440 *
1441 * alloc_bottom is set to the top of kernel/initrd
1442 *
1443 * from there, allocations are done this way : rtas is allocated
1444 * topmost, and the device-tree is allocated from the bottom. We try
1445 * to grow the device-tree allocation as we progress. If we can't,
1446 * then we fail, we don't currently have a facility to restart
1447 * elsewhere, but that shouldn't be necessary.
1448 *
1449 * Note that calls to reserve_mem have to be done explicitly, memory
1450 * allocated with either alloc_up or alloc_down isn't automatically
1451 * reserved.
1452 */
1453
1454
1455/*
1456 * Allocates memory in the RMO upward from the kernel/initrd
1457 *
1458 * When align is 0, this is a special case, it means to allocate in place
1459 * at the current location of alloc_bottom or fail (that is basically
1460 * extending the previous allocation). Used for the device-tree flattening
1461 */
1462static unsigned long __init alloc_up(unsigned long size, unsigned long align)
1463{
1464 unsigned long base = alloc_bottom;
1465 unsigned long addr = 0;
1466
1467 if (align)
1468 base = ALIGN(base, align);
1469 prom_debug("%s(%lx, %lx)\n", __func__, size, align);
1470 if (ram_top == 0)
1471 prom_panic("alloc_up() called with mem not initialized\n");
1472
1473 if (align)
1474 base = ALIGN(alloc_bottom, align);
1475 else
1476 base = alloc_bottom;
1477
1478 for(; (base + size) <= alloc_top;
1479 base = ALIGN(base + 0x100000, align)) {
1480 prom_debug(" trying: 0x%lx\n\r", base);
1481 addr = (unsigned long)prom_claim(base, size, 0);
1482 if (addr != PROM_ERROR && addr != 0)
1483 break;
1484 addr = 0;
1485 if (align == 0)
1486 break;
1487 }
1488 if (addr == 0)
1489 return 0;
1490 alloc_bottom = addr + size;
1491
1492 prom_debug(" -> %lx\n", addr);
1493 prom_debug(" alloc_bottom : %lx\n", alloc_bottom);
1494 prom_debug(" alloc_top : %lx\n", alloc_top);
1495 prom_debug(" alloc_top_hi : %lx\n", alloc_top_high);
1496 prom_debug(" rmo_top : %lx\n", rmo_top);
1497 prom_debug(" ram_top : %lx\n", ram_top);
1498
1499 return addr;
1500}
1501
1502/*
1503 * Allocates memory downward, either from top of RMO, or if highmem
1504 * is set, from the top of RAM. Note that this one doesn't handle
1505 * failures. It does claim memory if highmem is not set.
1506 */
1507static unsigned long __init alloc_down(unsigned long size, unsigned long align,
1508 int highmem)
1509{
1510 unsigned long base, addr = 0;
1511
1512 prom_debug("%s(%lx, %lx, %s)\n", __func__, size, align,
1513 highmem ? "(high)" : "(low)");
1514 if (ram_top == 0)
1515 prom_panic("alloc_down() called with mem not initialized\n");
1516
1517 if (highmem) {
1518 /* Carve out storage for the TCE table. */
1519 addr = ALIGN_DOWN(alloc_top_high - size, align);
1520 if (addr <= alloc_bottom)
1521 return 0;
1522 /* Will we bump into the RMO ? If yes, check out that we
1523 * didn't overlap existing allocations there, if we did,
1524 * we are dead, we must be the first in town !
1525 */
1526 if (addr < rmo_top) {
1527 /* Good, we are first */
1528 if (alloc_top == rmo_top)
1529 alloc_top = rmo_top = addr;
1530 else
1531 return 0;
1532 }
1533 alloc_top_high = addr;
1534 goto bail;
1535 }
1536
1537 base = ALIGN_DOWN(alloc_top - size, align);
1538 for (; base > alloc_bottom;
1539 base = ALIGN_DOWN(base - 0x100000, align)) {
1540 prom_debug(" trying: 0x%lx\n\r", base);
1541 addr = (unsigned long)prom_claim(base, size, 0);
1542 if (addr != PROM_ERROR && addr != 0)
1543 break;
1544 addr = 0;
1545 }
1546 if (addr == 0)
1547 return 0;
1548 alloc_top = addr;
1549
1550 bail:
1551 prom_debug(" -> %lx\n", addr);
1552 prom_debug(" alloc_bottom : %lx\n", alloc_bottom);
1553 prom_debug(" alloc_top : %lx\n", alloc_top);
1554 prom_debug(" alloc_top_hi : %lx\n", alloc_top_high);
1555 prom_debug(" rmo_top : %lx\n", rmo_top);
1556 prom_debug(" ram_top : %lx\n", ram_top);
1557
1558 return addr;
1559}
1560
1561/*
1562 * Parse a "reg" cell
1563 */
1564static unsigned long __init prom_next_cell(int s, cell_t **cellp)
1565{
1566 cell_t *p = *cellp;
1567 unsigned long r = 0;
1568
1569 /* Ignore more than 2 cells */
1570 while (s > sizeof(unsigned long) / 4) {
1571 p++;
1572 s--;
1573 }
1574 r = be32_to_cpu(*p++);
1575#ifdef CONFIG_PPC64
1576 if (s > 1) {
1577 r <<= 32;
1578 r |= be32_to_cpu(*(p++));
1579 }
1580#endif
1581 *cellp = p;
1582 return r;
1583}
1584
1585/*
1586 * Very dumb function for adding to the memory reserve list, but
1587 * we don't need anything smarter at this point
1588 *
1589 * XXX Eventually check for collisions. They should NEVER happen.
1590 * If problems seem to show up, it would be a good start to track
1591 * them down.
1592 */
1593static void __init reserve_mem(u64 base, u64 size)
1594{
1595 u64 top = base + size;
1596 unsigned long cnt = mem_reserve_cnt;
1597
1598 if (size == 0)
1599 return;
1600
1601 /* We need to always keep one empty entry so that we
1602 * have our terminator with "size" set to 0 since we are
1603 * dumb and just copy this entire array to the boot params
1604 */
1605 base = ALIGN_DOWN(base, PAGE_SIZE);
1606 top = ALIGN(top, PAGE_SIZE);
1607 size = top - base;
1608
1609 if (cnt >= (MEM_RESERVE_MAP_SIZE - 1))
1610 prom_panic("Memory reserve map exhausted !\n");
1611 mem_reserve_map[cnt].base = cpu_to_be64(base);
1612 mem_reserve_map[cnt].size = cpu_to_be64(size);
1613 mem_reserve_cnt = cnt + 1;
1614}
1615
1616/*
1617 * Initialize memory allocation mechanism, parse "memory" nodes and
1618 * obtain that way the top of memory and RMO to setup out local allocator
1619 */
1620static void __init prom_init_mem(void)
1621{
1622 phandle node;
1623 char type[64];
1624 unsigned int plen;
1625 cell_t *p, *endp;
1626 __be32 val;
1627 u32 rac, rsc;
1628
1629 /*
1630 * We iterate the memory nodes to find
1631 * 1) top of RMO (first node)
1632 * 2) top of memory
1633 */
1634 val = cpu_to_be32(2);
1635 prom_getprop(prom.root, "#address-cells", &val, sizeof(val));
1636 rac = be32_to_cpu(val);
1637 val = cpu_to_be32(1);
1638 prom_getprop(prom.root, "#size-cells", &val, sizeof(rsc));
1639 rsc = be32_to_cpu(val);
1640 prom_debug("root_addr_cells: %x\n", rac);
1641 prom_debug("root_size_cells: %x\n", rsc);
1642
1643 prom_debug("scanning memory:\n");
1644
1645 for (node = 0; prom_next_node(&node); ) {
1646 type[0] = 0;
1647 prom_getprop(node, "device_type", type, sizeof(type));
1648
1649 if (type[0] == 0) {
1650 /*
1651 * CHRP Longtrail machines have no device_type
1652 * on the memory node, so check the name instead...
1653 */
1654 prom_getprop(node, "name", type, sizeof(type));
1655 }
1656 if (prom_strcmp(type, "memory"))
1657 continue;
1658
1659 plen = prom_getprop(node, "reg", regbuf, sizeof(regbuf));
1660 if (plen > sizeof(regbuf)) {
1661 prom_printf("memory node too large for buffer !\n");
1662 plen = sizeof(regbuf);
1663 }
1664 p = regbuf;
1665 endp = p + (plen / sizeof(cell_t));
1666
1667#ifdef DEBUG_PROM
1668 memset(prom_scratch, 0, sizeof(prom_scratch));
1669 call_prom("package-to-path", 3, 1, node, prom_scratch,
1670 sizeof(prom_scratch) - 1);
1671 prom_debug(" node %s :\n", prom_scratch);
1672#endif /* DEBUG_PROM */
1673
1674 while ((endp - p) >= (rac + rsc)) {
1675 unsigned long base, size;
1676
1677 base = prom_next_cell(rac, &p);
1678 size = prom_next_cell(rsc, &p);
1679
1680 if (size == 0)
1681 continue;
1682 prom_debug(" %lx %lx\n", base, size);
1683 if (base == 0 && (of_platform & PLATFORM_LPAR))
1684 rmo_top = size;
1685 if ((base + size) > ram_top)
1686 ram_top = base + size;
1687 }
1688 }
1689
1690 alloc_bottom = PAGE_ALIGN((unsigned long)&_end + 0x4000);
1691
1692 /*
1693 * If prom_memory_limit is set we reduce the upper limits *except* for
1694 * alloc_top_high. This must be the real top of RAM so we can put
1695 * TCE's up there.
1696 */
1697
1698 alloc_top_high = ram_top;
1699
1700 if (prom_memory_limit) {
1701 if (prom_memory_limit <= alloc_bottom) {
1702 prom_printf("Ignoring mem=%lx <= alloc_bottom.\n",
1703 prom_memory_limit);
1704 prom_memory_limit = 0;
1705 } else if (prom_memory_limit >= ram_top) {
1706 prom_printf("Ignoring mem=%lx >= ram_top.\n",
1707 prom_memory_limit);
1708 prom_memory_limit = 0;
1709 } else {
1710 ram_top = prom_memory_limit;
1711 rmo_top = min(rmo_top, prom_memory_limit);
1712 }
1713 }
1714
1715 /*
1716 * Setup our top alloc point, that is top of RMO or top of
1717 * segment 0 when running non-LPAR.
1718 * Some RS64 machines have buggy firmware where claims up at
1719 * 1GB fail. Cap at 768MB as a workaround.
1720 * Since 768MB is plenty of room, and we need to cap to something
1721 * reasonable on 32-bit, cap at 768MB on all machines.
1722 */
1723 if (!rmo_top)
1724 rmo_top = ram_top;
1725 rmo_top = min(0x30000000ul, rmo_top);
1726 alloc_top = rmo_top;
1727 alloc_top_high = ram_top;
1728
1729 /*
1730 * Check if we have an initrd after the kernel but still inside
1731 * the RMO. If we do move our bottom point to after it.
1732 */
1733 if (prom_initrd_start &&
1734 prom_initrd_start < rmo_top &&
1735 prom_initrd_end > alloc_bottom)
1736 alloc_bottom = PAGE_ALIGN(prom_initrd_end);
1737
1738 prom_printf("memory layout at init:\n");
1739 prom_printf(" memory_limit : %lx (16 MB aligned)\n",
1740 prom_memory_limit);
1741 prom_printf(" alloc_bottom : %lx\n", alloc_bottom);
1742 prom_printf(" alloc_top : %lx\n", alloc_top);
1743 prom_printf(" alloc_top_hi : %lx\n", alloc_top_high);
1744 prom_printf(" rmo_top : %lx\n", rmo_top);
1745 prom_printf(" ram_top : %lx\n", ram_top);
1746}
1747
1748static void __init prom_close_stdin(void)
1749{
1750 __be32 val;
1751 ihandle stdin;
1752
1753 if (prom_getprop(prom.chosen, "stdin", &val, sizeof(val)) > 0) {
1754 stdin = be32_to_cpu(val);
1755 call_prom("close", 1, 0, stdin);
1756 }
1757}
1758
1759#ifdef CONFIG_PPC_SVM
1760static int prom_rtas_hcall(uint64_t args)
1761{
1762 register uint64_t arg1 asm("r3") = H_RTAS;
1763 register uint64_t arg2 asm("r4") = args;
1764
1765 asm volatile("sc 1\n" : "=r" (arg1) :
1766 "r" (arg1),
1767 "r" (arg2) :);
1768 return arg1;
1769}
1770
1771static struct rtas_args __prombss os_term_args;
1772
1773static void __init prom_rtas_os_term(char *str)
1774{
1775 phandle rtas_node;
1776 __be32 val;
1777 u32 token;
1778
1779 prom_debug("%s: start...\n", __func__);
1780 rtas_node = call_prom("finddevice", 1, 1, ADDR("/rtas"));
1781 prom_debug("rtas_node: %x\n", rtas_node);
1782 if (!PHANDLE_VALID(rtas_node))
1783 return;
1784
1785 val = 0;
1786 prom_getprop(rtas_node, "ibm,os-term", &val, sizeof(val));
1787 token = be32_to_cpu(val);
1788 prom_debug("ibm,os-term: %x\n", token);
1789 if (token == 0)
1790 prom_panic("Could not get token for ibm,os-term\n");
1791 os_term_args.token = cpu_to_be32(token);
1792 os_term_args.nargs = cpu_to_be32(1);
1793 os_term_args.nret = cpu_to_be32(1);
1794 os_term_args.args[0] = cpu_to_be32(__pa(str));
1795 prom_rtas_hcall((uint64_t)&os_term_args);
1796}
1797#endif /* CONFIG_PPC_SVM */
1798
1799/*
1800 * Allocate room for and instantiate RTAS
1801 */
1802static void __init prom_instantiate_rtas(void)
1803{
1804 phandle rtas_node;
1805 ihandle rtas_inst;
1806 u32 base, entry = 0;
1807 __be32 val;
1808 u32 size = 0;
1809
1810 prom_debug("prom_instantiate_rtas: start...\n");
1811
1812 rtas_node = call_prom("finddevice", 1, 1, ADDR("/rtas"));
1813 prom_debug("rtas_node: %x\n", rtas_node);
1814 if (!PHANDLE_VALID(rtas_node))
1815 return;
1816
1817 val = 0;
1818 prom_getprop(rtas_node, "rtas-size", &val, sizeof(size));
1819 size = be32_to_cpu(val);
1820 if (size == 0)
1821 return;
1822
1823 base = alloc_down(size, PAGE_SIZE, 0);
1824 if (base == 0)
1825 prom_panic("Could not allocate memory for RTAS\n");
1826
1827 rtas_inst = call_prom("open", 1, 1, ADDR("/rtas"));
1828 if (!IHANDLE_VALID(rtas_inst)) {
1829 prom_printf("opening rtas package failed (%x)\n", rtas_inst);
1830 return;
1831 }
1832
1833 prom_printf("instantiating rtas at 0x%x...", base);
1834
1835 if (call_prom_ret("call-method", 3, 2, &entry,
1836 ADDR("instantiate-rtas"),
1837 rtas_inst, base) != 0
1838 || entry == 0) {
1839 prom_printf(" failed\n");
1840 return;
1841 }
1842 prom_printf(" done\n");
1843
1844 reserve_mem(base, size);
1845
1846 val = cpu_to_be32(base);
1847 prom_setprop(rtas_node, "/rtas", "linux,rtas-base",
1848 &val, sizeof(val));
1849 val = cpu_to_be32(entry);
1850 prom_setprop(rtas_node, "/rtas", "linux,rtas-entry",
1851 &val, sizeof(val));
1852
1853 /* Check if it supports "query-cpu-stopped-state" */
1854 if (prom_getprop(rtas_node, "query-cpu-stopped-state",
1855 &val, sizeof(val)) != PROM_ERROR)
1856 rtas_has_query_cpu_stopped = true;
1857
1858 prom_debug("rtas base = 0x%x\n", base);
1859 prom_debug("rtas entry = 0x%x\n", entry);
1860 prom_debug("rtas size = 0x%x\n", size);
1861
1862 prom_debug("prom_instantiate_rtas: end...\n");
1863}
1864
1865#ifdef CONFIG_PPC64
1866/*
1867 * Allocate room for and instantiate Stored Measurement Log (SML)
1868 */
1869static void __init prom_instantiate_sml(void)
1870{
1871 phandle ibmvtpm_node;
1872 ihandle ibmvtpm_inst;
1873 u32 entry = 0, size = 0, succ = 0;
1874 u64 base;
1875 __be32 val;
1876
1877 prom_debug("prom_instantiate_sml: start...\n");
1878
1879 ibmvtpm_node = call_prom("finddevice", 1, 1, ADDR("/vdevice/vtpm"));
1880 prom_debug("ibmvtpm_node: %x\n", ibmvtpm_node);
1881 if (!PHANDLE_VALID(ibmvtpm_node))
1882 return;
1883
1884 ibmvtpm_inst = call_prom("open", 1, 1, ADDR("/vdevice/vtpm"));
1885 if (!IHANDLE_VALID(ibmvtpm_inst)) {
1886 prom_printf("opening vtpm package failed (%x)\n", ibmvtpm_inst);
1887 return;
1888 }
1889
1890 if (prom_getprop(ibmvtpm_node, "ibm,sml-efi-reformat-supported",
1891 &val, sizeof(val)) != PROM_ERROR) {
1892 if (call_prom_ret("call-method", 2, 2, &succ,
1893 ADDR("reformat-sml-to-efi-alignment"),
1894 ibmvtpm_inst) != 0 || succ == 0) {
1895 prom_printf("Reformat SML to EFI alignment failed\n");
1896 return;
1897 }
1898
1899 if (call_prom_ret("call-method", 2, 2, &size,
1900 ADDR("sml-get-allocated-size"),
1901 ibmvtpm_inst) != 0 || size == 0) {
1902 prom_printf("SML get allocated size failed\n");
1903 return;
1904 }
1905 } else {
1906 if (call_prom_ret("call-method", 2, 2, &size,
1907 ADDR("sml-get-handover-size"),
1908 ibmvtpm_inst) != 0 || size == 0) {
1909 prom_printf("SML get handover size failed\n");
1910 return;
1911 }
1912 }
1913
1914 base = alloc_down(size, PAGE_SIZE, 0);
1915 if (base == 0)
1916 prom_panic("Could not allocate memory for sml\n");
1917
1918 prom_printf("instantiating sml at 0x%llx...", base);
1919
1920 memset((void *)base, 0, size);
1921
1922 if (call_prom_ret("call-method", 4, 2, &entry,
1923 ADDR("sml-handover"),
1924 ibmvtpm_inst, size, base) != 0 || entry == 0) {
1925 prom_printf("SML handover failed\n");
1926 return;
1927 }
1928 prom_printf(" done\n");
1929
1930 reserve_mem(base, size);
1931
1932 prom_setprop(ibmvtpm_node, "/vdevice/vtpm", "linux,sml-base",
1933 &base, sizeof(base));
1934 prom_setprop(ibmvtpm_node, "/vdevice/vtpm", "linux,sml-size",
1935 &size, sizeof(size));
1936
1937 prom_debug("sml base = 0x%llx\n", base);
1938 prom_debug("sml size = 0x%x\n", size);
1939
1940 prom_debug("prom_instantiate_sml: end...\n");
1941}
1942
1943/*
1944 * Allocate room for and initialize TCE tables
1945 */
1946#ifdef __BIG_ENDIAN__
1947static void __init prom_initialize_tce_table(void)
1948{
1949 phandle node;
1950 ihandle phb_node;
1951 char compatible[64], type[64], model[64];
1952 char *path = prom_scratch;
1953 u64 base, align;
1954 u32 minalign, minsize;
1955 u64 tce_entry, *tce_entryp;
1956 u64 local_alloc_top, local_alloc_bottom;
1957 u64 i;
1958
1959 if (prom_iommu_off)
1960 return;
1961
1962 prom_debug("starting prom_initialize_tce_table\n");
1963
1964 /* Cache current top of allocs so we reserve a single block */
1965 local_alloc_top = alloc_top_high;
1966 local_alloc_bottom = local_alloc_top;
1967
1968 /* Search all nodes looking for PHBs. */
1969 for (node = 0; prom_next_node(&node); ) {
1970 compatible[0] = 0;
1971 type[0] = 0;
1972 model[0] = 0;
1973 prom_getprop(node, "compatible",
1974 compatible, sizeof(compatible));
1975 prom_getprop(node, "device_type", type, sizeof(type));
1976 prom_getprop(node, "model", model, sizeof(model));
1977
1978 if ((type[0] == 0) || (prom_strstr(type, "pci") == NULL))
1979 continue;
1980
1981 /* Keep the old logic intact to avoid regression. */
1982 if (compatible[0] != 0) {
1983 if ((prom_strstr(compatible, "python") == NULL) &&
1984 (prom_strstr(compatible, "Speedwagon") == NULL) &&
1985 (prom_strstr(compatible, "Winnipeg") == NULL))
1986 continue;
1987 } else if (model[0] != 0) {
1988 if ((prom_strstr(model, "ython") == NULL) &&
1989 (prom_strstr(model, "peedwagon") == NULL) &&
1990 (prom_strstr(model, "innipeg") == NULL))
1991 continue;
1992 }
1993
1994 if (prom_getprop(node, "tce-table-minalign", &minalign,
1995 sizeof(minalign)) == PROM_ERROR)
1996 minalign = 0;
1997 if (prom_getprop(node, "tce-table-minsize", &minsize,
1998 sizeof(minsize)) == PROM_ERROR)
1999 minsize = 4UL << 20;
2000
2001 /*
2002 * Even though we read what OF wants, we just set the table
2003 * size to 4 MB. This is enough to map 2GB of PCI DMA space.
2004 * By doing this, we avoid the pitfalls of trying to DMA to
2005 * MMIO space and the DMA alias hole.
2006 */
2007 minsize = 4UL << 20;
2008
2009 /* Align to the greater of the align or size */
2010 align = max(minalign, minsize);
2011 base = alloc_down(minsize, align, 1);
2012 if (base == 0)
2013 prom_panic("ERROR, cannot find space for TCE table.\n");
2014 if (base < local_alloc_bottom)
2015 local_alloc_bottom = base;
2016
2017 /* It seems OF doesn't null-terminate the path :-( */
2018 memset(path, 0, sizeof(prom_scratch));
2019 /* Call OF to setup the TCE hardware */
2020 if (call_prom("package-to-path", 3, 1, node,
2021 path, sizeof(prom_scratch) - 1) == PROM_ERROR) {
2022 prom_printf("package-to-path failed\n");
2023 }
2024
2025 /* Save away the TCE table attributes for later use. */
2026 prom_setprop(node, path, "linux,tce-base", &base, sizeof(base));
2027 prom_setprop(node, path, "linux,tce-size", &minsize, sizeof(minsize));
2028
2029 prom_debug("TCE table: %s\n", path);
2030 prom_debug("\tnode = 0x%x\n", node);
2031 prom_debug("\tbase = 0x%llx\n", base);
2032 prom_debug("\tsize = 0x%x\n", minsize);
2033
2034 /* Initialize the table to have a one-to-one mapping
2035 * over the allocated size.
2036 */
2037 tce_entryp = (u64 *)base;
2038 for (i = 0; i < (minsize >> 3) ;tce_entryp++, i++) {
2039 tce_entry = (i << PAGE_SHIFT);
2040 tce_entry |= 0x3;
2041 *tce_entryp = tce_entry;
2042 }
2043
2044 prom_printf("opening PHB %s", path);
2045 phb_node = call_prom("open", 1, 1, path);
2046 if (phb_node == 0)
2047 prom_printf("... failed\n");
2048 else
2049 prom_printf("... done\n");
2050
2051 call_prom("call-method", 6, 0, ADDR("set-64-bit-addressing"),
2052 phb_node, -1, minsize,
2053 (u32) base, (u32) (base >> 32));
2054 call_prom("close", 1, 0, phb_node);
2055 }
2056
2057 reserve_mem(local_alloc_bottom, local_alloc_top - local_alloc_bottom);
2058
2059 /* These are only really needed if there is a memory limit in
2060 * effect, but we don't know so export them always. */
2061 prom_tce_alloc_start = local_alloc_bottom;
2062 prom_tce_alloc_end = local_alloc_top;
2063
2064 /* Flag the first invalid entry */
2065 prom_debug("ending prom_initialize_tce_table\n");
2066}
2067#endif /* __BIG_ENDIAN__ */
2068#endif /* CONFIG_PPC64 */
2069
2070/*
2071 * With CHRP SMP we need to use the OF to start the other processors.
2072 * We can't wait until smp_boot_cpus (the OF is trashed by then)
2073 * so we have to put the processors into a holding pattern controlled
2074 * by the kernel (not OF) before we destroy the OF.
2075 *
2076 * This uses a chunk of low memory, puts some holding pattern
2077 * code there and sends the other processors off to there until
2078 * smp_boot_cpus tells them to do something. The holding pattern
2079 * checks that address until its cpu # is there, when it is that
2080 * cpu jumps to __secondary_start(). smp_boot_cpus() takes care
2081 * of setting those values.
2082 *
2083 * We also use physical address 0x4 here to tell when a cpu
2084 * is in its holding pattern code.
2085 *
2086 * -- Cort
2087 */
2088/*
2089 * We want to reference the copy of __secondary_hold_* in the
2090 * 0 - 0x100 address range
2091 */
2092#define LOW_ADDR(x) (((unsigned long) &(x)) & 0xff)
2093
2094static void __init prom_hold_cpus(void)
2095{
2096 unsigned long i;
2097 phandle node;
2098 char type[64];
2099 unsigned long *spinloop
2100 = (void *) LOW_ADDR(__secondary_hold_spinloop);
2101 unsigned long *acknowledge
2102 = (void *) LOW_ADDR(__secondary_hold_acknowledge);
2103 unsigned long secondary_hold = LOW_ADDR(__secondary_hold);
2104
2105 /*
2106 * On pseries, if RTAS supports "query-cpu-stopped-state",
2107 * we skip this stage, the CPUs will be started by the
2108 * kernel using RTAS.
2109 */
2110 if ((of_platform == PLATFORM_PSERIES ||
2111 of_platform == PLATFORM_PSERIES_LPAR) &&
2112 rtas_has_query_cpu_stopped) {
2113 prom_printf("prom_hold_cpus: skipped\n");
2114 return;
2115 }
2116
2117 prom_debug("prom_hold_cpus: start...\n");
2118 prom_debug(" 1) spinloop = 0x%lx\n", (unsigned long)spinloop);
2119 prom_debug(" 1) *spinloop = 0x%lx\n", *spinloop);
2120 prom_debug(" 1) acknowledge = 0x%lx\n",
2121 (unsigned long)acknowledge);
2122 prom_debug(" 1) *acknowledge = 0x%lx\n", *acknowledge);
2123 prom_debug(" 1) secondary_hold = 0x%lx\n", secondary_hold);
2124
2125 /* Set the common spinloop variable, so all of the secondary cpus
2126 * will block when they are awakened from their OF spinloop.
2127 * This must occur for both SMP and non SMP kernels, since OF will
2128 * be trashed when we move the kernel.
2129 */
2130 *spinloop = 0;
2131
2132 /* look for cpus */
2133 for (node = 0; prom_next_node(&node); ) {
2134 unsigned int cpu_no;
2135 __be32 reg;
2136
2137 type[0] = 0;
2138 prom_getprop(node, "device_type", type, sizeof(type));
2139 if (prom_strcmp(type, "cpu") != 0)
2140 continue;
2141
2142 /* Skip non-configured cpus. */
2143 if (prom_getprop(node, "status", type, sizeof(type)) > 0)
2144 if (prom_strcmp(type, "okay") != 0)
2145 continue;
2146
2147 reg = cpu_to_be32(-1); /* make sparse happy */
2148 prom_getprop(node, "reg", ®, sizeof(reg));
2149 cpu_no = be32_to_cpu(reg);
2150
2151 prom_debug("cpu hw idx = %u\n", cpu_no);
2152
2153 /* Init the acknowledge var which will be reset by
2154 * the secondary cpu when it awakens from its OF
2155 * spinloop.
2156 */
2157 *acknowledge = (unsigned long)-1;
2158
2159 if (cpu_no != prom.cpu) {
2160 /* Primary Thread of non-boot cpu or any thread */
2161 prom_printf("starting cpu hw idx %u... ", cpu_no);
2162 call_prom("start-cpu", 3, 0, node,
2163 secondary_hold, cpu_no);
2164
2165 for (i = 0; (i < 100000000) &&
2166 (*acknowledge == ((unsigned long)-1)); i++ )
2167 mb();
2168
2169 if (*acknowledge == cpu_no)
2170 prom_printf("done\n");
2171 else
2172 prom_printf("failed: %lx\n", *acknowledge);
2173 }
2174#ifdef CONFIG_SMP
2175 else
2176 prom_printf("boot cpu hw idx %u\n", cpu_no);
2177#endif /* CONFIG_SMP */
2178 }
2179
2180 prom_debug("prom_hold_cpus: end...\n");
2181}
2182
2183
2184static void __init prom_init_client_services(unsigned long pp)
2185{
2186 /* Get a handle to the prom entry point before anything else */
2187 prom_entry = pp;
2188
2189 /* get a handle for the stdout device */
2190 prom.chosen = call_prom("finddevice", 1, 1, ADDR("/chosen"));
2191 if (!PHANDLE_VALID(prom.chosen))
2192 prom_panic("cannot find chosen"); /* msg won't be printed :( */
2193
2194 /* get device tree root */
2195 prom.root = call_prom("finddevice", 1, 1, ADDR("/"));
2196 if (!PHANDLE_VALID(prom.root))
2197 prom_panic("cannot find device tree root"); /* msg won't be printed :( */
2198
2199 prom.mmumap = 0;
2200}
2201
2202#ifdef CONFIG_PPC32
2203/*
2204 * For really old powermacs, we need to map things we claim.
2205 * For that, we need the ihandle of the mmu.
2206 * Also, on the longtrail, we need to work around other bugs.
2207 */
2208static void __init prom_find_mmu(void)
2209{
2210 phandle oprom;
2211 char version[64];
2212
2213 oprom = call_prom("finddevice", 1, 1, ADDR("/openprom"));
2214 if (!PHANDLE_VALID(oprom))
2215 return;
2216 if (prom_getprop(oprom, "model", version, sizeof(version)) <= 0)
2217 return;
2218 version[sizeof(version) - 1] = 0;
2219 /* XXX might need to add other versions here */
2220 if (prom_strcmp(version, "Open Firmware, 1.0.5") == 0)
2221 of_workarounds = OF_WA_CLAIM;
2222 else if (prom_strncmp(version, "FirmWorks,3.", 12) == 0) {
2223 of_workarounds = OF_WA_CLAIM | OF_WA_LONGTRAIL;
2224 call_prom("interpret", 1, 1, "dev /memory 0 to allow-reclaim");
2225 } else
2226 return;
2227 prom.memory = call_prom("open", 1, 1, ADDR("/memory"));
2228 prom_getprop(prom.chosen, "mmu", &prom.mmumap,
2229 sizeof(prom.mmumap));
2230 prom.mmumap = be32_to_cpu(prom.mmumap);
2231 if (!IHANDLE_VALID(prom.memory) || !IHANDLE_VALID(prom.mmumap))
2232 of_workarounds &= ~OF_WA_CLAIM; /* hmmm */
2233}
2234#else
2235#define prom_find_mmu()
2236#endif
2237
2238static void __init prom_init_stdout(void)
2239{
2240 char *path = of_stdout_device;
2241 char type[16];
2242 phandle stdout_node;
2243 __be32 val;
2244
2245 if (prom_getprop(prom.chosen, "stdout", &val, sizeof(val)) <= 0)
2246 prom_panic("cannot find stdout");
2247
2248 prom.stdout = be32_to_cpu(val);
2249
2250 /* Get the full OF pathname of the stdout device */
2251 memset(path, 0, 256);
2252 call_prom("instance-to-path", 3, 1, prom.stdout, path, 255);
2253 prom_printf("OF stdout device is: %s\n", of_stdout_device);
2254 prom_setprop(prom.chosen, "/chosen", "linux,stdout-path",
2255 path, prom_strlen(path) + 1);
2256
2257 /* instance-to-package fails on PA-Semi */
2258 stdout_node = call_prom("instance-to-package", 1, 1, prom.stdout);
2259 if (stdout_node != PROM_ERROR) {
2260 val = cpu_to_be32(stdout_node);
2261
2262 /* If it's a display, note it */
2263 memset(type, 0, sizeof(type));
2264 prom_getprop(stdout_node, "device_type", type, sizeof(type));
2265 if (prom_strcmp(type, "display") == 0)
2266 prom_setprop(stdout_node, path, "linux,boot-display", NULL, 0);
2267 }
2268}
2269
2270static int __init prom_find_machine_type(void)
2271{
2272 char compat[256];
2273 int len, i = 0;
2274#ifdef CONFIG_PPC64
2275 phandle rtas;
2276 int x;
2277#endif
2278
2279 /* Look for a PowerMac or a Cell */
2280 len = prom_getprop(prom.root, "compatible",
2281 compat, sizeof(compat)-1);
2282 if (len > 0) {
2283 compat[len] = 0;
2284 while (i < len) {
2285 char *p = &compat[i];
2286 int sl = prom_strlen(p);
2287 if (sl == 0)
2288 break;
2289 if (prom_strstr(p, "Power Macintosh") ||
2290 prom_strstr(p, "MacRISC"))
2291 return PLATFORM_POWERMAC;
2292#ifdef CONFIG_PPC64
2293 /* We must make sure we don't detect the IBM Cell
2294 * blades as pSeries due to some firmware issues,
2295 * so we do it here.
2296 */
2297 if (prom_strstr(p, "IBM,CBEA") ||
2298 prom_strstr(p, "IBM,CPBW-1.0"))
2299 return PLATFORM_GENERIC;
2300#endif /* CONFIG_PPC64 */
2301 i += sl + 1;
2302 }
2303 }
2304#ifdef CONFIG_PPC64
2305 /* Try to figure out if it's an IBM pSeries or any other
2306 * PAPR compliant platform. We assume it is if :
2307 * - /device_type is "chrp" (please, do NOT use that for future
2308 * non-IBM designs !
2309 * - it has /rtas
2310 */
2311 len = prom_getprop(prom.root, "device_type",
2312 compat, sizeof(compat)-1);
2313 if (len <= 0)
2314 return PLATFORM_GENERIC;
2315 if (prom_strcmp(compat, "chrp"))
2316 return PLATFORM_GENERIC;
2317
2318 /* Default to pSeries. We need to know if we are running LPAR */
2319 rtas = call_prom("finddevice", 1, 1, ADDR("/rtas"));
2320 if (!PHANDLE_VALID(rtas))
2321 return PLATFORM_GENERIC;
2322 x = prom_getproplen(rtas, "ibm,hypertas-functions");
2323 if (x != PROM_ERROR) {
2324 prom_debug("Hypertas detected, assuming LPAR !\n");
2325 return PLATFORM_PSERIES_LPAR;
2326 }
2327 return PLATFORM_PSERIES;
2328#else
2329 return PLATFORM_GENERIC;
2330#endif
2331}
2332
2333static int __init prom_set_color(ihandle ih, int i, int r, int g, int b)
2334{
2335 return call_prom("call-method", 6, 1, ADDR("color!"), ih, i, b, g, r);
2336}
2337
2338/*
2339 * If we have a display that we don't know how to drive,
2340 * we will want to try to execute OF's open method for it
2341 * later. However, OF will probably fall over if we do that
2342 * we've taken over the MMU.
2343 * So we check whether we will need to open the display,
2344 * and if so, open it now.
2345 */
2346static void __init prom_check_displays(void)
2347{
2348 char type[16], *path;
2349 phandle node;
2350 ihandle ih;
2351 int i;
2352
2353 static const unsigned char default_colors[] __initconst = {
2354 0x00, 0x00, 0x00,
2355 0x00, 0x00, 0xaa,
2356 0x00, 0xaa, 0x00,
2357 0x00, 0xaa, 0xaa,
2358 0xaa, 0x00, 0x00,
2359 0xaa, 0x00, 0xaa,
2360 0xaa, 0xaa, 0x00,
2361 0xaa, 0xaa, 0xaa,
2362 0x55, 0x55, 0x55,
2363 0x55, 0x55, 0xff,
2364 0x55, 0xff, 0x55,
2365 0x55, 0xff, 0xff,
2366 0xff, 0x55, 0x55,
2367 0xff, 0x55, 0xff,
2368 0xff, 0xff, 0x55,
2369 0xff, 0xff, 0xff
2370 };
2371 const unsigned char *clut;
2372
2373 prom_debug("Looking for displays\n");
2374 for (node = 0; prom_next_node(&node); ) {
2375 memset(type, 0, sizeof(type));
2376 prom_getprop(node, "device_type", type, sizeof(type));
2377 if (prom_strcmp(type, "display") != 0)
2378 continue;
2379
2380 /* It seems OF doesn't null-terminate the path :-( */
2381 path = prom_scratch;
2382 memset(path, 0, sizeof(prom_scratch));
2383
2384 /*
2385 * leave some room at the end of the path for appending extra
2386 * arguments
2387 */
2388 if (call_prom("package-to-path", 3, 1, node, path,
2389 sizeof(prom_scratch) - 10) == PROM_ERROR)
2390 continue;
2391 prom_printf("found display : %s, opening... ", path);
2392
2393 ih = call_prom("open", 1, 1, path);
2394 if (ih == 0) {
2395 prom_printf("failed\n");
2396 continue;
2397 }
2398
2399 /* Success */
2400 prom_printf("done\n");
2401 prom_setprop(node, path, "linux,opened", NULL, 0);
2402
2403 /* Setup a usable color table when the appropriate
2404 * method is available. Should update this to set-colors */
2405 clut = default_colors;
2406 for (i = 0; i < 16; i++, clut += 3)
2407 if (prom_set_color(ih, i, clut[0], clut[1],
2408 clut[2]) != 0)
2409 break;
2410
2411#ifdef CONFIG_LOGO_LINUX_CLUT224
2412 clut = PTRRELOC(logo_linux_clut224.clut);
2413 for (i = 0; i < logo_linux_clut224.clutsize; i++, clut += 3)
2414 if (prom_set_color(ih, i + 32, clut[0], clut[1],
2415 clut[2]) != 0)
2416 break;
2417#endif /* CONFIG_LOGO_LINUX_CLUT224 */
2418
2419#ifdef CONFIG_PPC_EARLY_DEBUG_BOOTX
2420 if (prom_getprop(node, "linux,boot-display", NULL, 0) !=
2421 PROM_ERROR) {
2422 u32 width, height, pitch, addr;
2423
2424 prom_printf("Setting btext !\n");
2425 prom_getprop(node, "width", &width, 4);
2426 prom_getprop(node, "height", &height, 4);
2427 prom_getprop(node, "linebytes", &pitch, 4);
2428 prom_getprop(node, "address", &addr, 4);
2429 prom_printf("W=%d H=%d LB=%d addr=0x%x\n",
2430 width, height, pitch, addr);
2431 btext_setup_display(width, height, 8, pitch, addr);
2432 btext_prepare_BAT();
2433 }
2434#endif /* CONFIG_PPC_EARLY_DEBUG_BOOTX */
2435 }
2436}
2437
2438
2439/* Return (relocated) pointer to this much memory: moves initrd if reqd. */
2440static void __init *make_room(unsigned long *mem_start, unsigned long *mem_end,
2441 unsigned long needed, unsigned long align)
2442{
2443 void *ret;
2444
2445 *mem_start = ALIGN(*mem_start, align);
2446 while ((*mem_start + needed) > *mem_end) {
2447 unsigned long room, chunk;
2448
2449 prom_debug("Chunk exhausted, claiming more at %lx...\n",
2450 alloc_bottom);
2451 room = alloc_top - alloc_bottom;
2452 if (room > DEVTREE_CHUNK_SIZE)
2453 room = DEVTREE_CHUNK_SIZE;
2454 if (room < PAGE_SIZE)
2455 prom_panic("No memory for flatten_device_tree "
2456 "(no room)\n");
2457 chunk = alloc_up(room, 0);
2458 if (chunk == 0)
2459 prom_panic("No memory for flatten_device_tree "
2460 "(claim failed)\n");
2461 *mem_end = chunk + room;
2462 }
2463
2464 ret = (void *)*mem_start;
2465 *mem_start += needed;
2466
2467 return ret;
2468}
2469
2470#define dt_push_token(token, mem_start, mem_end) do { \
2471 void *room = make_room(mem_start, mem_end, 4, 4); \
2472 *(__be32 *)room = cpu_to_be32(token); \
2473 } while(0)
2474
2475static unsigned long __init dt_find_string(char *str)
2476{
2477 char *s, *os;
2478
2479 s = os = (char *)dt_string_start;
2480 s += 4;
2481 while (s < (char *)dt_string_end) {
2482 if (prom_strcmp(s, str) == 0)
2483 return s - os;
2484 s += prom_strlen(s) + 1;
2485 }
2486 return 0;
2487}
2488
2489/*
2490 * The Open Firmware 1275 specification states properties must be 31 bytes or
2491 * less, however not all firmwares obey this. Make it 64 bytes to be safe.
2492 */
2493#define MAX_PROPERTY_NAME 64
2494
2495static void __init scan_dt_build_strings(phandle node,
2496 unsigned long *mem_start,
2497 unsigned long *mem_end)
2498{
2499 char *prev_name, *namep, *sstart;
2500 unsigned long soff;
2501 phandle child;
2502
2503 sstart = (char *)dt_string_start;
2504
2505 /* get and store all property names */
2506 prev_name = "";
2507 for (;;) {
2508 /* 64 is max len of name including nul. */
2509 namep = make_room(mem_start, mem_end, MAX_PROPERTY_NAME, 1);
2510 if (call_prom("nextprop", 3, 1, node, prev_name, namep) != 1) {
2511 /* No more nodes: unwind alloc */
2512 *mem_start = (unsigned long)namep;
2513 break;
2514 }
2515
2516 /* skip "name" */
2517 if (prom_strcmp(namep, "name") == 0) {
2518 *mem_start = (unsigned long)namep;
2519 prev_name = "name";
2520 continue;
2521 }
2522 /* get/create string entry */
2523 soff = dt_find_string(namep);
2524 if (soff != 0) {
2525 *mem_start = (unsigned long)namep;
2526 namep = sstart + soff;
2527 } else {
2528 /* Trim off some if we can */
2529 *mem_start = (unsigned long)namep + prom_strlen(namep) + 1;
2530 dt_string_end = *mem_start;
2531 }
2532 prev_name = namep;
2533 }
2534
2535 /* do all our children */
2536 child = call_prom("child", 1, 1, node);
2537 while (child != 0) {
2538 scan_dt_build_strings(child, mem_start, mem_end);
2539 child = call_prom("peer", 1, 1, child);
2540 }
2541}
2542
2543static void __init scan_dt_build_struct(phandle node, unsigned long *mem_start,
2544 unsigned long *mem_end)
2545{
2546 phandle child;
2547 char *namep, *prev_name, *sstart, *p, *ep, *lp, *path;
2548 unsigned long soff;
2549 unsigned char *valp;
2550 static char pname[MAX_PROPERTY_NAME] __prombss;
2551 int l, room, has_phandle = 0;
2552
2553 dt_push_token(OF_DT_BEGIN_NODE, mem_start, mem_end);
2554
2555 /* get the node's full name */
2556 namep = (char *)*mem_start;
2557 room = *mem_end - *mem_start;
2558 if (room > 255)
2559 room = 255;
2560 l = call_prom("package-to-path", 3, 1, node, namep, room);
2561 if (l >= 0) {
2562 /* Didn't fit? Get more room. */
2563 if (l >= room) {
2564 if (l >= *mem_end - *mem_start)
2565 namep = make_room(mem_start, mem_end, l+1, 1);
2566 call_prom("package-to-path", 3, 1, node, namep, l);
2567 }
2568 namep[l] = '\0';
2569
2570 /* Fixup an Apple bug where they have bogus \0 chars in the
2571 * middle of the path in some properties, and extract
2572 * the unit name (everything after the last '/').
2573 */
2574 for (lp = p = namep, ep = namep + l; p < ep; p++) {
2575 if (*p == '/')
2576 lp = namep;
2577 else if (*p != 0)
2578 *lp++ = *p;
2579 }
2580 *lp = 0;
2581 *mem_start = ALIGN((unsigned long)lp + 1, 4);
2582 }
2583
2584 /* get it again for debugging */
2585 path = prom_scratch;
2586 memset(path, 0, sizeof(prom_scratch));
2587 call_prom("package-to-path", 3, 1, node, path, sizeof(prom_scratch) - 1);
2588
2589 /* get and store all properties */
2590 prev_name = "";
2591 sstart = (char *)dt_string_start;
2592 for (;;) {
2593 if (call_prom("nextprop", 3, 1, node, prev_name,
2594 pname) != 1)
2595 break;
2596
2597 /* skip "name" */
2598 if (prom_strcmp(pname, "name") == 0) {
2599 prev_name = "name";
2600 continue;
2601 }
2602
2603 /* find string offset */
2604 soff = dt_find_string(pname);
2605 if (soff == 0) {
2606 prom_printf("WARNING: Can't find string index for"
2607 " <%s>, node %s\n", pname, path);
2608 break;
2609 }
2610 prev_name = sstart + soff;
2611
2612 /* get length */
2613 l = call_prom("getproplen", 2, 1, node, pname);
2614
2615 /* sanity checks */
2616 if (l == PROM_ERROR)
2617 continue;
2618
2619 /* push property head */
2620 dt_push_token(OF_DT_PROP, mem_start, mem_end);
2621 dt_push_token(l, mem_start, mem_end);
2622 dt_push_token(soff, mem_start, mem_end);
2623
2624 /* push property content */
2625 valp = make_room(mem_start, mem_end, l, 4);
2626 call_prom("getprop", 4, 1, node, pname, valp, l);
2627 *mem_start = ALIGN(*mem_start, 4);
2628
2629 if (!prom_strcmp(pname, "phandle"))
2630 has_phandle = 1;
2631 }
2632
2633 /* Add a "phandle" property if none already exist */
2634 if (!has_phandle) {
2635 soff = dt_find_string("phandle");
2636 if (soff == 0)
2637 prom_printf("WARNING: Can't find string index for <phandle> node %s\n", path);
2638 else {
2639 dt_push_token(OF_DT_PROP, mem_start, mem_end);
2640 dt_push_token(4, mem_start, mem_end);
2641 dt_push_token(soff, mem_start, mem_end);
2642 valp = make_room(mem_start, mem_end, 4, 4);
2643 *(__be32 *)valp = cpu_to_be32(node);
2644 }
2645 }
2646
2647 /* do all our children */
2648 child = call_prom("child", 1, 1, node);
2649 while (child != 0) {
2650 scan_dt_build_struct(child, mem_start, mem_end);
2651 child = call_prom("peer", 1, 1, child);
2652 }
2653
2654 dt_push_token(OF_DT_END_NODE, mem_start, mem_end);
2655}
2656
2657static void __init flatten_device_tree(void)
2658{
2659 phandle root;
2660 unsigned long mem_start, mem_end, room;
2661 struct boot_param_header *hdr;
2662 char *namep;
2663 u64 *rsvmap;
2664
2665 /*
2666 * Check how much room we have between alloc top & bottom (+/- a
2667 * few pages), crop to 1MB, as this is our "chunk" size
2668 */
2669 room = alloc_top - alloc_bottom - 0x4000;
2670 if (room > DEVTREE_CHUNK_SIZE)
2671 room = DEVTREE_CHUNK_SIZE;
2672 prom_debug("starting device tree allocs at %lx\n", alloc_bottom);
2673
2674 /* Now try to claim that */
2675 mem_start = (unsigned long)alloc_up(room, PAGE_SIZE);
2676 if (mem_start == 0)
2677 prom_panic("Can't allocate initial device-tree chunk\n");
2678 mem_end = mem_start + room;
2679
2680 /* Get root of tree */
2681 root = call_prom("peer", 1, 1, (phandle)0);
2682 if (root == (phandle)0)
2683 prom_panic ("couldn't get device tree root\n");
2684
2685 /* Build header and make room for mem rsv map */
2686 mem_start = ALIGN(mem_start, 4);
2687 hdr = make_room(&mem_start, &mem_end,
2688 sizeof(struct boot_param_header), 4);
2689 dt_header_start = (unsigned long)hdr;
2690 rsvmap = make_room(&mem_start, &mem_end, sizeof(mem_reserve_map), 8);
2691
2692 /* Start of strings */
2693 mem_start = PAGE_ALIGN(mem_start);
2694 dt_string_start = mem_start;
2695 mem_start += 4; /* hole */
2696
2697 /* Add "phandle" in there, we'll need it */
2698 namep = make_room(&mem_start, &mem_end, 16, 1);
2699 prom_strcpy(namep, "phandle");
2700 mem_start = (unsigned long)namep + prom_strlen(namep) + 1;
2701
2702 /* Build string array */
2703 prom_printf("Building dt strings...\n");
2704 scan_dt_build_strings(root, &mem_start, &mem_end);
2705 dt_string_end = mem_start;
2706
2707 /* Build structure */
2708 mem_start = PAGE_ALIGN(mem_start);
2709 dt_struct_start = mem_start;
2710 prom_printf("Building dt structure...\n");
2711 scan_dt_build_struct(root, &mem_start, &mem_end);
2712 dt_push_token(OF_DT_END, &mem_start, &mem_end);
2713 dt_struct_end = PAGE_ALIGN(mem_start);
2714
2715 /* Finish header */
2716 hdr->boot_cpuid_phys = cpu_to_be32(prom.cpu);
2717 hdr->magic = cpu_to_be32(OF_DT_HEADER);
2718 hdr->totalsize = cpu_to_be32(dt_struct_end - dt_header_start);
2719 hdr->off_dt_struct = cpu_to_be32(dt_struct_start - dt_header_start);
2720 hdr->off_dt_strings = cpu_to_be32(dt_string_start - dt_header_start);
2721 hdr->dt_strings_size = cpu_to_be32(dt_string_end - dt_string_start);
2722 hdr->off_mem_rsvmap = cpu_to_be32(((unsigned long)rsvmap) - dt_header_start);
2723 hdr->version = cpu_to_be32(OF_DT_VERSION);
2724 /* Version 16 is not backward compatible */
2725 hdr->last_comp_version = cpu_to_be32(0x10);
2726
2727 /* Copy the reserve map in */
2728 memcpy(rsvmap, mem_reserve_map, sizeof(mem_reserve_map));
2729
2730#ifdef DEBUG_PROM
2731 {
2732 int i;
2733 prom_printf("reserved memory map:\n");
2734 for (i = 0; i < mem_reserve_cnt; i++)
2735 prom_printf(" %llx - %llx\n",
2736 be64_to_cpu(mem_reserve_map[i].base),
2737 be64_to_cpu(mem_reserve_map[i].size));
2738 }
2739#endif
2740 /* Bump mem_reserve_cnt to cause further reservations to fail
2741 * since it's too late.
2742 */
2743 mem_reserve_cnt = MEM_RESERVE_MAP_SIZE;
2744
2745 prom_printf("Device tree strings 0x%lx -> 0x%lx\n",
2746 dt_string_start, dt_string_end);
2747 prom_printf("Device tree struct 0x%lx -> 0x%lx\n",
2748 dt_struct_start, dt_struct_end);
2749}
2750
2751#ifdef CONFIG_PPC_MAPLE
2752/* PIBS Version 1.05.0000 04/26/2005 has an incorrect /ht/isa/ranges property.
2753 * The values are bad, and it doesn't even have the right number of cells. */
2754static void __init fixup_device_tree_maple(void)
2755{
2756 phandle isa;
2757 u32 rloc = 0x01002000; /* IO space; PCI device = 4 */
2758 u32 isa_ranges[6];
2759 char *name;
2760
2761 name = "/ht@0/isa@4";
2762 isa = call_prom("finddevice", 1, 1, ADDR(name));
2763 if (!PHANDLE_VALID(isa)) {
2764 name = "/ht@0/isa@6";
2765 isa = call_prom("finddevice", 1, 1, ADDR(name));
2766 rloc = 0x01003000; /* IO space; PCI device = 6 */
2767 }
2768 if (!PHANDLE_VALID(isa))
2769 return;
2770
2771 if (prom_getproplen(isa, "ranges") != 12)
2772 return;
2773 if (prom_getprop(isa, "ranges", isa_ranges, sizeof(isa_ranges))
2774 == PROM_ERROR)
2775 return;
2776
2777 if (isa_ranges[0] != 0x1 ||
2778 isa_ranges[1] != 0xf4000000 ||
2779 isa_ranges[2] != 0x00010000)
2780 return;
2781
2782 prom_printf("Fixing up bogus ISA range on Maple/Apache...\n");
2783
2784 isa_ranges[0] = 0x1;
2785 isa_ranges[1] = 0x0;
2786 isa_ranges[2] = rloc;
2787 isa_ranges[3] = 0x0;
2788 isa_ranges[4] = 0x0;
2789 isa_ranges[5] = 0x00010000;
2790 prom_setprop(isa, name, "ranges",
2791 isa_ranges, sizeof(isa_ranges));
2792}
2793
2794#define CPC925_MC_START 0xf8000000
2795#define CPC925_MC_LENGTH 0x1000000
2796/* The values for memory-controller don't have right number of cells */
2797static void __init fixup_device_tree_maple_memory_controller(void)
2798{
2799 phandle mc;
2800 u32 mc_reg[4];
2801 char *name = "/hostbridge@f8000000";
2802 u32 ac, sc;
2803
2804 mc = call_prom("finddevice", 1, 1, ADDR(name));
2805 if (!PHANDLE_VALID(mc))
2806 return;
2807
2808 if (prom_getproplen(mc, "reg") != 8)
2809 return;
2810
2811 prom_getprop(prom.root, "#address-cells", &ac, sizeof(ac));
2812 prom_getprop(prom.root, "#size-cells", &sc, sizeof(sc));
2813 if ((ac != 2) || (sc != 2))
2814 return;
2815
2816 if (prom_getprop(mc, "reg", mc_reg, sizeof(mc_reg)) == PROM_ERROR)
2817 return;
2818
2819 if (mc_reg[0] != CPC925_MC_START || mc_reg[1] != CPC925_MC_LENGTH)
2820 return;
2821
2822 prom_printf("Fixing up bogus hostbridge on Maple...\n");
2823
2824 mc_reg[0] = 0x0;
2825 mc_reg[1] = CPC925_MC_START;
2826 mc_reg[2] = 0x0;
2827 mc_reg[3] = CPC925_MC_LENGTH;
2828 prom_setprop(mc, name, "reg", mc_reg, sizeof(mc_reg));
2829}
2830#else
2831#define fixup_device_tree_maple()
2832#define fixup_device_tree_maple_memory_controller()
2833#endif
2834
2835#ifdef CONFIG_PPC_CHRP
2836/*
2837 * Pegasos and BriQ lacks the "ranges" property in the isa node
2838 * Pegasos needs decimal IRQ 14/15, not hexadecimal
2839 * Pegasos has the IDE configured in legacy mode, but advertised as native
2840 */
2841static void __init fixup_device_tree_chrp(void)
2842{
2843 phandle ph;
2844 u32 prop[6];
2845 u32 rloc = 0x01006000; /* IO space; PCI device = 12 */
2846 char *name;
2847 int rc;
2848
2849 name = "/pci@80000000/isa@c";
2850 ph = call_prom("finddevice", 1, 1, ADDR(name));
2851 if (!PHANDLE_VALID(ph)) {
2852 name = "/pci@ff500000/isa@6";
2853 ph = call_prom("finddevice", 1, 1, ADDR(name));
2854 rloc = 0x01003000; /* IO space; PCI device = 6 */
2855 }
2856 if (PHANDLE_VALID(ph)) {
2857 rc = prom_getproplen(ph, "ranges");
2858 if (rc == 0 || rc == PROM_ERROR) {
2859 prom_printf("Fixing up missing ISA range on Pegasos...\n");
2860
2861 prop[0] = 0x1;
2862 prop[1] = 0x0;
2863 prop[2] = rloc;
2864 prop[3] = 0x0;
2865 prop[4] = 0x0;
2866 prop[5] = 0x00010000;
2867 prom_setprop(ph, name, "ranges", prop, sizeof(prop));
2868 }
2869 }
2870
2871 name = "/pci@80000000/ide@C,1";
2872 ph = call_prom("finddevice", 1, 1, ADDR(name));
2873 if (PHANDLE_VALID(ph)) {
2874 prom_printf("Fixing up IDE interrupt on Pegasos...\n");
2875 prop[0] = 14;
2876 prop[1] = 0x0;
2877 prom_setprop(ph, name, "interrupts", prop, 2*sizeof(u32));
2878 prom_printf("Fixing up IDE class-code on Pegasos...\n");
2879 rc = prom_getprop(ph, "class-code", prop, sizeof(u32));
2880 if (rc == sizeof(u32)) {
2881 prop[0] &= ~0x5;
2882 prom_setprop(ph, name, "class-code", prop, sizeof(u32));
2883 }
2884 }
2885}
2886#else
2887#define fixup_device_tree_chrp()
2888#endif
2889
2890#if defined(CONFIG_PPC64) && defined(CONFIG_PPC_PMAC)
2891static void __init fixup_device_tree_pmac(void)
2892{
2893 phandle u3, i2c, mpic;
2894 u32 u3_rev;
2895 u32 interrupts[2];
2896 u32 parent;
2897
2898 /* Some G5s have a missing interrupt definition, fix it up here */
2899 u3 = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000"));
2900 if (!PHANDLE_VALID(u3))
2901 return;
2902 i2c = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000/i2c@f8001000"));
2903 if (!PHANDLE_VALID(i2c))
2904 return;
2905 mpic = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000/mpic@f8040000"));
2906 if (!PHANDLE_VALID(mpic))
2907 return;
2908
2909 /* check if proper rev of u3 */
2910 if (prom_getprop(u3, "device-rev", &u3_rev, sizeof(u3_rev))
2911 == PROM_ERROR)
2912 return;
2913 if (u3_rev < 0x35 || u3_rev > 0x39)
2914 return;
2915 /* does it need fixup ? */
2916 if (prom_getproplen(i2c, "interrupts") > 0)
2917 return;
2918
2919 prom_printf("fixing up bogus interrupts for u3 i2c...\n");
2920
2921 /* interrupt on this revision of u3 is number 0 and level */
2922 interrupts[0] = 0;
2923 interrupts[1] = 1;
2924 prom_setprop(i2c, "/u3@0,f8000000/i2c@f8001000", "interrupts",
2925 &interrupts, sizeof(interrupts));
2926 parent = (u32)mpic;
2927 prom_setprop(i2c, "/u3@0,f8000000/i2c@f8001000", "interrupt-parent",
2928 &parent, sizeof(parent));
2929}
2930#else
2931#define fixup_device_tree_pmac()
2932#endif
2933
2934#ifdef CONFIG_PPC_EFIKA
2935/*
2936 * The MPC5200 FEC driver requires an phy-handle property to tell it how
2937 * to talk to the phy. If the phy-handle property is missing, then this
2938 * function is called to add the appropriate nodes and link it to the
2939 * ethernet node.
2940 */
2941static void __init fixup_device_tree_efika_add_phy(void)
2942{
2943 u32 node;
2944 char prop[64];
2945 int rv;
2946
2947 /* Check if /builtin/ethernet exists - bail if it doesn't */
2948 node = call_prom("finddevice", 1, 1, ADDR("/builtin/ethernet"));
2949 if (!PHANDLE_VALID(node))
2950 return;
2951
2952 /* Check if the phy-handle property exists - bail if it does */
2953 rv = prom_getprop(node, "phy-handle", prop, sizeof(prop));
2954 if (!rv)
2955 return;
2956
2957 /*
2958 * At this point the ethernet device doesn't have a phy described.
2959 * Now we need to add the missing phy node and linkage
2960 */
2961
2962 /* Check for an MDIO bus node - if missing then create one */
2963 node = call_prom("finddevice", 1, 1, ADDR("/builtin/mdio"));
2964 if (!PHANDLE_VALID(node)) {
2965 prom_printf("Adding Ethernet MDIO node\n");
2966 call_prom("interpret", 1, 1,
2967 " s\" /builtin\" find-device"
2968 " new-device"
2969 " 1 encode-int s\" #address-cells\" property"
2970 " 0 encode-int s\" #size-cells\" property"
2971 " s\" mdio\" device-name"
2972 " s\" fsl,mpc5200b-mdio\" encode-string"
2973 " s\" compatible\" property"
2974 " 0xf0003000 0x400 reg"
2975 " 0x2 encode-int"
2976 " 0x5 encode-int encode+"
2977 " 0x3 encode-int encode+"
2978 " s\" interrupts\" property"
2979 " finish-device");
2980 };
2981
2982 /* Check for a PHY device node - if missing then create one and
2983 * give it's phandle to the ethernet node */
2984 node = call_prom("finddevice", 1, 1,
2985 ADDR("/builtin/mdio/ethernet-phy"));
2986 if (!PHANDLE_VALID(node)) {
2987 prom_printf("Adding Ethernet PHY node\n");
2988 call_prom("interpret", 1, 1,
2989 " s\" /builtin/mdio\" find-device"
2990 " new-device"
2991 " s\" ethernet-phy\" device-name"
2992 " 0x10 encode-int s\" reg\" property"
2993 " my-self"
2994 " ihandle>phandle"
2995 " finish-device"
2996 " s\" /builtin/ethernet\" find-device"
2997 " encode-int"
2998 " s\" phy-handle\" property"
2999 " device-end");
3000 }
3001}
3002
3003static void __init fixup_device_tree_efika(void)
3004{
3005 int sound_irq[3] = { 2, 2, 0 };
3006 int bcomm_irq[3*16] = { 3,0,0, 3,1,0, 3,2,0, 3,3,0,
3007 3,4,0, 3,5,0, 3,6,0, 3,7,0,
3008 3,8,0, 3,9,0, 3,10,0, 3,11,0,
3009 3,12,0, 3,13,0, 3,14,0, 3,15,0 };
3010 u32 node;
3011 char prop[64];
3012 int rv, len;
3013
3014 /* Check if we're really running on a EFIKA */
3015 node = call_prom("finddevice", 1, 1, ADDR("/"));
3016 if (!PHANDLE_VALID(node))
3017 return;
3018
3019 rv = prom_getprop(node, "model", prop, sizeof(prop));
3020 if (rv == PROM_ERROR)
3021 return;
3022 if (prom_strcmp(prop, "EFIKA5K2"))
3023 return;
3024
3025 prom_printf("Applying EFIKA device tree fixups\n");
3026
3027 /* Claiming to be 'chrp' is death */
3028 node = call_prom("finddevice", 1, 1, ADDR("/"));
3029 rv = prom_getprop(node, "device_type", prop, sizeof(prop));
3030 if (rv != PROM_ERROR && (prom_strcmp(prop, "chrp") == 0))
3031 prom_setprop(node, "/", "device_type", "efika", sizeof("efika"));
3032
3033 /* CODEGEN,description is exposed in /proc/cpuinfo so
3034 fix that too */
3035 rv = prom_getprop(node, "CODEGEN,description", prop, sizeof(prop));
3036 if (rv != PROM_ERROR && (prom_strstr(prop, "CHRP")))
3037 prom_setprop(node, "/", "CODEGEN,description",
3038 "Efika 5200B PowerPC System",
3039 sizeof("Efika 5200B PowerPC System"));
3040
3041 /* Fixup bestcomm interrupts property */
3042 node = call_prom("finddevice", 1, 1, ADDR("/builtin/bestcomm"));
3043 if (PHANDLE_VALID(node)) {
3044 len = prom_getproplen(node, "interrupts");
3045 if (len == 12) {
3046 prom_printf("Fixing bestcomm interrupts property\n");
3047 prom_setprop(node, "/builtin/bestcom", "interrupts",
3048 bcomm_irq, sizeof(bcomm_irq));
3049 }
3050 }
3051
3052 /* Fixup sound interrupts property */
3053 node = call_prom("finddevice", 1, 1, ADDR("/builtin/sound"));
3054 if (PHANDLE_VALID(node)) {
3055 rv = prom_getprop(node, "interrupts", prop, sizeof(prop));
3056 if (rv == PROM_ERROR) {
3057 prom_printf("Adding sound interrupts property\n");
3058 prom_setprop(node, "/builtin/sound", "interrupts",
3059 sound_irq, sizeof(sound_irq));
3060 }
3061 }
3062
3063 /* Make sure ethernet phy-handle property exists */
3064 fixup_device_tree_efika_add_phy();
3065}
3066#else
3067#define fixup_device_tree_efika()
3068#endif
3069
3070#ifdef CONFIG_PPC_PASEMI_NEMO
3071/*
3072 * CFE supplied on Nemo is broken in several ways, biggest
3073 * problem is that it reassigns ISA interrupts to unused mpic ints.
3074 * Add an interrupt-controller property for the io-bridge to use
3075 * and correct the ints so we can attach them to an irq_domain
3076 */
3077static void __init fixup_device_tree_pasemi(void)
3078{
3079 u32 interrupts[2], parent, rval, val = 0;
3080 char *name, *pci_name;
3081 phandle iob, node;
3082
3083 /* Find the root pci node */
3084 name = "/pxp@0,e0000000";
3085 iob = call_prom("finddevice", 1, 1, ADDR(name));
3086 if (!PHANDLE_VALID(iob))
3087 return;
3088
3089 /* check if interrupt-controller node set yet */
3090 if (prom_getproplen(iob, "interrupt-controller") !=PROM_ERROR)
3091 return;
3092
3093 prom_printf("adding interrupt-controller property for SB600...\n");
3094
3095 prom_setprop(iob, name, "interrupt-controller", &val, 0);
3096
3097 pci_name = "/pxp@0,e0000000/pci@11";
3098 node = call_prom("finddevice", 1, 1, ADDR(pci_name));
3099 parent = ADDR(iob);
3100
3101 for( ; prom_next_node(&node); ) {
3102 /* scan each node for one with an interrupt */
3103 if (!PHANDLE_VALID(node))
3104 continue;
3105
3106 rval = prom_getproplen(node, "interrupts");
3107 if (rval == 0 || rval == PROM_ERROR)
3108 continue;
3109
3110 prom_getprop(node, "interrupts", &interrupts, sizeof(interrupts));
3111 if ((interrupts[0] < 212) || (interrupts[0] > 222))
3112 continue;
3113
3114 /* found a node, update both interrupts and interrupt-parent */
3115 if ((interrupts[0] >= 212) && (interrupts[0] <= 215))
3116 interrupts[0] -= 203;
3117 if ((interrupts[0] >= 216) && (interrupts[0] <= 220))
3118 interrupts[0] -= 213;
3119 if (interrupts[0] == 221)
3120 interrupts[0] = 14;
3121 if (interrupts[0] == 222)
3122 interrupts[0] = 8;
3123
3124 prom_setprop(node, pci_name, "interrupts", interrupts,
3125 sizeof(interrupts));
3126 prom_setprop(node, pci_name, "interrupt-parent", &parent,
3127 sizeof(parent));
3128 }
3129
3130 /*
3131 * The io-bridge has device_type set to 'io-bridge' change it to 'isa'
3132 * so that generic isa-bridge code can add the SB600 and its on-board
3133 * peripherals.
3134 */
3135 name = "/pxp@0,e0000000/io-bridge@0";
3136 iob = call_prom("finddevice", 1, 1, ADDR(name));
3137 if (!PHANDLE_VALID(iob))
3138 return;
3139
3140 /* device_type is already set, just change it. */
3141
3142 prom_printf("Changing device_type of SB600 node...\n");
3143
3144 prom_setprop(iob, name, "device_type", "isa", sizeof("isa"));
3145}
3146#else /* !CONFIG_PPC_PASEMI_NEMO */
3147static inline void fixup_device_tree_pasemi(void) { }
3148#endif
3149
3150static void __init fixup_device_tree(void)
3151{
3152 fixup_device_tree_maple();
3153 fixup_device_tree_maple_memory_controller();
3154 fixup_device_tree_chrp();
3155 fixup_device_tree_pmac();
3156 fixup_device_tree_efika();
3157 fixup_device_tree_pasemi();
3158}
3159
3160static void __init prom_find_boot_cpu(void)
3161{
3162 __be32 rval;
3163 ihandle prom_cpu;
3164 phandle cpu_pkg;
3165
3166 rval = 0;
3167 if (prom_getprop(prom.chosen, "cpu", &rval, sizeof(rval)) <= 0)
3168 return;
3169 prom_cpu = be32_to_cpu(rval);
3170
3171 cpu_pkg = call_prom("instance-to-package", 1, 1, prom_cpu);
3172
3173 if (!PHANDLE_VALID(cpu_pkg))
3174 return;
3175
3176 prom_getprop(cpu_pkg, "reg", &rval, sizeof(rval));
3177 prom.cpu = be32_to_cpu(rval);
3178
3179 prom_debug("Booting CPU hw index = %d\n", prom.cpu);
3180}
3181
3182static void __init prom_check_initrd(unsigned long r3, unsigned long r4)
3183{
3184#ifdef CONFIG_BLK_DEV_INITRD
3185 if (r3 && r4 && r4 != 0xdeadbeef) {
3186 __be64 val;
3187
3188 prom_initrd_start = is_kernel_addr(r3) ? __pa(r3) : r3;
3189 prom_initrd_end = prom_initrd_start + r4;
3190
3191 val = cpu_to_be64(prom_initrd_start);
3192 prom_setprop(prom.chosen, "/chosen", "linux,initrd-start",
3193 &val, sizeof(val));
3194 val = cpu_to_be64(prom_initrd_end);
3195 prom_setprop(prom.chosen, "/chosen", "linux,initrd-end",
3196 &val, sizeof(val));
3197
3198 reserve_mem(prom_initrd_start,
3199 prom_initrd_end - prom_initrd_start);
3200
3201 prom_debug("initrd_start=0x%lx\n", prom_initrd_start);
3202 prom_debug("initrd_end=0x%lx\n", prom_initrd_end);
3203 }
3204#endif /* CONFIG_BLK_DEV_INITRD */
3205}
3206
3207#ifdef CONFIG_PPC64
3208#ifdef CONFIG_RELOCATABLE
3209static void reloc_toc(void)
3210{
3211}
3212
3213static void unreloc_toc(void)
3214{
3215}
3216#else
3217static void __reloc_toc(unsigned long offset, unsigned long nr_entries)
3218{
3219 unsigned long i;
3220 unsigned long *toc_entry;
3221
3222 /* Get the start of the TOC by using r2 directly. */
3223 asm volatile("addi %0,2,-0x8000" : "=b" (toc_entry));
3224
3225 for (i = 0; i < nr_entries; i++) {
3226 *toc_entry = *toc_entry + offset;
3227 toc_entry++;
3228 }
3229}
3230
3231static void reloc_toc(void)
3232{
3233 unsigned long offset = reloc_offset();
3234 unsigned long nr_entries =
3235 (__prom_init_toc_end - __prom_init_toc_start) / sizeof(long);
3236
3237 __reloc_toc(offset, nr_entries);
3238
3239 mb();
3240}
3241
3242static void unreloc_toc(void)
3243{
3244 unsigned long offset = reloc_offset();
3245 unsigned long nr_entries =
3246 (__prom_init_toc_end - __prom_init_toc_start) / sizeof(long);
3247
3248 mb();
3249
3250 __reloc_toc(-offset, nr_entries);
3251}
3252#endif
3253#endif
3254
3255#ifdef CONFIG_PPC_SVM
3256/*
3257 * Perform the Enter Secure Mode ultracall.
3258 */
3259static int enter_secure_mode(unsigned long kbase, unsigned long fdt)
3260{
3261 register unsigned long r3 asm("r3") = UV_ESM;
3262 register unsigned long r4 asm("r4") = kbase;
3263 register unsigned long r5 asm("r5") = fdt;
3264
3265 asm volatile("sc 2" : "+r"(r3) : "r"(r4), "r"(r5));
3266
3267 return r3;
3268}
3269
3270/*
3271 * Call the Ultravisor to transfer us to secure memory if we have an ESM blob.
3272 */
3273static void __init setup_secure_guest(unsigned long kbase, unsigned long fdt)
3274{
3275 int ret;
3276
3277 if (!prom_svm_enable)
3278 return;
3279
3280 /* Switch to secure mode. */
3281 prom_printf("Switching to secure mode.\n");
3282
3283 /*
3284 * The ultravisor will do an integrity check of the kernel image but we
3285 * relocated it so the check will fail. Restore the original image by
3286 * relocating it back to the kernel virtual base address.
3287 */
3288 if (IS_ENABLED(CONFIG_RELOCATABLE))
3289 relocate(KERNELBASE);
3290
3291 ret = enter_secure_mode(kbase, fdt);
3292
3293 /* Relocate the kernel again. */
3294 if (IS_ENABLED(CONFIG_RELOCATABLE))
3295 relocate(kbase);
3296
3297 if (ret != U_SUCCESS) {
3298 prom_printf("Returned %d from switching to secure mode.\n", ret);
3299 prom_rtas_os_term("Switch to secure mode failed.\n");
3300 }
3301}
3302#else
3303static void __init setup_secure_guest(unsigned long kbase, unsigned long fdt)
3304{
3305}
3306#endif /* CONFIG_PPC_SVM */
3307
3308/*
3309 * We enter here early on, when the Open Firmware prom is still
3310 * handling exceptions and the MMU hash table for us.
3311 */
3312
3313unsigned long __init prom_init(unsigned long r3, unsigned long r4,
3314 unsigned long pp,
3315 unsigned long r6, unsigned long r7,
3316 unsigned long kbase)
3317{
3318 unsigned long hdr;
3319
3320#ifdef CONFIG_PPC32
3321 unsigned long offset = reloc_offset();
3322 reloc_got2(offset);
3323#else
3324 reloc_toc();
3325#endif
3326
3327 /*
3328 * First zero the BSS
3329 */
3330 memset(&__bss_start, 0, __bss_stop - __bss_start);
3331
3332 /*
3333 * Init interface to Open Firmware, get some node references,
3334 * like /chosen
3335 */
3336 prom_init_client_services(pp);
3337
3338 /*
3339 * See if this OF is old enough that we need to do explicit maps
3340 * and other workarounds
3341 */
3342 prom_find_mmu();
3343
3344 /*
3345 * Init prom stdout device
3346 */
3347 prom_init_stdout();
3348
3349 prom_printf("Preparing to boot %s", linux_banner);
3350
3351 /*
3352 * Get default machine type. At this point, we do not differentiate
3353 * between pSeries SMP and pSeries LPAR
3354 */
3355 of_platform = prom_find_machine_type();
3356 prom_printf("Detected machine type: %x\n", of_platform);
3357
3358#ifndef CONFIG_NONSTATIC_KERNEL
3359 /* Bail if this is a kdump kernel. */
3360 if (PHYSICAL_START > 0)
3361 prom_panic("Error: You can't boot a kdump kernel from OF!\n");
3362#endif
3363
3364 /*
3365 * Check for an initrd
3366 */
3367 prom_check_initrd(r3, r4);
3368
3369 /*
3370 * Do early parsing of command line
3371 */
3372 early_cmdline_parse();
3373
3374#ifdef CONFIG_PPC_PSERIES
3375 /*
3376 * On pSeries, inform the firmware about our capabilities
3377 */
3378 if (of_platform == PLATFORM_PSERIES ||
3379 of_platform == PLATFORM_PSERIES_LPAR)
3380 prom_send_capabilities();
3381#endif
3382
3383 /*
3384 * Copy the CPU hold code
3385 */
3386 if (of_platform != PLATFORM_POWERMAC)
3387 copy_and_flush(0, kbase, 0x100, 0);
3388
3389 /*
3390 * Initialize memory management within prom_init
3391 */
3392 prom_init_mem();
3393
3394 /*
3395 * Determine which cpu is actually running right _now_
3396 */
3397 prom_find_boot_cpu();
3398
3399 /*
3400 * Initialize display devices
3401 */
3402 prom_check_displays();
3403
3404#if defined(CONFIG_PPC64) && defined(__BIG_ENDIAN__)
3405 /*
3406 * Initialize IOMMU (TCE tables) on pSeries. Do that before anything else
3407 * that uses the allocator, we need to make sure we get the top of memory
3408 * available for us here...
3409 */
3410 if (of_platform == PLATFORM_PSERIES)
3411 prom_initialize_tce_table();
3412#endif
3413
3414 /*
3415 * On non-powermacs, try to instantiate RTAS. PowerMacs don't
3416 * have a usable RTAS implementation.
3417 */
3418 if (of_platform != PLATFORM_POWERMAC)
3419 prom_instantiate_rtas();
3420
3421#ifdef CONFIG_PPC64
3422 /* instantiate sml */
3423 prom_instantiate_sml();
3424#endif
3425
3426 /*
3427 * On non-powermacs, put all CPUs in spin-loops.
3428 *
3429 * PowerMacs use a different mechanism to spin CPUs
3430 *
3431 * (This must be done after instanciating RTAS)
3432 */
3433 if (of_platform != PLATFORM_POWERMAC)
3434 prom_hold_cpus();
3435
3436 /*
3437 * Fill in some infos for use by the kernel later on
3438 */
3439 if (prom_memory_limit) {
3440 __be64 val = cpu_to_be64(prom_memory_limit);
3441 prom_setprop(prom.chosen, "/chosen", "linux,memory-limit",
3442 &val, sizeof(val));
3443 }
3444#ifdef CONFIG_PPC64
3445 if (prom_iommu_off)
3446 prom_setprop(prom.chosen, "/chosen", "linux,iommu-off",
3447 NULL, 0);
3448
3449 if (prom_iommu_force_on)
3450 prom_setprop(prom.chosen, "/chosen", "linux,iommu-force-on",
3451 NULL, 0);
3452
3453 if (prom_tce_alloc_start) {
3454 prom_setprop(prom.chosen, "/chosen", "linux,tce-alloc-start",
3455 &prom_tce_alloc_start,
3456 sizeof(prom_tce_alloc_start));
3457 prom_setprop(prom.chosen, "/chosen", "linux,tce-alloc-end",
3458 &prom_tce_alloc_end,
3459 sizeof(prom_tce_alloc_end));
3460 }
3461#endif
3462
3463 /*
3464 * Fixup any known bugs in the device-tree
3465 */
3466 fixup_device_tree();
3467
3468 /*
3469 * Now finally create the flattened device-tree
3470 */
3471 prom_printf("copying OF device tree...\n");
3472 flatten_device_tree();
3473
3474 /*
3475 * in case stdin is USB and still active on IBM machines...
3476 * Unfortunately quiesce crashes on some powermacs if we have
3477 * closed stdin already (in particular the powerbook 101).
3478 */
3479 if (of_platform != PLATFORM_POWERMAC)
3480 prom_close_stdin();
3481
3482 /*
3483 * Call OF "quiesce" method to shut down pending DMA's from
3484 * devices etc...
3485 */
3486 prom_printf("Quiescing Open Firmware ...\n");
3487 call_prom("quiesce", 0, 0);
3488
3489 /*
3490 * And finally, call the kernel passing it the flattened device
3491 * tree and NULL as r5, thus triggering the new entry point which
3492 * is common to us and kexec
3493 */
3494 hdr = dt_header_start;
3495
3496 prom_printf("Booting Linux via __start() @ 0x%lx ...\n", kbase);
3497 prom_debug("->dt_header_start=0x%lx\n", hdr);
3498
3499#ifdef CONFIG_PPC32
3500 reloc_got2(-offset);
3501#else
3502 unreloc_toc();
3503#endif
3504
3505 /* Move to secure memory if we're supposed to be secure guests. */
3506 setup_secure_guest(kbase, hdr);
3507
3508 __start(hdr, kbase, 0, 0, 0, 0, 0);
3509
3510 return 0;
3511}
1/*
2 * Procedures for interfacing to Open Firmware.
3 *
4 * Paul Mackerras August 1996.
5 * Copyright (C) 1996-2005 Paul Mackerras.
6 *
7 * Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner.
8 * {engebret|bergner}@us.ibm.com
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 */
15
16#undef DEBUG_PROM
17
18/* we cannot use FORTIFY as it brings in new symbols */
19#define __NO_FORTIFY
20
21#include <stdarg.h>
22#include <linux/kernel.h>
23#include <linux/string.h>
24#include <linux/init.h>
25#include <linux/threads.h>
26#include <linux/spinlock.h>
27#include <linux/types.h>
28#include <linux/pci.h>
29#include <linux/proc_fs.h>
30#include <linux/stringify.h>
31#include <linux/delay.h>
32#include <linux/initrd.h>
33#include <linux/bitops.h>
34#include <asm/prom.h>
35#include <asm/rtas.h>
36#include <asm/page.h>
37#include <asm/processor.h>
38#include <asm/irq.h>
39#include <asm/io.h>
40#include <asm/smp.h>
41#include <asm/mmu.h>
42#include <asm/pgtable.h>
43#include <asm/iommu.h>
44#include <asm/btext.h>
45#include <asm/sections.h>
46#include <asm/machdep.h>
47#include <asm/opal.h>
48#include <asm/asm-prototypes.h>
49
50#include <linux/linux_logo.h>
51
52/*
53 * Eventually bump that one up
54 */
55#define DEVTREE_CHUNK_SIZE 0x100000
56
57/*
58 * This is the size of the local memory reserve map that gets copied
59 * into the boot params passed to the kernel. That size is totally
60 * flexible as the kernel just reads the list until it encounters an
61 * entry with size 0, so it can be changed without breaking binary
62 * compatibility
63 */
64#define MEM_RESERVE_MAP_SIZE 8
65
66/*
67 * prom_init() is called very early on, before the kernel text
68 * and data have been mapped to KERNELBASE. At this point the code
69 * is running at whatever address it has been loaded at.
70 * On ppc32 we compile with -mrelocatable, which means that references
71 * to extern and static variables get relocated automatically.
72 * ppc64 objects are always relocatable, we just need to relocate the
73 * TOC.
74 *
75 * Because OF may have mapped I/O devices into the area starting at
76 * KERNELBASE, particularly on CHRP machines, we can't safely call
77 * OF once the kernel has been mapped to KERNELBASE. Therefore all
78 * OF calls must be done within prom_init().
79 *
80 * ADDR is used in calls to call_prom. The 4th and following
81 * arguments to call_prom should be 32-bit values.
82 * On ppc64, 64 bit values are truncated to 32 bits (and
83 * fortunately don't get interpreted as two arguments).
84 */
85#define ADDR(x) (u32)(unsigned long)(x)
86
87#ifdef CONFIG_PPC64
88#define OF_WORKAROUNDS 0
89#else
90#define OF_WORKAROUNDS of_workarounds
91int of_workarounds;
92#endif
93
94#define OF_WA_CLAIM 1 /* do phys/virt claim separately, then map */
95#define OF_WA_LONGTRAIL 2 /* work around longtrail bugs */
96
97#define PROM_BUG() do { \
98 prom_printf("kernel BUG at %s line 0x%x!\n", \
99 __FILE__, __LINE__); \
100 __asm__ __volatile__(".long " BUG_ILLEGAL_INSTR); \
101} while (0)
102
103#ifdef DEBUG_PROM
104#define prom_debug(x...) prom_printf(x)
105#else
106#define prom_debug(x...)
107#endif
108
109
110typedef u32 prom_arg_t;
111
112struct prom_args {
113 __be32 service;
114 __be32 nargs;
115 __be32 nret;
116 __be32 args[10];
117};
118
119struct prom_t {
120 ihandle root;
121 phandle chosen;
122 int cpu;
123 ihandle stdout;
124 ihandle mmumap;
125 ihandle memory;
126};
127
128struct mem_map_entry {
129 __be64 base;
130 __be64 size;
131};
132
133typedef __be32 cell_t;
134
135extern void __start(unsigned long r3, unsigned long r4, unsigned long r5,
136 unsigned long r6, unsigned long r7, unsigned long r8,
137 unsigned long r9);
138
139#ifdef CONFIG_PPC64
140extern int enter_prom(struct prom_args *args, unsigned long entry);
141#else
142static inline int enter_prom(struct prom_args *args, unsigned long entry)
143{
144 return ((int (*)(struct prom_args *))entry)(args);
145}
146#endif
147
148extern void copy_and_flush(unsigned long dest, unsigned long src,
149 unsigned long size, unsigned long offset);
150
151/* prom structure */
152static struct prom_t __initdata prom;
153
154static unsigned long prom_entry __initdata;
155
156#define PROM_SCRATCH_SIZE 256
157
158static char __initdata of_stdout_device[256];
159static char __initdata prom_scratch[PROM_SCRATCH_SIZE];
160
161static unsigned long __initdata dt_header_start;
162static unsigned long __initdata dt_struct_start, dt_struct_end;
163static unsigned long __initdata dt_string_start, dt_string_end;
164
165static unsigned long __initdata prom_initrd_start, prom_initrd_end;
166
167#ifdef CONFIG_PPC64
168static int __initdata prom_iommu_force_on;
169static int __initdata prom_iommu_off;
170static unsigned long __initdata prom_tce_alloc_start;
171static unsigned long __initdata prom_tce_alloc_end;
172#endif
173
174static bool prom_radix_disable __initdata = !IS_ENABLED(CONFIG_PPC_RADIX_MMU_DEFAULT);
175
176struct platform_support {
177 bool hash_mmu;
178 bool radix_mmu;
179 bool radix_gtse;
180 bool xive;
181};
182
183/* Platforms codes are now obsolete in the kernel. Now only used within this
184 * file and ultimately gone too. Feel free to change them if you need, they
185 * are not shared with anything outside of this file anymore
186 */
187#define PLATFORM_PSERIES 0x0100
188#define PLATFORM_PSERIES_LPAR 0x0101
189#define PLATFORM_LPAR 0x0001
190#define PLATFORM_POWERMAC 0x0400
191#define PLATFORM_GENERIC 0x0500
192#define PLATFORM_OPAL 0x0600
193
194static int __initdata of_platform;
195
196static char __initdata prom_cmd_line[COMMAND_LINE_SIZE];
197
198static unsigned long __initdata prom_memory_limit;
199
200static unsigned long __initdata alloc_top;
201static unsigned long __initdata alloc_top_high;
202static unsigned long __initdata alloc_bottom;
203static unsigned long __initdata rmo_top;
204static unsigned long __initdata ram_top;
205
206static struct mem_map_entry __initdata mem_reserve_map[MEM_RESERVE_MAP_SIZE];
207static int __initdata mem_reserve_cnt;
208
209static cell_t __initdata regbuf[1024];
210
211static bool rtas_has_query_cpu_stopped;
212
213
214/*
215 * Error results ... some OF calls will return "-1" on error, some
216 * will return 0, some will return either. To simplify, here are
217 * macros to use with any ihandle or phandle return value to check if
218 * it is valid
219 */
220
221#define PROM_ERROR (-1u)
222#define PHANDLE_VALID(p) ((p) != 0 && (p) != PROM_ERROR)
223#define IHANDLE_VALID(i) ((i) != 0 && (i) != PROM_ERROR)
224
225
226/* This is the one and *ONLY* place where we actually call open
227 * firmware.
228 */
229
230static int __init call_prom(const char *service, int nargs, int nret, ...)
231{
232 int i;
233 struct prom_args args;
234 va_list list;
235
236 args.service = cpu_to_be32(ADDR(service));
237 args.nargs = cpu_to_be32(nargs);
238 args.nret = cpu_to_be32(nret);
239
240 va_start(list, nret);
241 for (i = 0; i < nargs; i++)
242 args.args[i] = cpu_to_be32(va_arg(list, prom_arg_t));
243 va_end(list);
244
245 for (i = 0; i < nret; i++)
246 args.args[nargs+i] = 0;
247
248 if (enter_prom(&args, prom_entry) < 0)
249 return PROM_ERROR;
250
251 return (nret > 0) ? be32_to_cpu(args.args[nargs]) : 0;
252}
253
254static int __init call_prom_ret(const char *service, int nargs, int nret,
255 prom_arg_t *rets, ...)
256{
257 int i;
258 struct prom_args args;
259 va_list list;
260
261 args.service = cpu_to_be32(ADDR(service));
262 args.nargs = cpu_to_be32(nargs);
263 args.nret = cpu_to_be32(nret);
264
265 va_start(list, rets);
266 for (i = 0; i < nargs; i++)
267 args.args[i] = cpu_to_be32(va_arg(list, prom_arg_t));
268 va_end(list);
269
270 for (i = 0; i < nret; i++)
271 args.args[nargs+i] = 0;
272
273 if (enter_prom(&args, prom_entry) < 0)
274 return PROM_ERROR;
275
276 if (rets != NULL)
277 for (i = 1; i < nret; ++i)
278 rets[i-1] = be32_to_cpu(args.args[nargs+i]);
279
280 return (nret > 0) ? be32_to_cpu(args.args[nargs]) : 0;
281}
282
283
284static void __init prom_print(const char *msg)
285{
286 const char *p, *q;
287
288 if (prom.stdout == 0)
289 return;
290
291 for (p = msg; *p != 0; p = q) {
292 for (q = p; *q != 0 && *q != '\n'; ++q)
293 ;
294 if (q > p)
295 call_prom("write", 3, 1, prom.stdout, p, q - p);
296 if (*q == 0)
297 break;
298 ++q;
299 call_prom("write", 3, 1, prom.stdout, ADDR("\r\n"), 2);
300 }
301}
302
303
304static void __init prom_print_hex(unsigned long val)
305{
306 int i, nibbles = sizeof(val)*2;
307 char buf[sizeof(val)*2+1];
308
309 for (i = nibbles-1; i >= 0; i--) {
310 buf[i] = (val & 0xf) + '0';
311 if (buf[i] > '9')
312 buf[i] += ('a'-'0'-10);
313 val >>= 4;
314 }
315 buf[nibbles] = '\0';
316 call_prom("write", 3, 1, prom.stdout, buf, nibbles);
317}
318
319/* max number of decimal digits in an unsigned long */
320#define UL_DIGITS 21
321static void __init prom_print_dec(unsigned long val)
322{
323 int i, size;
324 char buf[UL_DIGITS+1];
325
326 for (i = UL_DIGITS-1; i >= 0; i--) {
327 buf[i] = (val % 10) + '0';
328 val = val/10;
329 if (val == 0)
330 break;
331 }
332 /* shift stuff down */
333 size = UL_DIGITS - i;
334 call_prom("write", 3, 1, prom.stdout, buf+i, size);
335}
336
337static void __init prom_printf(const char *format, ...)
338{
339 const char *p, *q, *s;
340 va_list args;
341 unsigned long v;
342 long vs;
343
344 va_start(args, format);
345 for (p = format; *p != 0; p = q) {
346 for (q = p; *q != 0 && *q != '\n' && *q != '%'; ++q)
347 ;
348 if (q > p)
349 call_prom("write", 3, 1, prom.stdout, p, q - p);
350 if (*q == 0)
351 break;
352 if (*q == '\n') {
353 ++q;
354 call_prom("write", 3, 1, prom.stdout,
355 ADDR("\r\n"), 2);
356 continue;
357 }
358 ++q;
359 if (*q == 0)
360 break;
361 switch (*q) {
362 case 's':
363 ++q;
364 s = va_arg(args, const char *);
365 prom_print(s);
366 break;
367 case 'x':
368 ++q;
369 v = va_arg(args, unsigned long);
370 prom_print_hex(v);
371 break;
372 case 'd':
373 ++q;
374 vs = va_arg(args, int);
375 if (vs < 0) {
376 prom_print("-");
377 vs = -vs;
378 }
379 prom_print_dec(vs);
380 break;
381 case 'l':
382 ++q;
383 if (*q == 0)
384 break;
385 else if (*q == 'x') {
386 ++q;
387 v = va_arg(args, unsigned long);
388 prom_print_hex(v);
389 } else if (*q == 'u') { /* '%lu' */
390 ++q;
391 v = va_arg(args, unsigned long);
392 prom_print_dec(v);
393 } else if (*q == 'd') { /* %ld */
394 ++q;
395 vs = va_arg(args, long);
396 if (vs < 0) {
397 prom_print("-");
398 vs = -vs;
399 }
400 prom_print_dec(vs);
401 }
402 break;
403 }
404 }
405 va_end(args);
406}
407
408
409static unsigned int __init prom_claim(unsigned long virt, unsigned long size,
410 unsigned long align)
411{
412
413 if (align == 0 && (OF_WORKAROUNDS & OF_WA_CLAIM)) {
414 /*
415 * Old OF requires we claim physical and virtual separately
416 * and then map explicitly (assuming virtual mode)
417 */
418 int ret;
419 prom_arg_t result;
420
421 ret = call_prom_ret("call-method", 5, 2, &result,
422 ADDR("claim"), prom.memory,
423 align, size, virt);
424 if (ret != 0 || result == -1)
425 return -1;
426 ret = call_prom_ret("call-method", 5, 2, &result,
427 ADDR("claim"), prom.mmumap,
428 align, size, virt);
429 if (ret != 0) {
430 call_prom("call-method", 4, 1, ADDR("release"),
431 prom.memory, size, virt);
432 return -1;
433 }
434 /* the 0x12 is M (coherence) + PP == read/write */
435 call_prom("call-method", 6, 1,
436 ADDR("map"), prom.mmumap, 0x12, size, virt, virt);
437 return virt;
438 }
439 return call_prom("claim", 3, 1, (prom_arg_t)virt, (prom_arg_t)size,
440 (prom_arg_t)align);
441}
442
443static void __init __attribute__((noreturn)) prom_panic(const char *reason)
444{
445 prom_print(reason);
446 /* Do not call exit because it clears the screen on pmac
447 * it also causes some sort of double-fault on early pmacs */
448 if (of_platform == PLATFORM_POWERMAC)
449 asm("trap\n");
450
451 /* ToDo: should put up an SRC here on pSeries */
452 call_prom("exit", 0, 0);
453
454 for (;;) /* should never get here */
455 ;
456}
457
458
459static int __init prom_next_node(phandle *nodep)
460{
461 phandle node;
462
463 if ((node = *nodep) != 0
464 && (*nodep = call_prom("child", 1, 1, node)) != 0)
465 return 1;
466 if ((*nodep = call_prom("peer", 1, 1, node)) != 0)
467 return 1;
468 for (;;) {
469 if ((node = call_prom("parent", 1, 1, node)) == 0)
470 return 0;
471 if ((*nodep = call_prom("peer", 1, 1, node)) != 0)
472 return 1;
473 }
474}
475
476static inline int prom_getprop(phandle node, const char *pname,
477 void *value, size_t valuelen)
478{
479 return call_prom("getprop", 4, 1, node, ADDR(pname),
480 (u32)(unsigned long) value, (u32) valuelen);
481}
482
483static inline int prom_getproplen(phandle node, const char *pname)
484{
485 return call_prom("getproplen", 2, 1, node, ADDR(pname));
486}
487
488static void add_string(char **str, const char *q)
489{
490 char *p = *str;
491
492 while (*q)
493 *p++ = *q++;
494 *p++ = ' ';
495 *str = p;
496}
497
498static char *tohex(unsigned int x)
499{
500 static char digits[] = "0123456789abcdef";
501 static char result[9];
502 int i;
503
504 result[8] = 0;
505 i = 8;
506 do {
507 --i;
508 result[i] = digits[x & 0xf];
509 x >>= 4;
510 } while (x != 0 && i > 0);
511 return &result[i];
512}
513
514static int __init prom_setprop(phandle node, const char *nodename,
515 const char *pname, void *value, size_t valuelen)
516{
517 char cmd[256], *p;
518
519 if (!(OF_WORKAROUNDS & OF_WA_LONGTRAIL))
520 return call_prom("setprop", 4, 1, node, ADDR(pname),
521 (u32)(unsigned long) value, (u32) valuelen);
522
523 /* gah... setprop doesn't work on longtrail, have to use interpret */
524 p = cmd;
525 add_string(&p, "dev");
526 add_string(&p, nodename);
527 add_string(&p, tohex((u32)(unsigned long) value));
528 add_string(&p, tohex(valuelen));
529 add_string(&p, tohex(ADDR(pname)));
530 add_string(&p, tohex(strlen(pname)));
531 add_string(&p, "property");
532 *p = 0;
533 return call_prom("interpret", 1, 1, (u32)(unsigned long) cmd);
534}
535
536/* We can't use the standard versions because of relocation headaches. */
537#define isxdigit(c) (('0' <= (c) && (c) <= '9') \
538 || ('a' <= (c) && (c) <= 'f') \
539 || ('A' <= (c) && (c) <= 'F'))
540
541#define isdigit(c) ('0' <= (c) && (c) <= '9')
542#define islower(c) ('a' <= (c) && (c) <= 'z')
543#define toupper(c) (islower(c) ? ((c) - 'a' + 'A') : (c))
544
545static unsigned long prom_strtoul(const char *cp, const char **endp)
546{
547 unsigned long result = 0, base = 10, value;
548
549 if (*cp == '0') {
550 base = 8;
551 cp++;
552 if (toupper(*cp) == 'X') {
553 cp++;
554 base = 16;
555 }
556 }
557
558 while (isxdigit(*cp) &&
559 (value = isdigit(*cp) ? *cp - '0' : toupper(*cp) - 'A' + 10) < base) {
560 result = result * base + value;
561 cp++;
562 }
563
564 if (endp)
565 *endp = cp;
566
567 return result;
568}
569
570static unsigned long prom_memparse(const char *ptr, const char **retptr)
571{
572 unsigned long ret = prom_strtoul(ptr, retptr);
573 int shift = 0;
574
575 /*
576 * We can't use a switch here because GCC *may* generate a
577 * jump table which won't work, because we're not running at
578 * the address we're linked at.
579 */
580 if ('G' == **retptr || 'g' == **retptr)
581 shift = 30;
582
583 if ('M' == **retptr || 'm' == **retptr)
584 shift = 20;
585
586 if ('K' == **retptr || 'k' == **retptr)
587 shift = 10;
588
589 if (shift) {
590 ret <<= shift;
591 (*retptr)++;
592 }
593
594 return ret;
595}
596
597/*
598 * Early parsing of the command line passed to the kernel, used for
599 * "mem=x" and the options that affect the iommu
600 */
601static void __init early_cmdline_parse(void)
602{
603 const char *opt;
604
605 char *p;
606 int l = 0;
607
608 prom_cmd_line[0] = 0;
609 p = prom_cmd_line;
610 if ((long)prom.chosen > 0)
611 l = prom_getprop(prom.chosen, "bootargs", p, COMMAND_LINE_SIZE-1);
612#ifdef CONFIG_CMDLINE
613 if (l <= 0 || p[0] == '\0') /* dbl check */
614 strlcpy(prom_cmd_line,
615 CONFIG_CMDLINE, sizeof(prom_cmd_line));
616#endif /* CONFIG_CMDLINE */
617 prom_printf("command line: %s\n", prom_cmd_line);
618
619#ifdef CONFIG_PPC64
620 opt = strstr(prom_cmd_line, "iommu=");
621 if (opt) {
622 prom_printf("iommu opt is: %s\n", opt);
623 opt += 6;
624 while (*opt && *opt == ' ')
625 opt++;
626 if (!strncmp(opt, "off", 3))
627 prom_iommu_off = 1;
628 else if (!strncmp(opt, "force", 5))
629 prom_iommu_force_on = 1;
630 }
631#endif
632 opt = strstr(prom_cmd_line, "mem=");
633 if (opt) {
634 opt += 4;
635 prom_memory_limit = prom_memparse(opt, (const char **)&opt);
636#ifdef CONFIG_PPC64
637 /* Align to 16 MB == size of ppc64 large page */
638 prom_memory_limit = ALIGN(prom_memory_limit, 0x1000000);
639#endif
640 }
641
642 opt = strstr(prom_cmd_line, "disable_radix");
643 if (opt) {
644 opt += 13;
645 if (*opt && *opt == '=') {
646 bool val;
647
648 if (kstrtobool(++opt, &val))
649 prom_radix_disable = false;
650 else
651 prom_radix_disable = val;
652 } else
653 prom_radix_disable = true;
654 }
655 if (prom_radix_disable)
656 prom_debug("Radix disabled from cmdline\n");
657}
658
659#if defined(CONFIG_PPC_PSERIES) || defined(CONFIG_PPC_POWERNV)
660/*
661 * The architecture vector has an array of PVR mask/value pairs,
662 * followed by # option vectors - 1, followed by the option vectors.
663 *
664 * See prom.h for the definition of the bits specified in the
665 * architecture vector.
666 */
667
668/* Firmware expects the value to be n - 1, where n is the # of vectors */
669#define NUM_VECTORS(n) ((n) - 1)
670
671/*
672 * Firmware expects 1 + n - 2, where n is the length of the option vector in
673 * bytes. The 1 accounts for the length byte itself, the - 2 .. ?
674 */
675#define VECTOR_LENGTH(n) (1 + (n) - 2)
676
677struct option_vector1 {
678 u8 byte1;
679 u8 arch_versions;
680 u8 arch_versions3;
681} __packed;
682
683struct option_vector2 {
684 u8 byte1;
685 __be16 reserved;
686 __be32 real_base;
687 __be32 real_size;
688 __be32 virt_base;
689 __be32 virt_size;
690 __be32 load_base;
691 __be32 min_rma;
692 __be32 min_load;
693 u8 min_rma_percent;
694 u8 max_pft_size;
695} __packed;
696
697struct option_vector3 {
698 u8 byte1;
699 u8 byte2;
700} __packed;
701
702struct option_vector4 {
703 u8 byte1;
704 u8 min_vp_cap;
705} __packed;
706
707struct option_vector5 {
708 u8 byte1;
709 u8 byte2;
710 u8 byte3;
711 u8 cmo;
712 u8 associativity;
713 u8 bin_opts;
714 u8 micro_checkpoint;
715 u8 reserved0;
716 __be32 max_cpus;
717 __be16 papr_level;
718 __be16 reserved1;
719 u8 platform_facilities;
720 u8 reserved2;
721 __be16 reserved3;
722 u8 subprocessors;
723 u8 byte22;
724 u8 intarch;
725 u8 mmu;
726 u8 hash_ext;
727 u8 radix_ext;
728} __packed;
729
730struct option_vector6 {
731 u8 reserved;
732 u8 secondary_pteg;
733 u8 os_name;
734} __packed;
735
736struct ibm_arch_vec {
737 struct { u32 mask, val; } pvrs[12];
738
739 u8 num_vectors;
740
741 u8 vec1_len;
742 struct option_vector1 vec1;
743
744 u8 vec2_len;
745 struct option_vector2 vec2;
746
747 u8 vec3_len;
748 struct option_vector3 vec3;
749
750 u8 vec4_len;
751 struct option_vector4 vec4;
752
753 u8 vec5_len;
754 struct option_vector5 vec5;
755
756 u8 vec6_len;
757 struct option_vector6 vec6;
758} __packed;
759
760struct ibm_arch_vec __cacheline_aligned ibm_architecture_vec = {
761 .pvrs = {
762 {
763 .mask = cpu_to_be32(0xfffe0000), /* POWER5/POWER5+ */
764 .val = cpu_to_be32(0x003a0000),
765 },
766 {
767 .mask = cpu_to_be32(0xffff0000), /* POWER6 */
768 .val = cpu_to_be32(0x003e0000),
769 },
770 {
771 .mask = cpu_to_be32(0xffff0000), /* POWER7 */
772 .val = cpu_to_be32(0x003f0000),
773 },
774 {
775 .mask = cpu_to_be32(0xffff0000), /* POWER8E */
776 .val = cpu_to_be32(0x004b0000),
777 },
778 {
779 .mask = cpu_to_be32(0xffff0000), /* POWER8NVL */
780 .val = cpu_to_be32(0x004c0000),
781 },
782 {
783 .mask = cpu_to_be32(0xffff0000), /* POWER8 */
784 .val = cpu_to_be32(0x004d0000),
785 },
786 {
787 .mask = cpu_to_be32(0xffff0000), /* POWER9 */
788 .val = cpu_to_be32(0x004e0000),
789 },
790 {
791 .mask = cpu_to_be32(0xffffffff), /* all 3.00-compliant */
792 .val = cpu_to_be32(0x0f000005),
793 },
794 {
795 .mask = cpu_to_be32(0xffffffff), /* all 2.07-compliant */
796 .val = cpu_to_be32(0x0f000004),
797 },
798 {
799 .mask = cpu_to_be32(0xffffffff), /* all 2.06-compliant */
800 .val = cpu_to_be32(0x0f000003),
801 },
802 {
803 .mask = cpu_to_be32(0xffffffff), /* all 2.05-compliant */
804 .val = cpu_to_be32(0x0f000002),
805 },
806 {
807 .mask = cpu_to_be32(0xfffffffe), /* all 2.04-compliant and earlier */
808 .val = cpu_to_be32(0x0f000001),
809 },
810 },
811
812 .num_vectors = NUM_VECTORS(6),
813
814 .vec1_len = VECTOR_LENGTH(sizeof(struct option_vector1)),
815 .vec1 = {
816 .byte1 = 0,
817 .arch_versions = OV1_PPC_2_00 | OV1_PPC_2_01 | OV1_PPC_2_02 | OV1_PPC_2_03 |
818 OV1_PPC_2_04 | OV1_PPC_2_05 | OV1_PPC_2_06 | OV1_PPC_2_07,
819 .arch_versions3 = OV1_PPC_3_00,
820 },
821
822 .vec2_len = VECTOR_LENGTH(sizeof(struct option_vector2)),
823 /* option vector 2: Open Firmware options supported */
824 .vec2 = {
825 .byte1 = OV2_REAL_MODE,
826 .reserved = 0,
827 .real_base = cpu_to_be32(0xffffffff),
828 .real_size = cpu_to_be32(0xffffffff),
829 .virt_base = cpu_to_be32(0xffffffff),
830 .virt_size = cpu_to_be32(0xffffffff),
831 .load_base = cpu_to_be32(0xffffffff),
832 .min_rma = cpu_to_be32(512), /* 512MB min RMA */
833 .min_load = cpu_to_be32(0xffffffff), /* full client load */
834 .min_rma_percent = 0, /* min RMA percentage of total RAM */
835 .max_pft_size = 48, /* max log_2(hash table size) */
836 },
837
838 .vec3_len = VECTOR_LENGTH(sizeof(struct option_vector3)),
839 /* option vector 3: processor options supported */
840 .vec3 = {
841 .byte1 = 0, /* don't ignore, don't halt */
842 .byte2 = OV3_FP | OV3_VMX | OV3_DFP,
843 },
844
845 .vec4_len = VECTOR_LENGTH(sizeof(struct option_vector4)),
846 /* option vector 4: IBM PAPR implementation */
847 .vec4 = {
848 .byte1 = 0, /* don't halt */
849 .min_vp_cap = OV4_MIN_ENT_CAP, /* minimum VP entitled capacity */
850 },
851
852 .vec5_len = VECTOR_LENGTH(sizeof(struct option_vector5)),
853 /* option vector 5: PAPR/OF options */
854 .vec5 = {
855 .byte1 = 0, /* don't ignore, don't halt */
856 .byte2 = OV5_FEAT(OV5_LPAR) | OV5_FEAT(OV5_SPLPAR) | OV5_FEAT(OV5_LARGE_PAGES) |
857 OV5_FEAT(OV5_DRCONF_MEMORY) | OV5_FEAT(OV5_DONATE_DEDICATE_CPU) |
858#ifdef CONFIG_PCI_MSI
859 /* PCIe/MSI support. Without MSI full PCIe is not supported */
860 OV5_FEAT(OV5_MSI),
861#else
862 0,
863#endif
864 .byte3 = 0,
865 .cmo =
866#ifdef CONFIG_PPC_SMLPAR
867 OV5_FEAT(OV5_CMO) | OV5_FEAT(OV5_XCMO),
868#else
869 0,
870#endif
871 .associativity = OV5_FEAT(OV5_TYPE1_AFFINITY) | OV5_FEAT(OV5_PRRN),
872 .bin_opts = OV5_FEAT(OV5_RESIZE_HPT) | OV5_FEAT(OV5_HP_EVT),
873 .micro_checkpoint = 0,
874 .reserved0 = 0,
875 .max_cpus = cpu_to_be32(NR_CPUS), /* number of cores supported */
876 .papr_level = 0,
877 .reserved1 = 0,
878 .platform_facilities = OV5_FEAT(OV5_PFO_HW_RNG) | OV5_FEAT(OV5_PFO_HW_ENCR) | OV5_FEAT(OV5_PFO_HW_842),
879 .reserved2 = 0,
880 .reserved3 = 0,
881 .subprocessors = 1,
882 .byte22 = OV5_FEAT(OV5_DRMEM_V2),
883 .intarch = 0,
884 .mmu = 0,
885 .hash_ext = 0,
886 .radix_ext = 0,
887 },
888
889 /* option vector 6: IBM PAPR hints */
890 .vec6_len = VECTOR_LENGTH(sizeof(struct option_vector6)),
891 .vec6 = {
892 .reserved = 0,
893 .secondary_pteg = 0,
894 .os_name = OV6_LINUX,
895 },
896};
897
898/* Old method - ELF header with PT_NOTE sections only works on BE */
899#ifdef __BIG_ENDIAN__
900static struct fake_elf {
901 Elf32_Ehdr elfhdr;
902 Elf32_Phdr phdr[2];
903 struct chrpnote {
904 u32 namesz;
905 u32 descsz;
906 u32 type;
907 char name[8]; /* "PowerPC" */
908 struct chrpdesc {
909 u32 real_mode;
910 u32 real_base;
911 u32 real_size;
912 u32 virt_base;
913 u32 virt_size;
914 u32 load_base;
915 } chrpdesc;
916 } chrpnote;
917 struct rpanote {
918 u32 namesz;
919 u32 descsz;
920 u32 type;
921 char name[24]; /* "IBM,RPA-Client-Config" */
922 struct rpadesc {
923 u32 lpar_affinity;
924 u32 min_rmo_size;
925 u32 min_rmo_percent;
926 u32 max_pft_size;
927 u32 splpar;
928 u32 min_load;
929 u32 new_mem_def;
930 u32 ignore_me;
931 } rpadesc;
932 } rpanote;
933} fake_elf = {
934 .elfhdr = {
935 .e_ident = { 0x7f, 'E', 'L', 'F',
936 ELFCLASS32, ELFDATA2MSB, EV_CURRENT },
937 .e_type = ET_EXEC, /* yeah right */
938 .e_machine = EM_PPC,
939 .e_version = EV_CURRENT,
940 .e_phoff = offsetof(struct fake_elf, phdr),
941 .e_phentsize = sizeof(Elf32_Phdr),
942 .e_phnum = 2
943 },
944 .phdr = {
945 [0] = {
946 .p_type = PT_NOTE,
947 .p_offset = offsetof(struct fake_elf, chrpnote),
948 .p_filesz = sizeof(struct chrpnote)
949 }, [1] = {
950 .p_type = PT_NOTE,
951 .p_offset = offsetof(struct fake_elf, rpanote),
952 .p_filesz = sizeof(struct rpanote)
953 }
954 },
955 .chrpnote = {
956 .namesz = sizeof("PowerPC"),
957 .descsz = sizeof(struct chrpdesc),
958 .type = 0x1275,
959 .name = "PowerPC",
960 .chrpdesc = {
961 .real_mode = ~0U, /* ~0 means "don't care" */
962 .real_base = ~0U,
963 .real_size = ~0U,
964 .virt_base = ~0U,
965 .virt_size = ~0U,
966 .load_base = ~0U
967 },
968 },
969 .rpanote = {
970 .namesz = sizeof("IBM,RPA-Client-Config"),
971 .descsz = sizeof(struct rpadesc),
972 .type = 0x12759999,
973 .name = "IBM,RPA-Client-Config",
974 .rpadesc = {
975 .lpar_affinity = 0,
976 .min_rmo_size = 64, /* in megabytes */
977 .min_rmo_percent = 0,
978 .max_pft_size = 48, /* 2^48 bytes max PFT size */
979 .splpar = 1,
980 .min_load = ~0U,
981 .new_mem_def = 0
982 }
983 }
984};
985#endif /* __BIG_ENDIAN__ */
986
987static int __init prom_count_smt_threads(void)
988{
989 phandle node;
990 char type[64];
991 unsigned int plen;
992
993 /* Pick up th first CPU node we can find */
994 for (node = 0; prom_next_node(&node); ) {
995 type[0] = 0;
996 prom_getprop(node, "device_type", type, sizeof(type));
997
998 if (strcmp(type, "cpu"))
999 continue;
1000 /*
1001 * There is an entry for each smt thread, each entry being
1002 * 4 bytes long. All cpus should have the same number of
1003 * smt threads, so return after finding the first.
1004 */
1005 plen = prom_getproplen(node, "ibm,ppc-interrupt-server#s");
1006 if (plen == PROM_ERROR)
1007 break;
1008 plen >>= 2;
1009 prom_debug("Found %lu smt threads per core\n", (unsigned long)plen);
1010
1011 /* Sanity check */
1012 if (plen < 1 || plen > 64) {
1013 prom_printf("Threads per core %lu out of bounds, assuming 1\n",
1014 (unsigned long)plen);
1015 return 1;
1016 }
1017 return plen;
1018 }
1019 prom_debug("No threads found, assuming 1 per core\n");
1020
1021 return 1;
1022
1023}
1024
1025static void __init prom_parse_mmu_model(u8 val,
1026 struct platform_support *support)
1027{
1028 switch (val) {
1029 case OV5_FEAT(OV5_MMU_DYNAMIC):
1030 case OV5_FEAT(OV5_MMU_EITHER): /* Either Available */
1031 prom_debug("MMU - either supported\n");
1032 support->radix_mmu = !prom_radix_disable;
1033 support->hash_mmu = true;
1034 break;
1035 case OV5_FEAT(OV5_MMU_RADIX): /* Only Radix */
1036 prom_debug("MMU - radix only\n");
1037 if (prom_radix_disable) {
1038 /*
1039 * If we __have__ to do radix, we're better off ignoring
1040 * the command line rather than not booting.
1041 */
1042 prom_printf("WARNING: Ignoring cmdline option disable_radix\n");
1043 }
1044 support->radix_mmu = true;
1045 break;
1046 case OV5_FEAT(OV5_MMU_HASH):
1047 prom_debug("MMU - hash only\n");
1048 support->hash_mmu = true;
1049 break;
1050 default:
1051 prom_debug("Unknown mmu support option: 0x%x\n", val);
1052 break;
1053 }
1054}
1055
1056static void __init prom_parse_xive_model(u8 val,
1057 struct platform_support *support)
1058{
1059 switch (val) {
1060 case OV5_FEAT(OV5_XIVE_EITHER): /* Either Available */
1061 prom_debug("XIVE - either mode supported\n");
1062 support->xive = true;
1063 break;
1064 case OV5_FEAT(OV5_XIVE_EXPLOIT): /* Only Exploitation mode */
1065 prom_debug("XIVE - exploitation mode supported\n");
1066 support->xive = true;
1067 break;
1068 case OV5_FEAT(OV5_XIVE_LEGACY): /* Only Legacy mode */
1069 prom_debug("XIVE - legacy mode supported\n");
1070 break;
1071 default:
1072 prom_debug("Unknown xive support option: 0x%x\n", val);
1073 break;
1074 }
1075}
1076
1077static void __init prom_parse_platform_support(u8 index, u8 val,
1078 struct platform_support *support)
1079{
1080 switch (index) {
1081 case OV5_INDX(OV5_MMU_SUPPORT): /* MMU Model */
1082 prom_parse_mmu_model(val & OV5_FEAT(OV5_MMU_SUPPORT), support);
1083 break;
1084 case OV5_INDX(OV5_RADIX_GTSE): /* Radix Extensions */
1085 if (val & OV5_FEAT(OV5_RADIX_GTSE)) {
1086 prom_debug("Radix - GTSE supported\n");
1087 support->radix_gtse = true;
1088 }
1089 break;
1090 case OV5_INDX(OV5_XIVE_SUPPORT): /* Interrupt mode */
1091 prom_parse_xive_model(val & OV5_FEAT(OV5_XIVE_SUPPORT),
1092 support);
1093 break;
1094 }
1095}
1096
1097static void __init prom_check_platform_support(void)
1098{
1099 struct platform_support supported = {
1100 .hash_mmu = false,
1101 .radix_mmu = false,
1102 .radix_gtse = false,
1103 .xive = false
1104 };
1105 int prop_len = prom_getproplen(prom.chosen,
1106 "ibm,arch-vec-5-platform-support");
1107 if (prop_len > 1) {
1108 int i;
1109 u8 vec[prop_len];
1110 prom_debug("Found ibm,arch-vec-5-platform-support, len: %d\n",
1111 prop_len);
1112 prom_getprop(prom.chosen, "ibm,arch-vec-5-platform-support",
1113 &vec, sizeof(vec));
1114 for (i = 0; i < prop_len; i += 2) {
1115 prom_debug("%d: index = 0x%x val = 0x%x\n", i / 2
1116 , vec[i]
1117 , vec[i + 1]);
1118 prom_parse_platform_support(vec[i], vec[i + 1],
1119 &supported);
1120 }
1121 }
1122
1123 if (supported.radix_mmu && supported.radix_gtse &&
1124 IS_ENABLED(CONFIG_PPC_RADIX_MMU)) {
1125 /* Radix preferred - but we require GTSE for now */
1126 prom_debug("Asking for radix with GTSE\n");
1127 ibm_architecture_vec.vec5.mmu = OV5_FEAT(OV5_MMU_RADIX);
1128 ibm_architecture_vec.vec5.radix_ext = OV5_FEAT(OV5_RADIX_GTSE);
1129 } else if (supported.hash_mmu) {
1130 /* Default to hash mmu (if we can) */
1131 prom_debug("Asking for hash\n");
1132 ibm_architecture_vec.vec5.mmu = OV5_FEAT(OV5_MMU_HASH);
1133 } else {
1134 /* We're probably on a legacy hypervisor */
1135 prom_debug("Assuming legacy hash support\n");
1136 }
1137
1138 if (supported.xive) {
1139 prom_debug("Asking for XIVE\n");
1140 ibm_architecture_vec.vec5.intarch = OV5_FEAT(OV5_XIVE_EXPLOIT);
1141 }
1142}
1143
1144static void __init prom_send_capabilities(void)
1145{
1146 ihandle root;
1147 prom_arg_t ret;
1148 u32 cores;
1149
1150 /* Check ibm,arch-vec-5-platform-support and fixup vec5 if required */
1151 prom_check_platform_support();
1152
1153 root = call_prom("open", 1, 1, ADDR("/"));
1154 if (root != 0) {
1155 /* We need to tell the FW about the number of cores we support.
1156 *
1157 * To do that, we count the number of threads on the first core
1158 * (we assume this is the same for all cores) and use it to
1159 * divide NR_CPUS.
1160 */
1161
1162 cores = DIV_ROUND_UP(NR_CPUS, prom_count_smt_threads());
1163 prom_printf("Max number of cores passed to firmware: %lu (NR_CPUS = %lu)\n",
1164 cores, NR_CPUS);
1165
1166 ibm_architecture_vec.vec5.max_cpus = cpu_to_be32(cores);
1167
1168 /* try calling the ibm,client-architecture-support method */
1169 prom_printf("Calling ibm,client-architecture-support...");
1170 if (call_prom_ret("call-method", 3, 2, &ret,
1171 ADDR("ibm,client-architecture-support"),
1172 root,
1173 ADDR(&ibm_architecture_vec)) == 0) {
1174 /* the call exists... */
1175 if (ret)
1176 prom_printf("\nWARNING: ibm,client-architecture"
1177 "-support call FAILED!\n");
1178 call_prom("close", 1, 0, root);
1179 prom_printf(" done\n");
1180 return;
1181 }
1182 call_prom("close", 1, 0, root);
1183 prom_printf(" not implemented\n");
1184 }
1185
1186#ifdef __BIG_ENDIAN__
1187 {
1188 ihandle elfloader;
1189
1190 /* no ibm,client-architecture-support call, try the old way */
1191 elfloader = call_prom("open", 1, 1,
1192 ADDR("/packages/elf-loader"));
1193 if (elfloader == 0) {
1194 prom_printf("couldn't open /packages/elf-loader\n");
1195 return;
1196 }
1197 call_prom("call-method", 3, 1, ADDR("process-elf-header"),
1198 elfloader, ADDR(&fake_elf));
1199 call_prom("close", 1, 0, elfloader);
1200 }
1201#endif /* __BIG_ENDIAN__ */
1202}
1203#endif /* #if defined(CONFIG_PPC_PSERIES) || defined(CONFIG_PPC_POWERNV) */
1204
1205/*
1206 * Memory allocation strategy... our layout is normally:
1207 *
1208 * at 14Mb or more we have vmlinux, then a gap and initrd. In some
1209 * rare cases, initrd might end up being before the kernel though.
1210 * We assume this won't override the final kernel at 0, we have no
1211 * provision to handle that in this version, but it should hopefully
1212 * never happen.
1213 *
1214 * alloc_top is set to the top of RMO, eventually shrink down if the
1215 * TCEs overlap
1216 *
1217 * alloc_bottom is set to the top of kernel/initrd
1218 *
1219 * from there, allocations are done this way : rtas is allocated
1220 * topmost, and the device-tree is allocated from the bottom. We try
1221 * to grow the device-tree allocation as we progress. If we can't,
1222 * then we fail, we don't currently have a facility to restart
1223 * elsewhere, but that shouldn't be necessary.
1224 *
1225 * Note that calls to reserve_mem have to be done explicitly, memory
1226 * allocated with either alloc_up or alloc_down isn't automatically
1227 * reserved.
1228 */
1229
1230
1231/*
1232 * Allocates memory in the RMO upward from the kernel/initrd
1233 *
1234 * When align is 0, this is a special case, it means to allocate in place
1235 * at the current location of alloc_bottom or fail (that is basically
1236 * extending the previous allocation). Used for the device-tree flattening
1237 */
1238static unsigned long __init alloc_up(unsigned long size, unsigned long align)
1239{
1240 unsigned long base = alloc_bottom;
1241 unsigned long addr = 0;
1242
1243 if (align)
1244 base = _ALIGN_UP(base, align);
1245 prom_debug("alloc_up(%x, %x)\n", size, align);
1246 if (ram_top == 0)
1247 prom_panic("alloc_up() called with mem not initialized\n");
1248
1249 if (align)
1250 base = _ALIGN_UP(alloc_bottom, align);
1251 else
1252 base = alloc_bottom;
1253
1254 for(; (base + size) <= alloc_top;
1255 base = _ALIGN_UP(base + 0x100000, align)) {
1256 prom_debug(" trying: 0x%x\n\r", base);
1257 addr = (unsigned long)prom_claim(base, size, 0);
1258 if (addr != PROM_ERROR && addr != 0)
1259 break;
1260 addr = 0;
1261 if (align == 0)
1262 break;
1263 }
1264 if (addr == 0)
1265 return 0;
1266 alloc_bottom = addr + size;
1267
1268 prom_debug(" -> %x\n", addr);
1269 prom_debug(" alloc_bottom : %x\n", alloc_bottom);
1270 prom_debug(" alloc_top : %x\n", alloc_top);
1271 prom_debug(" alloc_top_hi : %x\n", alloc_top_high);
1272 prom_debug(" rmo_top : %x\n", rmo_top);
1273 prom_debug(" ram_top : %x\n", ram_top);
1274
1275 return addr;
1276}
1277
1278/*
1279 * Allocates memory downward, either from top of RMO, or if highmem
1280 * is set, from the top of RAM. Note that this one doesn't handle
1281 * failures. It does claim memory if highmem is not set.
1282 */
1283static unsigned long __init alloc_down(unsigned long size, unsigned long align,
1284 int highmem)
1285{
1286 unsigned long base, addr = 0;
1287
1288 prom_debug("alloc_down(%x, %x, %s)\n", size, align,
1289 highmem ? "(high)" : "(low)");
1290 if (ram_top == 0)
1291 prom_panic("alloc_down() called with mem not initialized\n");
1292
1293 if (highmem) {
1294 /* Carve out storage for the TCE table. */
1295 addr = _ALIGN_DOWN(alloc_top_high - size, align);
1296 if (addr <= alloc_bottom)
1297 return 0;
1298 /* Will we bump into the RMO ? If yes, check out that we
1299 * didn't overlap existing allocations there, if we did,
1300 * we are dead, we must be the first in town !
1301 */
1302 if (addr < rmo_top) {
1303 /* Good, we are first */
1304 if (alloc_top == rmo_top)
1305 alloc_top = rmo_top = addr;
1306 else
1307 return 0;
1308 }
1309 alloc_top_high = addr;
1310 goto bail;
1311 }
1312
1313 base = _ALIGN_DOWN(alloc_top - size, align);
1314 for (; base > alloc_bottom;
1315 base = _ALIGN_DOWN(base - 0x100000, align)) {
1316 prom_debug(" trying: 0x%x\n\r", base);
1317 addr = (unsigned long)prom_claim(base, size, 0);
1318 if (addr != PROM_ERROR && addr != 0)
1319 break;
1320 addr = 0;
1321 }
1322 if (addr == 0)
1323 return 0;
1324 alloc_top = addr;
1325
1326 bail:
1327 prom_debug(" -> %x\n", addr);
1328 prom_debug(" alloc_bottom : %x\n", alloc_bottom);
1329 prom_debug(" alloc_top : %x\n", alloc_top);
1330 prom_debug(" alloc_top_hi : %x\n", alloc_top_high);
1331 prom_debug(" rmo_top : %x\n", rmo_top);
1332 prom_debug(" ram_top : %x\n", ram_top);
1333
1334 return addr;
1335}
1336
1337/*
1338 * Parse a "reg" cell
1339 */
1340static unsigned long __init prom_next_cell(int s, cell_t **cellp)
1341{
1342 cell_t *p = *cellp;
1343 unsigned long r = 0;
1344
1345 /* Ignore more than 2 cells */
1346 while (s > sizeof(unsigned long) / 4) {
1347 p++;
1348 s--;
1349 }
1350 r = be32_to_cpu(*p++);
1351#ifdef CONFIG_PPC64
1352 if (s > 1) {
1353 r <<= 32;
1354 r |= be32_to_cpu(*(p++));
1355 }
1356#endif
1357 *cellp = p;
1358 return r;
1359}
1360
1361/*
1362 * Very dumb function for adding to the memory reserve list, but
1363 * we don't need anything smarter at this point
1364 *
1365 * XXX Eventually check for collisions. They should NEVER happen.
1366 * If problems seem to show up, it would be a good start to track
1367 * them down.
1368 */
1369static void __init reserve_mem(u64 base, u64 size)
1370{
1371 u64 top = base + size;
1372 unsigned long cnt = mem_reserve_cnt;
1373
1374 if (size == 0)
1375 return;
1376
1377 /* We need to always keep one empty entry so that we
1378 * have our terminator with "size" set to 0 since we are
1379 * dumb and just copy this entire array to the boot params
1380 */
1381 base = _ALIGN_DOWN(base, PAGE_SIZE);
1382 top = _ALIGN_UP(top, PAGE_SIZE);
1383 size = top - base;
1384
1385 if (cnt >= (MEM_RESERVE_MAP_SIZE - 1))
1386 prom_panic("Memory reserve map exhausted !\n");
1387 mem_reserve_map[cnt].base = cpu_to_be64(base);
1388 mem_reserve_map[cnt].size = cpu_to_be64(size);
1389 mem_reserve_cnt = cnt + 1;
1390}
1391
1392/*
1393 * Initialize memory allocation mechanism, parse "memory" nodes and
1394 * obtain that way the top of memory and RMO to setup out local allocator
1395 */
1396static void __init prom_init_mem(void)
1397{
1398 phandle node;
1399 char *path, type[64];
1400 unsigned int plen;
1401 cell_t *p, *endp;
1402 __be32 val;
1403 u32 rac, rsc;
1404
1405 /*
1406 * We iterate the memory nodes to find
1407 * 1) top of RMO (first node)
1408 * 2) top of memory
1409 */
1410 val = cpu_to_be32(2);
1411 prom_getprop(prom.root, "#address-cells", &val, sizeof(val));
1412 rac = be32_to_cpu(val);
1413 val = cpu_to_be32(1);
1414 prom_getprop(prom.root, "#size-cells", &val, sizeof(rsc));
1415 rsc = be32_to_cpu(val);
1416 prom_debug("root_addr_cells: %x\n", rac);
1417 prom_debug("root_size_cells: %x\n", rsc);
1418
1419 prom_debug("scanning memory:\n");
1420 path = prom_scratch;
1421
1422 for (node = 0; prom_next_node(&node); ) {
1423 type[0] = 0;
1424 prom_getprop(node, "device_type", type, sizeof(type));
1425
1426 if (type[0] == 0) {
1427 /*
1428 * CHRP Longtrail machines have no device_type
1429 * on the memory node, so check the name instead...
1430 */
1431 prom_getprop(node, "name", type, sizeof(type));
1432 }
1433 if (strcmp(type, "memory"))
1434 continue;
1435
1436 plen = prom_getprop(node, "reg", regbuf, sizeof(regbuf));
1437 if (plen > sizeof(regbuf)) {
1438 prom_printf("memory node too large for buffer !\n");
1439 plen = sizeof(regbuf);
1440 }
1441 p = regbuf;
1442 endp = p + (plen / sizeof(cell_t));
1443
1444#ifdef DEBUG_PROM
1445 memset(path, 0, PROM_SCRATCH_SIZE);
1446 call_prom("package-to-path", 3, 1, node, path, PROM_SCRATCH_SIZE-1);
1447 prom_debug(" node %s :\n", path);
1448#endif /* DEBUG_PROM */
1449
1450 while ((endp - p) >= (rac + rsc)) {
1451 unsigned long base, size;
1452
1453 base = prom_next_cell(rac, &p);
1454 size = prom_next_cell(rsc, &p);
1455
1456 if (size == 0)
1457 continue;
1458 prom_debug(" %x %x\n", base, size);
1459 if (base == 0 && (of_platform & PLATFORM_LPAR))
1460 rmo_top = size;
1461 if ((base + size) > ram_top)
1462 ram_top = base + size;
1463 }
1464 }
1465
1466 alloc_bottom = PAGE_ALIGN((unsigned long)&_end + 0x4000);
1467
1468 /*
1469 * If prom_memory_limit is set we reduce the upper limits *except* for
1470 * alloc_top_high. This must be the real top of RAM so we can put
1471 * TCE's up there.
1472 */
1473
1474 alloc_top_high = ram_top;
1475
1476 if (prom_memory_limit) {
1477 if (prom_memory_limit <= alloc_bottom) {
1478 prom_printf("Ignoring mem=%x <= alloc_bottom.\n",
1479 prom_memory_limit);
1480 prom_memory_limit = 0;
1481 } else if (prom_memory_limit >= ram_top) {
1482 prom_printf("Ignoring mem=%x >= ram_top.\n",
1483 prom_memory_limit);
1484 prom_memory_limit = 0;
1485 } else {
1486 ram_top = prom_memory_limit;
1487 rmo_top = min(rmo_top, prom_memory_limit);
1488 }
1489 }
1490
1491 /*
1492 * Setup our top alloc point, that is top of RMO or top of
1493 * segment 0 when running non-LPAR.
1494 * Some RS64 machines have buggy firmware where claims up at
1495 * 1GB fail. Cap at 768MB as a workaround.
1496 * Since 768MB is plenty of room, and we need to cap to something
1497 * reasonable on 32-bit, cap at 768MB on all machines.
1498 */
1499 if (!rmo_top)
1500 rmo_top = ram_top;
1501 rmo_top = min(0x30000000ul, rmo_top);
1502 alloc_top = rmo_top;
1503 alloc_top_high = ram_top;
1504
1505 /*
1506 * Check if we have an initrd after the kernel but still inside
1507 * the RMO. If we do move our bottom point to after it.
1508 */
1509 if (prom_initrd_start &&
1510 prom_initrd_start < rmo_top &&
1511 prom_initrd_end > alloc_bottom)
1512 alloc_bottom = PAGE_ALIGN(prom_initrd_end);
1513
1514 prom_printf("memory layout at init:\n");
1515 prom_printf(" memory_limit : %x (16 MB aligned)\n", prom_memory_limit);
1516 prom_printf(" alloc_bottom : %x\n", alloc_bottom);
1517 prom_printf(" alloc_top : %x\n", alloc_top);
1518 prom_printf(" alloc_top_hi : %x\n", alloc_top_high);
1519 prom_printf(" rmo_top : %x\n", rmo_top);
1520 prom_printf(" ram_top : %x\n", ram_top);
1521}
1522
1523static void __init prom_close_stdin(void)
1524{
1525 __be32 val;
1526 ihandle stdin;
1527
1528 if (prom_getprop(prom.chosen, "stdin", &val, sizeof(val)) > 0) {
1529 stdin = be32_to_cpu(val);
1530 call_prom("close", 1, 0, stdin);
1531 }
1532}
1533
1534#ifdef CONFIG_PPC_POWERNV
1535
1536#ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
1537static u64 __initdata prom_opal_base;
1538static u64 __initdata prom_opal_entry;
1539#endif
1540
1541/*
1542 * Allocate room for and instantiate OPAL
1543 */
1544static void __init prom_instantiate_opal(void)
1545{
1546 phandle opal_node;
1547 ihandle opal_inst;
1548 u64 base, entry;
1549 u64 size = 0, align = 0x10000;
1550 __be64 val64;
1551 u32 rets[2];
1552
1553 prom_debug("prom_instantiate_opal: start...\n");
1554
1555 opal_node = call_prom("finddevice", 1, 1, ADDR("/ibm,opal"));
1556 prom_debug("opal_node: %x\n", opal_node);
1557 if (!PHANDLE_VALID(opal_node))
1558 return;
1559
1560 val64 = 0;
1561 prom_getprop(opal_node, "opal-runtime-size", &val64, sizeof(val64));
1562 size = be64_to_cpu(val64);
1563 if (size == 0)
1564 return;
1565 val64 = 0;
1566 prom_getprop(opal_node, "opal-runtime-alignment", &val64,sizeof(val64));
1567 align = be64_to_cpu(val64);
1568
1569 base = alloc_down(size, align, 0);
1570 if (base == 0) {
1571 prom_printf("OPAL allocation failed !\n");
1572 return;
1573 }
1574
1575 opal_inst = call_prom("open", 1, 1, ADDR("/ibm,opal"));
1576 if (!IHANDLE_VALID(opal_inst)) {
1577 prom_printf("opening opal package failed (%x)\n", opal_inst);
1578 return;
1579 }
1580
1581 prom_printf("instantiating opal at 0x%x...", base);
1582
1583 if (call_prom_ret("call-method", 4, 3, rets,
1584 ADDR("load-opal-runtime"),
1585 opal_inst,
1586 base >> 32, base & 0xffffffff) != 0
1587 || (rets[0] == 0 && rets[1] == 0)) {
1588 prom_printf(" failed\n");
1589 return;
1590 }
1591 entry = (((u64)rets[0]) << 32) | rets[1];
1592
1593 prom_printf(" done\n");
1594
1595 reserve_mem(base, size);
1596
1597 prom_debug("opal base = 0x%x\n", base);
1598 prom_debug("opal align = 0x%x\n", align);
1599 prom_debug("opal entry = 0x%x\n", entry);
1600 prom_debug("opal size = 0x%x\n", (long)size);
1601
1602 prom_setprop(opal_node, "/ibm,opal", "opal-base-address",
1603 &base, sizeof(base));
1604 prom_setprop(opal_node, "/ibm,opal", "opal-entry-address",
1605 &entry, sizeof(entry));
1606
1607#ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
1608 prom_opal_base = base;
1609 prom_opal_entry = entry;
1610#endif
1611 prom_debug("prom_instantiate_opal: end...\n");
1612}
1613
1614#endif /* CONFIG_PPC_POWERNV */
1615
1616/*
1617 * Allocate room for and instantiate RTAS
1618 */
1619static void __init prom_instantiate_rtas(void)
1620{
1621 phandle rtas_node;
1622 ihandle rtas_inst;
1623 u32 base, entry = 0;
1624 __be32 val;
1625 u32 size = 0;
1626
1627 prom_debug("prom_instantiate_rtas: start...\n");
1628
1629 rtas_node = call_prom("finddevice", 1, 1, ADDR("/rtas"));
1630 prom_debug("rtas_node: %x\n", rtas_node);
1631 if (!PHANDLE_VALID(rtas_node))
1632 return;
1633
1634 val = 0;
1635 prom_getprop(rtas_node, "rtas-size", &val, sizeof(size));
1636 size = be32_to_cpu(val);
1637 if (size == 0)
1638 return;
1639
1640 base = alloc_down(size, PAGE_SIZE, 0);
1641 if (base == 0)
1642 prom_panic("Could not allocate memory for RTAS\n");
1643
1644 rtas_inst = call_prom("open", 1, 1, ADDR("/rtas"));
1645 if (!IHANDLE_VALID(rtas_inst)) {
1646 prom_printf("opening rtas package failed (%x)\n", rtas_inst);
1647 return;
1648 }
1649
1650 prom_printf("instantiating rtas at 0x%x...", base);
1651
1652 if (call_prom_ret("call-method", 3, 2, &entry,
1653 ADDR("instantiate-rtas"),
1654 rtas_inst, base) != 0
1655 || entry == 0) {
1656 prom_printf(" failed\n");
1657 return;
1658 }
1659 prom_printf(" done\n");
1660
1661 reserve_mem(base, size);
1662
1663 val = cpu_to_be32(base);
1664 prom_setprop(rtas_node, "/rtas", "linux,rtas-base",
1665 &val, sizeof(val));
1666 val = cpu_to_be32(entry);
1667 prom_setprop(rtas_node, "/rtas", "linux,rtas-entry",
1668 &val, sizeof(val));
1669
1670 /* Check if it supports "query-cpu-stopped-state" */
1671 if (prom_getprop(rtas_node, "query-cpu-stopped-state",
1672 &val, sizeof(val)) != PROM_ERROR)
1673 rtas_has_query_cpu_stopped = true;
1674
1675 prom_debug("rtas base = 0x%x\n", base);
1676 prom_debug("rtas entry = 0x%x\n", entry);
1677 prom_debug("rtas size = 0x%x\n", (long)size);
1678
1679 prom_debug("prom_instantiate_rtas: end...\n");
1680}
1681
1682#ifdef CONFIG_PPC64
1683/*
1684 * Allocate room for and instantiate Stored Measurement Log (SML)
1685 */
1686static void __init prom_instantiate_sml(void)
1687{
1688 phandle ibmvtpm_node;
1689 ihandle ibmvtpm_inst;
1690 u32 entry = 0, size = 0, succ = 0;
1691 u64 base;
1692 __be32 val;
1693
1694 prom_debug("prom_instantiate_sml: start...\n");
1695
1696 ibmvtpm_node = call_prom("finddevice", 1, 1, ADDR("/vdevice/vtpm"));
1697 prom_debug("ibmvtpm_node: %x\n", ibmvtpm_node);
1698 if (!PHANDLE_VALID(ibmvtpm_node))
1699 return;
1700
1701 ibmvtpm_inst = call_prom("open", 1, 1, ADDR("/vdevice/vtpm"));
1702 if (!IHANDLE_VALID(ibmvtpm_inst)) {
1703 prom_printf("opening vtpm package failed (%x)\n", ibmvtpm_inst);
1704 return;
1705 }
1706
1707 if (prom_getprop(ibmvtpm_node, "ibm,sml-efi-reformat-supported",
1708 &val, sizeof(val)) != PROM_ERROR) {
1709 if (call_prom_ret("call-method", 2, 2, &succ,
1710 ADDR("reformat-sml-to-efi-alignment"),
1711 ibmvtpm_inst) != 0 || succ == 0) {
1712 prom_printf("Reformat SML to EFI alignment failed\n");
1713 return;
1714 }
1715
1716 if (call_prom_ret("call-method", 2, 2, &size,
1717 ADDR("sml-get-allocated-size"),
1718 ibmvtpm_inst) != 0 || size == 0) {
1719 prom_printf("SML get allocated size failed\n");
1720 return;
1721 }
1722 } else {
1723 if (call_prom_ret("call-method", 2, 2, &size,
1724 ADDR("sml-get-handover-size"),
1725 ibmvtpm_inst) != 0 || size == 0) {
1726 prom_printf("SML get handover size failed\n");
1727 return;
1728 }
1729 }
1730
1731 base = alloc_down(size, PAGE_SIZE, 0);
1732 if (base == 0)
1733 prom_panic("Could not allocate memory for sml\n");
1734
1735 prom_printf("instantiating sml at 0x%x...", base);
1736
1737 memset((void *)base, 0, size);
1738
1739 if (call_prom_ret("call-method", 4, 2, &entry,
1740 ADDR("sml-handover"),
1741 ibmvtpm_inst, size, base) != 0 || entry == 0) {
1742 prom_printf("SML handover failed\n");
1743 return;
1744 }
1745 prom_printf(" done\n");
1746
1747 reserve_mem(base, size);
1748
1749 prom_setprop(ibmvtpm_node, "/vdevice/vtpm", "linux,sml-base",
1750 &base, sizeof(base));
1751 prom_setprop(ibmvtpm_node, "/vdevice/vtpm", "linux,sml-size",
1752 &size, sizeof(size));
1753
1754 prom_debug("sml base = 0x%x\n", base);
1755 prom_debug("sml size = 0x%x\n", (long)size);
1756
1757 prom_debug("prom_instantiate_sml: end...\n");
1758}
1759
1760/*
1761 * Allocate room for and initialize TCE tables
1762 */
1763#ifdef __BIG_ENDIAN__
1764static void __init prom_initialize_tce_table(void)
1765{
1766 phandle node;
1767 ihandle phb_node;
1768 char compatible[64], type[64], model[64];
1769 char *path = prom_scratch;
1770 u64 base, align;
1771 u32 minalign, minsize;
1772 u64 tce_entry, *tce_entryp;
1773 u64 local_alloc_top, local_alloc_bottom;
1774 u64 i;
1775
1776 if (prom_iommu_off)
1777 return;
1778
1779 prom_debug("starting prom_initialize_tce_table\n");
1780
1781 /* Cache current top of allocs so we reserve a single block */
1782 local_alloc_top = alloc_top_high;
1783 local_alloc_bottom = local_alloc_top;
1784
1785 /* Search all nodes looking for PHBs. */
1786 for (node = 0; prom_next_node(&node); ) {
1787 compatible[0] = 0;
1788 type[0] = 0;
1789 model[0] = 0;
1790 prom_getprop(node, "compatible",
1791 compatible, sizeof(compatible));
1792 prom_getprop(node, "device_type", type, sizeof(type));
1793 prom_getprop(node, "model", model, sizeof(model));
1794
1795 if ((type[0] == 0) || (strstr(type, "pci") == NULL))
1796 continue;
1797
1798 /* Keep the old logic intact to avoid regression. */
1799 if (compatible[0] != 0) {
1800 if ((strstr(compatible, "python") == NULL) &&
1801 (strstr(compatible, "Speedwagon") == NULL) &&
1802 (strstr(compatible, "Winnipeg") == NULL))
1803 continue;
1804 } else if (model[0] != 0) {
1805 if ((strstr(model, "ython") == NULL) &&
1806 (strstr(model, "peedwagon") == NULL) &&
1807 (strstr(model, "innipeg") == NULL))
1808 continue;
1809 }
1810
1811 if (prom_getprop(node, "tce-table-minalign", &minalign,
1812 sizeof(minalign)) == PROM_ERROR)
1813 minalign = 0;
1814 if (prom_getprop(node, "tce-table-minsize", &minsize,
1815 sizeof(minsize)) == PROM_ERROR)
1816 minsize = 4UL << 20;
1817
1818 /*
1819 * Even though we read what OF wants, we just set the table
1820 * size to 4 MB. This is enough to map 2GB of PCI DMA space.
1821 * By doing this, we avoid the pitfalls of trying to DMA to
1822 * MMIO space and the DMA alias hole.
1823 */
1824 minsize = 4UL << 20;
1825
1826 /* Align to the greater of the align or size */
1827 align = max(minalign, minsize);
1828 base = alloc_down(minsize, align, 1);
1829 if (base == 0)
1830 prom_panic("ERROR, cannot find space for TCE table.\n");
1831 if (base < local_alloc_bottom)
1832 local_alloc_bottom = base;
1833
1834 /* It seems OF doesn't null-terminate the path :-( */
1835 memset(path, 0, PROM_SCRATCH_SIZE);
1836 /* Call OF to setup the TCE hardware */
1837 if (call_prom("package-to-path", 3, 1, node,
1838 path, PROM_SCRATCH_SIZE-1) == PROM_ERROR) {
1839 prom_printf("package-to-path failed\n");
1840 }
1841
1842 /* Save away the TCE table attributes for later use. */
1843 prom_setprop(node, path, "linux,tce-base", &base, sizeof(base));
1844 prom_setprop(node, path, "linux,tce-size", &minsize, sizeof(minsize));
1845
1846 prom_debug("TCE table: %s\n", path);
1847 prom_debug("\tnode = 0x%x\n", node);
1848 prom_debug("\tbase = 0x%x\n", base);
1849 prom_debug("\tsize = 0x%x\n", minsize);
1850
1851 /* Initialize the table to have a one-to-one mapping
1852 * over the allocated size.
1853 */
1854 tce_entryp = (u64 *)base;
1855 for (i = 0; i < (minsize >> 3) ;tce_entryp++, i++) {
1856 tce_entry = (i << PAGE_SHIFT);
1857 tce_entry |= 0x3;
1858 *tce_entryp = tce_entry;
1859 }
1860
1861 prom_printf("opening PHB %s", path);
1862 phb_node = call_prom("open", 1, 1, path);
1863 if (phb_node == 0)
1864 prom_printf("... failed\n");
1865 else
1866 prom_printf("... done\n");
1867
1868 call_prom("call-method", 6, 0, ADDR("set-64-bit-addressing"),
1869 phb_node, -1, minsize,
1870 (u32) base, (u32) (base >> 32));
1871 call_prom("close", 1, 0, phb_node);
1872 }
1873
1874 reserve_mem(local_alloc_bottom, local_alloc_top - local_alloc_bottom);
1875
1876 /* These are only really needed if there is a memory limit in
1877 * effect, but we don't know so export them always. */
1878 prom_tce_alloc_start = local_alloc_bottom;
1879 prom_tce_alloc_end = local_alloc_top;
1880
1881 /* Flag the first invalid entry */
1882 prom_debug("ending prom_initialize_tce_table\n");
1883}
1884#endif /* __BIG_ENDIAN__ */
1885#endif /* CONFIG_PPC64 */
1886
1887/*
1888 * With CHRP SMP we need to use the OF to start the other processors.
1889 * We can't wait until smp_boot_cpus (the OF is trashed by then)
1890 * so we have to put the processors into a holding pattern controlled
1891 * by the kernel (not OF) before we destroy the OF.
1892 *
1893 * This uses a chunk of low memory, puts some holding pattern
1894 * code there and sends the other processors off to there until
1895 * smp_boot_cpus tells them to do something. The holding pattern
1896 * checks that address until its cpu # is there, when it is that
1897 * cpu jumps to __secondary_start(). smp_boot_cpus() takes care
1898 * of setting those values.
1899 *
1900 * We also use physical address 0x4 here to tell when a cpu
1901 * is in its holding pattern code.
1902 *
1903 * -- Cort
1904 */
1905/*
1906 * We want to reference the copy of __secondary_hold_* in the
1907 * 0 - 0x100 address range
1908 */
1909#define LOW_ADDR(x) (((unsigned long) &(x)) & 0xff)
1910
1911static void __init prom_hold_cpus(void)
1912{
1913 unsigned long i;
1914 phandle node;
1915 char type[64];
1916 unsigned long *spinloop
1917 = (void *) LOW_ADDR(__secondary_hold_spinloop);
1918 unsigned long *acknowledge
1919 = (void *) LOW_ADDR(__secondary_hold_acknowledge);
1920 unsigned long secondary_hold = LOW_ADDR(__secondary_hold);
1921
1922 /*
1923 * On pseries, if RTAS supports "query-cpu-stopped-state",
1924 * we skip this stage, the CPUs will be started by the
1925 * kernel using RTAS.
1926 */
1927 if ((of_platform == PLATFORM_PSERIES ||
1928 of_platform == PLATFORM_PSERIES_LPAR) &&
1929 rtas_has_query_cpu_stopped) {
1930 prom_printf("prom_hold_cpus: skipped\n");
1931 return;
1932 }
1933
1934 prom_debug("prom_hold_cpus: start...\n");
1935 prom_debug(" 1) spinloop = 0x%x\n", (unsigned long)spinloop);
1936 prom_debug(" 1) *spinloop = 0x%x\n", *spinloop);
1937 prom_debug(" 1) acknowledge = 0x%x\n",
1938 (unsigned long)acknowledge);
1939 prom_debug(" 1) *acknowledge = 0x%x\n", *acknowledge);
1940 prom_debug(" 1) secondary_hold = 0x%x\n", secondary_hold);
1941
1942 /* Set the common spinloop variable, so all of the secondary cpus
1943 * will block when they are awakened from their OF spinloop.
1944 * This must occur for both SMP and non SMP kernels, since OF will
1945 * be trashed when we move the kernel.
1946 */
1947 *spinloop = 0;
1948
1949 /* look for cpus */
1950 for (node = 0; prom_next_node(&node); ) {
1951 unsigned int cpu_no;
1952 __be32 reg;
1953
1954 type[0] = 0;
1955 prom_getprop(node, "device_type", type, sizeof(type));
1956 if (strcmp(type, "cpu") != 0)
1957 continue;
1958
1959 /* Skip non-configured cpus. */
1960 if (prom_getprop(node, "status", type, sizeof(type)) > 0)
1961 if (strcmp(type, "okay") != 0)
1962 continue;
1963
1964 reg = cpu_to_be32(-1); /* make sparse happy */
1965 prom_getprop(node, "reg", ®, sizeof(reg));
1966 cpu_no = be32_to_cpu(reg);
1967
1968 prom_debug("cpu hw idx = %lu\n", cpu_no);
1969
1970 /* Init the acknowledge var which will be reset by
1971 * the secondary cpu when it awakens from its OF
1972 * spinloop.
1973 */
1974 *acknowledge = (unsigned long)-1;
1975
1976 if (cpu_no != prom.cpu) {
1977 /* Primary Thread of non-boot cpu or any thread */
1978 prom_printf("starting cpu hw idx %lu... ", cpu_no);
1979 call_prom("start-cpu", 3, 0, node,
1980 secondary_hold, cpu_no);
1981
1982 for (i = 0; (i < 100000000) &&
1983 (*acknowledge == ((unsigned long)-1)); i++ )
1984 mb();
1985
1986 if (*acknowledge == cpu_no)
1987 prom_printf("done\n");
1988 else
1989 prom_printf("failed: %x\n", *acknowledge);
1990 }
1991#ifdef CONFIG_SMP
1992 else
1993 prom_printf("boot cpu hw idx %lu\n", cpu_no);
1994#endif /* CONFIG_SMP */
1995 }
1996
1997 prom_debug("prom_hold_cpus: end...\n");
1998}
1999
2000
2001static void __init prom_init_client_services(unsigned long pp)
2002{
2003 /* Get a handle to the prom entry point before anything else */
2004 prom_entry = pp;
2005
2006 /* get a handle for the stdout device */
2007 prom.chosen = call_prom("finddevice", 1, 1, ADDR("/chosen"));
2008 if (!PHANDLE_VALID(prom.chosen))
2009 prom_panic("cannot find chosen"); /* msg won't be printed :( */
2010
2011 /* get device tree root */
2012 prom.root = call_prom("finddevice", 1, 1, ADDR("/"));
2013 if (!PHANDLE_VALID(prom.root))
2014 prom_panic("cannot find device tree root"); /* msg won't be printed :( */
2015
2016 prom.mmumap = 0;
2017}
2018
2019#ifdef CONFIG_PPC32
2020/*
2021 * For really old powermacs, we need to map things we claim.
2022 * For that, we need the ihandle of the mmu.
2023 * Also, on the longtrail, we need to work around other bugs.
2024 */
2025static void __init prom_find_mmu(void)
2026{
2027 phandle oprom;
2028 char version[64];
2029
2030 oprom = call_prom("finddevice", 1, 1, ADDR("/openprom"));
2031 if (!PHANDLE_VALID(oprom))
2032 return;
2033 if (prom_getprop(oprom, "model", version, sizeof(version)) <= 0)
2034 return;
2035 version[sizeof(version) - 1] = 0;
2036 /* XXX might need to add other versions here */
2037 if (strcmp(version, "Open Firmware, 1.0.5") == 0)
2038 of_workarounds = OF_WA_CLAIM;
2039 else if (strncmp(version, "FirmWorks,3.", 12) == 0) {
2040 of_workarounds = OF_WA_CLAIM | OF_WA_LONGTRAIL;
2041 call_prom("interpret", 1, 1, "dev /memory 0 to allow-reclaim");
2042 } else
2043 return;
2044 prom.memory = call_prom("open", 1, 1, ADDR("/memory"));
2045 prom_getprop(prom.chosen, "mmu", &prom.mmumap,
2046 sizeof(prom.mmumap));
2047 prom.mmumap = be32_to_cpu(prom.mmumap);
2048 if (!IHANDLE_VALID(prom.memory) || !IHANDLE_VALID(prom.mmumap))
2049 of_workarounds &= ~OF_WA_CLAIM; /* hmmm */
2050}
2051#else
2052#define prom_find_mmu()
2053#endif
2054
2055static void __init prom_init_stdout(void)
2056{
2057 char *path = of_stdout_device;
2058 char type[16];
2059 phandle stdout_node;
2060 __be32 val;
2061
2062 if (prom_getprop(prom.chosen, "stdout", &val, sizeof(val)) <= 0)
2063 prom_panic("cannot find stdout");
2064
2065 prom.stdout = be32_to_cpu(val);
2066
2067 /* Get the full OF pathname of the stdout device */
2068 memset(path, 0, 256);
2069 call_prom("instance-to-path", 3, 1, prom.stdout, path, 255);
2070 prom_printf("OF stdout device is: %s\n", of_stdout_device);
2071 prom_setprop(prom.chosen, "/chosen", "linux,stdout-path",
2072 path, strlen(path) + 1);
2073
2074 /* instance-to-package fails on PA-Semi */
2075 stdout_node = call_prom("instance-to-package", 1, 1, prom.stdout);
2076 if (stdout_node != PROM_ERROR) {
2077 val = cpu_to_be32(stdout_node);
2078 prom_setprop(prom.chosen, "/chosen", "linux,stdout-package",
2079 &val, sizeof(val));
2080
2081 /* If it's a display, note it */
2082 memset(type, 0, sizeof(type));
2083 prom_getprop(stdout_node, "device_type", type, sizeof(type));
2084 if (strcmp(type, "display") == 0)
2085 prom_setprop(stdout_node, path, "linux,boot-display", NULL, 0);
2086 }
2087}
2088
2089static int __init prom_find_machine_type(void)
2090{
2091 char compat[256];
2092 int len, i = 0;
2093#ifdef CONFIG_PPC64
2094 phandle rtas;
2095 int x;
2096#endif
2097
2098 /* Look for a PowerMac or a Cell */
2099 len = prom_getprop(prom.root, "compatible",
2100 compat, sizeof(compat)-1);
2101 if (len > 0) {
2102 compat[len] = 0;
2103 while (i < len) {
2104 char *p = &compat[i];
2105 int sl = strlen(p);
2106 if (sl == 0)
2107 break;
2108 if (strstr(p, "Power Macintosh") ||
2109 strstr(p, "MacRISC"))
2110 return PLATFORM_POWERMAC;
2111#ifdef CONFIG_PPC64
2112 /* We must make sure we don't detect the IBM Cell
2113 * blades as pSeries due to some firmware issues,
2114 * so we do it here.
2115 */
2116 if (strstr(p, "IBM,CBEA") ||
2117 strstr(p, "IBM,CPBW-1.0"))
2118 return PLATFORM_GENERIC;
2119#endif /* CONFIG_PPC64 */
2120 i += sl + 1;
2121 }
2122 }
2123#ifdef CONFIG_PPC64
2124 /* Try to detect OPAL */
2125 if (PHANDLE_VALID(call_prom("finddevice", 1, 1, ADDR("/ibm,opal"))))
2126 return PLATFORM_OPAL;
2127
2128 /* Try to figure out if it's an IBM pSeries or any other
2129 * PAPR compliant platform. We assume it is if :
2130 * - /device_type is "chrp" (please, do NOT use that for future
2131 * non-IBM designs !
2132 * - it has /rtas
2133 */
2134 len = prom_getprop(prom.root, "device_type",
2135 compat, sizeof(compat)-1);
2136 if (len <= 0)
2137 return PLATFORM_GENERIC;
2138 if (strcmp(compat, "chrp"))
2139 return PLATFORM_GENERIC;
2140
2141 /* Default to pSeries. We need to know if we are running LPAR */
2142 rtas = call_prom("finddevice", 1, 1, ADDR("/rtas"));
2143 if (!PHANDLE_VALID(rtas))
2144 return PLATFORM_GENERIC;
2145 x = prom_getproplen(rtas, "ibm,hypertas-functions");
2146 if (x != PROM_ERROR) {
2147 prom_debug("Hypertas detected, assuming LPAR !\n");
2148 return PLATFORM_PSERIES_LPAR;
2149 }
2150 return PLATFORM_PSERIES;
2151#else
2152 return PLATFORM_GENERIC;
2153#endif
2154}
2155
2156static int __init prom_set_color(ihandle ih, int i, int r, int g, int b)
2157{
2158 return call_prom("call-method", 6, 1, ADDR("color!"), ih, i, b, g, r);
2159}
2160
2161/*
2162 * If we have a display that we don't know how to drive,
2163 * we will want to try to execute OF's open method for it
2164 * later. However, OF will probably fall over if we do that
2165 * we've taken over the MMU.
2166 * So we check whether we will need to open the display,
2167 * and if so, open it now.
2168 */
2169static void __init prom_check_displays(void)
2170{
2171 char type[16], *path;
2172 phandle node;
2173 ihandle ih;
2174 int i;
2175
2176 static unsigned char default_colors[] = {
2177 0x00, 0x00, 0x00,
2178 0x00, 0x00, 0xaa,
2179 0x00, 0xaa, 0x00,
2180 0x00, 0xaa, 0xaa,
2181 0xaa, 0x00, 0x00,
2182 0xaa, 0x00, 0xaa,
2183 0xaa, 0xaa, 0x00,
2184 0xaa, 0xaa, 0xaa,
2185 0x55, 0x55, 0x55,
2186 0x55, 0x55, 0xff,
2187 0x55, 0xff, 0x55,
2188 0x55, 0xff, 0xff,
2189 0xff, 0x55, 0x55,
2190 0xff, 0x55, 0xff,
2191 0xff, 0xff, 0x55,
2192 0xff, 0xff, 0xff
2193 };
2194 const unsigned char *clut;
2195
2196 prom_debug("Looking for displays\n");
2197 for (node = 0; prom_next_node(&node); ) {
2198 memset(type, 0, sizeof(type));
2199 prom_getprop(node, "device_type", type, sizeof(type));
2200 if (strcmp(type, "display") != 0)
2201 continue;
2202
2203 /* It seems OF doesn't null-terminate the path :-( */
2204 path = prom_scratch;
2205 memset(path, 0, PROM_SCRATCH_SIZE);
2206
2207 /*
2208 * leave some room at the end of the path for appending extra
2209 * arguments
2210 */
2211 if (call_prom("package-to-path", 3, 1, node, path,
2212 PROM_SCRATCH_SIZE-10) == PROM_ERROR)
2213 continue;
2214 prom_printf("found display : %s, opening... ", path);
2215
2216 ih = call_prom("open", 1, 1, path);
2217 if (ih == 0) {
2218 prom_printf("failed\n");
2219 continue;
2220 }
2221
2222 /* Success */
2223 prom_printf("done\n");
2224 prom_setprop(node, path, "linux,opened", NULL, 0);
2225
2226 /* Setup a usable color table when the appropriate
2227 * method is available. Should update this to set-colors */
2228 clut = default_colors;
2229 for (i = 0; i < 16; i++, clut += 3)
2230 if (prom_set_color(ih, i, clut[0], clut[1],
2231 clut[2]) != 0)
2232 break;
2233
2234#ifdef CONFIG_LOGO_LINUX_CLUT224
2235 clut = PTRRELOC(logo_linux_clut224.clut);
2236 for (i = 0; i < logo_linux_clut224.clutsize; i++, clut += 3)
2237 if (prom_set_color(ih, i + 32, clut[0], clut[1],
2238 clut[2]) != 0)
2239 break;
2240#endif /* CONFIG_LOGO_LINUX_CLUT224 */
2241
2242#ifdef CONFIG_PPC_EARLY_DEBUG_BOOTX
2243 if (prom_getprop(node, "linux,boot-display", NULL, 0) !=
2244 PROM_ERROR) {
2245 u32 width, height, pitch, addr;
2246
2247 prom_printf("Setting btext !\n");
2248 prom_getprop(node, "width", &width, 4);
2249 prom_getprop(node, "height", &height, 4);
2250 prom_getprop(node, "linebytes", &pitch, 4);
2251 prom_getprop(node, "address", &addr, 4);
2252 prom_printf("W=%d H=%d LB=%d addr=0x%x\n",
2253 width, height, pitch, addr);
2254 btext_setup_display(width, height, 8, pitch, addr);
2255 }
2256#endif /* CONFIG_PPC_EARLY_DEBUG_BOOTX */
2257 }
2258}
2259
2260
2261/* Return (relocated) pointer to this much memory: moves initrd if reqd. */
2262static void __init *make_room(unsigned long *mem_start, unsigned long *mem_end,
2263 unsigned long needed, unsigned long align)
2264{
2265 void *ret;
2266
2267 *mem_start = _ALIGN(*mem_start, align);
2268 while ((*mem_start + needed) > *mem_end) {
2269 unsigned long room, chunk;
2270
2271 prom_debug("Chunk exhausted, claiming more at %x...\n",
2272 alloc_bottom);
2273 room = alloc_top - alloc_bottom;
2274 if (room > DEVTREE_CHUNK_SIZE)
2275 room = DEVTREE_CHUNK_SIZE;
2276 if (room < PAGE_SIZE)
2277 prom_panic("No memory for flatten_device_tree "
2278 "(no room)\n");
2279 chunk = alloc_up(room, 0);
2280 if (chunk == 0)
2281 prom_panic("No memory for flatten_device_tree "
2282 "(claim failed)\n");
2283 *mem_end = chunk + room;
2284 }
2285
2286 ret = (void *)*mem_start;
2287 *mem_start += needed;
2288
2289 return ret;
2290}
2291
2292#define dt_push_token(token, mem_start, mem_end) do { \
2293 void *room = make_room(mem_start, mem_end, 4, 4); \
2294 *(__be32 *)room = cpu_to_be32(token); \
2295 } while(0)
2296
2297static unsigned long __init dt_find_string(char *str)
2298{
2299 char *s, *os;
2300
2301 s = os = (char *)dt_string_start;
2302 s += 4;
2303 while (s < (char *)dt_string_end) {
2304 if (strcmp(s, str) == 0)
2305 return s - os;
2306 s += strlen(s) + 1;
2307 }
2308 return 0;
2309}
2310
2311/*
2312 * The Open Firmware 1275 specification states properties must be 31 bytes or
2313 * less, however not all firmwares obey this. Make it 64 bytes to be safe.
2314 */
2315#define MAX_PROPERTY_NAME 64
2316
2317static void __init scan_dt_build_strings(phandle node,
2318 unsigned long *mem_start,
2319 unsigned long *mem_end)
2320{
2321 char *prev_name, *namep, *sstart;
2322 unsigned long soff;
2323 phandle child;
2324
2325 sstart = (char *)dt_string_start;
2326
2327 /* get and store all property names */
2328 prev_name = "";
2329 for (;;) {
2330 /* 64 is max len of name including nul. */
2331 namep = make_room(mem_start, mem_end, MAX_PROPERTY_NAME, 1);
2332 if (call_prom("nextprop", 3, 1, node, prev_name, namep) != 1) {
2333 /* No more nodes: unwind alloc */
2334 *mem_start = (unsigned long)namep;
2335 break;
2336 }
2337
2338 /* skip "name" */
2339 if (strcmp(namep, "name") == 0) {
2340 *mem_start = (unsigned long)namep;
2341 prev_name = "name";
2342 continue;
2343 }
2344 /* get/create string entry */
2345 soff = dt_find_string(namep);
2346 if (soff != 0) {
2347 *mem_start = (unsigned long)namep;
2348 namep = sstart + soff;
2349 } else {
2350 /* Trim off some if we can */
2351 *mem_start = (unsigned long)namep + strlen(namep) + 1;
2352 dt_string_end = *mem_start;
2353 }
2354 prev_name = namep;
2355 }
2356
2357 /* do all our children */
2358 child = call_prom("child", 1, 1, node);
2359 while (child != 0) {
2360 scan_dt_build_strings(child, mem_start, mem_end);
2361 child = call_prom("peer", 1, 1, child);
2362 }
2363}
2364
2365static void __init scan_dt_build_struct(phandle node, unsigned long *mem_start,
2366 unsigned long *mem_end)
2367{
2368 phandle child;
2369 char *namep, *prev_name, *sstart, *p, *ep, *lp, *path;
2370 unsigned long soff;
2371 unsigned char *valp;
2372 static char pname[MAX_PROPERTY_NAME];
2373 int l, room, has_phandle = 0;
2374
2375 dt_push_token(OF_DT_BEGIN_NODE, mem_start, mem_end);
2376
2377 /* get the node's full name */
2378 namep = (char *)*mem_start;
2379 room = *mem_end - *mem_start;
2380 if (room > 255)
2381 room = 255;
2382 l = call_prom("package-to-path", 3, 1, node, namep, room);
2383 if (l >= 0) {
2384 /* Didn't fit? Get more room. */
2385 if (l >= room) {
2386 if (l >= *mem_end - *mem_start)
2387 namep = make_room(mem_start, mem_end, l+1, 1);
2388 call_prom("package-to-path", 3, 1, node, namep, l);
2389 }
2390 namep[l] = '\0';
2391
2392 /* Fixup an Apple bug where they have bogus \0 chars in the
2393 * middle of the path in some properties, and extract
2394 * the unit name (everything after the last '/').
2395 */
2396 for (lp = p = namep, ep = namep + l; p < ep; p++) {
2397 if (*p == '/')
2398 lp = namep;
2399 else if (*p != 0)
2400 *lp++ = *p;
2401 }
2402 *lp = 0;
2403 *mem_start = _ALIGN((unsigned long)lp + 1, 4);
2404 }
2405
2406 /* get it again for debugging */
2407 path = prom_scratch;
2408 memset(path, 0, PROM_SCRATCH_SIZE);
2409 call_prom("package-to-path", 3, 1, node, path, PROM_SCRATCH_SIZE-1);
2410
2411 /* get and store all properties */
2412 prev_name = "";
2413 sstart = (char *)dt_string_start;
2414 for (;;) {
2415 if (call_prom("nextprop", 3, 1, node, prev_name,
2416 pname) != 1)
2417 break;
2418
2419 /* skip "name" */
2420 if (strcmp(pname, "name") == 0) {
2421 prev_name = "name";
2422 continue;
2423 }
2424
2425 /* find string offset */
2426 soff = dt_find_string(pname);
2427 if (soff == 0) {
2428 prom_printf("WARNING: Can't find string index for"
2429 " <%s>, node %s\n", pname, path);
2430 break;
2431 }
2432 prev_name = sstart + soff;
2433
2434 /* get length */
2435 l = call_prom("getproplen", 2, 1, node, pname);
2436
2437 /* sanity checks */
2438 if (l == PROM_ERROR)
2439 continue;
2440
2441 /* push property head */
2442 dt_push_token(OF_DT_PROP, mem_start, mem_end);
2443 dt_push_token(l, mem_start, mem_end);
2444 dt_push_token(soff, mem_start, mem_end);
2445
2446 /* push property content */
2447 valp = make_room(mem_start, mem_end, l, 4);
2448 call_prom("getprop", 4, 1, node, pname, valp, l);
2449 *mem_start = _ALIGN(*mem_start, 4);
2450
2451 if (!strcmp(pname, "phandle"))
2452 has_phandle = 1;
2453 }
2454
2455 /* Add a "linux,phandle" property if no "phandle" property already
2456 * existed (can happen with OPAL)
2457 */
2458 if (!has_phandle) {
2459 soff = dt_find_string("linux,phandle");
2460 if (soff == 0)
2461 prom_printf("WARNING: Can't find string index for"
2462 " <linux-phandle> node %s\n", path);
2463 else {
2464 dt_push_token(OF_DT_PROP, mem_start, mem_end);
2465 dt_push_token(4, mem_start, mem_end);
2466 dt_push_token(soff, mem_start, mem_end);
2467 valp = make_room(mem_start, mem_end, 4, 4);
2468 *(__be32 *)valp = cpu_to_be32(node);
2469 }
2470 }
2471
2472 /* do all our children */
2473 child = call_prom("child", 1, 1, node);
2474 while (child != 0) {
2475 scan_dt_build_struct(child, mem_start, mem_end);
2476 child = call_prom("peer", 1, 1, child);
2477 }
2478
2479 dt_push_token(OF_DT_END_NODE, mem_start, mem_end);
2480}
2481
2482static void __init flatten_device_tree(void)
2483{
2484 phandle root;
2485 unsigned long mem_start, mem_end, room;
2486 struct boot_param_header *hdr;
2487 char *namep;
2488 u64 *rsvmap;
2489
2490 /*
2491 * Check how much room we have between alloc top & bottom (+/- a
2492 * few pages), crop to 1MB, as this is our "chunk" size
2493 */
2494 room = alloc_top - alloc_bottom - 0x4000;
2495 if (room > DEVTREE_CHUNK_SIZE)
2496 room = DEVTREE_CHUNK_SIZE;
2497 prom_debug("starting device tree allocs at %x\n", alloc_bottom);
2498
2499 /* Now try to claim that */
2500 mem_start = (unsigned long)alloc_up(room, PAGE_SIZE);
2501 if (mem_start == 0)
2502 prom_panic("Can't allocate initial device-tree chunk\n");
2503 mem_end = mem_start + room;
2504
2505 /* Get root of tree */
2506 root = call_prom("peer", 1, 1, (phandle)0);
2507 if (root == (phandle)0)
2508 prom_panic ("couldn't get device tree root\n");
2509
2510 /* Build header and make room for mem rsv map */
2511 mem_start = _ALIGN(mem_start, 4);
2512 hdr = make_room(&mem_start, &mem_end,
2513 sizeof(struct boot_param_header), 4);
2514 dt_header_start = (unsigned long)hdr;
2515 rsvmap = make_room(&mem_start, &mem_end, sizeof(mem_reserve_map), 8);
2516
2517 /* Start of strings */
2518 mem_start = PAGE_ALIGN(mem_start);
2519 dt_string_start = mem_start;
2520 mem_start += 4; /* hole */
2521
2522 /* Add "linux,phandle" in there, we'll need it */
2523 namep = make_room(&mem_start, &mem_end, 16, 1);
2524 strcpy(namep, "linux,phandle");
2525 mem_start = (unsigned long)namep + strlen(namep) + 1;
2526
2527 /* Build string array */
2528 prom_printf("Building dt strings...\n");
2529 scan_dt_build_strings(root, &mem_start, &mem_end);
2530 dt_string_end = mem_start;
2531
2532 /* Build structure */
2533 mem_start = PAGE_ALIGN(mem_start);
2534 dt_struct_start = mem_start;
2535 prom_printf("Building dt structure...\n");
2536 scan_dt_build_struct(root, &mem_start, &mem_end);
2537 dt_push_token(OF_DT_END, &mem_start, &mem_end);
2538 dt_struct_end = PAGE_ALIGN(mem_start);
2539
2540 /* Finish header */
2541 hdr->boot_cpuid_phys = cpu_to_be32(prom.cpu);
2542 hdr->magic = cpu_to_be32(OF_DT_HEADER);
2543 hdr->totalsize = cpu_to_be32(dt_struct_end - dt_header_start);
2544 hdr->off_dt_struct = cpu_to_be32(dt_struct_start - dt_header_start);
2545 hdr->off_dt_strings = cpu_to_be32(dt_string_start - dt_header_start);
2546 hdr->dt_strings_size = cpu_to_be32(dt_string_end - dt_string_start);
2547 hdr->off_mem_rsvmap = cpu_to_be32(((unsigned long)rsvmap) - dt_header_start);
2548 hdr->version = cpu_to_be32(OF_DT_VERSION);
2549 /* Version 16 is not backward compatible */
2550 hdr->last_comp_version = cpu_to_be32(0x10);
2551
2552 /* Copy the reserve map in */
2553 memcpy(rsvmap, mem_reserve_map, sizeof(mem_reserve_map));
2554
2555#ifdef DEBUG_PROM
2556 {
2557 int i;
2558 prom_printf("reserved memory map:\n");
2559 for (i = 0; i < mem_reserve_cnt; i++)
2560 prom_printf(" %x - %x\n",
2561 be64_to_cpu(mem_reserve_map[i].base),
2562 be64_to_cpu(mem_reserve_map[i].size));
2563 }
2564#endif
2565 /* Bump mem_reserve_cnt to cause further reservations to fail
2566 * since it's too late.
2567 */
2568 mem_reserve_cnt = MEM_RESERVE_MAP_SIZE;
2569
2570 prom_printf("Device tree strings 0x%x -> 0x%x\n",
2571 dt_string_start, dt_string_end);
2572 prom_printf("Device tree struct 0x%x -> 0x%x\n",
2573 dt_struct_start, dt_struct_end);
2574}
2575
2576#ifdef CONFIG_PPC_MAPLE
2577/* PIBS Version 1.05.0000 04/26/2005 has an incorrect /ht/isa/ranges property.
2578 * The values are bad, and it doesn't even have the right number of cells. */
2579static void __init fixup_device_tree_maple(void)
2580{
2581 phandle isa;
2582 u32 rloc = 0x01002000; /* IO space; PCI device = 4 */
2583 u32 isa_ranges[6];
2584 char *name;
2585
2586 name = "/ht@0/isa@4";
2587 isa = call_prom("finddevice", 1, 1, ADDR(name));
2588 if (!PHANDLE_VALID(isa)) {
2589 name = "/ht@0/isa@6";
2590 isa = call_prom("finddevice", 1, 1, ADDR(name));
2591 rloc = 0x01003000; /* IO space; PCI device = 6 */
2592 }
2593 if (!PHANDLE_VALID(isa))
2594 return;
2595
2596 if (prom_getproplen(isa, "ranges") != 12)
2597 return;
2598 if (prom_getprop(isa, "ranges", isa_ranges, sizeof(isa_ranges))
2599 == PROM_ERROR)
2600 return;
2601
2602 if (isa_ranges[0] != 0x1 ||
2603 isa_ranges[1] != 0xf4000000 ||
2604 isa_ranges[2] != 0x00010000)
2605 return;
2606
2607 prom_printf("Fixing up bogus ISA range on Maple/Apache...\n");
2608
2609 isa_ranges[0] = 0x1;
2610 isa_ranges[1] = 0x0;
2611 isa_ranges[2] = rloc;
2612 isa_ranges[3] = 0x0;
2613 isa_ranges[4] = 0x0;
2614 isa_ranges[5] = 0x00010000;
2615 prom_setprop(isa, name, "ranges",
2616 isa_ranges, sizeof(isa_ranges));
2617}
2618
2619#define CPC925_MC_START 0xf8000000
2620#define CPC925_MC_LENGTH 0x1000000
2621/* The values for memory-controller don't have right number of cells */
2622static void __init fixup_device_tree_maple_memory_controller(void)
2623{
2624 phandle mc;
2625 u32 mc_reg[4];
2626 char *name = "/hostbridge@f8000000";
2627 u32 ac, sc;
2628
2629 mc = call_prom("finddevice", 1, 1, ADDR(name));
2630 if (!PHANDLE_VALID(mc))
2631 return;
2632
2633 if (prom_getproplen(mc, "reg") != 8)
2634 return;
2635
2636 prom_getprop(prom.root, "#address-cells", &ac, sizeof(ac));
2637 prom_getprop(prom.root, "#size-cells", &sc, sizeof(sc));
2638 if ((ac != 2) || (sc != 2))
2639 return;
2640
2641 if (prom_getprop(mc, "reg", mc_reg, sizeof(mc_reg)) == PROM_ERROR)
2642 return;
2643
2644 if (mc_reg[0] != CPC925_MC_START || mc_reg[1] != CPC925_MC_LENGTH)
2645 return;
2646
2647 prom_printf("Fixing up bogus hostbridge on Maple...\n");
2648
2649 mc_reg[0] = 0x0;
2650 mc_reg[1] = CPC925_MC_START;
2651 mc_reg[2] = 0x0;
2652 mc_reg[3] = CPC925_MC_LENGTH;
2653 prom_setprop(mc, name, "reg", mc_reg, sizeof(mc_reg));
2654}
2655#else
2656#define fixup_device_tree_maple()
2657#define fixup_device_tree_maple_memory_controller()
2658#endif
2659
2660#ifdef CONFIG_PPC_CHRP
2661/*
2662 * Pegasos and BriQ lacks the "ranges" property in the isa node
2663 * Pegasos needs decimal IRQ 14/15, not hexadecimal
2664 * Pegasos has the IDE configured in legacy mode, but advertised as native
2665 */
2666static void __init fixup_device_tree_chrp(void)
2667{
2668 phandle ph;
2669 u32 prop[6];
2670 u32 rloc = 0x01006000; /* IO space; PCI device = 12 */
2671 char *name;
2672 int rc;
2673
2674 name = "/pci@80000000/isa@c";
2675 ph = call_prom("finddevice", 1, 1, ADDR(name));
2676 if (!PHANDLE_VALID(ph)) {
2677 name = "/pci@ff500000/isa@6";
2678 ph = call_prom("finddevice", 1, 1, ADDR(name));
2679 rloc = 0x01003000; /* IO space; PCI device = 6 */
2680 }
2681 if (PHANDLE_VALID(ph)) {
2682 rc = prom_getproplen(ph, "ranges");
2683 if (rc == 0 || rc == PROM_ERROR) {
2684 prom_printf("Fixing up missing ISA range on Pegasos...\n");
2685
2686 prop[0] = 0x1;
2687 prop[1] = 0x0;
2688 prop[2] = rloc;
2689 prop[3] = 0x0;
2690 prop[4] = 0x0;
2691 prop[5] = 0x00010000;
2692 prom_setprop(ph, name, "ranges", prop, sizeof(prop));
2693 }
2694 }
2695
2696 name = "/pci@80000000/ide@C,1";
2697 ph = call_prom("finddevice", 1, 1, ADDR(name));
2698 if (PHANDLE_VALID(ph)) {
2699 prom_printf("Fixing up IDE interrupt on Pegasos...\n");
2700 prop[0] = 14;
2701 prop[1] = 0x0;
2702 prom_setprop(ph, name, "interrupts", prop, 2*sizeof(u32));
2703 prom_printf("Fixing up IDE class-code on Pegasos...\n");
2704 rc = prom_getprop(ph, "class-code", prop, sizeof(u32));
2705 if (rc == sizeof(u32)) {
2706 prop[0] &= ~0x5;
2707 prom_setprop(ph, name, "class-code", prop, sizeof(u32));
2708 }
2709 }
2710}
2711#else
2712#define fixup_device_tree_chrp()
2713#endif
2714
2715#if defined(CONFIG_PPC64) && defined(CONFIG_PPC_PMAC)
2716static void __init fixup_device_tree_pmac(void)
2717{
2718 phandle u3, i2c, mpic;
2719 u32 u3_rev;
2720 u32 interrupts[2];
2721 u32 parent;
2722
2723 /* Some G5s have a missing interrupt definition, fix it up here */
2724 u3 = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000"));
2725 if (!PHANDLE_VALID(u3))
2726 return;
2727 i2c = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000/i2c@f8001000"));
2728 if (!PHANDLE_VALID(i2c))
2729 return;
2730 mpic = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000/mpic@f8040000"));
2731 if (!PHANDLE_VALID(mpic))
2732 return;
2733
2734 /* check if proper rev of u3 */
2735 if (prom_getprop(u3, "device-rev", &u3_rev, sizeof(u3_rev))
2736 == PROM_ERROR)
2737 return;
2738 if (u3_rev < 0x35 || u3_rev > 0x39)
2739 return;
2740 /* does it need fixup ? */
2741 if (prom_getproplen(i2c, "interrupts") > 0)
2742 return;
2743
2744 prom_printf("fixing up bogus interrupts for u3 i2c...\n");
2745
2746 /* interrupt on this revision of u3 is number 0 and level */
2747 interrupts[0] = 0;
2748 interrupts[1] = 1;
2749 prom_setprop(i2c, "/u3@0,f8000000/i2c@f8001000", "interrupts",
2750 &interrupts, sizeof(interrupts));
2751 parent = (u32)mpic;
2752 prom_setprop(i2c, "/u3@0,f8000000/i2c@f8001000", "interrupt-parent",
2753 &parent, sizeof(parent));
2754}
2755#else
2756#define fixup_device_tree_pmac()
2757#endif
2758
2759#ifdef CONFIG_PPC_EFIKA
2760/*
2761 * The MPC5200 FEC driver requires an phy-handle property to tell it how
2762 * to talk to the phy. If the phy-handle property is missing, then this
2763 * function is called to add the appropriate nodes and link it to the
2764 * ethernet node.
2765 */
2766static void __init fixup_device_tree_efika_add_phy(void)
2767{
2768 u32 node;
2769 char prop[64];
2770 int rv;
2771
2772 /* Check if /builtin/ethernet exists - bail if it doesn't */
2773 node = call_prom("finddevice", 1, 1, ADDR("/builtin/ethernet"));
2774 if (!PHANDLE_VALID(node))
2775 return;
2776
2777 /* Check if the phy-handle property exists - bail if it does */
2778 rv = prom_getprop(node, "phy-handle", prop, sizeof(prop));
2779 if (!rv)
2780 return;
2781
2782 /*
2783 * At this point the ethernet device doesn't have a phy described.
2784 * Now we need to add the missing phy node and linkage
2785 */
2786
2787 /* Check for an MDIO bus node - if missing then create one */
2788 node = call_prom("finddevice", 1, 1, ADDR("/builtin/mdio"));
2789 if (!PHANDLE_VALID(node)) {
2790 prom_printf("Adding Ethernet MDIO node\n");
2791 call_prom("interpret", 1, 1,
2792 " s\" /builtin\" find-device"
2793 " new-device"
2794 " 1 encode-int s\" #address-cells\" property"
2795 " 0 encode-int s\" #size-cells\" property"
2796 " s\" mdio\" device-name"
2797 " s\" fsl,mpc5200b-mdio\" encode-string"
2798 " s\" compatible\" property"
2799 " 0xf0003000 0x400 reg"
2800 " 0x2 encode-int"
2801 " 0x5 encode-int encode+"
2802 " 0x3 encode-int encode+"
2803 " s\" interrupts\" property"
2804 " finish-device");
2805 };
2806
2807 /* Check for a PHY device node - if missing then create one and
2808 * give it's phandle to the ethernet node */
2809 node = call_prom("finddevice", 1, 1,
2810 ADDR("/builtin/mdio/ethernet-phy"));
2811 if (!PHANDLE_VALID(node)) {
2812 prom_printf("Adding Ethernet PHY node\n");
2813 call_prom("interpret", 1, 1,
2814 " s\" /builtin/mdio\" find-device"
2815 " new-device"
2816 " s\" ethernet-phy\" device-name"
2817 " 0x10 encode-int s\" reg\" property"
2818 " my-self"
2819 " ihandle>phandle"
2820 " finish-device"
2821 " s\" /builtin/ethernet\" find-device"
2822 " encode-int"
2823 " s\" phy-handle\" property"
2824 " device-end");
2825 }
2826}
2827
2828static void __init fixup_device_tree_efika(void)
2829{
2830 int sound_irq[3] = { 2, 2, 0 };
2831 int bcomm_irq[3*16] = { 3,0,0, 3,1,0, 3,2,0, 3,3,0,
2832 3,4,0, 3,5,0, 3,6,0, 3,7,0,
2833 3,8,0, 3,9,0, 3,10,0, 3,11,0,
2834 3,12,0, 3,13,0, 3,14,0, 3,15,0 };
2835 u32 node;
2836 char prop[64];
2837 int rv, len;
2838
2839 /* Check if we're really running on a EFIKA */
2840 node = call_prom("finddevice", 1, 1, ADDR("/"));
2841 if (!PHANDLE_VALID(node))
2842 return;
2843
2844 rv = prom_getprop(node, "model", prop, sizeof(prop));
2845 if (rv == PROM_ERROR)
2846 return;
2847 if (strcmp(prop, "EFIKA5K2"))
2848 return;
2849
2850 prom_printf("Applying EFIKA device tree fixups\n");
2851
2852 /* Claiming to be 'chrp' is death */
2853 node = call_prom("finddevice", 1, 1, ADDR("/"));
2854 rv = prom_getprop(node, "device_type", prop, sizeof(prop));
2855 if (rv != PROM_ERROR && (strcmp(prop, "chrp") == 0))
2856 prom_setprop(node, "/", "device_type", "efika", sizeof("efika"));
2857
2858 /* CODEGEN,description is exposed in /proc/cpuinfo so
2859 fix that too */
2860 rv = prom_getprop(node, "CODEGEN,description", prop, sizeof(prop));
2861 if (rv != PROM_ERROR && (strstr(prop, "CHRP")))
2862 prom_setprop(node, "/", "CODEGEN,description",
2863 "Efika 5200B PowerPC System",
2864 sizeof("Efika 5200B PowerPC System"));
2865
2866 /* Fixup bestcomm interrupts property */
2867 node = call_prom("finddevice", 1, 1, ADDR("/builtin/bestcomm"));
2868 if (PHANDLE_VALID(node)) {
2869 len = prom_getproplen(node, "interrupts");
2870 if (len == 12) {
2871 prom_printf("Fixing bestcomm interrupts property\n");
2872 prom_setprop(node, "/builtin/bestcom", "interrupts",
2873 bcomm_irq, sizeof(bcomm_irq));
2874 }
2875 }
2876
2877 /* Fixup sound interrupts property */
2878 node = call_prom("finddevice", 1, 1, ADDR("/builtin/sound"));
2879 if (PHANDLE_VALID(node)) {
2880 rv = prom_getprop(node, "interrupts", prop, sizeof(prop));
2881 if (rv == PROM_ERROR) {
2882 prom_printf("Adding sound interrupts property\n");
2883 prom_setprop(node, "/builtin/sound", "interrupts",
2884 sound_irq, sizeof(sound_irq));
2885 }
2886 }
2887
2888 /* Make sure ethernet phy-handle property exists */
2889 fixup_device_tree_efika_add_phy();
2890}
2891#else
2892#define fixup_device_tree_efika()
2893#endif
2894
2895#ifdef CONFIG_PPC_PASEMI_NEMO
2896/*
2897 * CFE supplied on Nemo is broken in several ways, biggest
2898 * problem is that it reassigns ISA interrupts to unused mpic ints.
2899 * Add an interrupt-controller property for the io-bridge to use
2900 * and correct the ints so we can attach them to an irq_domain
2901 */
2902static void __init fixup_device_tree_pasemi(void)
2903{
2904 u32 interrupts[2], parent, rval, val = 0;
2905 char *name, *pci_name;
2906 phandle iob, node;
2907
2908 /* Find the root pci node */
2909 name = "/pxp@0,e0000000";
2910 iob = call_prom("finddevice", 1, 1, ADDR(name));
2911 if (!PHANDLE_VALID(iob))
2912 return;
2913
2914 /* check if interrupt-controller node set yet */
2915 if (prom_getproplen(iob, "interrupt-controller") !=PROM_ERROR)
2916 return;
2917
2918 prom_printf("adding interrupt-controller property for SB600...\n");
2919
2920 prom_setprop(iob, name, "interrupt-controller", &val, 0);
2921
2922 pci_name = "/pxp@0,e0000000/pci@11";
2923 node = call_prom("finddevice", 1, 1, ADDR(pci_name));
2924 parent = ADDR(iob);
2925
2926 for( ; prom_next_node(&node); ) {
2927 /* scan each node for one with an interrupt */
2928 if (!PHANDLE_VALID(node))
2929 continue;
2930
2931 rval = prom_getproplen(node, "interrupts");
2932 if (rval == 0 || rval == PROM_ERROR)
2933 continue;
2934
2935 prom_getprop(node, "interrupts", &interrupts, sizeof(interrupts));
2936 if ((interrupts[0] < 212) || (interrupts[0] > 222))
2937 continue;
2938
2939 /* found a node, update both interrupts and interrupt-parent */
2940 if ((interrupts[0] >= 212) && (interrupts[0] <= 215))
2941 interrupts[0] -= 203;
2942 if ((interrupts[0] >= 216) && (interrupts[0] <= 220))
2943 interrupts[0] -= 213;
2944 if (interrupts[0] == 221)
2945 interrupts[0] = 14;
2946 if (interrupts[0] == 222)
2947 interrupts[0] = 8;
2948
2949 prom_setprop(node, pci_name, "interrupts", interrupts,
2950 sizeof(interrupts));
2951 prom_setprop(node, pci_name, "interrupt-parent", &parent,
2952 sizeof(parent));
2953 }
2954
2955 /*
2956 * The io-bridge has device_type set to 'io-bridge' change it to 'isa'
2957 * so that generic isa-bridge code can add the SB600 and its on-board
2958 * peripherals.
2959 */
2960 name = "/pxp@0,e0000000/io-bridge@0";
2961 iob = call_prom("finddevice", 1, 1, ADDR(name));
2962 if (!PHANDLE_VALID(iob))
2963 return;
2964
2965 /* device_type is already set, just change it. */
2966
2967 prom_printf("Changing device_type of SB600 node...\n");
2968
2969 prom_setprop(iob, name, "device_type", "isa", sizeof("isa"));
2970}
2971#else /* !CONFIG_PPC_PASEMI_NEMO */
2972static inline void fixup_device_tree_pasemi(void) { }
2973#endif
2974
2975static void __init fixup_device_tree(void)
2976{
2977 fixup_device_tree_maple();
2978 fixup_device_tree_maple_memory_controller();
2979 fixup_device_tree_chrp();
2980 fixup_device_tree_pmac();
2981 fixup_device_tree_efika();
2982 fixup_device_tree_pasemi();
2983}
2984
2985static void __init prom_find_boot_cpu(void)
2986{
2987 __be32 rval;
2988 ihandle prom_cpu;
2989 phandle cpu_pkg;
2990
2991 rval = 0;
2992 if (prom_getprop(prom.chosen, "cpu", &rval, sizeof(rval)) <= 0)
2993 return;
2994 prom_cpu = be32_to_cpu(rval);
2995
2996 cpu_pkg = call_prom("instance-to-package", 1, 1, prom_cpu);
2997
2998 if (!PHANDLE_VALID(cpu_pkg))
2999 return;
3000
3001 prom_getprop(cpu_pkg, "reg", &rval, sizeof(rval));
3002 prom.cpu = be32_to_cpu(rval);
3003
3004 prom_debug("Booting CPU hw index = %lu\n", prom.cpu);
3005}
3006
3007static void __init prom_check_initrd(unsigned long r3, unsigned long r4)
3008{
3009#ifdef CONFIG_BLK_DEV_INITRD
3010 if (r3 && r4 && r4 != 0xdeadbeef) {
3011 __be64 val;
3012
3013 prom_initrd_start = is_kernel_addr(r3) ? __pa(r3) : r3;
3014 prom_initrd_end = prom_initrd_start + r4;
3015
3016 val = cpu_to_be64(prom_initrd_start);
3017 prom_setprop(prom.chosen, "/chosen", "linux,initrd-start",
3018 &val, sizeof(val));
3019 val = cpu_to_be64(prom_initrd_end);
3020 prom_setprop(prom.chosen, "/chosen", "linux,initrd-end",
3021 &val, sizeof(val));
3022
3023 reserve_mem(prom_initrd_start,
3024 prom_initrd_end - prom_initrd_start);
3025
3026 prom_debug("initrd_start=0x%x\n", prom_initrd_start);
3027 prom_debug("initrd_end=0x%x\n", prom_initrd_end);
3028 }
3029#endif /* CONFIG_BLK_DEV_INITRD */
3030}
3031
3032#ifdef CONFIG_PPC64
3033#ifdef CONFIG_RELOCATABLE
3034static void reloc_toc(void)
3035{
3036}
3037
3038static void unreloc_toc(void)
3039{
3040}
3041#else
3042static void __reloc_toc(unsigned long offset, unsigned long nr_entries)
3043{
3044 unsigned long i;
3045 unsigned long *toc_entry;
3046
3047 /* Get the start of the TOC by using r2 directly. */
3048 asm volatile("addi %0,2,-0x8000" : "=b" (toc_entry));
3049
3050 for (i = 0; i < nr_entries; i++) {
3051 *toc_entry = *toc_entry + offset;
3052 toc_entry++;
3053 }
3054}
3055
3056static void reloc_toc(void)
3057{
3058 unsigned long offset = reloc_offset();
3059 unsigned long nr_entries =
3060 (__prom_init_toc_end - __prom_init_toc_start) / sizeof(long);
3061
3062 __reloc_toc(offset, nr_entries);
3063
3064 mb();
3065}
3066
3067static void unreloc_toc(void)
3068{
3069 unsigned long offset = reloc_offset();
3070 unsigned long nr_entries =
3071 (__prom_init_toc_end - __prom_init_toc_start) / sizeof(long);
3072
3073 mb();
3074
3075 __reloc_toc(-offset, nr_entries);
3076}
3077#endif
3078#endif
3079
3080/*
3081 * We enter here early on, when the Open Firmware prom is still
3082 * handling exceptions and the MMU hash table for us.
3083 */
3084
3085unsigned long __init prom_init(unsigned long r3, unsigned long r4,
3086 unsigned long pp,
3087 unsigned long r6, unsigned long r7,
3088 unsigned long kbase)
3089{
3090 unsigned long hdr;
3091
3092#ifdef CONFIG_PPC32
3093 unsigned long offset = reloc_offset();
3094 reloc_got2(offset);
3095#else
3096 reloc_toc();
3097#endif
3098
3099 /*
3100 * First zero the BSS
3101 */
3102 memset(&__bss_start, 0, __bss_stop - __bss_start);
3103
3104 /*
3105 * Init interface to Open Firmware, get some node references,
3106 * like /chosen
3107 */
3108 prom_init_client_services(pp);
3109
3110 /*
3111 * See if this OF is old enough that we need to do explicit maps
3112 * and other workarounds
3113 */
3114 prom_find_mmu();
3115
3116 /*
3117 * Init prom stdout device
3118 */
3119 prom_init_stdout();
3120
3121 prom_printf("Preparing to boot %s", linux_banner);
3122
3123 /*
3124 * Get default machine type. At this point, we do not differentiate
3125 * between pSeries SMP and pSeries LPAR
3126 */
3127 of_platform = prom_find_machine_type();
3128 prom_printf("Detected machine type: %x\n", of_platform);
3129
3130#ifndef CONFIG_NONSTATIC_KERNEL
3131 /* Bail if this is a kdump kernel. */
3132 if (PHYSICAL_START > 0)
3133 prom_panic("Error: You can't boot a kdump kernel from OF!\n");
3134#endif
3135
3136 /*
3137 * Check for an initrd
3138 */
3139 prom_check_initrd(r3, r4);
3140
3141 /*
3142 * Do early parsing of command line
3143 */
3144 early_cmdline_parse();
3145
3146#if defined(CONFIG_PPC_PSERIES) || defined(CONFIG_PPC_POWERNV)
3147 /*
3148 * On pSeries, inform the firmware about our capabilities
3149 */
3150 if (of_platform == PLATFORM_PSERIES ||
3151 of_platform == PLATFORM_PSERIES_LPAR)
3152 prom_send_capabilities();
3153#endif
3154
3155 /*
3156 * Copy the CPU hold code
3157 */
3158 if (of_platform != PLATFORM_POWERMAC)
3159 copy_and_flush(0, kbase, 0x100, 0);
3160
3161 /*
3162 * Initialize memory management within prom_init
3163 */
3164 prom_init_mem();
3165
3166 /*
3167 * Determine which cpu is actually running right _now_
3168 */
3169 prom_find_boot_cpu();
3170
3171 /*
3172 * Initialize display devices
3173 */
3174 prom_check_displays();
3175
3176#if defined(CONFIG_PPC64) && defined(__BIG_ENDIAN__)
3177 /*
3178 * Initialize IOMMU (TCE tables) on pSeries. Do that before anything else
3179 * that uses the allocator, we need to make sure we get the top of memory
3180 * available for us here...
3181 */
3182 if (of_platform == PLATFORM_PSERIES)
3183 prom_initialize_tce_table();
3184#endif
3185
3186 /*
3187 * On non-powermacs, try to instantiate RTAS. PowerMacs don't
3188 * have a usable RTAS implementation.
3189 */
3190 if (of_platform != PLATFORM_POWERMAC &&
3191 of_platform != PLATFORM_OPAL)
3192 prom_instantiate_rtas();
3193
3194#ifdef CONFIG_PPC_POWERNV
3195 if (of_platform == PLATFORM_OPAL)
3196 prom_instantiate_opal();
3197#endif /* CONFIG_PPC_POWERNV */
3198
3199#ifdef CONFIG_PPC64
3200 /* instantiate sml */
3201 prom_instantiate_sml();
3202#endif
3203
3204 /*
3205 * On non-powermacs, put all CPUs in spin-loops.
3206 *
3207 * PowerMacs use a different mechanism to spin CPUs
3208 *
3209 * (This must be done after instanciating RTAS)
3210 */
3211 if (of_platform != PLATFORM_POWERMAC &&
3212 of_platform != PLATFORM_OPAL)
3213 prom_hold_cpus();
3214
3215 /*
3216 * Fill in some infos for use by the kernel later on
3217 */
3218 if (prom_memory_limit) {
3219 __be64 val = cpu_to_be64(prom_memory_limit);
3220 prom_setprop(prom.chosen, "/chosen", "linux,memory-limit",
3221 &val, sizeof(val));
3222 }
3223#ifdef CONFIG_PPC64
3224 if (prom_iommu_off)
3225 prom_setprop(prom.chosen, "/chosen", "linux,iommu-off",
3226 NULL, 0);
3227
3228 if (prom_iommu_force_on)
3229 prom_setprop(prom.chosen, "/chosen", "linux,iommu-force-on",
3230 NULL, 0);
3231
3232 if (prom_tce_alloc_start) {
3233 prom_setprop(prom.chosen, "/chosen", "linux,tce-alloc-start",
3234 &prom_tce_alloc_start,
3235 sizeof(prom_tce_alloc_start));
3236 prom_setprop(prom.chosen, "/chosen", "linux,tce-alloc-end",
3237 &prom_tce_alloc_end,
3238 sizeof(prom_tce_alloc_end));
3239 }
3240#endif
3241
3242 /*
3243 * Fixup any known bugs in the device-tree
3244 */
3245 fixup_device_tree();
3246
3247 /*
3248 * Now finally create the flattened device-tree
3249 */
3250 prom_printf("copying OF device tree...\n");
3251 flatten_device_tree();
3252
3253 /*
3254 * in case stdin is USB and still active on IBM machines...
3255 * Unfortunately quiesce crashes on some powermacs if we have
3256 * closed stdin already (in particular the powerbook 101). It
3257 * appears that the OPAL version of OFW doesn't like it either.
3258 */
3259 if (of_platform != PLATFORM_POWERMAC &&
3260 of_platform != PLATFORM_OPAL)
3261 prom_close_stdin();
3262
3263 /*
3264 * Call OF "quiesce" method to shut down pending DMA's from
3265 * devices etc...
3266 */
3267 prom_printf("Quiescing Open Firmware ...\n");
3268 call_prom("quiesce", 0, 0);
3269
3270 /*
3271 * And finally, call the kernel passing it the flattened device
3272 * tree and NULL as r5, thus triggering the new entry point which
3273 * is common to us and kexec
3274 */
3275 hdr = dt_header_start;
3276
3277 /* Don't print anything after quiesce under OPAL, it crashes OFW */
3278 if (of_platform != PLATFORM_OPAL) {
3279 prom_printf("Booting Linux via __start() @ 0x%lx ...\n", kbase);
3280 prom_debug("->dt_header_start=0x%x\n", hdr);
3281 }
3282
3283#ifdef CONFIG_PPC32
3284 reloc_got2(-offset);
3285#else
3286 unreloc_toc();
3287#endif
3288
3289#ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
3290 /* OPAL early debug gets the OPAL base & entry in r8 and r9 */
3291 __start(hdr, kbase, 0, 0, 0,
3292 prom_opal_base, prom_opal_entry);
3293#else
3294 __start(hdr, kbase, 0, 0, 0, 0, 0);
3295#endif
3296
3297 return 0;
3298}