GNU Linux-libre 4.19.304-gnu1
[releases.git] / arch / powerpc / kernel / prom_init.c
1 /*
2  * Procedures for interfacing to Open Firmware.
3  *
4  * Paul Mackerras       August 1996.
5  * Copyright (C) 1996-2005 Paul Mackerras.
6  * 
7  *  Adapted for 64bit PowerPC by Dave Engebretsen and Peter Bergner.
8  *    {engebret|bergner}@us.ibm.com 
9  *
10  *      This program is free software; you can redistribute it and/or
11  *      modify it under the terms of the GNU General Public License
12  *      as published by the Free Software Foundation; either version
13  *      2 of the License, or (at your option) any later version.
14  */
15
16 #undef DEBUG_PROM
17
18 /* we cannot use FORTIFY as it brings in new symbols */
19 #define __NO_FORTIFY
20
21 #include <stdarg.h>
22 #include <linux/kernel.h>
23 #include <linux/string.h>
24 #include <linux/init.h>
25 #include <linux/threads.h>
26 #include <linux/spinlock.h>
27 #include <linux/types.h>
28 #include <linux/pci.h>
29 #include <linux/proc_fs.h>
30 #include <linux/delay.h>
31 #include <linux/initrd.h>
32 #include <linux/bitops.h>
33 #include <asm/prom.h>
34 #include <asm/rtas.h>
35 #include <asm/page.h>
36 #include <asm/processor.h>
37 #include <asm/irq.h>
38 #include <asm/io.h>
39 #include <asm/smp.h>
40 #include <asm/mmu.h>
41 #include <asm/pgtable.h>
42 #include <asm/iommu.h>
43 #include <asm/btext.h>
44 #include <asm/sections.h>
45 #include <asm/machdep.h>
46 #include <asm/opal.h>
47 #include <asm/asm-prototypes.h>
48
49 #include <linux/linux_logo.h>
50
51 /*
52  * Eventually bump that one up
53  */
54 #define DEVTREE_CHUNK_SIZE      0x100000
55
56 /*
57  * This is the size of the local memory reserve map that gets copied
58  * into the boot params passed to the kernel. That size is totally
59  * flexible as the kernel just reads the list until it encounters an
60  * entry with size 0, so it can be changed without breaking binary
61  * compatibility
62  */
63 #define MEM_RESERVE_MAP_SIZE    8
64
65 /*
66  * prom_init() is called very early on, before the kernel text
67  * and data have been mapped to KERNELBASE.  At this point the code
68  * is running at whatever address it has been loaded at.
69  * On ppc32 we compile with -mrelocatable, which means that references
70  * to extern and static variables get relocated automatically.
71  * ppc64 objects are always relocatable, we just need to relocate the
72  * TOC.
73  *
74  * Because OF may have mapped I/O devices into the area starting at
75  * KERNELBASE, particularly on CHRP machines, we can't safely call
76  * OF once the kernel has been mapped to KERNELBASE.  Therefore all
77  * OF calls must be done within prom_init().
78  *
79  * ADDR is used in calls to call_prom.  The 4th and following
80  * arguments to call_prom should be 32-bit values.
81  * On ppc64, 64 bit values are truncated to 32 bits (and
82  * fortunately don't get interpreted as two arguments).
83  */
84 #define ADDR(x)         (u32)(unsigned long)(x)
85
86 #ifdef CONFIG_PPC64
87 #define OF_WORKAROUNDS  0
88 #else
89 #define OF_WORKAROUNDS  of_workarounds
90 int of_workarounds;
91 #endif
92
93 #define OF_WA_CLAIM     1       /* do phys/virt claim separately, then map */
94 #define OF_WA_LONGTRAIL 2       /* work around longtrail bugs */
95
96 #define PROM_BUG() do {                                         \
97         prom_printf("kernel BUG at %s line 0x%x!\n",            \
98                     __FILE__, __LINE__);                        \
99         __asm__ __volatile__(".long " BUG_ILLEGAL_INSTR);       \
100 } while (0)
101
102 #ifdef DEBUG_PROM
103 #define prom_debug(x...)        prom_printf(x)
104 #else
105 #define prom_debug(x...)        do { } while (0)
106 #endif
107
108
109 typedef u32 prom_arg_t;
110
111 struct prom_args {
112         __be32 service;
113         __be32 nargs;
114         __be32 nret;
115         __be32 args[10];
116 };
117
118 struct prom_t {
119         ihandle root;
120         phandle chosen;
121         int cpu;
122         ihandle stdout;
123         ihandle mmumap;
124         ihandle memory;
125 };
126
127 struct mem_map_entry {
128         __be64  base;
129         __be64  size;
130 };
131
132 typedef __be32 cell_t;
133
134 extern void __start(unsigned long r3, unsigned long r4, unsigned long r5,
135                     unsigned long r6, unsigned long r7, unsigned long r8,
136                     unsigned long r9);
137
138 #ifdef CONFIG_PPC64
139 extern int enter_prom(struct prom_args *args, unsigned long entry);
140 #else
141 static inline int enter_prom(struct prom_args *args, unsigned long entry)
142 {
143         return ((int (*)(struct prom_args *))entry)(args);
144 }
145 #endif
146
147 extern void copy_and_flush(unsigned long dest, unsigned long src,
148                            unsigned long size, unsigned long offset);
149
150 /* prom structure */
151 static struct prom_t __initdata prom;
152
153 static unsigned long prom_entry __initdata;
154
155 #define PROM_SCRATCH_SIZE 256
156
157 static char __initdata of_stdout_device[256];
158 static char __initdata prom_scratch[PROM_SCRATCH_SIZE];
159
160 static unsigned long __initdata dt_header_start;
161 static unsigned long __initdata dt_struct_start, dt_struct_end;
162 static unsigned long __initdata dt_string_start, dt_string_end;
163
164 static unsigned long __initdata prom_initrd_start, prom_initrd_end;
165
166 #ifdef CONFIG_PPC64
167 static int __initdata prom_iommu_force_on;
168 static int __initdata prom_iommu_off;
169 static unsigned long __initdata prom_tce_alloc_start;
170 static unsigned long __initdata prom_tce_alloc_end;
171 #endif
172
173 static bool prom_radix_disable __initdata = !IS_ENABLED(CONFIG_PPC_RADIX_MMU_DEFAULT);
174
175 struct platform_support {
176         bool hash_mmu;
177         bool radix_mmu;
178         bool radix_gtse;
179         bool xive;
180 };
181
182 /* Platforms codes are now obsolete in the kernel. Now only used within this
183  * file and ultimately gone too. Feel free to change them if you need, they
184  * are not shared with anything outside of this file anymore
185  */
186 #define PLATFORM_PSERIES        0x0100
187 #define PLATFORM_PSERIES_LPAR   0x0101
188 #define PLATFORM_LPAR           0x0001
189 #define PLATFORM_POWERMAC       0x0400
190 #define PLATFORM_GENERIC        0x0500
191 #define PLATFORM_OPAL           0x0600
192
193 static int __initdata of_platform;
194
195 static char __initdata prom_cmd_line[COMMAND_LINE_SIZE];
196
197 static unsigned long __initdata prom_memory_limit;
198
199 static unsigned long __initdata alloc_top;
200 static unsigned long __initdata alloc_top_high;
201 static unsigned long __initdata alloc_bottom;
202 static unsigned long __initdata rmo_top;
203 static unsigned long __initdata ram_top;
204
205 static struct mem_map_entry __initdata mem_reserve_map[MEM_RESERVE_MAP_SIZE];
206 static int __initdata mem_reserve_cnt;
207
208 static cell_t __initdata regbuf[1024];
209
210 static bool rtas_has_query_cpu_stopped;
211
212
213 /*
214  * Error results ... some OF calls will return "-1" on error, some
215  * will return 0, some will return either. To simplify, here are
216  * macros to use with any ihandle or phandle return value to check if
217  * it is valid
218  */
219
220 #define PROM_ERROR              (-1u)
221 #define PHANDLE_VALID(p)        ((p) != 0 && (p) != PROM_ERROR)
222 #define IHANDLE_VALID(i)        ((i) != 0 && (i) != PROM_ERROR)
223
224
225 /* This is the one and *ONLY* place where we actually call open
226  * firmware.
227  */
228
229 static int __init call_prom(const char *service, int nargs, int nret, ...)
230 {
231         int i;
232         struct prom_args args;
233         va_list list;
234
235         args.service = cpu_to_be32(ADDR(service));
236         args.nargs = cpu_to_be32(nargs);
237         args.nret = cpu_to_be32(nret);
238
239         va_start(list, nret);
240         for (i = 0; i < nargs; i++)
241                 args.args[i] = cpu_to_be32(va_arg(list, prom_arg_t));
242         va_end(list);
243
244         for (i = 0; i < nret; i++)
245                 args.args[nargs+i] = 0;
246
247         if (enter_prom(&args, prom_entry) < 0)
248                 return PROM_ERROR;
249
250         return (nret > 0) ? be32_to_cpu(args.args[nargs]) : 0;
251 }
252
253 static int __init call_prom_ret(const char *service, int nargs, int nret,
254                                 prom_arg_t *rets, ...)
255 {
256         int i;
257         struct prom_args args;
258         va_list list;
259
260         args.service = cpu_to_be32(ADDR(service));
261         args.nargs = cpu_to_be32(nargs);
262         args.nret = cpu_to_be32(nret);
263
264         va_start(list, rets);
265         for (i = 0; i < nargs; i++)
266                 args.args[i] = cpu_to_be32(va_arg(list, prom_arg_t));
267         va_end(list);
268
269         for (i = 0; i < nret; i++)
270                 args.args[nargs+i] = 0;
271
272         if (enter_prom(&args, prom_entry) < 0)
273                 return PROM_ERROR;
274
275         if (rets != NULL)
276                 for (i = 1; i < nret; ++i)
277                         rets[i-1] = be32_to_cpu(args.args[nargs+i]);
278
279         return (nret > 0) ? be32_to_cpu(args.args[nargs]) : 0;
280 }
281
282
283 static void __init prom_print(const char *msg)
284 {
285         const char *p, *q;
286
287         if (prom.stdout == 0)
288                 return;
289
290         for (p = msg; *p != 0; p = q) {
291                 for (q = p; *q != 0 && *q != '\n'; ++q)
292                         ;
293                 if (q > p)
294                         call_prom("write", 3, 1, prom.stdout, p, q - p);
295                 if (*q == 0)
296                         break;
297                 ++q;
298                 call_prom("write", 3, 1, prom.stdout, ADDR("\r\n"), 2);
299         }
300 }
301
302
303 /*
304  * Both prom_print_hex & prom_print_dec takes an unsigned long as input so that
305  * we do not need __udivdi3 or __umoddi3 on 32bits.
306  */
307 static void __init prom_print_hex(unsigned long val)
308 {
309         int i, nibbles = sizeof(val)*2;
310         char buf[sizeof(val)*2+1];
311
312         for (i = nibbles-1;  i >= 0;  i--) {
313                 buf[i] = (val & 0xf) + '0';
314                 if (buf[i] > '9')
315                         buf[i] += ('a'-'0'-10);
316                 val >>= 4;
317         }
318         buf[nibbles] = '\0';
319         call_prom("write", 3, 1, prom.stdout, buf, nibbles);
320 }
321
322 /* max number of decimal digits in an unsigned long */
323 #define UL_DIGITS 21
324 static void __init prom_print_dec(unsigned long val)
325 {
326         int i, size;
327         char buf[UL_DIGITS+1];
328
329         for (i = UL_DIGITS-1; i >= 0;  i--) {
330                 buf[i] = (val % 10) + '0';
331                 val = val/10;
332                 if (val == 0)
333                         break;
334         }
335         /* shift stuff down */
336         size = UL_DIGITS - i;
337         call_prom("write", 3, 1, prom.stdout, buf+i, size);
338 }
339
340 __printf(1, 2)
341 static void __init prom_printf(const char *format, ...)
342 {
343         const char *p, *q, *s;
344         va_list args;
345         unsigned long v;
346         long vs;
347         int n = 0;
348
349         va_start(args, format);
350         for (p = format; *p != 0; p = q) {
351                 for (q = p; *q != 0 && *q != '\n' && *q != '%'; ++q)
352                         ;
353                 if (q > p)
354                         call_prom("write", 3, 1, prom.stdout, p, q - p);
355                 if (*q == 0)
356                         break;
357                 if (*q == '\n') {
358                         ++q;
359                         call_prom("write", 3, 1, prom.stdout,
360                                   ADDR("\r\n"), 2);
361                         continue;
362                 }
363                 ++q;
364                 if (*q == 0)
365                         break;
366                 while (*q == 'l') {
367                         ++q;
368                         ++n;
369                 }
370                 switch (*q) {
371                 case 's':
372                         ++q;
373                         s = va_arg(args, const char *);
374                         prom_print(s);
375                         break;
376                 case 'x':
377                         ++q;
378                         switch (n) {
379                         case 0:
380                                 v = va_arg(args, unsigned int);
381                                 break;
382                         case 1:
383                                 v = va_arg(args, unsigned long);
384                                 break;
385                         case 2:
386                         default:
387                                 v = va_arg(args, unsigned long long);
388                                 break;
389                         }
390                         prom_print_hex(v);
391                         break;
392                 case 'u':
393                         ++q;
394                         switch (n) {
395                         case 0:
396                                 v = va_arg(args, unsigned int);
397                                 break;
398                         case 1:
399                                 v = va_arg(args, unsigned long);
400                                 break;
401                         case 2:
402                         default:
403                                 v = va_arg(args, unsigned long long);
404                                 break;
405                         }
406                         prom_print_dec(v);
407                         break;
408                 case 'd':
409                         ++q;
410                         switch (n) {
411                         case 0:
412                                 vs = va_arg(args, int);
413                                 break;
414                         case 1:
415                                 vs = va_arg(args, long);
416                                 break;
417                         case 2:
418                         default:
419                                 vs = va_arg(args, long long);
420                                 break;
421                         }
422                         if (vs < 0) {
423                                 prom_print("-");
424                                 vs = -vs;
425                         }
426                         prom_print_dec(vs);
427                         break;
428                 }
429         }
430         va_end(args);
431 }
432
433
434 static unsigned int __init prom_claim(unsigned long virt, unsigned long size,
435                                 unsigned long align)
436 {
437
438         if (align == 0 && (OF_WORKAROUNDS & OF_WA_CLAIM)) {
439                 /*
440                  * Old OF requires we claim physical and virtual separately
441                  * and then map explicitly (assuming virtual mode)
442                  */
443                 int ret;
444                 prom_arg_t result;
445
446                 ret = call_prom_ret("call-method", 5, 2, &result,
447                                     ADDR("claim"), prom.memory,
448                                     align, size, virt);
449                 if (ret != 0 || result == -1)
450                         return -1;
451                 ret = call_prom_ret("call-method", 5, 2, &result,
452                                     ADDR("claim"), prom.mmumap,
453                                     align, size, virt);
454                 if (ret != 0) {
455                         call_prom("call-method", 4, 1, ADDR("release"),
456                                   prom.memory, size, virt);
457                         return -1;
458                 }
459                 /* the 0x12 is M (coherence) + PP == read/write */
460                 call_prom("call-method", 6, 1,
461                           ADDR("map"), prom.mmumap, 0x12, size, virt, virt);
462                 return virt;
463         }
464         return call_prom("claim", 3, 1, (prom_arg_t)virt, (prom_arg_t)size,
465                          (prom_arg_t)align);
466 }
467
468 static void __init __attribute__((noreturn)) prom_panic(const char *reason)
469 {
470         prom_print(reason);
471         /* Do not call exit because it clears the screen on pmac
472          * it also causes some sort of double-fault on early pmacs */
473         if (of_platform == PLATFORM_POWERMAC)
474                 asm("trap\n");
475
476         /* ToDo: should put up an SRC here on pSeries */
477         call_prom("exit", 0, 0);
478
479         for (;;)                        /* should never get here */
480                 ;
481 }
482
483
484 static int __init prom_next_node(phandle *nodep)
485 {
486         phandle node;
487
488         if ((node = *nodep) != 0
489             && (*nodep = call_prom("child", 1, 1, node)) != 0)
490                 return 1;
491         if ((*nodep = call_prom("peer", 1, 1, node)) != 0)
492                 return 1;
493         for (;;) {
494                 if ((node = call_prom("parent", 1, 1, node)) == 0)
495                         return 0;
496                 if ((*nodep = call_prom("peer", 1, 1, node)) != 0)
497                         return 1;
498         }
499 }
500
501 static inline int prom_getprop(phandle node, const char *pname,
502                                void *value, size_t valuelen)
503 {
504         return call_prom("getprop", 4, 1, node, ADDR(pname),
505                          (u32)(unsigned long) value, (u32) valuelen);
506 }
507
508 static inline int prom_getproplen(phandle node, const char *pname)
509 {
510         return call_prom("getproplen", 2, 1, node, ADDR(pname));
511 }
512
513 static void add_string(char **str, const char *q)
514 {
515         char *p = *str;
516
517         while (*q)
518                 *p++ = *q++;
519         *p++ = ' ';
520         *str = p;
521 }
522
523 static char *tohex(unsigned int x)
524 {
525         static char digits[] = "0123456789abcdef";
526         static char result[9];
527         int i;
528
529         result[8] = 0;
530         i = 8;
531         do {
532                 --i;
533                 result[i] = digits[x & 0xf];
534                 x >>= 4;
535         } while (x != 0 && i > 0);
536         return &result[i];
537 }
538
539 static int __init prom_setprop(phandle node, const char *nodename,
540                                const char *pname, void *value, size_t valuelen)
541 {
542         char cmd[256], *p;
543
544         if (!(OF_WORKAROUNDS & OF_WA_LONGTRAIL))
545                 return call_prom("setprop", 4, 1, node, ADDR(pname),
546                                  (u32)(unsigned long) value, (u32) valuelen);
547
548         /* gah... setprop doesn't work on longtrail, have to use interpret */
549         p = cmd;
550         add_string(&p, "dev");
551         add_string(&p, nodename);
552         add_string(&p, tohex((u32)(unsigned long) value));
553         add_string(&p, tohex(valuelen));
554         add_string(&p, tohex(ADDR(pname)));
555         add_string(&p, tohex(strlen(pname)));
556         add_string(&p, "property");
557         *p = 0;
558         return call_prom("interpret", 1, 1, (u32)(unsigned long) cmd);
559 }
560
561 /* We can't use the standard versions because of relocation headaches. */
562 #define isxdigit(c)     (('0' <= (c) && (c) <= '9') \
563                          || ('a' <= (c) && (c) <= 'f') \
564                          || ('A' <= (c) && (c) <= 'F'))
565
566 #define isdigit(c)      ('0' <= (c) && (c) <= '9')
567 #define islower(c)      ('a' <= (c) && (c) <= 'z')
568 #define toupper(c)      (islower(c) ? ((c) - 'a' + 'A') : (c))
569
570 static unsigned long prom_strtoul(const char *cp, const char **endp)
571 {
572         unsigned long result = 0, base = 10, value;
573
574         if (*cp == '0') {
575                 base = 8;
576                 cp++;
577                 if (toupper(*cp) == 'X') {
578                         cp++;
579                         base = 16;
580                 }
581         }
582
583         while (isxdigit(*cp) &&
584                (value = isdigit(*cp) ? *cp - '0' : toupper(*cp) - 'A' + 10) < base) {
585                 result = result * base + value;
586                 cp++;
587         }
588
589         if (endp)
590                 *endp = cp;
591
592         return result;
593 }
594
595 static unsigned long prom_memparse(const char *ptr, const char **retptr)
596 {
597         unsigned long ret = prom_strtoul(ptr, retptr);
598         int shift = 0;
599
600         /*
601          * We can't use a switch here because GCC *may* generate a
602          * jump table which won't work, because we're not running at
603          * the address we're linked at.
604          */
605         if ('G' == **retptr || 'g' == **retptr)
606                 shift = 30;
607
608         if ('M' == **retptr || 'm' == **retptr)
609                 shift = 20;
610
611         if ('K' == **retptr || 'k' == **retptr)
612                 shift = 10;
613
614         if (shift) {
615                 ret <<= shift;
616                 (*retptr)++;
617         }
618
619         return ret;
620 }
621
622 /*
623  * Early parsing of the command line passed to the kernel, used for
624  * "mem=x" and the options that affect the iommu
625  */
626 static void __init early_cmdline_parse(void)
627 {
628         const char *opt;
629
630         char *p;
631         int l __maybe_unused = 0;
632
633         prom_cmd_line[0] = 0;
634         p = prom_cmd_line;
635         if ((long)prom.chosen > 0)
636                 l = prom_getprop(prom.chosen, "bootargs", p, COMMAND_LINE_SIZE-1);
637 #ifdef CONFIG_CMDLINE
638         if (l <= 0 || p[0] == '\0') /* dbl check */
639                 strlcpy(prom_cmd_line,
640                         CONFIG_CMDLINE, sizeof(prom_cmd_line));
641 #endif /* CONFIG_CMDLINE */
642         prom_printf("command line: %s\n", prom_cmd_line);
643
644 #ifdef CONFIG_PPC64
645         opt = strstr(prom_cmd_line, "iommu=");
646         if (opt) {
647                 prom_printf("iommu opt is: %s\n", opt);
648                 opt += 6;
649                 while (*opt && *opt == ' ')
650                         opt++;
651                 if (!strncmp(opt, "off", 3))
652                         prom_iommu_off = 1;
653                 else if (!strncmp(opt, "force", 5))
654                         prom_iommu_force_on = 1;
655         }
656 #endif
657         opt = strstr(prom_cmd_line, "mem=");
658         if (opt) {
659                 opt += 4;
660                 prom_memory_limit = prom_memparse(opt, (const char **)&opt);
661 #ifdef CONFIG_PPC64
662                 /* Align to 16 MB == size of ppc64 large page */
663                 prom_memory_limit = ALIGN(prom_memory_limit, 0x1000000);
664 #endif
665         }
666
667         opt = strstr(prom_cmd_line, "disable_radix");
668         if (opt) {
669                 opt += 13;
670                 if (*opt && *opt == '=') {
671                         bool val;
672
673                         if (kstrtobool(++opt, &val))
674                                 prom_radix_disable = false;
675                         else
676                                 prom_radix_disable = val;
677                 } else
678                         prom_radix_disable = true;
679         }
680         if (prom_radix_disable)
681                 prom_debug("Radix disabled from cmdline\n");
682 }
683
684 #if defined(CONFIG_PPC_PSERIES) || defined(CONFIG_PPC_POWERNV)
685 /*
686  * The architecture vector has an array of PVR mask/value pairs,
687  * followed by # option vectors - 1, followed by the option vectors.
688  *
689  * See prom.h for the definition of the bits specified in the
690  * architecture vector.
691  */
692
693 /* Firmware expects the value to be n - 1, where n is the # of vectors */
694 #define NUM_VECTORS(n)          ((n) - 1)
695
696 /*
697  * Firmware expects 1 + n - 2, where n is the length of the option vector in
698  * bytes. The 1 accounts for the length byte itself, the - 2 .. ?
699  */
700 #define VECTOR_LENGTH(n)        (1 + (n) - 2)
701
702 struct option_vector1 {
703         u8 byte1;
704         u8 arch_versions;
705         u8 arch_versions3;
706 } __packed;
707
708 struct option_vector2 {
709         u8 byte1;
710         __be16 reserved;
711         __be32 real_base;
712         __be32 real_size;
713         __be32 virt_base;
714         __be32 virt_size;
715         __be32 load_base;
716         __be32 min_rma;
717         __be32 min_load;
718         u8 min_rma_percent;
719         u8 max_pft_size;
720 } __packed;
721
722 struct option_vector3 {
723         u8 byte1;
724         u8 byte2;
725 } __packed;
726
727 struct option_vector4 {
728         u8 byte1;
729         u8 min_vp_cap;
730 } __packed;
731
732 struct option_vector5 {
733         u8 byte1;
734         u8 byte2;
735         u8 byte3;
736         u8 cmo;
737         u8 associativity;
738         u8 bin_opts;
739         u8 micro_checkpoint;
740         u8 reserved0;
741         __be32 max_cpus;
742         __be16 papr_level;
743         __be16 reserved1;
744         u8 platform_facilities;
745         u8 reserved2;
746         __be16 reserved3;
747         u8 subprocessors;
748         u8 byte22;
749         u8 intarch;
750         u8 mmu;
751         u8 hash_ext;
752         u8 radix_ext;
753 } __packed;
754
755 struct option_vector6 {
756         u8 reserved;
757         u8 secondary_pteg;
758         u8 os_name;
759 } __packed;
760
761 struct ibm_arch_vec {
762         struct { u32 mask, val; } pvrs[12];
763
764         u8 num_vectors;
765
766         u8 vec1_len;
767         struct option_vector1 vec1;
768
769         u8 vec2_len;
770         struct option_vector2 vec2;
771
772         u8 vec3_len;
773         struct option_vector3 vec3;
774
775         u8 vec4_len;
776         struct option_vector4 vec4;
777
778         u8 vec5_len;
779         struct option_vector5 vec5;
780
781         u8 vec6_len;
782         struct option_vector6 vec6;
783 } __packed;
784
785 struct ibm_arch_vec __cacheline_aligned ibm_architecture_vec = {
786         .pvrs = {
787                 {
788                         .mask = cpu_to_be32(0xfffe0000), /* POWER5/POWER5+ */
789                         .val  = cpu_to_be32(0x003a0000),
790                 },
791                 {
792                         .mask = cpu_to_be32(0xffff0000), /* POWER6 */
793                         .val  = cpu_to_be32(0x003e0000),
794                 },
795                 {
796                         .mask = cpu_to_be32(0xffff0000), /* POWER7 */
797                         .val  = cpu_to_be32(0x003f0000),
798                 },
799                 {
800                         .mask = cpu_to_be32(0xffff0000), /* POWER8E */
801                         .val  = cpu_to_be32(0x004b0000),
802                 },
803                 {
804                         .mask = cpu_to_be32(0xffff0000), /* POWER8NVL */
805                         .val  = cpu_to_be32(0x004c0000),
806                 },
807                 {
808                         .mask = cpu_to_be32(0xffff0000), /* POWER8 */
809                         .val  = cpu_to_be32(0x004d0000),
810                 },
811                 {
812                         .mask = cpu_to_be32(0xffff0000), /* POWER9 */
813                         .val  = cpu_to_be32(0x004e0000),
814                 },
815                 {
816                         .mask = cpu_to_be32(0xffffffff), /* all 3.00-compliant */
817                         .val  = cpu_to_be32(0x0f000005),
818                 },
819                 {
820                         .mask = cpu_to_be32(0xffffffff), /* all 2.07-compliant */
821                         .val  = cpu_to_be32(0x0f000004),
822                 },
823                 {
824                         .mask = cpu_to_be32(0xffffffff), /* all 2.06-compliant */
825                         .val  = cpu_to_be32(0x0f000003),
826                 },
827                 {
828                         .mask = cpu_to_be32(0xffffffff), /* all 2.05-compliant */
829                         .val  = cpu_to_be32(0x0f000002),
830                 },
831                 {
832                         .mask = cpu_to_be32(0xfffffffe), /* all 2.04-compliant and earlier */
833                         .val  = cpu_to_be32(0x0f000001),
834                 },
835         },
836
837         .num_vectors = NUM_VECTORS(6),
838
839         .vec1_len = VECTOR_LENGTH(sizeof(struct option_vector1)),
840         .vec1 = {
841                 .byte1 = 0,
842                 .arch_versions = OV1_PPC_2_00 | OV1_PPC_2_01 | OV1_PPC_2_02 | OV1_PPC_2_03 |
843                                  OV1_PPC_2_04 | OV1_PPC_2_05 | OV1_PPC_2_06 | OV1_PPC_2_07,
844                 .arch_versions3 = OV1_PPC_3_00,
845         },
846
847         .vec2_len = VECTOR_LENGTH(sizeof(struct option_vector2)),
848         /* option vector 2: Open Firmware options supported */
849         .vec2 = {
850                 .byte1 = OV2_REAL_MODE,
851                 .reserved = 0,
852                 .real_base = cpu_to_be32(0xffffffff),
853                 .real_size = cpu_to_be32(0xffffffff),
854                 .virt_base = cpu_to_be32(0xffffffff),
855                 .virt_size = cpu_to_be32(0xffffffff),
856                 .load_base = cpu_to_be32(0xffffffff),
857                 .min_rma = cpu_to_be32(512),            /* 512MB min RMA */
858                 .min_load = cpu_to_be32(0xffffffff),    /* full client load */
859                 .min_rma_percent = 0,   /* min RMA percentage of total RAM */
860                 .max_pft_size = 48,     /* max log_2(hash table size) */
861         },
862
863         .vec3_len = VECTOR_LENGTH(sizeof(struct option_vector3)),
864         /* option vector 3: processor options supported */
865         .vec3 = {
866                 .byte1 = 0,                     /* don't ignore, don't halt */
867                 .byte2 = OV3_FP | OV3_VMX | OV3_DFP,
868         },
869
870         .vec4_len = VECTOR_LENGTH(sizeof(struct option_vector4)),
871         /* option vector 4: IBM PAPR implementation */
872         .vec4 = {
873                 .byte1 = 0,                     /* don't halt */
874                 .min_vp_cap = OV4_MIN_ENT_CAP,  /* minimum VP entitled capacity */
875         },
876
877         .vec5_len = VECTOR_LENGTH(sizeof(struct option_vector5)),
878         /* option vector 5: PAPR/OF options */
879         .vec5 = {
880                 .byte1 = 0,                             /* don't ignore, don't halt */
881                 .byte2 = OV5_FEAT(OV5_LPAR) | OV5_FEAT(OV5_SPLPAR) | OV5_FEAT(OV5_LARGE_PAGES) |
882                 OV5_FEAT(OV5_DRCONF_MEMORY) | OV5_FEAT(OV5_DONATE_DEDICATE_CPU) |
883 #ifdef CONFIG_PCI_MSI
884                 /* PCIe/MSI support.  Without MSI full PCIe is not supported */
885                 OV5_FEAT(OV5_MSI),
886 #else
887                 0,
888 #endif
889                 .byte3 = 0,
890                 .cmo =
891 #ifdef CONFIG_PPC_SMLPAR
892                 OV5_FEAT(OV5_CMO) | OV5_FEAT(OV5_XCMO),
893 #else
894                 0,
895 #endif
896                 .associativity = OV5_FEAT(OV5_TYPE1_AFFINITY) | OV5_FEAT(OV5_PRRN),
897                 .bin_opts = OV5_FEAT(OV5_RESIZE_HPT) | OV5_FEAT(OV5_HP_EVT),
898                 .micro_checkpoint = 0,
899                 .reserved0 = 0,
900                 .max_cpus = cpu_to_be32(NR_CPUS),       /* number of cores supported */
901                 .papr_level = 0,
902                 .reserved1 = 0,
903                 .platform_facilities = OV5_FEAT(OV5_PFO_HW_RNG) | OV5_FEAT(OV5_PFO_HW_ENCR) | OV5_FEAT(OV5_PFO_HW_842),
904                 .reserved2 = 0,
905                 .reserved3 = 0,
906                 .subprocessors = 1,
907                 .byte22 = OV5_FEAT(OV5_DRMEM_V2) | OV5_FEAT(OV5_DRC_INFO),
908                 .intarch = 0,
909                 .mmu = 0,
910                 .hash_ext = 0,
911                 .radix_ext = 0,
912         },
913
914         /* option vector 6: IBM PAPR hints */
915         .vec6_len = VECTOR_LENGTH(sizeof(struct option_vector6)),
916         .vec6 = {
917                 .reserved = 0,
918                 .secondary_pteg = 0,
919                 .os_name = OV6_LINUX,
920         },
921 };
922
923 /* Old method - ELF header with PT_NOTE sections only works on BE */
924 #ifdef __BIG_ENDIAN__
925 static struct fake_elf {
926         Elf32_Ehdr      elfhdr;
927         Elf32_Phdr      phdr[2];
928         struct chrpnote {
929                 u32     namesz;
930                 u32     descsz;
931                 u32     type;
932                 char    name[8];        /* "PowerPC" */
933                 struct chrpdesc {
934                         u32     real_mode;
935                         u32     real_base;
936                         u32     real_size;
937                         u32     virt_base;
938                         u32     virt_size;
939                         u32     load_base;
940                 } chrpdesc;
941         } chrpnote;
942         struct rpanote {
943                 u32     namesz;
944                 u32     descsz;
945                 u32     type;
946                 char    name[24];       /* "IBM,RPA-Client-Config" */
947                 struct rpadesc {
948                         u32     lpar_affinity;
949                         u32     min_rmo_size;
950                         u32     min_rmo_percent;
951                         u32     max_pft_size;
952                         u32     splpar;
953                         u32     min_load;
954                         u32     new_mem_def;
955                         u32     ignore_me;
956                 } rpadesc;
957         } rpanote;
958 } fake_elf = {
959         .elfhdr = {
960                 .e_ident = { 0x7f, 'E', 'L', 'F',
961                              ELFCLASS32, ELFDATA2MSB, EV_CURRENT },
962                 .e_type = ET_EXEC,      /* yeah right */
963                 .e_machine = EM_PPC,
964                 .e_version = EV_CURRENT,
965                 .e_phoff = offsetof(struct fake_elf, phdr),
966                 .e_phentsize = sizeof(Elf32_Phdr),
967                 .e_phnum = 2
968         },
969         .phdr = {
970                 [0] = {
971                         .p_type = PT_NOTE,
972                         .p_offset = offsetof(struct fake_elf, chrpnote),
973                         .p_filesz = sizeof(struct chrpnote)
974                 }, [1] = {
975                         .p_type = PT_NOTE,
976                         .p_offset = offsetof(struct fake_elf, rpanote),
977                         .p_filesz = sizeof(struct rpanote)
978                 }
979         },
980         .chrpnote = {
981                 .namesz = sizeof("PowerPC"),
982                 .descsz = sizeof(struct chrpdesc),
983                 .type = 0x1275,
984                 .name = "PowerPC",
985                 .chrpdesc = {
986                         .real_mode = ~0U,       /* ~0 means "don't care" */
987                         .real_base = ~0U,
988                         .real_size = ~0U,
989                         .virt_base = ~0U,
990                         .virt_size = ~0U,
991                         .load_base = ~0U
992                 },
993         },
994         .rpanote = {
995                 .namesz = sizeof("IBM,RPA-Client-Config"),
996                 .descsz = sizeof(struct rpadesc),
997                 .type = 0x12759999,
998                 .name = "IBM,RPA-Client-Config",
999                 .rpadesc = {
1000                         .lpar_affinity = 0,
1001                         .min_rmo_size = 64,     /* in megabytes */
1002                         .min_rmo_percent = 0,
1003                         .max_pft_size = 48,     /* 2^48 bytes max PFT size */
1004                         .splpar = 1,
1005                         .min_load = ~0U,
1006                         .new_mem_def = 0
1007                 }
1008         }
1009 };
1010 #endif /* __BIG_ENDIAN__ */
1011
1012 static int __init prom_count_smt_threads(void)
1013 {
1014         phandle node;
1015         char type[64];
1016         unsigned int plen;
1017
1018         /* Pick up th first CPU node we can find */
1019         for (node = 0; prom_next_node(&node); ) {
1020                 type[0] = 0;
1021                 prom_getprop(node, "device_type", type, sizeof(type));
1022
1023                 if (strcmp(type, "cpu"))
1024                         continue;
1025                 /*
1026                  * There is an entry for each smt thread, each entry being
1027                  * 4 bytes long.  All cpus should have the same number of
1028                  * smt threads, so return after finding the first.
1029                  */
1030                 plen = prom_getproplen(node, "ibm,ppc-interrupt-server#s");
1031                 if (plen == PROM_ERROR)
1032                         break;
1033                 plen >>= 2;
1034                 prom_debug("Found %lu smt threads per core\n", (unsigned long)plen);
1035
1036                 /* Sanity check */
1037                 if (plen < 1 || plen > 64) {
1038                         prom_printf("Threads per core %lu out of bounds, assuming 1\n",
1039                                     (unsigned long)plen);
1040                         return 1;
1041                 }
1042                 return plen;
1043         }
1044         prom_debug("No threads found, assuming 1 per core\n");
1045
1046         return 1;
1047
1048 }
1049
1050 static void __init prom_parse_mmu_model(u8 val,
1051                                         struct platform_support *support)
1052 {
1053         switch (val) {
1054         case OV5_FEAT(OV5_MMU_DYNAMIC):
1055         case OV5_FEAT(OV5_MMU_EITHER): /* Either Available */
1056                 prom_debug("MMU - either supported\n");
1057                 support->radix_mmu = !prom_radix_disable;
1058                 support->hash_mmu = true;
1059                 break;
1060         case OV5_FEAT(OV5_MMU_RADIX): /* Only Radix */
1061                 prom_debug("MMU - radix only\n");
1062                 if (prom_radix_disable) {
1063                         /*
1064                          * If we __have__ to do radix, we're better off ignoring
1065                          * the command line rather than not booting.
1066                          */
1067                         prom_printf("WARNING: Ignoring cmdline option disable_radix\n");
1068                 }
1069                 support->radix_mmu = true;
1070                 break;
1071         case OV5_FEAT(OV5_MMU_HASH):
1072                 prom_debug("MMU - hash only\n");
1073                 support->hash_mmu = true;
1074                 break;
1075         default:
1076                 prom_debug("Unknown mmu support option: 0x%x\n", val);
1077                 break;
1078         }
1079 }
1080
1081 static void __init prom_parse_xive_model(u8 val,
1082                                          struct platform_support *support)
1083 {
1084         switch (val) {
1085         case OV5_FEAT(OV5_XIVE_EITHER): /* Either Available */
1086                 prom_debug("XIVE - either mode supported\n");
1087                 support->xive = true;
1088                 break;
1089         case OV5_FEAT(OV5_XIVE_EXPLOIT): /* Only Exploitation mode */
1090                 prom_debug("XIVE - exploitation mode supported\n");
1091                 support->xive = true;
1092                 break;
1093         case OV5_FEAT(OV5_XIVE_LEGACY): /* Only Legacy mode */
1094                 prom_debug("XIVE - legacy mode supported\n");
1095                 break;
1096         default:
1097                 prom_debug("Unknown xive support option: 0x%x\n", val);
1098                 break;
1099         }
1100 }
1101
1102 static void __init prom_parse_platform_support(u8 index, u8 val,
1103                                                struct platform_support *support)
1104 {
1105         switch (index) {
1106         case OV5_INDX(OV5_MMU_SUPPORT): /* MMU Model */
1107                 prom_parse_mmu_model(val & OV5_FEAT(OV5_MMU_SUPPORT), support);
1108                 break;
1109         case OV5_INDX(OV5_RADIX_GTSE): /* Radix Extensions */
1110                 if (val & OV5_FEAT(OV5_RADIX_GTSE)) {
1111                         prom_debug("Radix - GTSE supported\n");
1112                         support->radix_gtse = true;
1113                 }
1114                 break;
1115         case OV5_INDX(OV5_XIVE_SUPPORT): /* Interrupt mode */
1116                 prom_parse_xive_model(val & OV5_FEAT(OV5_XIVE_SUPPORT),
1117                                       support);
1118                 break;
1119         }
1120 }
1121
1122 static void __init prom_check_platform_support(void)
1123 {
1124         struct platform_support supported = {
1125                 .hash_mmu = false,
1126                 .radix_mmu = false,
1127                 .radix_gtse = false,
1128                 .xive = false
1129         };
1130         int prop_len = prom_getproplen(prom.chosen,
1131                                        "ibm,arch-vec-5-platform-support");
1132         if (prop_len > 1) {
1133                 int i;
1134                 u8 vec[prop_len];
1135                 prom_debug("Found ibm,arch-vec-5-platform-support, len: %d\n",
1136                            prop_len);
1137                 prom_getprop(prom.chosen, "ibm,arch-vec-5-platform-support",
1138                              &vec, sizeof(vec));
1139                 for (i = 0; i < prop_len; i += 2) {
1140                         prom_debug("%d: index = 0x%x val = 0x%x\n", i / 2
1141                                                                   , vec[i]
1142                                                                   , vec[i + 1]);
1143                         prom_parse_platform_support(vec[i], vec[i + 1],
1144                                                     &supported);
1145                 }
1146         }
1147
1148         if (supported.radix_mmu && supported.radix_gtse &&
1149             IS_ENABLED(CONFIG_PPC_RADIX_MMU)) {
1150                 /* Radix preferred - but we require GTSE for now */
1151                 prom_debug("Asking for radix with GTSE\n");
1152                 ibm_architecture_vec.vec5.mmu = OV5_FEAT(OV5_MMU_RADIX);
1153                 ibm_architecture_vec.vec5.radix_ext = OV5_FEAT(OV5_RADIX_GTSE);
1154         } else if (supported.hash_mmu) {
1155                 /* Default to hash mmu (if we can) */
1156                 prom_debug("Asking for hash\n");
1157                 ibm_architecture_vec.vec5.mmu = OV5_FEAT(OV5_MMU_HASH);
1158         } else {
1159                 /* We're probably on a legacy hypervisor */
1160                 prom_debug("Assuming legacy hash support\n");
1161         }
1162
1163         if (supported.xive) {
1164                 prom_debug("Asking for XIVE\n");
1165                 ibm_architecture_vec.vec5.intarch = OV5_FEAT(OV5_XIVE_EXPLOIT);
1166         }
1167 }
1168
1169 static void __init prom_send_capabilities(void)
1170 {
1171         ihandle root;
1172         prom_arg_t ret;
1173         u32 cores;
1174
1175         /* Check ibm,arch-vec-5-platform-support and fixup vec5 if required */
1176         prom_check_platform_support();
1177
1178         root = call_prom("open", 1, 1, ADDR("/"));
1179         if (root != 0) {
1180                 /* We need to tell the FW about the number of cores we support.
1181                  *
1182                  * To do that, we count the number of threads on the first core
1183                  * (we assume this is the same for all cores) and use it to
1184                  * divide NR_CPUS.
1185                  */
1186
1187                 cores = DIV_ROUND_UP(NR_CPUS, prom_count_smt_threads());
1188                 prom_printf("Max number of cores passed to firmware: %u (NR_CPUS = %d)\n",
1189                             cores, NR_CPUS);
1190
1191                 ibm_architecture_vec.vec5.max_cpus = cpu_to_be32(cores);
1192
1193                 /* try calling the ibm,client-architecture-support method */
1194                 prom_printf("Calling ibm,client-architecture-support...");
1195                 if (call_prom_ret("call-method", 3, 2, &ret,
1196                                   ADDR("ibm,client-architecture-support"),
1197                                   root,
1198                                   ADDR(&ibm_architecture_vec)) == 0) {
1199                         /* the call exists... */
1200                         if (ret)
1201                                 prom_printf("\nWARNING: ibm,client-architecture"
1202                                             "-support call FAILED!\n");
1203                         call_prom("close", 1, 0, root);
1204                         prom_printf(" done\n");
1205                         return;
1206                 }
1207                 call_prom("close", 1, 0, root);
1208                 prom_printf(" not implemented\n");
1209         }
1210
1211 #ifdef __BIG_ENDIAN__
1212         {
1213                 ihandle elfloader;
1214
1215                 /* no ibm,client-architecture-support call, try the old way */
1216                 elfloader = call_prom("open", 1, 1,
1217                                       ADDR("/packages/elf-loader"));
1218                 if (elfloader == 0) {
1219                         prom_printf("couldn't open /packages/elf-loader\n");
1220                         return;
1221                 }
1222                 call_prom("call-method", 3, 1, ADDR("process-elf-header"),
1223                           elfloader, ADDR(&fake_elf));
1224                 call_prom("close", 1, 0, elfloader);
1225         }
1226 #endif /* __BIG_ENDIAN__ */
1227 }
1228 #endif /* #if defined(CONFIG_PPC_PSERIES) || defined(CONFIG_PPC_POWERNV) */
1229
1230 /*
1231  * Memory allocation strategy... our layout is normally:
1232  *
1233  *  at 14Mb or more we have vmlinux, then a gap and initrd.  In some
1234  *  rare cases, initrd might end up being before the kernel though.
1235  *  We assume this won't override the final kernel at 0, we have no
1236  *  provision to handle that in this version, but it should hopefully
1237  *  never happen.
1238  *
1239  *  alloc_top is set to the top of RMO, eventually shrink down if the
1240  *  TCEs overlap
1241  *
1242  *  alloc_bottom is set to the top of kernel/initrd
1243  *
1244  *  from there, allocations are done this way : rtas is allocated
1245  *  topmost, and the device-tree is allocated from the bottom. We try
1246  *  to grow the device-tree allocation as we progress. If we can't,
1247  *  then we fail, we don't currently have a facility to restart
1248  *  elsewhere, but that shouldn't be necessary.
1249  *
1250  *  Note that calls to reserve_mem have to be done explicitly, memory
1251  *  allocated with either alloc_up or alloc_down isn't automatically
1252  *  reserved.
1253  */
1254
1255
1256 /*
1257  * Allocates memory in the RMO upward from the kernel/initrd
1258  *
1259  * When align is 0, this is a special case, it means to allocate in place
1260  * at the current location of alloc_bottom or fail (that is basically
1261  * extending the previous allocation). Used for the device-tree flattening
1262  */
1263 static unsigned long __init alloc_up(unsigned long size, unsigned long align)
1264 {
1265         unsigned long base = alloc_bottom;
1266         unsigned long addr = 0;
1267
1268         if (align)
1269                 base = _ALIGN_UP(base, align);
1270         prom_debug("%s(%lx, %lx)\n", __func__, size, align);
1271         if (ram_top == 0)
1272                 prom_panic("alloc_up() called with mem not initialized\n");
1273
1274         if (align)
1275                 base = _ALIGN_UP(alloc_bottom, align);
1276         else
1277                 base = alloc_bottom;
1278
1279         for(; (base + size) <= alloc_top; 
1280             base = _ALIGN_UP(base + 0x100000, align)) {
1281                 prom_debug("    trying: 0x%lx\n\r", base);
1282                 addr = (unsigned long)prom_claim(base, size, 0);
1283                 if (addr != PROM_ERROR && addr != 0)
1284                         break;
1285                 addr = 0;
1286                 if (align == 0)
1287                         break;
1288         }
1289         if (addr == 0)
1290                 return 0;
1291         alloc_bottom = addr + size;
1292
1293         prom_debug(" -> %lx\n", addr);
1294         prom_debug("  alloc_bottom : %lx\n", alloc_bottom);
1295         prom_debug("  alloc_top    : %lx\n", alloc_top);
1296         prom_debug("  alloc_top_hi : %lx\n", alloc_top_high);
1297         prom_debug("  rmo_top      : %lx\n", rmo_top);
1298         prom_debug("  ram_top      : %lx\n", ram_top);
1299
1300         return addr;
1301 }
1302
1303 /*
1304  * Allocates memory downward, either from top of RMO, or if highmem
1305  * is set, from the top of RAM.  Note that this one doesn't handle
1306  * failures.  It does claim memory if highmem is not set.
1307  */
1308 static unsigned long __init alloc_down(unsigned long size, unsigned long align,
1309                                        int highmem)
1310 {
1311         unsigned long base, addr = 0;
1312
1313         prom_debug("%s(%lx, %lx, %s)\n", __func__, size, align,
1314                    highmem ? "(high)" : "(low)");
1315         if (ram_top == 0)
1316                 prom_panic("alloc_down() called with mem not initialized\n");
1317
1318         if (highmem) {
1319                 /* Carve out storage for the TCE table. */
1320                 addr = _ALIGN_DOWN(alloc_top_high - size, align);
1321                 if (addr <= alloc_bottom)
1322                         return 0;
1323                 /* Will we bump into the RMO ? If yes, check out that we
1324                  * didn't overlap existing allocations there, if we did,
1325                  * we are dead, we must be the first in town !
1326                  */
1327                 if (addr < rmo_top) {
1328                         /* Good, we are first */
1329                         if (alloc_top == rmo_top)
1330                                 alloc_top = rmo_top = addr;
1331                         else
1332                                 return 0;
1333                 }
1334                 alloc_top_high = addr;
1335                 goto bail;
1336         }
1337
1338         base = _ALIGN_DOWN(alloc_top - size, align);
1339         for (; base > alloc_bottom;
1340              base = _ALIGN_DOWN(base - 0x100000, align))  {
1341                 prom_debug("    trying: 0x%lx\n\r", base);
1342                 addr = (unsigned long)prom_claim(base, size, 0);
1343                 if (addr != PROM_ERROR && addr != 0)
1344                         break;
1345                 addr = 0;
1346         }
1347         if (addr == 0)
1348                 return 0;
1349         alloc_top = addr;
1350
1351  bail:
1352         prom_debug(" -> %lx\n", addr);
1353         prom_debug("  alloc_bottom : %lx\n", alloc_bottom);
1354         prom_debug("  alloc_top    : %lx\n", alloc_top);
1355         prom_debug("  alloc_top_hi : %lx\n", alloc_top_high);
1356         prom_debug("  rmo_top      : %lx\n", rmo_top);
1357         prom_debug("  ram_top      : %lx\n", ram_top);
1358
1359         return addr;
1360 }
1361
1362 /*
1363  * Parse a "reg" cell
1364  */
1365 static unsigned long __init prom_next_cell(int s, cell_t **cellp)
1366 {
1367         cell_t *p = *cellp;
1368         unsigned long r = 0;
1369
1370         /* Ignore more than 2 cells */
1371         while (s > sizeof(unsigned long) / 4) {
1372                 p++;
1373                 s--;
1374         }
1375         r = be32_to_cpu(*p++);
1376 #ifdef CONFIG_PPC64
1377         if (s > 1) {
1378                 r <<= 32;
1379                 r |= be32_to_cpu(*(p++));
1380         }
1381 #endif
1382         *cellp = p;
1383         return r;
1384 }
1385
1386 /*
1387  * Very dumb function for adding to the memory reserve list, but
1388  * we don't need anything smarter at this point
1389  *
1390  * XXX Eventually check for collisions.  They should NEVER happen.
1391  * If problems seem to show up, it would be a good start to track
1392  * them down.
1393  */
1394 static void __init reserve_mem(u64 base, u64 size)
1395 {
1396         u64 top = base + size;
1397         unsigned long cnt = mem_reserve_cnt;
1398
1399         if (size == 0)
1400                 return;
1401
1402         /* We need to always keep one empty entry so that we
1403          * have our terminator with "size" set to 0 since we are
1404          * dumb and just copy this entire array to the boot params
1405          */
1406         base = _ALIGN_DOWN(base, PAGE_SIZE);
1407         top = _ALIGN_UP(top, PAGE_SIZE);
1408         size = top - base;
1409
1410         if (cnt >= (MEM_RESERVE_MAP_SIZE - 1))
1411                 prom_panic("Memory reserve map exhausted !\n");
1412         mem_reserve_map[cnt].base = cpu_to_be64(base);
1413         mem_reserve_map[cnt].size = cpu_to_be64(size);
1414         mem_reserve_cnt = cnt + 1;
1415 }
1416
1417 /*
1418  * Initialize memory allocation mechanism, parse "memory" nodes and
1419  * obtain that way the top of memory and RMO to setup out local allocator
1420  */
1421 static void __init prom_init_mem(void)
1422 {
1423         phandle node;
1424 #ifdef DEBUG_PROM
1425         char *path;
1426 #endif
1427         char type[64];
1428         unsigned int plen;
1429         cell_t *p, *endp;
1430         __be32 val;
1431         u32 rac, rsc;
1432
1433         /*
1434          * We iterate the memory nodes to find
1435          * 1) top of RMO (first node)
1436          * 2) top of memory
1437          */
1438         val = cpu_to_be32(2);
1439         prom_getprop(prom.root, "#address-cells", &val, sizeof(val));
1440         rac = be32_to_cpu(val);
1441         val = cpu_to_be32(1);
1442         prom_getprop(prom.root, "#size-cells", &val, sizeof(rsc));
1443         rsc = be32_to_cpu(val);
1444         prom_debug("root_addr_cells: %x\n", rac);
1445         prom_debug("root_size_cells: %x\n", rsc);
1446
1447         prom_debug("scanning memory:\n");
1448 #ifdef DEBUG_PROM
1449         path = prom_scratch;
1450 #endif
1451
1452         for (node = 0; prom_next_node(&node); ) {
1453                 type[0] = 0;
1454                 prom_getprop(node, "device_type", type, sizeof(type));
1455
1456                 if (type[0] == 0) {
1457                         /*
1458                          * CHRP Longtrail machines have no device_type
1459                          * on the memory node, so check the name instead...
1460                          */
1461                         prom_getprop(node, "name", type, sizeof(type));
1462                 }
1463                 if (strcmp(type, "memory"))
1464                         continue;
1465
1466                 plen = prom_getprop(node, "reg", regbuf, sizeof(regbuf));
1467                 if (plen > sizeof(regbuf)) {
1468                         prom_printf("memory node too large for buffer !\n");
1469                         plen = sizeof(regbuf);
1470                 }
1471                 p = regbuf;
1472                 endp = p + (plen / sizeof(cell_t));
1473
1474 #ifdef DEBUG_PROM
1475                 memset(path, 0, PROM_SCRATCH_SIZE);
1476                 call_prom("package-to-path", 3, 1, node, path, PROM_SCRATCH_SIZE-1);
1477                 prom_debug("  node %s :\n", path);
1478 #endif /* DEBUG_PROM */
1479
1480                 while ((endp - p) >= (rac + rsc)) {
1481                         unsigned long base, size;
1482
1483                         base = prom_next_cell(rac, &p);
1484                         size = prom_next_cell(rsc, &p);
1485
1486                         if (size == 0)
1487                                 continue;
1488                         prom_debug("    %lx %lx\n", base, size);
1489                         if (base == 0 && (of_platform & PLATFORM_LPAR))
1490                                 rmo_top = size;
1491                         if ((base + size) > ram_top)
1492                                 ram_top = base + size;
1493                 }
1494         }
1495
1496         alloc_bottom = PAGE_ALIGN((unsigned long)&_end + 0x4000);
1497
1498         /*
1499          * If prom_memory_limit is set we reduce the upper limits *except* for
1500          * alloc_top_high. This must be the real top of RAM so we can put
1501          * TCE's up there.
1502          */
1503
1504         alloc_top_high = ram_top;
1505
1506         if (prom_memory_limit) {
1507                 if (prom_memory_limit <= alloc_bottom) {
1508                         prom_printf("Ignoring mem=%lx <= alloc_bottom.\n",
1509                                     prom_memory_limit);
1510                         prom_memory_limit = 0;
1511                 } else if (prom_memory_limit >= ram_top) {
1512                         prom_printf("Ignoring mem=%lx >= ram_top.\n",
1513                                     prom_memory_limit);
1514                         prom_memory_limit = 0;
1515                 } else {
1516                         ram_top = prom_memory_limit;
1517                         rmo_top = min(rmo_top, prom_memory_limit);
1518                 }
1519         }
1520
1521         /*
1522          * Setup our top alloc point, that is top of RMO or top of
1523          * segment 0 when running non-LPAR.
1524          * Some RS64 machines have buggy firmware where claims up at
1525          * 1GB fail.  Cap at 768MB as a workaround.
1526          * Since 768MB is plenty of room, and we need to cap to something
1527          * reasonable on 32-bit, cap at 768MB on all machines.
1528          */
1529         if (!rmo_top)
1530                 rmo_top = ram_top;
1531         rmo_top = min(0x30000000ul, rmo_top);
1532         alloc_top = rmo_top;
1533         alloc_top_high = ram_top;
1534
1535         /*
1536          * Check if we have an initrd after the kernel but still inside
1537          * the RMO.  If we do move our bottom point to after it.
1538          */
1539         if (prom_initrd_start &&
1540             prom_initrd_start < rmo_top &&
1541             prom_initrd_end > alloc_bottom)
1542                 alloc_bottom = PAGE_ALIGN(prom_initrd_end);
1543
1544         prom_printf("memory layout at init:\n");
1545         prom_printf("  memory_limit : %lx (16 MB aligned)\n",
1546                     prom_memory_limit);
1547         prom_printf("  alloc_bottom : %lx\n", alloc_bottom);
1548         prom_printf("  alloc_top    : %lx\n", alloc_top);
1549         prom_printf("  alloc_top_hi : %lx\n", alloc_top_high);
1550         prom_printf("  rmo_top      : %lx\n", rmo_top);
1551         prom_printf("  ram_top      : %lx\n", ram_top);
1552 }
1553
1554 static void __init prom_close_stdin(void)
1555 {
1556         __be32 val;
1557         ihandle stdin;
1558
1559         if (prom_getprop(prom.chosen, "stdin", &val, sizeof(val)) > 0) {
1560                 stdin = be32_to_cpu(val);
1561                 call_prom("close", 1, 0, stdin);
1562         }
1563 }
1564
1565 #ifdef CONFIG_PPC_POWERNV
1566
1567 #ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
1568 static u64 __initdata prom_opal_base;
1569 static u64 __initdata prom_opal_entry;
1570 #endif
1571
1572 /*
1573  * Allocate room for and instantiate OPAL
1574  */
1575 static void __init prom_instantiate_opal(void)
1576 {
1577         phandle opal_node;
1578         ihandle opal_inst;
1579         u64 base, entry;
1580         u64 size = 0, align = 0x10000;
1581         __be64 val64;
1582         u32 rets[2];
1583
1584         prom_debug("prom_instantiate_opal: start...\n");
1585
1586         opal_node = call_prom("finddevice", 1, 1, ADDR("/ibm,opal"));
1587         prom_debug("opal_node: %x\n", opal_node);
1588         if (!PHANDLE_VALID(opal_node))
1589                 return;
1590
1591         val64 = 0;
1592         prom_getprop(opal_node, "opal-runtime-size", &val64, sizeof(val64));
1593         size = be64_to_cpu(val64);
1594         if (size == 0)
1595                 return;
1596         val64 = 0;
1597         prom_getprop(opal_node, "opal-runtime-alignment", &val64,sizeof(val64));
1598         align = be64_to_cpu(val64);
1599
1600         base = alloc_down(size, align, 0);
1601         if (base == 0) {
1602                 prom_printf("OPAL allocation failed !\n");
1603                 return;
1604         }
1605
1606         opal_inst = call_prom("open", 1, 1, ADDR("/ibm,opal"));
1607         if (!IHANDLE_VALID(opal_inst)) {
1608                 prom_printf("opening opal package failed (%x)\n", opal_inst);
1609                 return;
1610         }
1611
1612         prom_printf("instantiating opal at 0x%llx...", base);
1613
1614         if (call_prom_ret("call-method", 4, 3, rets,
1615                           ADDR("load-opal-runtime"),
1616                           opal_inst,
1617                           base >> 32, base & 0xffffffff) != 0
1618             || (rets[0] == 0 && rets[1] == 0)) {
1619                 prom_printf(" failed\n");
1620                 return;
1621         }
1622         entry = (((u64)rets[0]) << 32) | rets[1];
1623
1624         prom_printf(" done\n");
1625
1626         reserve_mem(base, size);
1627
1628         prom_debug("opal base     = 0x%llx\n", base);
1629         prom_debug("opal align    = 0x%llx\n", align);
1630         prom_debug("opal entry    = 0x%llx\n", entry);
1631         prom_debug("opal size     = 0x%llx\n", size);
1632
1633         prom_setprop(opal_node, "/ibm,opal", "opal-base-address",
1634                      &base, sizeof(base));
1635         prom_setprop(opal_node, "/ibm,opal", "opal-entry-address",
1636                      &entry, sizeof(entry));
1637
1638 #ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
1639         prom_opal_base = base;
1640         prom_opal_entry = entry;
1641 #endif
1642         prom_debug("prom_instantiate_opal: end...\n");
1643 }
1644
1645 #endif /* CONFIG_PPC_POWERNV */
1646
1647 /*
1648  * Allocate room for and instantiate RTAS
1649  */
1650 static void __init prom_instantiate_rtas(void)
1651 {
1652         phandle rtas_node;
1653         ihandle rtas_inst;
1654         u32 base, entry = 0;
1655         __be32 val;
1656         u32 size = 0;
1657
1658         prom_debug("prom_instantiate_rtas: start...\n");
1659
1660         rtas_node = call_prom("finddevice", 1, 1, ADDR("/rtas"));
1661         prom_debug("rtas_node: %x\n", rtas_node);
1662         if (!PHANDLE_VALID(rtas_node))
1663                 return;
1664
1665         val = 0;
1666         prom_getprop(rtas_node, "rtas-size", &val, sizeof(size));
1667         size = be32_to_cpu(val);
1668         if (size == 0)
1669                 return;
1670
1671         base = alloc_down(size, PAGE_SIZE, 0);
1672         if (base == 0)
1673                 prom_panic("Could not allocate memory for RTAS\n");
1674
1675         rtas_inst = call_prom("open", 1, 1, ADDR("/rtas"));
1676         if (!IHANDLE_VALID(rtas_inst)) {
1677                 prom_printf("opening rtas package failed (%x)\n", rtas_inst);
1678                 return;
1679         }
1680
1681         prom_printf("instantiating rtas at 0x%x...", base);
1682
1683         if (call_prom_ret("call-method", 3, 2, &entry,
1684                           ADDR("instantiate-rtas"),
1685                           rtas_inst, base) != 0
1686             || entry == 0) {
1687                 prom_printf(" failed\n");
1688                 return;
1689         }
1690         prom_printf(" done\n");
1691
1692         reserve_mem(base, size);
1693
1694         val = cpu_to_be32(base);
1695         prom_setprop(rtas_node, "/rtas", "linux,rtas-base",
1696                      &val, sizeof(val));
1697         val = cpu_to_be32(entry);
1698         prom_setprop(rtas_node, "/rtas", "linux,rtas-entry",
1699                      &val, sizeof(val));
1700
1701         /* Check if it supports "query-cpu-stopped-state" */
1702         if (prom_getprop(rtas_node, "query-cpu-stopped-state",
1703                          &val, sizeof(val)) != PROM_ERROR)
1704                 rtas_has_query_cpu_stopped = true;
1705
1706         prom_debug("rtas base     = 0x%x\n", base);
1707         prom_debug("rtas entry    = 0x%x\n", entry);
1708         prom_debug("rtas size     = 0x%x\n", size);
1709
1710         prom_debug("prom_instantiate_rtas: end...\n");
1711 }
1712
1713 #ifdef CONFIG_PPC64
1714 /*
1715  * Allocate room for and instantiate Stored Measurement Log (SML)
1716  */
1717 static void __init prom_instantiate_sml(void)
1718 {
1719         phandle ibmvtpm_node;
1720         ihandle ibmvtpm_inst;
1721         u32 entry = 0, size = 0, succ = 0;
1722         u64 base;
1723         __be32 val;
1724
1725         prom_debug("prom_instantiate_sml: start...\n");
1726
1727         ibmvtpm_node = call_prom("finddevice", 1, 1, ADDR("/vdevice/vtpm"));
1728         prom_debug("ibmvtpm_node: %x\n", ibmvtpm_node);
1729         if (!PHANDLE_VALID(ibmvtpm_node))
1730                 return;
1731
1732         ibmvtpm_inst = call_prom("open", 1, 1, ADDR("/vdevice/vtpm"));
1733         if (!IHANDLE_VALID(ibmvtpm_inst)) {
1734                 prom_printf("opening vtpm package failed (%x)\n", ibmvtpm_inst);
1735                 return;
1736         }
1737
1738         if (prom_getprop(ibmvtpm_node, "ibm,sml-efi-reformat-supported",
1739                          &val, sizeof(val)) != PROM_ERROR) {
1740                 if (call_prom_ret("call-method", 2, 2, &succ,
1741                                   ADDR("reformat-sml-to-efi-alignment"),
1742                                   ibmvtpm_inst) != 0 || succ == 0) {
1743                         prom_printf("Reformat SML to EFI alignment failed\n");
1744                         return;
1745                 }
1746
1747                 if (call_prom_ret("call-method", 2, 2, &size,
1748                                   ADDR("sml-get-allocated-size"),
1749                                   ibmvtpm_inst) != 0 || size == 0) {
1750                         prom_printf("SML get allocated size failed\n");
1751                         return;
1752                 }
1753         } else {
1754                 if (call_prom_ret("call-method", 2, 2, &size,
1755                                   ADDR("sml-get-handover-size"),
1756                                   ibmvtpm_inst) != 0 || size == 0) {
1757                         prom_printf("SML get handover size failed\n");
1758                         return;
1759                 }
1760         }
1761
1762         base = alloc_down(size, PAGE_SIZE, 0);
1763         if (base == 0)
1764                 prom_panic("Could not allocate memory for sml\n");
1765
1766         prom_printf("instantiating sml at 0x%llx...", base);
1767
1768         memset((void *)base, 0, size);
1769
1770         if (call_prom_ret("call-method", 4, 2, &entry,
1771                           ADDR("sml-handover"),
1772                           ibmvtpm_inst, size, base) != 0 || entry == 0) {
1773                 prom_printf("SML handover failed\n");
1774                 return;
1775         }
1776         prom_printf(" done\n");
1777
1778         reserve_mem(base, size);
1779
1780         prom_setprop(ibmvtpm_node, "/vdevice/vtpm", "linux,sml-base",
1781                      &base, sizeof(base));
1782         prom_setprop(ibmvtpm_node, "/vdevice/vtpm", "linux,sml-size",
1783                      &size, sizeof(size));
1784
1785         prom_debug("sml base     = 0x%llx\n", base);
1786         prom_debug("sml size     = 0x%x\n", size);
1787
1788         prom_debug("prom_instantiate_sml: end...\n");
1789 }
1790
1791 /*
1792  * Allocate room for and initialize TCE tables
1793  */
1794 #ifdef __BIG_ENDIAN__
1795 static void __init prom_initialize_tce_table(void)
1796 {
1797         phandle node;
1798         ihandle phb_node;
1799         char compatible[64], type[64], model[64];
1800         char *path = prom_scratch;
1801         u64 base, align;
1802         u32 minalign, minsize;
1803         u64 tce_entry, *tce_entryp;
1804         u64 local_alloc_top, local_alloc_bottom;
1805         u64 i;
1806
1807         if (prom_iommu_off)
1808                 return;
1809
1810         prom_debug("starting prom_initialize_tce_table\n");
1811
1812         /* Cache current top of allocs so we reserve a single block */
1813         local_alloc_top = alloc_top_high;
1814         local_alloc_bottom = local_alloc_top;
1815
1816         /* Search all nodes looking for PHBs. */
1817         for (node = 0; prom_next_node(&node); ) {
1818                 compatible[0] = 0;
1819                 type[0] = 0;
1820                 model[0] = 0;
1821                 prom_getprop(node, "compatible",
1822                              compatible, sizeof(compatible));
1823                 prom_getprop(node, "device_type", type, sizeof(type));
1824                 prom_getprop(node, "model", model, sizeof(model));
1825
1826                 if ((type[0] == 0) || (strstr(type, "pci") == NULL))
1827                         continue;
1828
1829                 /* Keep the old logic intact to avoid regression. */
1830                 if (compatible[0] != 0) {
1831                         if ((strstr(compatible, "python") == NULL) &&
1832                             (strstr(compatible, "Speedwagon") == NULL) &&
1833                             (strstr(compatible, "Winnipeg") == NULL))
1834                                 continue;
1835                 } else if (model[0] != 0) {
1836                         if ((strstr(model, "ython") == NULL) &&
1837                             (strstr(model, "peedwagon") == NULL) &&
1838                             (strstr(model, "innipeg") == NULL))
1839                                 continue;
1840                 }
1841
1842                 if (prom_getprop(node, "tce-table-minalign", &minalign,
1843                                  sizeof(minalign)) == PROM_ERROR)
1844                         minalign = 0;
1845                 if (prom_getprop(node, "tce-table-minsize", &minsize,
1846                                  sizeof(minsize)) == PROM_ERROR)
1847                         minsize = 4UL << 20;
1848
1849                 /*
1850                  * Even though we read what OF wants, we just set the table
1851                  * size to 4 MB.  This is enough to map 2GB of PCI DMA space.
1852                  * By doing this, we avoid the pitfalls of trying to DMA to
1853                  * MMIO space and the DMA alias hole.
1854                  */
1855                 minsize = 4UL << 20;
1856
1857                 /* Align to the greater of the align or size */
1858                 align = max(minalign, minsize);
1859                 base = alloc_down(minsize, align, 1);
1860                 if (base == 0)
1861                         prom_panic("ERROR, cannot find space for TCE table.\n");
1862                 if (base < local_alloc_bottom)
1863                         local_alloc_bottom = base;
1864
1865                 /* It seems OF doesn't null-terminate the path :-( */
1866                 memset(path, 0, PROM_SCRATCH_SIZE);
1867                 /* Call OF to setup the TCE hardware */
1868                 if (call_prom("package-to-path", 3, 1, node,
1869                               path, PROM_SCRATCH_SIZE-1) == PROM_ERROR) {
1870                         prom_printf("package-to-path failed\n");
1871                 }
1872
1873                 /* Save away the TCE table attributes for later use. */
1874                 prom_setprop(node, path, "linux,tce-base", &base, sizeof(base));
1875                 prom_setprop(node, path, "linux,tce-size", &minsize, sizeof(minsize));
1876
1877                 prom_debug("TCE table: %s\n", path);
1878                 prom_debug("\tnode = 0x%x\n", node);
1879                 prom_debug("\tbase = 0x%llx\n", base);
1880                 prom_debug("\tsize = 0x%x\n", minsize);
1881
1882                 /* Initialize the table to have a one-to-one mapping
1883                  * over the allocated size.
1884                  */
1885                 tce_entryp = (u64 *)base;
1886                 for (i = 0; i < (minsize >> 3) ;tce_entryp++, i++) {
1887                         tce_entry = (i << PAGE_SHIFT);
1888                         tce_entry |= 0x3;
1889                         *tce_entryp = tce_entry;
1890                 }
1891
1892                 prom_printf("opening PHB %s", path);
1893                 phb_node = call_prom("open", 1, 1, path);
1894                 if (phb_node == 0)
1895                         prom_printf("... failed\n");
1896                 else
1897                         prom_printf("... done\n");
1898
1899                 call_prom("call-method", 6, 0, ADDR("set-64-bit-addressing"),
1900                           phb_node, -1, minsize,
1901                           (u32) base, (u32) (base >> 32));
1902                 call_prom("close", 1, 0, phb_node);
1903         }
1904
1905         reserve_mem(local_alloc_bottom, local_alloc_top - local_alloc_bottom);
1906
1907         /* These are only really needed if there is a memory limit in
1908          * effect, but we don't know so export them always. */
1909         prom_tce_alloc_start = local_alloc_bottom;
1910         prom_tce_alloc_end = local_alloc_top;
1911
1912         /* Flag the first invalid entry */
1913         prom_debug("ending prom_initialize_tce_table\n");
1914 }
1915 #endif /* __BIG_ENDIAN__ */
1916 #endif /* CONFIG_PPC64 */
1917
1918 /*
1919  * With CHRP SMP we need to use the OF to start the other processors.
1920  * We can't wait until smp_boot_cpus (the OF is trashed by then)
1921  * so we have to put the processors into a holding pattern controlled
1922  * by the kernel (not OF) before we destroy the OF.
1923  *
1924  * This uses a chunk of low memory, puts some holding pattern
1925  * code there and sends the other processors off to there until
1926  * smp_boot_cpus tells them to do something.  The holding pattern
1927  * checks that address until its cpu # is there, when it is that
1928  * cpu jumps to __secondary_start().  smp_boot_cpus() takes care
1929  * of setting those values.
1930  *
1931  * We also use physical address 0x4 here to tell when a cpu
1932  * is in its holding pattern code.
1933  *
1934  * -- Cort
1935  */
1936 /*
1937  * We want to reference the copy of __secondary_hold_* in the
1938  * 0 - 0x100 address range
1939  */
1940 #define LOW_ADDR(x)     (((unsigned long) &(x)) & 0xff)
1941
1942 static void __init prom_hold_cpus(void)
1943 {
1944         unsigned long i;
1945         phandle node;
1946         char type[64];
1947         unsigned long *spinloop
1948                 = (void *) LOW_ADDR(__secondary_hold_spinloop);
1949         unsigned long *acknowledge
1950                 = (void *) LOW_ADDR(__secondary_hold_acknowledge);
1951         unsigned long secondary_hold = LOW_ADDR(__secondary_hold);
1952
1953         /*
1954          * On pseries, if RTAS supports "query-cpu-stopped-state",
1955          * we skip this stage, the CPUs will be started by the
1956          * kernel using RTAS.
1957          */
1958         if ((of_platform == PLATFORM_PSERIES ||
1959              of_platform == PLATFORM_PSERIES_LPAR) &&
1960             rtas_has_query_cpu_stopped) {
1961                 prom_printf("prom_hold_cpus: skipped\n");
1962                 return;
1963         }
1964
1965         prom_debug("prom_hold_cpus: start...\n");
1966         prom_debug("    1) spinloop       = 0x%lx\n", (unsigned long)spinloop);
1967         prom_debug("    1) *spinloop      = 0x%lx\n", *spinloop);
1968         prom_debug("    1) acknowledge    = 0x%lx\n",
1969                    (unsigned long)acknowledge);
1970         prom_debug("    1) *acknowledge   = 0x%lx\n", *acknowledge);
1971         prom_debug("    1) secondary_hold = 0x%lx\n", secondary_hold);
1972
1973         /* Set the common spinloop variable, so all of the secondary cpus
1974          * will block when they are awakened from their OF spinloop.
1975          * This must occur for both SMP and non SMP kernels, since OF will
1976          * be trashed when we move the kernel.
1977          */
1978         *spinloop = 0;
1979
1980         /* look for cpus */
1981         for (node = 0; prom_next_node(&node); ) {
1982                 unsigned int cpu_no;
1983                 __be32 reg;
1984
1985                 type[0] = 0;
1986                 prom_getprop(node, "device_type", type, sizeof(type));
1987                 if (strcmp(type, "cpu") != 0)
1988                         continue;
1989
1990                 /* Skip non-configured cpus. */
1991                 if (prom_getprop(node, "status", type, sizeof(type)) > 0)
1992                         if (strcmp(type, "okay") != 0)
1993                                 continue;
1994
1995                 reg = cpu_to_be32(-1); /* make sparse happy */
1996                 prom_getprop(node, "reg", &reg, sizeof(reg));
1997                 cpu_no = be32_to_cpu(reg);
1998
1999                 prom_debug("cpu hw idx   = %u\n", cpu_no);
2000
2001                 /* Init the acknowledge var which will be reset by
2002                  * the secondary cpu when it awakens from its OF
2003                  * spinloop.
2004                  */
2005                 *acknowledge = (unsigned long)-1;
2006
2007                 if (cpu_no != prom.cpu) {
2008                         /* Primary Thread of non-boot cpu or any thread */
2009                         prom_printf("starting cpu hw idx %u... ", cpu_no);
2010                         call_prom("start-cpu", 3, 0, node,
2011                                   secondary_hold, cpu_no);
2012
2013                         for (i = 0; (i < 100000000) && 
2014                              (*acknowledge == ((unsigned long)-1)); i++ )
2015                                 mb();
2016
2017                         if (*acknowledge == cpu_no)
2018                                 prom_printf("done\n");
2019                         else
2020                                 prom_printf("failed: %lx\n", *acknowledge);
2021                 }
2022 #ifdef CONFIG_SMP
2023                 else
2024                         prom_printf("boot cpu hw idx %u\n", cpu_no);
2025 #endif /* CONFIG_SMP */
2026         }
2027
2028         prom_debug("prom_hold_cpus: end...\n");
2029 }
2030
2031
2032 static void __init prom_init_client_services(unsigned long pp)
2033 {
2034         /* Get a handle to the prom entry point before anything else */
2035         prom_entry = pp;
2036
2037         /* get a handle for the stdout device */
2038         prom.chosen = call_prom("finddevice", 1, 1, ADDR("/chosen"));
2039         if (!PHANDLE_VALID(prom.chosen))
2040                 prom_panic("cannot find chosen"); /* msg won't be printed :( */
2041
2042         /* get device tree root */
2043         prom.root = call_prom("finddevice", 1, 1, ADDR("/"));
2044         if (!PHANDLE_VALID(prom.root))
2045                 prom_panic("cannot find device tree root"); /* msg won't be printed :( */
2046
2047         prom.mmumap = 0;
2048 }
2049
2050 #ifdef CONFIG_PPC32
2051 /*
2052  * For really old powermacs, we need to map things we claim.
2053  * For that, we need the ihandle of the mmu.
2054  * Also, on the longtrail, we need to work around other bugs.
2055  */
2056 static void __init prom_find_mmu(void)
2057 {
2058         phandle oprom;
2059         char version[64];
2060
2061         oprom = call_prom("finddevice", 1, 1, ADDR("/openprom"));
2062         if (!PHANDLE_VALID(oprom))
2063                 return;
2064         if (prom_getprop(oprom, "model", version, sizeof(version)) <= 0)
2065                 return;
2066         version[sizeof(version) - 1] = 0;
2067         /* XXX might need to add other versions here */
2068         if (strcmp(version, "Open Firmware, 1.0.5") == 0)
2069                 of_workarounds = OF_WA_CLAIM;
2070         else if (strncmp(version, "FirmWorks,3.", 12) == 0) {
2071                 of_workarounds = OF_WA_CLAIM | OF_WA_LONGTRAIL;
2072                 call_prom("interpret", 1, 1, "dev /memory 0 to allow-reclaim");
2073         } else
2074                 return;
2075         prom.memory = call_prom("open", 1, 1, ADDR("/memory"));
2076         prom_getprop(prom.chosen, "mmu", &prom.mmumap,
2077                      sizeof(prom.mmumap));
2078         prom.mmumap = be32_to_cpu(prom.mmumap);
2079         if (!IHANDLE_VALID(prom.memory) || !IHANDLE_VALID(prom.mmumap))
2080                 of_workarounds &= ~OF_WA_CLAIM;         /* hmmm */
2081 }
2082 #else
2083 #define prom_find_mmu()
2084 #endif
2085
2086 static void __init prom_init_stdout(void)
2087 {
2088         char *path = of_stdout_device;
2089         char type[16];
2090         phandle stdout_node;
2091         __be32 val;
2092
2093         if (prom_getprop(prom.chosen, "stdout", &val, sizeof(val)) <= 0)
2094                 prom_panic("cannot find stdout");
2095
2096         prom.stdout = be32_to_cpu(val);
2097
2098         /* Get the full OF pathname of the stdout device */
2099         memset(path, 0, 256);
2100         call_prom("instance-to-path", 3, 1, prom.stdout, path, 255);
2101         prom_printf("OF stdout device is: %s\n", of_stdout_device);
2102         prom_setprop(prom.chosen, "/chosen", "linux,stdout-path",
2103                      path, strlen(path) + 1);
2104
2105         /* instance-to-package fails on PA-Semi */
2106         stdout_node = call_prom("instance-to-package", 1, 1, prom.stdout);
2107         if (stdout_node != PROM_ERROR) {
2108                 val = cpu_to_be32(stdout_node);
2109
2110                 /* If it's a display, note it */
2111                 memset(type, 0, sizeof(type));
2112                 prom_getprop(stdout_node, "device_type", type, sizeof(type));
2113                 if (strcmp(type, "display") == 0)
2114                         prom_setprop(stdout_node, path, "linux,boot-display", NULL, 0);
2115         }
2116 }
2117
2118 static int __init prom_find_machine_type(void)
2119 {
2120         char compat[256];
2121         int len, i = 0;
2122 #ifdef CONFIG_PPC64
2123         phandle rtas;
2124         int x;
2125 #endif
2126
2127         /* Look for a PowerMac or a Cell */
2128         len = prom_getprop(prom.root, "compatible",
2129                            compat, sizeof(compat)-1);
2130         if (len > 0) {
2131                 compat[len] = 0;
2132                 while (i < len) {
2133                         char *p = &compat[i];
2134                         int sl = strlen(p);
2135                         if (sl == 0)
2136                                 break;
2137                         if (strstr(p, "Power Macintosh") ||
2138                             strstr(p, "MacRISC"))
2139                                 return PLATFORM_POWERMAC;
2140 #ifdef CONFIG_PPC64
2141                         /* We must make sure we don't detect the IBM Cell
2142                          * blades as pSeries due to some firmware issues,
2143                          * so we do it here.
2144                          */
2145                         if (strstr(p, "IBM,CBEA") ||
2146                             strstr(p, "IBM,CPBW-1.0"))
2147                                 return PLATFORM_GENERIC;
2148 #endif /* CONFIG_PPC64 */
2149                         i += sl + 1;
2150                 }
2151         }
2152 #ifdef CONFIG_PPC64
2153         /* Try to detect OPAL */
2154         if (PHANDLE_VALID(call_prom("finddevice", 1, 1, ADDR("/ibm,opal"))))
2155                 return PLATFORM_OPAL;
2156
2157         /* Try to figure out if it's an IBM pSeries or any other
2158          * PAPR compliant platform. We assume it is if :
2159          *  - /device_type is "chrp" (please, do NOT use that for future
2160          *    non-IBM designs !
2161          *  - it has /rtas
2162          */
2163         len = prom_getprop(prom.root, "device_type",
2164                            compat, sizeof(compat)-1);
2165         if (len <= 0)
2166                 return PLATFORM_GENERIC;
2167         if (strcmp(compat, "chrp"))
2168                 return PLATFORM_GENERIC;
2169
2170         /* Default to pSeries. We need to know if we are running LPAR */
2171         rtas = call_prom("finddevice", 1, 1, ADDR("/rtas"));
2172         if (!PHANDLE_VALID(rtas))
2173                 return PLATFORM_GENERIC;
2174         x = prom_getproplen(rtas, "ibm,hypertas-functions");
2175         if (x != PROM_ERROR) {
2176                 prom_debug("Hypertas detected, assuming LPAR !\n");
2177                 return PLATFORM_PSERIES_LPAR;
2178         }
2179         return PLATFORM_PSERIES;
2180 #else
2181         return PLATFORM_GENERIC;
2182 #endif
2183 }
2184
2185 static int __init prom_set_color(ihandle ih, int i, int r, int g, int b)
2186 {
2187         return call_prom("call-method", 6, 1, ADDR("color!"), ih, i, b, g, r);
2188 }
2189
2190 /*
2191  * If we have a display that we don't know how to drive,
2192  * we will want to try to execute OF's open method for it
2193  * later.  However, OF will probably fall over if we do that
2194  * we've taken over the MMU.
2195  * So we check whether we will need to open the display,
2196  * and if so, open it now.
2197  */
2198 static void __init prom_check_displays(void)
2199 {
2200         char type[16], *path;
2201         phandle node;
2202         ihandle ih;
2203         int i;
2204
2205         static unsigned char default_colors[] = {
2206                 0x00, 0x00, 0x00,
2207                 0x00, 0x00, 0xaa,
2208                 0x00, 0xaa, 0x00,
2209                 0x00, 0xaa, 0xaa,
2210                 0xaa, 0x00, 0x00,
2211                 0xaa, 0x00, 0xaa,
2212                 0xaa, 0xaa, 0x00,
2213                 0xaa, 0xaa, 0xaa,
2214                 0x55, 0x55, 0x55,
2215                 0x55, 0x55, 0xff,
2216                 0x55, 0xff, 0x55,
2217                 0x55, 0xff, 0xff,
2218                 0xff, 0x55, 0x55,
2219                 0xff, 0x55, 0xff,
2220                 0xff, 0xff, 0x55,
2221                 0xff, 0xff, 0xff
2222         };
2223         const unsigned char *clut;
2224
2225         prom_debug("Looking for displays\n");
2226         for (node = 0; prom_next_node(&node); ) {
2227                 memset(type, 0, sizeof(type));
2228                 prom_getprop(node, "device_type", type, sizeof(type));
2229                 if (strcmp(type, "display") != 0)
2230                         continue;
2231
2232                 /* It seems OF doesn't null-terminate the path :-( */
2233                 path = prom_scratch;
2234                 memset(path, 0, PROM_SCRATCH_SIZE);
2235
2236                 /*
2237                  * leave some room at the end of the path for appending extra
2238                  * arguments
2239                  */
2240                 if (call_prom("package-to-path", 3, 1, node, path,
2241                               PROM_SCRATCH_SIZE-10) == PROM_ERROR)
2242                         continue;
2243                 prom_printf("found display   : %s, opening... ", path);
2244                 
2245                 ih = call_prom("open", 1, 1, path);
2246                 if (ih == 0) {
2247                         prom_printf("failed\n");
2248                         continue;
2249                 }
2250
2251                 /* Success */
2252                 prom_printf("done\n");
2253                 prom_setprop(node, path, "linux,opened", NULL, 0);
2254
2255                 /* Setup a usable color table when the appropriate
2256                  * method is available. Should update this to set-colors */
2257                 clut = default_colors;
2258                 for (i = 0; i < 16; i++, clut += 3)
2259                         if (prom_set_color(ih, i, clut[0], clut[1],
2260                                            clut[2]) != 0)
2261                                 break;
2262
2263 #ifdef CONFIG_LOGO_LINUX_CLUT224
2264                 clut = PTRRELOC(logo_linux_clut224.clut);
2265                 for (i = 0; i < logo_linux_clut224.clutsize; i++, clut += 3)
2266                         if (prom_set_color(ih, i + 32, clut[0], clut[1],
2267                                            clut[2]) != 0)
2268                                 break;
2269 #endif /* CONFIG_LOGO_LINUX_CLUT224 */
2270
2271 #ifdef CONFIG_PPC_EARLY_DEBUG_BOOTX
2272                 if (prom_getprop(node, "linux,boot-display", NULL, 0) !=
2273                     PROM_ERROR) {
2274                         u32 width, height, pitch, addr;
2275
2276                         prom_printf("Setting btext !\n");
2277                         prom_getprop(node, "width", &width, 4);
2278                         prom_getprop(node, "height", &height, 4);
2279                         prom_getprop(node, "linebytes", &pitch, 4);
2280                         prom_getprop(node, "address", &addr, 4);
2281                         prom_printf("W=%d H=%d LB=%d addr=0x%x\n",
2282                                     width, height, pitch, addr);
2283                         btext_setup_display(width, height, 8, pitch, addr);
2284                 }
2285 #endif /* CONFIG_PPC_EARLY_DEBUG_BOOTX */
2286         }
2287 }
2288
2289
2290 /* Return (relocated) pointer to this much memory: moves initrd if reqd. */
2291 static void __init *make_room(unsigned long *mem_start, unsigned long *mem_end,
2292                               unsigned long needed, unsigned long align)
2293 {
2294         void *ret;
2295
2296         *mem_start = _ALIGN(*mem_start, align);
2297         while ((*mem_start + needed) > *mem_end) {
2298                 unsigned long room, chunk;
2299
2300                 prom_debug("Chunk exhausted, claiming more at %lx...\n",
2301                            alloc_bottom);
2302                 room = alloc_top - alloc_bottom;
2303                 if (room > DEVTREE_CHUNK_SIZE)
2304                         room = DEVTREE_CHUNK_SIZE;
2305                 if (room < PAGE_SIZE)
2306                         prom_panic("No memory for flatten_device_tree "
2307                                    "(no room)\n");
2308                 chunk = alloc_up(room, 0);
2309                 if (chunk == 0)
2310                         prom_panic("No memory for flatten_device_tree "
2311                                    "(claim failed)\n");
2312                 *mem_end = chunk + room;
2313         }
2314
2315         ret = (void *)*mem_start;
2316         *mem_start += needed;
2317
2318         return ret;
2319 }
2320
2321 #define dt_push_token(token, mem_start, mem_end) do {                   \
2322                 void *room = make_room(mem_start, mem_end, 4, 4);       \
2323                 *(__be32 *)room = cpu_to_be32(token);                   \
2324         } while(0)
2325
2326 static unsigned long __init dt_find_string(char *str)
2327 {
2328         char *s, *os;
2329
2330         s = os = (char *)dt_string_start;
2331         s += 4;
2332         while (s <  (char *)dt_string_end) {
2333                 if (strcmp(s, str) == 0)
2334                         return s - os;
2335                 s += strlen(s) + 1;
2336         }
2337         return 0;
2338 }
2339
2340 /*
2341  * The Open Firmware 1275 specification states properties must be 31 bytes or
2342  * less, however not all firmwares obey this. Make it 64 bytes to be safe.
2343  */
2344 #define MAX_PROPERTY_NAME 64
2345
2346 static void __init scan_dt_build_strings(phandle node,
2347                                          unsigned long *mem_start,
2348                                          unsigned long *mem_end)
2349 {
2350         char *prev_name, *namep, *sstart;
2351         unsigned long soff;
2352         phandle child;
2353
2354         sstart =  (char *)dt_string_start;
2355
2356         /* get and store all property names */
2357         prev_name = "";
2358         for (;;) {
2359                 /* 64 is max len of name including nul. */
2360                 namep = make_room(mem_start, mem_end, MAX_PROPERTY_NAME, 1);
2361                 if (call_prom("nextprop", 3, 1, node, prev_name, namep) != 1) {
2362                         /* No more nodes: unwind alloc */
2363                         *mem_start = (unsigned long)namep;
2364                         break;
2365                 }
2366
2367                 /* skip "name" */
2368                 if (strcmp(namep, "name") == 0) {
2369                         *mem_start = (unsigned long)namep;
2370                         prev_name = "name";
2371                         continue;
2372                 }
2373                 /* get/create string entry */
2374                 soff = dt_find_string(namep);
2375                 if (soff != 0) {
2376                         *mem_start = (unsigned long)namep;
2377                         namep = sstart + soff;
2378                 } else {
2379                         /* Trim off some if we can */
2380                         *mem_start = (unsigned long)namep + strlen(namep) + 1;
2381                         dt_string_end = *mem_start;
2382                 }
2383                 prev_name = namep;
2384         }
2385
2386         /* do all our children */
2387         child = call_prom("child", 1, 1, node);
2388         while (child != 0) {
2389                 scan_dt_build_strings(child, mem_start, mem_end);
2390                 child = call_prom("peer", 1, 1, child);
2391         }
2392 }
2393
2394 static void __init scan_dt_build_struct(phandle node, unsigned long *mem_start,
2395                                         unsigned long *mem_end)
2396 {
2397         phandle child;
2398         char *namep, *prev_name, *sstart, *p, *ep, *lp, *path;
2399         unsigned long soff;
2400         unsigned char *valp;
2401         static char pname[MAX_PROPERTY_NAME];
2402         int l, room, has_phandle = 0;
2403
2404         dt_push_token(OF_DT_BEGIN_NODE, mem_start, mem_end);
2405
2406         /* get the node's full name */
2407         namep = (char *)*mem_start;
2408         room = *mem_end - *mem_start;
2409         if (room > 255)
2410                 room = 255;
2411         l = call_prom("package-to-path", 3, 1, node, namep, room);
2412         if (l >= 0) {
2413                 /* Didn't fit?  Get more room. */
2414                 if (l >= room) {
2415                         if (l >= *mem_end - *mem_start)
2416                                 namep = make_room(mem_start, mem_end, l+1, 1);
2417                         call_prom("package-to-path", 3, 1, node, namep, l);
2418                 }
2419                 namep[l] = '\0';
2420
2421                 /* Fixup an Apple bug where they have bogus \0 chars in the
2422                  * middle of the path in some properties, and extract
2423                  * the unit name (everything after the last '/').
2424                  */
2425                 for (lp = p = namep, ep = namep + l; p < ep; p++) {
2426                         if (*p == '/')
2427                                 lp = namep;
2428                         else if (*p != 0)
2429                                 *lp++ = *p;
2430                 }
2431                 *lp = 0;
2432                 *mem_start = _ALIGN((unsigned long)lp + 1, 4);
2433         }
2434
2435         /* get it again for debugging */
2436         path = prom_scratch;
2437         memset(path, 0, PROM_SCRATCH_SIZE);
2438         call_prom("package-to-path", 3, 1, node, path, PROM_SCRATCH_SIZE-1);
2439
2440         /* get and store all properties */
2441         prev_name = "";
2442         sstart = (char *)dt_string_start;
2443         for (;;) {
2444                 if (call_prom("nextprop", 3, 1, node, prev_name,
2445                               pname) != 1)
2446                         break;
2447
2448                 /* skip "name" */
2449                 if (strcmp(pname, "name") == 0) {
2450                         prev_name = "name";
2451                         continue;
2452                 }
2453
2454                 /* find string offset */
2455                 soff = dt_find_string(pname);
2456                 if (soff == 0) {
2457                         prom_printf("WARNING: Can't find string index for"
2458                                     " <%s>, node %s\n", pname, path);
2459                         break;
2460                 }
2461                 prev_name = sstart + soff;
2462
2463                 /* get length */
2464                 l = call_prom("getproplen", 2, 1, node, pname);
2465
2466                 /* sanity checks */
2467                 if (l == PROM_ERROR)
2468                         continue;
2469
2470                 /* push property head */
2471                 dt_push_token(OF_DT_PROP, mem_start, mem_end);
2472                 dt_push_token(l, mem_start, mem_end);
2473                 dt_push_token(soff, mem_start, mem_end);
2474
2475                 /* push property content */
2476                 valp = make_room(mem_start, mem_end, l, 4);
2477                 call_prom("getprop", 4, 1, node, pname, valp, l);
2478                 *mem_start = _ALIGN(*mem_start, 4);
2479
2480                 if (!strcmp(pname, "phandle"))
2481                         has_phandle = 1;
2482         }
2483
2484         /* Add a "linux,phandle" property if no "phandle" property already
2485          * existed (can happen with OPAL)
2486          */
2487         if (!has_phandle) {
2488                 soff = dt_find_string("linux,phandle");
2489                 if (soff == 0)
2490                         prom_printf("WARNING: Can't find string index for"
2491                                     " <linux-phandle> node %s\n", path);
2492                 else {
2493                         dt_push_token(OF_DT_PROP, mem_start, mem_end);
2494                         dt_push_token(4, mem_start, mem_end);
2495                         dt_push_token(soff, mem_start, mem_end);
2496                         valp = make_room(mem_start, mem_end, 4, 4);
2497                         *(__be32 *)valp = cpu_to_be32(node);
2498                 }
2499         }
2500
2501         /* do all our children */
2502         child = call_prom("child", 1, 1, node);
2503         while (child != 0) {
2504                 scan_dt_build_struct(child, mem_start, mem_end);
2505                 child = call_prom("peer", 1, 1, child);
2506         }
2507
2508         dt_push_token(OF_DT_END_NODE, mem_start, mem_end);
2509 }
2510
2511 static void __init flatten_device_tree(void)
2512 {
2513         phandle root;
2514         unsigned long mem_start, mem_end, room;
2515         struct boot_param_header *hdr;
2516         char *namep;
2517         u64 *rsvmap;
2518
2519         /*
2520          * Check how much room we have between alloc top & bottom (+/- a
2521          * few pages), crop to 1MB, as this is our "chunk" size
2522          */
2523         room = alloc_top - alloc_bottom - 0x4000;
2524         if (room > DEVTREE_CHUNK_SIZE)
2525                 room = DEVTREE_CHUNK_SIZE;
2526         prom_debug("starting device tree allocs at %lx\n", alloc_bottom);
2527
2528         /* Now try to claim that */
2529         mem_start = (unsigned long)alloc_up(room, PAGE_SIZE);
2530         if (mem_start == 0)
2531                 prom_panic("Can't allocate initial device-tree chunk\n");
2532         mem_end = mem_start + room;
2533
2534         /* Get root of tree */
2535         root = call_prom("peer", 1, 1, (phandle)0);
2536         if (root == (phandle)0)
2537                 prom_panic ("couldn't get device tree root\n");
2538
2539         /* Build header and make room for mem rsv map */ 
2540         mem_start = _ALIGN(mem_start, 4);
2541         hdr = make_room(&mem_start, &mem_end,
2542                         sizeof(struct boot_param_header), 4);
2543         dt_header_start = (unsigned long)hdr;
2544         rsvmap = make_room(&mem_start, &mem_end, sizeof(mem_reserve_map), 8);
2545
2546         /* Start of strings */
2547         mem_start = PAGE_ALIGN(mem_start);
2548         dt_string_start = mem_start;
2549         mem_start += 4; /* hole */
2550
2551         /* Add "linux,phandle" in there, we'll need it */
2552         namep = make_room(&mem_start, &mem_end, 16, 1);
2553         strcpy(namep, "linux,phandle");
2554         mem_start = (unsigned long)namep + strlen(namep) + 1;
2555
2556         /* Build string array */
2557         prom_printf("Building dt strings...\n"); 
2558         scan_dt_build_strings(root, &mem_start, &mem_end);
2559         dt_string_end = mem_start;
2560
2561         /* Build structure */
2562         mem_start = PAGE_ALIGN(mem_start);
2563         dt_struct_start = mem_start;
2564         prom_printf("Building dt structure...\n"); 
2565         scan_dt_build_struct(root, &mem_start, &mem_end);
2566         dt_push_token(OF_DT_END, &mem_start, &mem_end);
2567         dt_struct_end = PAGE_ALIGN(mem_start);
2568
2569         /* Finish header */
2570         hdr->boot_cpuid_phys = cpu_to_be32(prom.cpu);
2571         hdr->magic = cpu_to_be32(OF_DT_HEADER);
2572         hdr->totalsize = cpu_to_be32(dt_struct_end - dt_header_start);
2573         hdr->off_dt_struct = cpu_to_be32(dt_struct_start - dt_header_start);
2574         hdr->off_dt_strings = cpu_to_be32(dt_string_start - dt_header_start);
2575         hdr->dt_strings_size = cpu_to_be32(dt_string_end - dt_string_start);
2576         hdr->off_mem_rsvmap = cpu_to_be32(((unsigned long)rsvmap) - dt_header_start);
2577         hdr->version = cpu_to_be32(OF_DT_VERSION);
2578         /* Version 16 is not backward compatible */
2579         hdr->last_comp_version = cpu_to_be32(0x10);
2580
2581         /* Copy the reserve map in */
2582         memcpy(rsvmap, mem_reserve_map, sizeof(mem_reserve_map));
2583
2584 #ifdef DEBUG_PROM
2585         {
2586                 int i;
2587                 prom_printf("reserved memory map:\n");
2588                 for (i = 0; i < mem_reserve_cnt; i++)
2589                         prom_printf("  %llx - %llx\n",
2590                                     be64_to_cpu(mem_reserve_map[i].base),
2591                                     be64_to_cpu(mem_reserve_map[i].size));
2592         }
2593 #endif
2594         /* Bump mem_reserve_cnt to cause further reservations to fail
2595          * since it's too late.
2596          */
2597         mem_reserve_cnt = MEM_RESERVE_MAP_SIZE;
2598
2599         prom_printf("Device tree strings 0x%lx -> 0x%lx\n",
2600                     dt_string_start, dt_string_end);
2601         prom_printf("Device tree struct  0x%lx -> 0x%lx\n",
2602                     dt_struct_start, dt_struct_end);
2603 }
2604
2605 #ifdef CONFIG_PPC_MAPLE
2606 /* PIBS Version 1.05.0000 04/26/2005 has an incorrect /ht/isa/ranges property.
2607  * The values are bad, and it doesn't even have the right number of cells. */
2608 static void __init fixup_device_tree_maple(void)
2609 {
2610         phandle isa;
2611         u32 rloc = 0x01002000; /* IO space; PCI device = 4 */
2612         u32 isa_ranges[6];
2613         char *name;
2614
2615         name = "/ht@0/isa@4";
2616         isa = call_prom("finddevice", 1, 1, ADDR(name));
2617         if (!PHANDLE_VALID(isa)) {
2618                 name = "/ht@0/isa@6";
2619                 isa = call_prom("finddevice", 1, 1, ADDR(name));
2620                 rloc = 0x01003000; /* IO space; PCI device = 6 */
2621         }
2622         if (!PHANDLE_VALID(isa))
2623                 return;
2624
2625         if (prom_getproplen(isa, "ranges") != 12)
2626                 return;
2627         if (prom_getprop(isa, "ranges", isa_ranges, sizeof(isa_ranges))
2628                 == PROM_ERROR)
2629                 return;
2630
2631         if (isa_ranges[0] != 0x1 ||
2632                 isa_ranges[1] != 0xf4000000 ||
2633                 isa_ranges[2] != 0x00010000)
2634                 return;
2635
2636         prom_printf("Fixing up bogus ISA range on Maple/Apache...\n");
2637
2638         isa_ranges[0] = 0x1;
2639         isa_ranges[1] = 0x0;
2640         isa_ranges[2] = rloc;
2641         isa_ranges[3] = 0x0;
2642         isa_ranges[4] = 0x0;
2643         isa_ranges[5] = 0x00010000;
2644         prom_setprop(isa, name, "ranges",
2645                         isa_ranges, sizeof(isa_ranges));
2646 }
2647
2648 #define CPC925_MC_START         0xf8000000
2649 #define CPC925_MC_LENGTH        0x1000000
2650 /* The values for memory-controller don't have right number of cells */
2651 static void __init fixup_device_tree_maple_memory_controller(void)
2652 {
2653         phandle mc;
2654         u32 mc_reg[4];
2655         char *name = "/hostbridge@f8000000";
2656         u32 ac, sc;
2657
2658         mc = call_prom("finddevice", 1, 1, ADDR(name));
2659         if (!PHANDLE_VALID(mc))
2660                 return;
2661
2662         if (prom_getproplen(mc, "reg") != 8)
2663                 return;
2664
2665         prom_getprop(prom.root, "#address-cells", &ac, sizeof(ac));
2666         prom_getprop(prom.root, "#size-cells", &sc, sizeof(sc));
2667         if ((ac != 2) || (sc != 2))
2668                 return;
2669
2670         if (prom_getprop(mc, "reg", mc_reg, sizeof(mc_reg)) == PROM_ERROR)
2671                 return;
2672
2673         if (mc_reg[0] != CPC925_MC_START || mc_reg[1] != CPC925_MC_LENGTH)
2674                 return;
2675
2676         prom_printf("Fixing up bogus hostbridge on Maple...\n");
2677
2678         mc_reg[0] = 0x0;
2679         mc_reg[1] = CPC925_MC_START;
2680         mc_reg[2] = 0x0;
2681         mc_reg[3] = CPC925_MC_LENGTH;
2682         prom_setprop(mc, name, "reg", mc_reg, sizeof(mc_reg));
2683 }
2684 #else
2685 #define fixup_device_tree_maple()
2686 #define fixup_device_tree_maple_memory_controller()
2687 #endif
2688
2689 #ifdef CONFIG_PPC_CHRP
2690 /*
2691  * Pegasos and BriQ lacks the "ranges" property in the isa node
2692  * Pegasos needs decimal IRQ 14/15, not hexadecimal
2693  * Pegasos has the IDE configured in legacy mode, but advertised as native
2694  */
2695 static void __init fixup_device_tree_chrp(void)
2696 {
2697         phandle ph;
2698         u32 prop[6];
2699         u32 rloc = 0x01006000; /* IO space; PCI device = 12 */
2700         char *name;
2701         int rc;
2702
2703         name = "/pci@80000000/isa@c";
2704         ph = call_prom("finddevice", 1, 1, ADDR(name));
2705         if (!PHANDLE_VALID(ph)) {
2706                 name = "/pci@ff500000/isa@6";
2707                 ph = call_prom("finddevice", 1, 1, ADDR(name));
2708                 rloc = 0x01003000; /* IO space; PCI device = 6 */
2709         }
2710         if (PHANDLE_VALID(ph)) {
2711                 rc = prom_getproplen(ph, "ranges");
2712                 if (rc == 0 || rc == PROM_ERROR) {
2713                         prom_printf("Fixing up missing ISA range on Pegasos...\n");
2714
2715                         prop[0] = 0x1;
2716                         prop[1] = 0x0;
2717                         prop[2] = rloc;
2718                         prop[3] = 0x0;
2719                         prop[4] = 0x0;
2720                         prop[5] = 0x00010000;
2721                         prom_setprop(ph, name, "ranges", prop, sizeof(prop));
2722                 }
2723         }
2724
2725         name = "/pci@80000000/ide@C,1";
2726         ph = call_prom("finddevice", 1, 1, ADDR(name));
2727         if (PHANDLE_VALID(ph)) {
2728                 prom_printf("Fixing up IDE interrupt on Pegasos...\n");
2729                 prop[0] = 14;
2730                 prop[1] = 0x0;
2731                 prom_setprop(ph, name, "interrupts", prop, 2*sizeof(u32));
2732                 prom_printf("Fixing up IDE class-code on Pegasos...\n");
2733                 rc = prom_getprop(ph, "class-code", prop, sizeof(u32));
2734                 if (rc == sizeof(u32)) {
2735                         prop[0] &= ~0x5;
2736                         prom_setprop(ph, name, "class-code", prop, sizeof(u32));
2737                 }
2738         }
2739 }
2740 #else
2741 #define fixup_device_tree_chrp()
2742 #endif
2743
2744 #if defined(CONFIG_PPC64) && defined(CONFIG_PPC_PMAC)
2745 static void __init fixup_device_tree_pmac(void)
2746 {
2747         phandle u3, i2c, mpic;
2748         u32 u3_rev;
2749         u32 interrupts[2];
2750         u32 parent;
2751
2752         /* Some G5s have a missing interrupt definition, fix it up here */
2753         u3 = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000"));
2754         if (!PHANDLE_VALID(u3))
2755                 return;
2756         i2c = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000/i2c@f8001000"));
2757         if (!PHANDLE_VALID(i2c))
2758                 return;
2759         mpic = call_prom("finddevice", 1, 1, ADDR("/u3@0,f8000000/mpic@f8040000"));
2760         if (!PHANDLE_VALID(mpic))
2761                 return;
2762
2763         /* check if proper rev of u3 */
2764         if (prom_getprop(u3, "device-rev", &u3_rev, sizeof(u3_rev))
2765             == PROM_ERROR)
2766                 return;
2767         if (u3_rev < 0x35 || u3_rev > 0x39)
2768                 return;
2769         /* does it need fixup ? */
2770         if (prom_getproplen(i2c, "interrupts") > 0)
2771                 return;
2772
2773         prom_printf("fixing up bogus interrupts for u3 i2c...\n");
2774
2775         /* interrupt on this revision of u3 is number 0 and level */
2776         interrupts[0] = 0;
2777         interrupts[1] = 1;
2778         prom_setprop(i2c, "/u3@0,f8000000/i2c@f8001000", "interrupts",
2779                      &interrupts, sizeof(interrupts));
2780         parent = (u32)mpic;
2781         prom_setprop(i2c, "/u3@0,f8000000/i2c@f8001000", "interrupt-parent",
2782                      &parent, sizeof(parent));
2783 }
2784 #else
2785 #define fixup_device_tree_pmac()
2786 #endif
2787
2788 #ifdef CONFIG_PPC_EFIKA
2789 /*
2790  * The MPC5200 FEC driver requires an phy-handle property to tell it how
2791  * to talk to the phy.  If the phy-handle property is missing, then this
2792  * function is called to add the appropriate nodes and link it to the
2793  * ethernet node.
2794  */
2795 static void __init fixup_device_tree_efika_add_phy(void)
2796 {
2797         u32 node;
2798         char prop[64];
2799         int rv;
2800
2801         /* Check if /builtin/ethernet exists - bail if it doesn't */
2802         node = call_prom("finddevice", 1, 1, ADDR("/builtin/ethernet"));
2803         if (!PHANDLE_VALID(node))
2804                 return;
2805
2806         /* Check if the phy-handle property exists - bail if it does */
2807         rv = prom_getprop(node, "phy-handle", prop, sizeof(prop));
2808         if (rv <= 0)
2809                 return;
2810
2811         /*
2812          * At this point the ethernet device doesn't have a phy described.
2813          * Now we need to add the missing phy node and linkage
2814          */
2815
2816         /* Check for an MDIO bus node - if missing then create one */
2817         node = call_prom("finddevice", 1, 1, ADDR("/builtin/mdio"));
2818         if (!PHANDLE_VALID(node)) {
2819                 prom_printf("Adding Ethernet MDIO node\n");
2820                 call_prom("interpret", 1, 1,
2821                         " s\" /builtin\" find-device"
2822                         " new-device"
2823                                 " 1 encode-int s\" #address-cells\" property"
2824                                 " 0 encode-int s\" #size-cells\" property"
2825                                 " s\" mdio\" device-name"
2826                                 " s\" fsl,mpc5200b-mdio\" encode-string"
2827                                 " s\" compatible\" property"
2828                                 " 0xf0003000 0x400 reg"
2829                                 " 0x2 encode-int"
2830                                 " 0x5 encode-int encode+"
2831                                 " 0x3 encode-int encode+"
2832                                 " s\" interrupts\" property"
2833                         " finish-device");
2834         };
2835
2836         /* Check for a PHY device node - if missing then create one and
2837          * give it's phandle to the ethernet node */
2838         node = call_prom("finddevice", 1, 1,
2839                          ADDR("/builtin/mdio/ethernet-phy"));
2840         if (!PHANDLE_VALID(node)) {
2841                 prom_printf("Adding Ethernet PHY node\n");
2842                 call_prom("interpret", 1, 1,
2843                         " s\" /builtin/mdio\" find-device"
2844                         " new-device"
2845                                 " s\" ethernet-phy\" device-name"
2846                                 " 0x10 encode-int s\" reg\" property"
2847                                 " my-self"
2848                                 " ihandle>phandle"
2849                         " finish-device"
2850                         " s\" /builtin/ethernet\" find-device"
2851                                 " encode-int"
2852                                 " s\" phy-handle\" property"
2853                         " device-end");
2854         }
2855 }
2856
2857 static void __init fixup_device_tree_efika(void)
2858 {
2859         int sound_irq[3] = { 2, 2, 0 };
2860         int bcomm_irq[3*16] = { 3,0,0, 3,1,0, 3,2,0, 3,3,0,
2861                                 3,4,0, 3,5,0, 3,6,0, 3,7,0,
2862                                 3,8,0, 3,9,0, 3,10,0, 3,11,0,
2863                                 3,12,0, 3,13,0, 3,14,0, 3,15,0 };
2864         u32 node;
2865         char prop[64];
2866         int rv, len;
2867
2868         /* Check if we're really running on a EFIKA */
2869         node = call_prom("finddevice", 1, 1, ADDR("/"));
2870         if (!PHANDLE_VALID(node))
2871                 return;
2872
2873         rv = prom_getprop(node, "model", prop, sizeof(prop));
2874         if (rv == PROM_ERROR)
2875                 return;
2876         if (strcmp(prop, "EFIKA5K2"))
2877                 return;
2878
2879         prom_printf("Applying EFIKA device tree fixups\n");
2880
2881         /* Claiming to be 'chrp' is death */
2882         node = call_prom("finddevice", 1, 1, ADDR("/"));
2883         rv = prom_getprop(node, "device_type", prop, sizeof(prop));
2884         if (rv != PROM_ERROR && (strcmp(prop, "chrp") == 0))
2885                 prom_setprop(node, "/", "device_type", "efika", sizeof("efika"));
2886
2887         /* CODEGEN,description is exposed in /proc/cpuinfo so
2888            fix that too */
2889         rv = prom_getprop(node, "CODEGEN,description", prop, sizeof(prop));
2890         if (rv != PROM_ERROR && (strstr(prop, "CHRP")))
2891                 prom_setprop(node, "/", "CODEGEN,description",
2892                              "Efika 5200B PowerPC System",
2893                              sizeof("Efika 5200B PowerPC System"));
2894
2895         /* Fixup bestcomm interrupts property */
2896         node = call_prom("finddevice", 1, 1, ADDR("/builtin/bestcomm"));
2897         if (PHANDLE_VALID(node)) {
2898                 len = prom_getproplen(node, "interrupts");
2899                 if (len == 12) {
2900                         prom_printf("Fixing bestcomm interrupts property\n");
2901                         prom_setprop(node, "/builtin/bestcom", "interrupts",
2902                                      bcomm_irq, sizeof(bcomm_irq));
2903                 }
2904         }
2905
2906         /* Fixup sound interrupts property */
2907         node = call_prom("finddevice", 1, 1, ADDR("/builtin/sound"));
2908         if (PHANDLE_VALID(node)) {
2909                 rv = prom_getprop(node, "interrupts", prop, sizeof(prop));
2910                 if (rv == PROM_ERROR) {
2911                         prom_printf("Adding sound interrupts property\n");
2912                         prom_setprop(node, "/builtin/sound", "interrupts",
2913                                      sound_irq, sizeof(sound_irq));
2914                 }
2915         }
2916
2917         /* Make sure ethernet phy-handle property exists */
2918         fixup_device_tree_efika_add_phy();
2919 }
2920 #else
2921 #define fixup_device_tree_efika()
2922 #endif
2923
2924 #ifdef CONFIG_PPC_PASEMI_NEMO
2925 /*
2926  * CFE supplied on Nemo is broken in several ways, biggest
2927  * problem is that it reassigns ISA interrupts to unused mpic ints.
2928  * Add an interrupt-controller property for the io-bridge to use
2929  * and correct the ints so we can attach them to an irq_domain
2930  */
2931 static void __init fixup_device_tree_pasemi(void)
2932 {
2933         u32 interrupts[2], parent, rval, val = 0;
2934         char *name, *pci_name;
2935         phandle iob, node;
2936
2937         /* Find the root pci node */
2938         name = "/pxp@0,e0000000";
2939         iob = call_prom("finddevice", 1, 1, ADDR(name));
2940         if (!PHANDLE_VALID(iob))
2941                 return;
2942
2943         /* check if interrupt-controller node set yet */
2944         if (prom_getproplen(iob, "interrupt-controller") !=PROM_ERROR)
2945                 return;
2946
2947         prom_printf("adding interrupt-controller property for SB600...\n");
2948
2949         prom_setprop(iob, name, "interrupt-controller", &val, 0);
2950
2951         pci_name = "/pxp@0,e0000000/pci@11";
2952         node = call_prom("finddevice", 1, 1, ADDR(pci_name));
2953         parent = ADDR(iob);
2954
2955         for( ; prom_next_node(&node); ) {
2956                 /* scan each node for one with an interrupt */
2957                 if (!PHANDLE_VALID(node))
2958                         continue;
2959
2960                 rval = prom_getproplen(node, "interrupts");
2961                 if (rval == 0 || rval == PROM_ERROR)
2962                         continue;
2963
2964                 prom_getprop(node, "interrupts", &interrupts, sizeof(interrupts));
2965                 if ((interrupts[0] < 212) || (interrupts[0] > 222))
2966                         continue;
2967
2968                 /* found a node, update both interrupts and interrupt-parent */
2969                 if ((interrupts[0] >= 212) && (interrupts[0] <= 215))
2970                         interrupts[0] -= 203;
2971                 if ((interrupts[0] >= 216) && (interrupts[0] <= 220))
2972                         interrupts[0] -= 213;
2973                 if (interrupts[0] == 221)
2974                         interrupts[0] = 14;
2975                 if (interrupts[0] == 222)
2976                         interrupts[0] = 8;
2977
2978                 prom_setprop(node, pci_name, "interrupts", interrupts,
2979                                         sizeof(interrupts));
2980                 prom_setprop(node, pci_name, "interrupt-parent", &parent,
2981                                         sizeof(parent));
2982         }
2983
2984         /*
2985          * The io-bridge has device_type set to 'io-bridge' change it to 'isa'
2986          * so that generic isa-bridge code can add the SB600 and its on-board
2987          * peripherals.
2988          */
2989         name = "/pxp@0,e0000000/io-bridge@0";
2990         iob = call_prom("finddevice", 1, 1, ADDR(name));
2991         if (!PHANDLE_VALID(iob))
2992                 return;
2993
2994         /* device_type is already set, just change it. */
2995
2996         prom_printf("Changing device_type of SB600 node...\n");
2997
2998         prom_setprop(iob, name, "device_type", "isa", sizeof("isa"));
2999 }
3000 #else   /* !CONFIG_PPC_PASEMI_NEMO */
3001 static inline void fixup_device_tree_pasemi(void) { }
3002 #endif
3003
3004 static void __init fixup_device_tree(void)
3005 {
3006         fixup_device_tree_maple();
3007         fixup_device_tree_maple_memory_controller();
3008         fixup_device_tree_chrp();
3009         fixup_device_tree_pmac();
3010         fixup_device_tree_efika();
3011         fixup_device_tree_pasemi();
3012 }
3013
3014 static void __init prom_find_boot_cpu(void)
3015 {
3016         __be32 rval;
3017         ihandle prom_cpu;
3018         phandle cpu_pkg;
3019
3020         rval = 0;
3021         if (prom_getprop(prom.chosen, "cpu", &rval, sizeof(rval)) <= 0)
3022                 return;
3023         prom_cpu = be32_to_cpu(rval);
3024
3025         cpu_pkg = call_prom("instance-to-package", 1, 1, prom_cpu);
3026
3027         if (!PHANDLE_VALID(cpu_pkg))
3028                 return;
3029
3030         prom_getprop(cpu_pkg, "reg", &rval, sizeof(rval));
3031         prom.cpu = be32_to_cpu(rval);
3032
3033         prom_debug("Booting CPU hw index = %d\n", prom.cpu);
3034 }
3035
3036 static void __init prom_check_initrd(unsigned long r3, unsigned long r4)
3037 {
3038 #ifdef CONFIG_BLK_DEV_INITRD
3039         if (r3 && r4 && r4 != 0xdeadbeef) {
3040                 __be64 val;
3041
3042                 prom_initrd_start = is_kernel_addr(r3) ? __pa(r3) : r3;
3043                 prom_initrd_end = prom_initrd_start + r4;
3044
3045                 val = cpu_to_be64(prom_initrd_start);
3046                 prom_setprop(prom.chosen, "/chosen", "linux,initrd-start",
3047                              &val, sizeof(val));
3048                 val = cpu_to_be64(prom_initrd_end);
3049                 prom_setprop(prom.chosen, "/chosen", "linux,initrd-end",
3050                              &val, sizeof(val));
3051
3052                 reserve_mem(prom_initrd_start,
3053                             prom_initrd_end - prom_initrd_start);
3054
3055                 prom_debug("initrd_start=0x%lx\n", prom_initrd_start);
3056                 prom_debug("initrd_end=0x%lx\n", prom_initrd_end);
3057         }
3058 #endif /* CONFIG_BLK_DEV_INITRD */
3059 }
3060
3061 #ifdef CONFIG_PPC64
3062 #ifdef CONFIG_RELOCATABLE
3063 static void reloc_toc(void)
3064 {
3065 }
3066
3067 static void unreloc_toc(void)
3068 {
3069 }
3070 #else
3071 static void __reloc_toc(unsigned long offset, unsigned long nr_entries)
3072 {
3073         unsigned long i;
3074         unsigned long *toc_entry;
3075
3076         /* Get the start of the TOC by using r2 directly. */
3077         asm volatile("addi %0,2,-0x8000" : "=b" (toc_entry));
3078
3079         for (i = 0; i < nr_entries; i++) {
3080                 *toc_entry = *toc_entry + offset;
3081                 toc_entry++;
3082         }
3083 }
3084
3085 static void reloc_toc(void)
3086 {
3087         unsigned long offset = reloc_offset();
3088         unsigned long nr_entries =
3089                 (__prom_init_toc_end - __prom_init_toc_start) / sizeof(long);
3090
3091         __reloc_toc(offset, nr_entries);
3092
3093         mb();
3094 }
3095
3096 static void unreloc_toc(void)
3097 {
3098         unsigned long offset = reloc_offset();
3099         unsigned long nr_entries =
3100                 (__prom_init_toc_end - __prom_init_toc_start) / sizeof(long);
3101
3102         mb();
3103
3104         __reloc_toc(-offset, nr_entries);
3105 }
3106 #endif
3107 #endif
3108
3109 /*
3110  * We enter here early on, when the Open Firmware prom is still
3111  * handling exceptions and the MMU hash table for us.
3112  */
3113
3114 unsigned long __init prom_init(unsigned long r3, unsigned long r4,
3115                                unsigned long pp,
3116                                unsigned long r6, unsigned long r7,
3117                                unsigned long kbase)
3118 {       
3119         unsigned long hdr;
3120
3121 #ifdef CONFIG_PPC32
3122         unsigned long offset = reloc_offset();
3123         reloc_got2(offset);
3124 #else
3125         reloc_toc();
3126 #endif
3127
3128         /*
3129          * First zero the BSS
3130          */
3131         memset(&__bss_start, 0, __bss_stop - __bss_start);
3132
3133         /*
3134          * Init interface to Open Firmware, get some node references,
3135          * like /chosen
3136          */
3137         prom_init_client_services(pp);
3138
3139         /*
3140          * See if this OF is old enough that we need to do explicit maps
3141          * and other workarounds
3142          */
3143         prom_find_mmu();
3144
3145         /*
3146          * Init prom stdout device
3147          */
3148         prom_init_stdout();
3149
3150         prom_printf("Preparing to boot %s", linux_banner);
3151
3152         /*
3153          * Get default machine type. At this point, we do not differentiate
3154          * between pSeries SMP and pSeries LPAR
3155          */
3156         of_platform = prom_find_machine_type();
3157         prom_printf("Detected machine type: %x\n", of_platform);
3158
3159 #ifndef CONFIG_NONSTATIC_KERNEL
3160         /* Bail if this is a kdump kernel. */
3161         if (PHYSICAL_START > 0)
3162                 prom_panic("Error: You can't boot a kdump kernel from OF!\n");
3163 #endif
3164
3165         /*
3166          * Check for an initrd
3167          */
3168         prom_check_initrd(r3, r4);
3169
3170         /*
3171          * Do early parsing of command line
3172          */
3173         early_cmdline_parse();
3174
3175 #if defined(CONFIG_PPC_PSERIES) || defined(CONFIG_PPC_POWERNV)
3176         /*
3177          * On pSeries, inform the firmware about our capabilities
3178          */
3179         if (of_platform == PLATFORM_PSERIES ||
3180             of_platform == PLATFORM_PSERIES_LPAR)
3181                 prom_send_capabilities();
3182 #endif
3183
3184         /*
3185          * Copy the CPU hold code
3186          */
3187         if (of_platform != PLATFORM_POWERMAC)
3188                 copy_and_flush(0, kbase, 0x100, 0);
3189
3190         /*
3191          * Initialize memory management within prom_init
3192          */
3193         prom_init_mem();
3194
3195         /*
3196          * Determine which cpu is actually running right _now_
3197          */
3198         prom_find_boot_cpu();
3199
3200         /* 
3201          * Initialize display devices
3202          */
3203         prom_check_displays();
3204
3205 #if defined(CONFIG_PPC64) && defined(__BIG_ENDIAN__)
3206         /*
3207          * Initialize IOMMU (TCE tables) on pSeries. Do that before anything else
3208          * that uses the allocator, we need to make sure we get the top of memory
3209          * available for us here...
3210          */
3211         if (of_platform == PLATFORM_PSERIES)
3212                 prom_initialize_tce_table();
3213 #endif
3214
3215         /*
3216          * On non-powermacs, try to instantiate RTAS. PowerMacs don't
3217          * have a usable RTAS implementation.
3218          */
3219         if (of_platform != PLATFORM_POWERMAC &&
3220             of_platform != PLATFORM_OPAL)
3221                 prom_instantiate_rtas();
3222
3223 #ifdef CONFIG_PPC_POWERNV
3224         if (of_platform == PLATFORM_OPAL)
3225                 prom_instantiate_opal();
3226 #endif /* CONFIG_PPC_POWERNV */
3227
3228 #ifdef CONFIG_PPC64
3229         /* instantiate sml */
3230         prom_instantiate_sml();
3231 #endif
3232
3233         /*
3234          * On non-powermacs, put all CPUs in spin-loops.
3235          *
3236          * PowerMacs use a different mechanism to spin CPUs
3237          *
3238          * (This must be done after instanciating RTAS)
3239          */
3240         if (of_platform != PLATFORM_POWERMAC &&
3241             of_platform != PLATFORM_OPAL)
3242                 prom_hold_cpus();
3243
3244         /*
3245          * Fill in some infos for use by the kernel later on
3246          */
3247         if (prom_memory_limit) {
3248                 __be64 val = cpu_to_be64(prom_memory_limit);
3249                 prom_setprop(prom.chosen, "/chosen", "linux,memory-limit",
3250                              &val, sizeof(val));
3251         }
3252 #ifdef CONFIG_PPC64
3253         if (prom_iommu_off)
3254                 prom_setprop(prom.chosen, "/chosen", "linux,iommu-off",
3255                              NULL, 0);
3256
3257         if (prom_iommu_force_on)
3258                 prom_setprop(prom.chosen, "/chosen", "linux,iommu-force-on",
3259                              NULL, 0);
3260
3261         if (prom_tce_alloc_start) {
3262                 prom_setprop(prom.chosen, "/chosen", "linux,tce-alloc-start",
3263                              &prom_tce_alloc_start,
3264                              sizeof(prom_tce_alloc_start));
3265                 prom_setprop(prom.chosen, "/chosen", "linux,tce-alloc-end",
3266                              &prom_tce_alloc_end,
3267                              sizeof(prom_tce_alloc_end));
3268         }
3269 #endif
3270
3271         /*
3272          * Fixup any known bugs in the device-tree
3273          */
3274         fixup_device_tree();
3275
3276         /*
3277          * Now finally create the flattened device-tree
3278          */
3279         prom_printf("copying OF device tree...\n");
3280         flatten_device_tree();
3281
3282         /*
3283          * in case stdin is USB and still active on IBM machines...
3284          * Unfortunately quiesce crashes on some powermacs if we have
3285          * closed stdin already (in particular the powerbook 101). It
3286          * appears that the OPAL version of OFW doesn't like it either.
3287          */
3288         if (of_platform != PLATFORM_POWERMAC &&
3289             of_platform != PLATFORM_OPAL)
3290                 prom_close_stdin();
3291
3292         /*
3293          * Call OF "quiesce" method to shut down pending DMA's from
3294          * devices etc...
3295          */
3296         prom_printf("Quiescing Open Firmware ...\n");
3297         call_prom("quiesce", 0, 0);
3298
3299         /*
3300          * And finally, call the kernel passing it the flattened device
3301          * tree and NULL as r5, thus triggering the new entry point which
3302          * is common to us and kexec
3303          */
3304         hdr = dt_header_start;
3305
3306         /* Don't print anything after quiesce under OPAL, it crashes OFW */
3307         if (of_platform != PLATFORM_OPAL) {
3308                 prom_printf("Booting Linux via __start() @ 0x%lx ...\n", kbase);
3309                 prom_debug("->dt_header_start=0x%lx\n", hdr);
3310         }
3311
3312 #ifdef CONFIG_PPC32
3313         reloc_got2(-offset);
3314 #else
3315         unreloc_toc();
3316 #endif
3317
3318 #ifdef CONFIG_PPC_EARLY_DEBUG_OPAL
3319         /* OPAL early debug gets the OPAL base & entry in r8 and r9 */
3320         __start(hdr, kbase, 0, 0, 0,
3321                 prom_opal_base, prom_opal_entry);
3322 #else
3323         __start(hdr, kbase, 0, 0, 0, 0, 0);
3324 #endif
3325
3326         return 0;
3327 }