2 * Copyright (C) 1995-1999 Gary Thomas, Paul Mackerras, Cort Dougan.
4 #ifndef _ASM_POWERPC_PPC_ASM_H
5 #define _ASM_POWERPC_PPC_ASM_H
7 #include <linux/stringify.h>
8 #include <asm/asm-compat.h>
9 #include <asm/processor.h>
10 #include <asm/ppc-opcode.h>
11 #include <asm/firmware.h>
14 #error __FILE__ should only be used in assembler files
17 #define SZL (BITS_PER_LONG/8)
20 * Stuff for accurate CPU time accounting.
21 * These macros handle transitions between user and system state
22 * in exception entry and exit and accumulate time to the
23 * user_time and system_time fields in the paca.
26 #ifndef CONFIG_VIRT_CPU_ACCOUNTING_NATIVE
27 #define ACCOUNT_CPU_USER_ENTRY(ra, rb)
28 #define ACCOUNT_CPU_USER_EXIT(ra, rb)
29 #define ACCOUNT_STOLEN_TIME
31 #define ACCOUNT_CPU_USER_ENTRY(ra, rb) \
32 MFTB(ra); /* get timebase */ \
33 ld rb,PACA_STARTTIME_USER(r13); \
34 std ra,PACA_STARTTIME(r13); \
35 subf rb,rb,ra; /* subtract start value */ \
36 ld ra,PACA_USER_TIME(r13); \
37 add ra,ra,rb; /* add on to user time */ \
38 std ra,PACA_USER_TIME(r13); \
40 #define ACCOUNT_CPU_USER_EXIT(ra, rb) \
41 MFTB(ra); /* get timebase */ \
42 ld rb,PACA_STARTTIME(r13); \
43 std ra,PACA_STARTTIME_USER(r13); \
44 subf rb,rb,ra; /* subtract start value */ \
45 ld ra,PACA_SYSTEM_TIME(r13); \
46 add ra,ra,rb; /* add on to system time */ \
47 std ra,PACA_SYSTEM_TIME(r13)
49 #ifdef CONFIG_PPC_SPLPAR
50 #define ACCOUNT_STOLEN_TIME \
51 BEGIN_FW_FTR_SECTION; \
53 /* from user - see if there are any DTL entries to process */ \
54 ld r10,PACALPPACAPTR(r13); /* get ptr to VPA */ \
55 ld r11,PACA_DTL_RIDX(r13); /* get log read index */ \
56 addi r10,r10,LPPACA_DTLIDX; \
57 LDX_BE r10,0,r10; /* get log write index */ \
60 bl accumulate_stolen_time; \
62 andi. r10,r12,MSR_PR; /* Restore cr0 (coming from user) */ \
64 END_FW_FTR_SECTION_IFSET(FW_FEATURE_SPLPAR)
66 #else /* CONFIG_PPC_SPLPAR */
67 #define ACCOUNT_STOLEN_TIME
69 #endif /* CONFIG_PPC_SPLPAR */
71 #endif /* CONFIG_VIRT_CPU_ACCOUNTING_NATIVE */
74 * Macros for storing registers into and loading registers from
78 #define SAVE_GPR(n, base) std n,GPR0+8*(n)(base)
79 #define REST_GPR(n, base) ld n,GPR0+8*(n)(base)
80 #define SAVE_NVGPRS(base) SAVE_8GPRS(14, base); SAVE_10GPRS(22, base)
81 #define REST_NVGPRS(base) REST_8GPRS(14, base); REST_10GPRS(22, base)
83 #define SAVE_GPR(n, base) stw n,GPR0+4*(n)(base)
84 #define REST_GPR(n, base) lwz n,GPR0+4*(n)(base)
85 #define SAVE_NVGPRS(base) SAVE_GPR(13, base); SAVE_8GPRS(14, base); \
87 #define REST_NVGPRS(base) REST_GPR(13, base); REST_8GPRS(14, base); \
91 #define SAVE_2GPRS(n, base) SAVE_GPR(n, base); SAVE_GPR(n+1, base)
92 #define SAVE_4GPRS(n, base) SAVE_2GPRS(n, base); SAVE_2GPRS(n+2, base)
93 #define SAVE_8GPRS(n, base) SAVE_4GPRS(n, base); SAVE_4GPRS(n+4, base)
94 #define SAVE_10GPRS(n, base) SAVE_8GPRS(n, base); SAVE_2GPRS(n+8, base)
95 #define REST_2GPRS(n, base) REST_GPR(n, base); REST_GPR(n+1, base)
96 #define REST_4GPRS(n, base) REST_2GPRS(n, base); REST_2GPRS(n+2, base)
97 #define REST_8GPRS(n, base) REST_4GPRS(n, base); REST_4GPRS(n+4, base)
98 #define REST_10GPRS(n, base) REST_8GPRS(n, base); REST_2GPRS(n+8, base)
100 #define SAVE_FPR(n, base) stfd n,8*TS_FPRWIDTH*(n)(base)
101 #define SAVE_2FPRS(n, base) SAVE_FPR(n, base); SAVE_FPR(n+1, base)
102 #define SAVE_4FPRS(n, base) SAVE_2FPRS(n, base); SAVE_2FPRS(n+2, base)
103 #define SAVE_8FPRS(n, base) SAVE_4FPRS(n, base); SAVE_4FPRS(n+4, base)
104 #define SAVE_16FPRS(n, base) SAVE_8FPRS(n, base); SAVE_8FPRS(n+8, base)
105 #define SAVE_32FPRS(n, base) SAVE_16FPRS(n, base); SAVE_16FPRS(n+16, base)
106 #define REST_FPR(n, base) lfd n,8*TS_FPRWIDTH*(n)(base)
107 #define REST_2FPRS(n, base) REST_FPR(n, base); REST_FPR(n+1, base)
108 #define REST_4FPRS(n, base) REST_2FPRS(n, base); REST_2FPRS(n+2, base)
109 #define REST_8FPRS(n, base) REST_4FPRS(n, base); REST_4FPRS(n+4, base)
110 #define REST_16FPRS(n, base) REST_8FPRS(n, base); REST_8FPRS(n+8, base)
111 #define REST_32FPRS(n, base) REST_16FPRS(n, base); REST_16FPRS(n+16, base)
113 #define SAVE_VR(n,b,base) li b,16*(n); stvx n,base,b
114 #define SAVE_2VRS(n,b,base) SAVE_VR(n,b,base); SAVE_VR(n+1,b,base)
115 #define SAVE_4VRS(n,b,base) SAVE_2VRS(n,b,base); SAVE_2VRS(n+2,b,base)
116 #define SAVE_8VRS(n,b,base) SAVE_4VRS(n,b,base); SAVE_4VRS(n+4,b,base)
117 #define SAVE_16VRS(n,b,base) SAVE_8VRS(n,b,base); SAVE_8VRS(n+8,b,base)
118 #define SAVE_32VRS(n,b,base) SAVE_16VRS(n,b,base); SAVE_16VRS(n+16,b,base)
119 #define REST_VR(n,b,base) li b,16*(n); lvx n,base,b
120 #define REST_2VRS(n,b,base) REST_VR(n,b,base); REST_VR(n+1,b,base)
121 #define REST_4VRS(n,b,base) REST_2VRS(n,b,base); REST_2VRS(n+2,b,base)
122 #define REST_8VRS(n,b,base) REST_4VRS(n,b,base); REST_4VRS(n+4,b,base)
123 #define REST_16VRS(n,b,base) REST_8VRS(n,b,base); REST_8VRS(n+8,b,base)
124 #define REST_32VRS(n,b,base) REST_16VRS(n,b,base); REST_16VRS(n+16,b,base)
126 #ifdef __BIG_ENDIAN__
127 #define STXVD2X_ROT(n,b,base) STXVD2X(n,b,base)
128 #define LXVD2X_ROT(n,b,base) LXVD2X(n,b,base)
130 #define STXVD2X_ROT(n,b,base) XXSWAPD(n,n); \
134 #define LXVD2X_ROT(n,b,base) LXVD2X(n,b,base); \
137 /* Save the lower 32 VSRs in the thread VSR region */
138 #define SAVE_VSR(n,b,base) li b,16*(n); STXVD2X_ROT(n,R##base,R##b)
139 #define SAVE_2VSRS(n,b,base) SAVE_VSR(n,b,base); SAVE_VSR(n+1,b,base)
140 #define SAVE_4VSRS(n,b,base) SAVE_2VSRS(n,b,base); SAVE_2VSRS(n+2,b,base)
141 #define SAVE_8VSRS(n,b,base) SAVE_4VSRS(n,b,base); SAVE_4VSRS(n+4,b,base)
142 #define SAVE_16VSRS(n,b,base) SAVE_8VSRS(n,b,base); SAVE_8VSRS(n+8,b,base)
143 #define SAVE_32VSRS(n,b,base) SAVE_16VSRS(n,b,base); SAVE_16VSRS(n+16,b,base)
144 #define REST_VSR(n,b,base) li b,16*(n); LXVD2X_ROT(n,R##base,R##b)
145 #define REST_2VSRS(n,b,base) REST_VSR(n,b,base); REST_VSR(n+1,b,base)
146 #define REST_4VSRS(n,b,base) REST_2VSRS(n,b,base); REST_2VSRS(n+2,b,base)
147 #define REST_8VSRS(n,b,base) REST_4VSRS(n,b,base); REST_4VSRS(n+4,b,base)
148 #define REST_16VSRS(n,b,base) REST_8VSRS(n,b,base); REST_8VSRS(n+8,b,base)
149 #define REST_32VSRS(n,b,base) REST_16VSRS(n,b,base); REST_16VSRS(n+16,b,base)
152 * b = base register for addressing, o = base offset from register of 1st EVR
153 * n = first EVR, s = scratch
155 #define SAVE_EVR(n,s,b,o) evmergehi s,s,n; stw s,o+4*(n)(b)
156 #define SAVE_2EVRS(n,s,b,o) SAVE_EVR(n,s,b,o); SAVE_EVR(n+1,s,b,o)
157 #define SAVE_4EVRS(n,s,b,o) SAVE_2EVRS(n,s,b,o); SAVE_2EVRS(n+2,s,b,o)
158 #define SAVE_8EVRS(n,s,b,o) SAVE_4EVRS(n,s,b,o); SAVE_4EVRS(n+4,s,b,o)
159 #define SAVE_16EVRS(n,s,b,o) SAVE_8EVRS(n,s,b,o); SAVE_8EVRS(n+8,s,b,o)
160 #define SAVE_32EVRS(n,s,b,o) SAVE_16EVRS(n,s,b,o); SAVE_16EVRS(n+16,s,b,o)
161 #define REST_EVR(n,s,b,o) lwz s,o+4*(n)(b); evmergelo n,s,n
162 #define REST_2EVRS(n,s,b,o) REST_EVR(n,s,b,o); REST_EVR(n+1,s,b,o)
163 #define REST_4EVRS(n,s,b,o) REST_2EVRS(n,s,b,o); REST_2EVRS(n+2,s,b,o)
164 #define REST_8EVRS(n,s,b,o) REST_4EVRS(n,s,b,o); REST_4EVRS(n+4,s,b,o)
165 #define REST_16EVRS(n,s,b,o) REST_8EVRS(n,s,b,o); REST_8EVRS(n+8,s,b,o)
166 #define REST_32EVRS(n,s,b,o) REST_16EVRS(n,s,b,o); REST_16EVRS(n+16,s,b,o)
168 /* Macros to adjust thread priority for hardware multithreading */
169 #define HMT_VERY_LOW or 31,31,31 # very low priority
170 #define HMT_LOW or 1,1,1
171 #define HMT_MEDIUM_LOW or 6,6,6 # medium low priority
172 #define HMT_MEDIUM or 2,2,2
173 #define HMT_MEDIUM_HIGH or 5,5,5 # medium high priority
174 #define HMT_HIGH or 3,3,3
175 #define HMT_EXTRA_HIGH or 7,7,7 # power7 only
182 #define __VCPU_GPR(n) (VCPU_GPRS + (n * ULONG_SIZE))
183 #define VCPU_GPR(n) __VCPU_GPR(__REG_##n)
188 #define STACKFRAMESIZE 256
189 #define __STK_REG(i) (112 + ((i)-14)*8)
190 #define STK_REG(i) __STK_REG(__REG_##i)
192 #if defined(_CALL_ELF) && _CALL_ELF == 2
194 #define __STK_PARAM(i) (32 + ((i)-3)*8)
197 #define __STK_PARAM(i) (48 + ((i)-3)*8)
199 #define STK_PARAM(i) __STK_PARAM(__REG_##i)
201 #if defined(_CALL_ELF) && _CALL_ELF == 2
203 #define _GLOBAL(name) \
206 .type name,@function; \
210 #define _GLOBAL_TOC(name) \
213 .type name,@function; \
216 0: addis r2,r12,(.TOC.-0b)@ha; \
217 addi r2,r2,(.TOC.-0b)@l; \
218 .localentry name,.-name
220 #define _KPROBE(name) \
221 .section ".kprobes.text","a"; \
223 .type name,@function; \
227 #define _KPROBE_TOC(name) \
228 .section ".kprobes.text","a"; \
230 .type name,@function; \
233 0: addis r2,r12,(.TOC.-0b)@ha; \
234 addi r2,r2,(.TOC.-0b)@l; \
235 .localentry name,.-name
241 #define XGLUE(a,b) a##b
242 #define GLUE(a,b) XGLUE(a,b)
244 #define _GLOBAL(name) \
248 .globl GLUE(.,name); \
249 .section ".opd","aw"; \
251 .quad GLUE(.,name); \
252 .quad .TOC.@tocbase; \
255 .type GLUE(.,name),@function; \
258 #define _GLOBAL_TOC(name) _GLOBAL(name)
260 #define _KPROBE(name) \
261 .section ".kprobes.text","a"; \
264 .globl GLUE(.,name); \
265 .section ".opd","aw"; \
267 .quad GLUE(.,name); \
268 .quad .TOC.@tocbase; \
271 .type GLUE(.,name),@function; \
274 #define _KPROBE_TOC(n) _KPROBE(n)
276 #define DOTSYM(a) GLUE(.,a)
288 .stabs __stringify(n:F-1),N_FUN,0,0,n;\
292 #define _GLOBAL_TOC(name) _GLOBAL(name)
295 .section ".kprobes.text","a"; \
302 * LOAD_REG_IMMEDIATE(rn, expr)
303 * Loads the value of the constant expression 'expr' into register 'rn'
304 * using immediate instructions only. Use this when it's important not
305 * to reference other data (i.e. on ppc64 when the TOC pointer is not
306 * valid) and when 'expr' is a constant or absolute address.
308 * LOAD_REG_ADDR(rn, name)
309 * Loads the address of label 'name' into register 'rn'. Use this when
310 * you don't particularly need immediate instructions only, but you need
311 * the whole address in one register (e.g. it's a structure address and
312 * you want to access various offsets within it). On ppc32 this is
313 * identical to LOAD_REG_IMMEDIATE.
315 * LOAD_REG_ADDR_PIC(rn, name)
316 * Loads the address of label 'name' into register 'run'. Use this when
317 * the kernel doesn't run at the linked or relocated address. Please
318 * note that this macro will clobber the lr register.
320 * LOAD_REG_ADDRBASE(rn, name)
322 * LOAD_REG_ADDRBASE loads part of the address of label 'name' into
323 * register 'rn'. ADDROFF(name) returns the remainder of the address as
324 * a constant expression. ADDROFF(name) is a signed expression < 16 bits
325 * in size, so is suitable for use directly as an offset in load and store
326 * instructions. Use this when loading/storing a single word or less as:
327 * LOAD_REG_ADDRBASE(rX, name)
328 * ld rY,ADDROFF(name)(rX)
331 /* Be careful, this will clobber the lr register. */
332 #define LOAD_REG_ADDR_PIC(reg, name) \
335 addis reg,reg,(name - 0b)@ha; \
336 addi reg,reg,(name - 0b)@l;
339 #ifdef HAVE_AS_ATHIGH
340 #define __AS_ATHIGH high
342 #define __AS_ATHIGH h
344 #define LOAD_REG_IMMEDIATE(reg,expr) \
345 lis reg,(expr)@highest; \
346 ori reg,reg,(expr)@higher; \
347 rldicr reg,reg,32,31; \
348 oris reg,reg,(expr)@__AS_ATHIGH; \
349 ori reg,reg,(expr)@l;
351 #define LOAD_REG_ADDR(reg,name) \
354 #define LOAD_REG_ADDRBASE(reg,name) LOAD_REG_ADDR(reg,name)
355 #define ADDROFF(name) 0
357 /* offsets for stack frame layout */
362 #define LOAD_REG_IMMEDIATE(reg,expr) \
364 addi reg,reg,(expr)@l;
366 #define LOAD_REG_ADDR(reg,name) LOAD_REG_IMMEDIATE(reg, name)
368 #define LOAD_REG_ADDRBASE(reg, name) lis reg,name@ha
369 #define ADDROFF(name) name@l
371 /* offsets for stack frame layout */
376 /* various errata or part fixups */
377 #ifdef CONFIG_PPC601_SYNC_FIX
382 END_FTR_SECTION_IFSET(CPU_FTR_601)
386 END_FTR_SECTION_IFSET(CPU_FTR_601)
390 END_FTR_SECTION_IFSET(CPU_FTR_601)
397 #if defined(CONFIG_PPC_CELL) || defined(CONFIG_PPC_FSL_BOOK3E)
399 90: mfspr dest, SPRN_TBRL; \
400 BEGIN_FTR_SECTION_NESTED(96); \
403 END_FTR_SECTION_NESTED(CPU_FTR_CELL_TB_BUG, CPU_FTR_CELL_TB_BUG, 96)
404 #elif defined(CONFIG_8xx)
405 #define MFTB(dest) mftb dest
407 #define MFTB(dest) mfspr dest, SPRN_TBRL
412 #else /* CONFIG_SMP */
413 /* tlbsync is not implemented on 601 */
418 END_FTR_SECTION_IFCLR(CPU_FTR_601)
422 #define MTOCRF(FXM, RS) \
423 BEGIN_FTR_SECTION_NESTED(848); \
425 FTR_SECTION_ELSE_NESTED(848); \
427 ALT_FTR_SECTION_END_NESTED_IFCLR(CPU_FTR_NOEXECUTE, 848)
430 * PPR restore macros used in entry_64.S
431 * Used for P7 or later processors
433 #define HMT_MEDIUM_LOW_HAS_PPR \
434 BEGIN_FTR_SECTION_NESTED(944) \
436 END_FTR_SECTION_NESTED(CPU_FTR_HAS_PPR,CPU_FTR_HAS_PPR,944)
438 #define SET_DEFAULT_THREAD_PPR(ra, rb) \
439 BEGIN_FTR_SECTION_NESTED(945) \
440 lis ra,INIT_PPR@highest; /* default ppr=3 */ \
441 ld rb,PACACURRENT(r13); \
442 sldi ra,ra,32; /* 11- 13 bits are used for ppr */ \
443 std ra,TASKTHREADPPR(rb); \
444 END_FTR_SECTION_NESTED(CPU_FTR_HAS_PPR,CPU_FTR_HAS_PPR,945)
449 * This instruction is not implemented on the PPC 603 or 601; however, on
450 * the 403GCX and 405GP tlbia IS defined and tlbie is not.
451 * All of these instructions exist in the 8xx, they have magical powers,
452 * and they must be used.
455 #if !defined(CONFIG_4xx) && !defined(CONFIG_8xx)
459 lis r4,KERNELBASE@h; \
466 #ifdef CONFIG_IBM440EP_ERR42
467 #define PPC440EP_ERR42 isync
469 #define PPC440EP_ERR42
472 /* The following stops all load and store data streams associated with stream
473 * ID (ie. streams created explicitly). The embedded and server mnemonics for
474 * dcbt are different so we use machine "power4" here explicitly.
476 #define DCBT_STOP_ALL_STREAM_IDS(scratch) \
478 .machine "power4" ; \
479 lis scratch,0x60000000@h; \
480 dcbt r0,scratch,0b01010; \
484 * toreal/fromreal/tophys/tovirt macros. 32-bit BookE makes them
485 * keep the address intact to be compatible with code shared with
488 * On the other hand, I find it useful to have them behave as expected
489 * by their name (ie always do the addition) on 64-bit BookE
491 #if defined(CONFIG_BOOKE) && !defined(CONFIG_PPC64)
496 * We use addis to ensure compatibility with the "classic" ppc versions of
497 * these macros, which use rs = 0 to get the tophys offset in rd, rather than
498 * converting the address in r0, and so this version has to do that too
499 * (i.e. set register rd to 0 when rs == 0).
501 #define tophys(rd,rs) \
504 #define tovirt(rd,rs) \
507 #elif defined(CONFIG_PPC64)
508 #define toreal(rd) /* we can access c000... in real mode */
511 #define tophys(rd,rs) \
514 #define tovirt(rd,rs) \
516 ori rd,rd,((KERNELBASE>>48)&0xFFFF);\
520 * On APUS (Amiga PowerPC cpu upgrade board), we don't know the
521 * physical base address of RAM at compile time.
523 #define toreal(rd) tophys(rd,rd)
524 #define fromreal(rd) tovirt(rd,rd)
526 #define tophys(rd,rs) \
527 0: addis rd,rs,-PAGE_OFFSET@h; \
528 .section ".vtop_fixup","aw"; \
533 #define tovirt(rd,rs) \
534 0: addis rd,rs,PAGE_OFFSET@h; \
535 .section ".ptov_fixup","aw"; \
541 #ifdef CONFIG_PPC_BOOK3S_64
543 #define MTMSRD(r) mtmsrd r
544 #define MTMSR_EERI(reg) mtmsrd reg,1
546 #define FIX_SRR1(ra, rb)
550 #define RFI rfi; b . /* Prevent prefetch past rfi */
552 #define MTMSRD(r) mtmsr r
553 #define MTMSR_EERI(reg) mtmsr reg
557 #endif /* __KERNEL__ */
559 /* The boring bits... */
561 /* Condition Register Bit Fields */
574 * General Purpose Registers (GPRs)
576 * The lower case r0-r31 should be used in preference to the upper
577 * case R0-R31 as they provide more error checking in the assembler.
578 * Use R0-31 only when really nessesary.
615 /* Floating Point Registers (FPRs) */
650 /* AltiVec Registers (VPRs) */
685 /* VSX Registers (VSRs) */
752 /* SPE Registers (EVPRs) */
787 /* some stab codes */
794 * Create an endian fixup trampoline
796 * This starts with a "tdi 0,0,0x48" instruction which is
797 * essentially a "trap never", and thus akin to a nop.
799 * The opcode for this instruction read with the wrong endian
800 * however results in a b . + 8
802 * So essentially we use that trick to execute the following
803 * trampoline in "reverse endian" if we are running with the
804 * MSR_LE bit set the "wrong" way for whatever endianness the
805 * kernel is built for.
808 #ifdef CONFIG_PPC_BOOK3E
811 #define FIXUP_ENDIAN \
812 tdi 0,0,0x48; /* Reverse endian of b . + 8 */ \
813 b $+36; /* Skip trampoline if endian is good */ \
814 .long 0x05009f42; /* bcl 20,31,$+4 */ \
815 .long 0xa602487d; /* mflr r10 */ \
816 .long 0x1c004a39; /* addi r10,r10,28 */ \
817 .long 0xa600607d; /* mfmsr r11 */ \
818 .long 0x01006b69; /* xori r11,r11,1 */ \
819 .long 0xa6035a7d; /* mtsrr0 r10 */ \
820 .long 0xa6037b7d; /* mtsrr1 r11 */ \
821 .long 0x2400004c /* rfid */
822 #endif /* !CONFIG_PPC_BOOK3E */
823 #endif /* __ASSEMBLY__ */
825 #ifdef CONFIG_PPC_FSL_BOOK3E
826 #define BTB_FLUSH(reg) \
827 lis reg,BUCSR_INIT@h; \
828 ori reg,reg,BUCSR_INIT@l; \
829 mtspr SPRN_BUCSR,reg; \
832 #define BTB_FLUSH(reg)
833 #endif /* CONFIG_PPC_FSL_BOOK3E */
835 #endif /* _ASM_POWERPC_PPC_ASM_H */