]> git.proxmox.com Git - mirror_ubuntu-artful-kernel.git/blob - arch/powerpc/kernel/misc_64.S
Merge branch 'for-4.7/wacom' into for-linus
[mirror_ubuntu-artful-kernel.git] / arch / powerpc / kernel / misc_64.S
1 /*
2 * This file contains miscellaneous low-level functions.
3 * Copyright (C) 1995-1996 Gary Thomas (gdt@linuxppc.org)
4 *
5 * Largely rewritten by Cort Dougan (cort@cs.nmt.edu)
6 * and Paul Mackerras.
7 * Adapted for iSeries by Mike Corrigan (mikejc@us.ibm.com)
8 * PPC64 updates by Dave Engebretsen (engebret@us.ibm.com)
9 *
10 * This program is free software; you can redistribute it and/or
11 * modify it under the terms of the GNU General Public License
12 * as published by the Free Software Foundation; either version
13 * 2 of the License, or (at your option) any later version.
14 *
15 */
16
17 #include <linux/sys.h>
18 #include <asm/unistd.h>
19 #include <asm/errno.h>
20 #include <asm/processor.h>
21 #include <asm/page.h>
22 #include <asm/cache.h>
23 #include <asm/ppc_asm.h>
24 #include <asm/asm-offsets.h>
25 #include <asm/cputable.h>
26 #include <asm/thread_info.h>
27 #include <asm/kexec.h>
28 #include <asm/ptrace.h>
29 #include <asm/mmu.h>
30
31 .text
32
33 _GLOBAL(call_do_softirq)
34 mflr r0
35 std r0,16(r1)
36 stdu r1,THREAD_SIZE-STACK_FRAME_OVERHEAD(r3)
37 mr r1,r3
38 bl __do_softirq
39 ld r1,0(r1)
40 ld r0,16(r1)
41 mtlr r0
42 blr
43
44 _GLOBAL(call_do_irq)
45 mflr r0
46 std r0,16(r1)
47 stdu r1,THREAD_SIZE-STACK_FRAME_OVERHEAD(r4)
48 mr r1,r4
49 bl __do_irq
50 ld r1,0(r1)
51 ld r0,16(r1)
52 mtlr r0
53 blr
54
55 .section ".toc","aw"
56 PPC64_CACHES:
57 .tc ppc64_caches[TC],ppc64_caches
58 .section ".text"
59
60 /*
61 * Write any modified data cache blocks out to memory
62 * and invalidate the corresponding instruction cache blocks.
63 *
64 * flush_icache_range(unsigned long start, unsigned long stop)
65 *
66 * flush all bytes from start through stop-1 inclusive
67 */
68
69 _KPROBE(flush_icache_range)
70 BEGIN_FTR_SECTION
71 PURGE_PREFETCHED_INS
72 blr
73 END_FTR_SECTION_IFSET(CPU_FTR_COHERENT_ICACHE)
74 /*
75 * Flush the data cache to memory
76 *
77 * Different systems have different cache line sizes
78 * and in some cases i-cache and d-cache line sizes differ from
79 * each other.
80 */
81 ld r10,PPC64_CACHES@toc(r2)
82 lwz r7,DCACHEL1LINESIZE(r10)/* Get cache line size */
83 addi r5,r7,-1
84 andc r6,r3,r5 /* round low to line bdy */
85 subf r8,r6,r4 /* compute length */
86 add r8,r8,r5 /* ensure we get enough */
87 lwz r9,DCACHEL1LOGLINESIZE(r10) /* Get log-2 of cache line size */
88 srw. r8,r8,r9 /* compute line count */
89 beqlr /* nothing to do? */
90 mtctr r8
91 1: dcbst 0,r6
92 add r6,r6,r7
93 bdnz 1b
94 sync
95
96 /* Now invalidate the instruction cache */
97
98 lwz r7,ICACHEL1LINESIZE(r10) /* Get Icache line size */
99 addi r5,r7,-1
100 andc r6,r3,r5 /* round low to line bdy */
101 subf r8,r6,r4 /* compute length */
102 add r8,r8,r5
103 lwz r9,ICACHEL1LOGLINESIZE(r10) /* Get log-2 of Icache line size */
104 srw. r8,r8,r9 /* compute line count */
105 beqlr /* nothing to do? */
106 mtctr r8
107 2: icbi 0,r6
108 add r6,r6,r7
109 bdnz 2b
110 isync
111 blr
112 .previous .text
113 /*
114 * Like above, but only do the D-cache.
115 *
116 * flush_dcache_range(unsigned long start, unsigned long stop)
117 *
118 * flush all bytes from start to stop-1 inclusive
119 */
120 _GLOBAL(flush_dcache_range)
121
122 /*
123 * Flush the data cache to memory
124 *
125 * Different systems have different cache line sizes
126 */
127 ld r10,PPC64_CACHES@toc(r2)
128 lwz r7,DCACHEL1LINESIZE(r10) /* Get dcache line size */
129 addi r5,r7,-1
130 andc r6,r3,r5 /* round low to line bdy */
131 subf r8,r6,r4 /* compute length */
132 add r8,r8,r5 /* ensure we get enough */
133 lwz r9,DCACHEL1LOGLINESIZE(r10) /* Get log-2 of dcache line size */
134 srw. r8,r8,r9 /* compute line count */
135 beqlr /* nothing to do? */
136 mtctr r8
137 0: dcbst 0,r6
138 add r6,r6,r7
139 bdnz 0b
140 sync
141 blr
142
143 /*
144 * Like above, but works on non-mapped physical addresses.
145 * Use only for non-LPAR setups ! It also assumes real mode
146 * is cacheable. Used for flushing out the DART before using
147 * it as uncacheable memory
148 *
149 * flush_dcache_phys_range(unsigned long start, unsigned long stop)
150 *
151 * flush all bytes from start to stop-1 inclusive
152 */
153 _GLOBAL(flush_dcache_phys_range)
154 ld r10,PPC64_CACHES@toc(r2)
155 lwz r7,DCACHEL1LINESIZE(r10) /* Get dcache line size */
156 addi r5,r7,-1
157 andc r6,r3,r5 /* round low to line bdy */
158 subf r8,r6,r4 /* compute length */
159 add r8,r8,r5 /* ensure we get enough */
160 lwz r9,DCACHEL1LOGLINESIZE(r10) /* Get log-2 of dcache line size */
161 srw. r8,r8,r9 /* compute line count */
162 beqlr /* nothing to do? */
163 mfmsr r5 /* Disable MMU Data Relocation */
164 ori r0,r5,MSR_DR
165 xori r0,r0,MSR_DR
166 sync
167 mtmsr r0
168 sync
169 isync
170 mtctr r8
171 0: dcbst 0,r6
172 add r6,r6,r7
173 bdnz 0b
174 sync
175 isync
176 mtmsr r5 /* Re-enable MMU Data Relocation */
177 sync
178 isync
179 blr
180
181 _GLOBAL(flush_inval_dcache_range)
182 ld r10,PPC64_CACHES@toc(r2)
183 lwz r7,DCACHEL1LINESIZE(r10) /* Get dcache line size */
184 addi r5,r7,-1
185 andc r6,r3,r5 /* round low to line bdy */
186 subf r8,r6,r4 /* compute length */
187 add r8,r8,r5 /* ensure we get enough */
188 lwz r9,DCACHEL1LOGLINESIZE(r10)/* Get log-2 of dcache line size */
189 srw. r8,r8,r9 /* compute line count */
190 beqlr /* nothing to do? */
191 sync
192 isync
193 mtctr r8
194 0: dcbf 0,r6
195 add r6,r6,r7
196 bdnz 0b
197 sync
198 isync
199 blr
200
201
202 /*
203 * Flush a particular page from the data cache to RAM.
204 * Note: this is necessary because the instruction cache does *not*
205 * snoop from the data cache.
206 *
207 * void __flush_dcache_icache(void *page)
208 */
209 _GLOBAL(__flush_dcache_icache)
210 /*
211 * Flush the data cache to memory
212 *
213 * Different systems have different cache line sizes
214 */
215
216 BEGIN_FTR_SECTION
217 PURGE_PREFETCHED_INS
218 blr
219 END_FTR_SECTION_IFSET(CPU_FTR_COHERENT_ICACHE)
220
221 /* Flush the dcache */
222 ld r7,PPC64_CACHES@toc(r2)
223 clrrdi r3,r3,PAGE_SHIFT /* Page align */
224 lwz r4,DCACHEL1LINESPERPAGE(r7) /* Get # dcache lines per page */
225 lwz r5,DCACHEL1LINESIZE(r7) /* Get dcache line size */
226 mr r6,r3
227 mtctr r4
228 0: dcbst 0,r6
229 add r6,r6,r5
230 bdnz 0b
231 sync
232
233 /* Now invalidate the icache */
234
235 lwz r4,ICACHEL1LINESPERPAGE(r7) /* Get # icache lines per page */
236 lwz r5,ICACHEL1LINESIZE(r7) /* Get icache line size */
237 mtctr r4
238 1: icbi 0,r3
239 add r3,r3,r5
240 bdnz 1b
241 isync
242 blr
243
244 _GLOBAL(__bswapdi2)
245 srdi r8,r3,32
246 rlwinm r7,r3,8,0xffffffff
247 rlwimi r7,r3,24,0,7
248 rlwinm r9,r8,8,0xffffffff
249 rlwimi r7,r3,24,16,23
250 rlwimi r9,r8,24,0,7
251 rlwimi r9,r8,24,16,23
252 sldi r7,r7,32
253 or r3,r7,r9
254 blr
255
256
257 #ifdef CONFIG_PPC_EARLY_DEBUG_BOOTX
258 _GLOBAL(rmci_on)
259 sync
260 isync
261 li r3,0x100
262 rldicl r3,r3,32,0
263 mfspr r5,SPRN_HID4
264 or r5,r5,r3
265 sync
266 mtspr SPRN_HID4,r5
267 isync
268 slbia
269 isync
270 sync
271 blr
272
273 _GLOBAL(rmci_off)
274 sync
275 isync
276 li r3,0x100
277 rldicl r3,r3,32,0
278 mfspr r5,SPRN_HID4
279 andc r5,r5,r3
280 sync
281 mtspr SPRN_HID4,r5
282 isync
283 slbia
284 isync
285 sync
286 blr
287 #endif /* CONFIG_PPC_EARLY_DEBUG_BOOTX */
288
289 #if defined(CONFIG_PPC_PMAC) || defined(CONFIG_PPC_MAPLE)
290
291 /*
292 * Do an IO access in real mode
293 */
294 _GLOBAL(real_readb)
295 mfmsr r7
296 ori r0,r7,MSR_DR
297 xori r0,r0,MSR_DR
298 sync
299 mtmsrd r0
300 sync
301 isync
302 mfspr r6,SPRN_HID4
303 rldicl r5,r6,32,0
304 ori r5,r5,0x100
305 rldicl r5,r5,32,0
306 sync
307 mtspr SPRN_HID4,r5
308 isync
309 slbia
310 isync
311 lbz r3,0(r3)
312 sync
313 mtspr SPRN_HID4,r6
314 isync
315 slbia
316 isync
317 mtmsrd r7
318 sync
319 isync
320 blr
321
322 /*
323 * Do an IO access in real mode
324 */
325 _GLOBAL(real_writeb)
326 mfmsr r7
327 ori r0,r7,MSR_DR
328 xori r0,r0,MSR_DR
329 sync
330 mtmsrd r0
331 sync
332 isync
333 mfspr r6,SPRN_HID4
334 rldicl r5,r6,32,0
335 ori r5,r5,0x100
336 rldicl r5,r5,32,0
337 sync
338 mtspr SPRN_HID4,r5
339 isync
340 slbia
341 isync
342 stb r3,0(r4)
343 sync
344 mtspr SPRN_HID4,r6
345 isync
346 slbia
347 isync
348 mtmsrd r7
349 sync
350 isync
351 blr
352 #endif /* defined(CONFIG_PPC_PMAC) || defined(CONFIG_PPC_MAPLE) */
353
354 #ifdef CONFIG_PPC_PASEMI
355
356 _GLOBAL(real_205_readb)
357 mfmsr r7
358 ori r0,r7,MSR_DR
359 xori r0,r0,MSR_DR
360 sync
361 mtmsrd r0
362 sync
363 isync
364 LBZCIX(R3,R0,R3)
365 isync
366 mtmsrd r7
367 sync
368 isync
369 blr
370
371 _GLOBAL(real_205_writeb)
372 mfmsr r7
373 ori r0,r7,MSR_DR
374 xori r0,r0,MSR_DR
375 sync
376 mtmsrd r0
377 sync
378 isync
379 STBCIX(R3,R0,R4)
380 isync
381 mtmsrd r7
382 sync
383 isync
384 blr
385
386 #endif /* CONFIG_PPC_PASEMI */
387
388
389 #if defined(CONFIG_CPU_FREQ_PMAC64) || defined(CONFIG_CPU_FREQ_MAPLE)
390 /*
391 * SCOM access functions for 970 (FX only for now)
392 *
393 * unsigned long scom970_read(unsigned int address);
394 * void scom970_write(unsigned int address, unsigned long value);
395 *
396 * The address passed in is the 24 bits register address. This code
397 * is 970 specific and will not check the status bits, so you should
398 * know what you are doing.
399 */
400 _GLOBAL(scom970_read)
401 /* interrupts off */
402 mfmsr r4
403 ori r0,r4,MSR_EE
404 xori r0,r0,MSR_EE
405 mtmsrd r0,1
406
407 /* rotate 24 bits SCOM address 8 bits left and mask out it's low 8 bits
408 * (including parity). On current CPUs they must be 0'd,
409 * and finally or in RW bit
410 */
411 rlwinm r3,r3,8,0,15
412 ori r3,r3,0x8000
413
414 /* do the actual scom read */
415 sync
416 mtspr SPRN_SCOMC,r3
417 isync
418 mfspr r3,SPRN_SCOMD
419 isync
420 mfspr r0,SPRN_SCOMC
421 isync
422
423 /* XXX: fixup result on some buggy 970's (ouch ! we lost a bit, bah
424 * that's the best we can do). Not implemented yet as we don't use
425 * the scom on any of the bogus CPUs yet, but may have to be done
426 * ultimately
427 */
428
429 /* restore interrupts */
430 mtmsrd r4,1
431 blr
432
433
434 _GLOBAL(scom970_write)
435 /* interrupts off */
436 mfmsr r5
437 ori r0,r5,MSR_EE
438 xori r0,r0,MSR_EE
439 mtmsrd r0,1
440
441 /* rotate 24 bits SCOM address 8 bits left and mask out it's low 8 bits
442 * (including parity). On current CPUs they must be 0'd.
443 */
444
445 rlwinm r3,r3,8,0,15
446
447 sync
448 mtspr SPRN_SCOMD,r4 /* write data */
449 isync
450 mtspr SPRN_SCOMC,r3 /* write command */
451 isync
452 mfspr 3,SPRN_SCOMC
453 isync
454
455 /* restore interrupts */
456 mtmsrd r5,1
457 blr
458 #endif /* CONFIG_CPU_FREQ_PMAC64 || CONFIG_CPU_FREQ_MAPLE */
459
460 /* kexec_wait(phys_cpu)
461 *
462 * wait for the flag to change, indicating this kernel is going away but
463 * the slave code for the next one is at addresses 0 to 100.
464 *
465 * This is used by all slaves, even those that did not find a matching
466 * paca in the secondary startup code.
467 *
468 * Physical (hardware) cpu id should be in r3.
469 */
470 _GLOBAL(kexec_wait)
471 bl 1f
472 1: mflr r5
473 addi r5,r5,kexec_flag-1b
474
475 99: HMT_LOW
476 #ifdef CONFIG_KEXEC /* use no memory without kexec */
477 lwz r4,0(r5)
478 cmpwi 0,r4,0
479 beq 99b
480 #ifdef CONFIG_PPC_BOOK3S_64
481 li r10,0x60
482 mfmsr r11
483 clrrdi r11,r11,1 /* Clear MSR_LE */
484 mtsrr0 r10
485 mtsrr1 r11
486 rfid
487 #else
488 /* Create TLB entry in book3e_secondary_core_init */
489 li r4,0
490 ba 0x60
491 #endif
492 #endif
493
494 /* this can be in text because we won't change it until we are
495 * running in real anyways
496 */
497 kexec_flag:
498 .long 0
499
500
501 #ifdef CONFIG_KEXEC
502 #ifdef CONFIG_PPC_BOOK3E
503 /*
504 * BOOK3E has no real MMU mode, so we have to setup the initial TLB
505 * for a core to identity map v:0 to p:0. This current implementation
506 * assumes that 1G is enough for kexec.
507 */
508 kexec_create_tlb:
509 /*
510 * Invalidate all non-IPROT TLB entries to avoid any TLB conflict.
511 * IPROT TLB entries should be >= PAGE_OFFSET and thus not conflict.
512 */
513 PPC_TLBILX_ALL(0,R0)
514 sync
515 isync
516
517 mfspr r10,SPRN_TLB1CFG
518 andi. r10,r10,TLBnCFG_N_ENTRY /* Extract # entries */
519 subi r10,r10,1 /* Last entry: no conflict with kernel text */
520 lis r9,MAS0_TLBSEL(1)@h
521 rlwimi r9,r10,16,4,15 /* Setup MAS0 = TLBSEL | ESEL(r9) */
522
523 /* Set up a temp identity mapping v:0 to p:0 and return to it. */
524 #if defined(CONFIG_SMP) || defined(CONFIG_PPC_E500MC)
525 #define M_IF_NEEDED MAS2_M
526 #else
527 #define M_IF_NEEDED 0
528 #endif
529 mtspr SPRN_MAS0,r9
530
531 lis r9,(MAS1_VALID|MAS1_IPROT)@h
532 ori r9,r9,(MAS1_TSIZE(BOOK3E_PAGESZ_1GB))@l
533 mtspr SPRN_MAS1,r9
534
535 LOAD_REG_IMMEDIATE(r9, 0x0 | M_IF_NEEDED)
536 mtspr SPRN_MAS2,r9
537
538 LOAD_REG_IMMEDIATE(r9, 0x0 | MAS3_SR | MAS3_SW | MAS3_SX)
539 mtspr SPRN_MAS3,r9
540 li r9,0
541 mtspr SPRN_MAS7,r9
542
543 tlbwe
544 isync
545 blr
546 #endif
547
548 /* kexec_smp_wait(void)
549 *
550 * call with interrupts off
551 * note: this is a terminal routine, it does not save lr
552 *
553 * get phys id from paca
554 * switch to real mode
555 * mark the paca as no longer used
556 * join other cpus in kexec_wait(phys_id)
557 */
558 _GLOBAL(kexec_smp_wait)
559 lhz r3,PACAHWCPUID(r13)
560 bl real_mode
561
562 li r4,KEXEC_STATE_REAL_MODE
563 stb r4,PACAKEXECSTATE(r13)
564 SYNC
565
566 b kexec_wait
567
568 /*
569 * switch to real mode (turn mmu off)
570 * we use the early kernel trick that the hardware ignores bits
571 * 0 and 1 (big endian) of the effective address in real mode
572 *
573 * don't overwrite r3 here, it is live for kexec_wait above.
574 */
575 real_mode: /* assume normal blr return */
576 #ifdef CONFIG_PPC_BOOK3E
577 /* Create an identity mapping. */
578 b kexec_create_tlb
579 #else
580 1: li r9,MSR_RI
581 li r10,MSR_DR|MSR_IR
582 mflr r11 /* return address to SRR0 */
583 mfmsr r12
584 andc r9,r12,r9
585 andc r10,r12,r10
586
587 mtmsrd r9,1
588 mtspr SPRN_SRR1,r10
589 mtspr SPRN_SRR0,r11
590 rfid
591 #endif
592
593 /*
594 * kexec_sequence(newstack, start, image, control, clear_all())
595 *
596 * does the grungy work with stack switching and real mode switches
597 * also does simple calls to other code
598 */
599
600 _GLOBAL(kexec_sequence)
601 mflr r0
602 std r0,16(r1)
603
604 /* switch stacks to newstack -- &kexec_stack.stack */
605 stdu r1,THREAD_SIZE-STACK_FRAME_OVERHEAD(r3)
606 mr r1,r3
607
608 li r0,0
609 std r0,16(r1)
610
611 /* save regs for local vars on new stack.
612 * yes, we won't go back, but ...
613 */
614 std r31,-8(r1)
615 std r30,-16(r1)
616 std r29,-24(r1)
617 std r28,-32(r1)
618 std r27,-40(r1)
619 std r26,-48(r1)
620 std r25,-56(r1)
621
622 stdu r1,-STACK_FRAME_OVERHEAD-64(r1)
623
624 /* save args into preserved regs */
625 mr r31,r3 /* newstack (both) */
626 mr r30,r4 /* start (real) */
627 mr r29,r5 /* image (virt) */
628 mr r28,r6 /* control, unused */
629 mr r27,r7 /* clear_all() fn desc */
630 mr r26,r8 /* spare */
631 lhz r25,PACAHWCPUID(r13) /* get our phys cpu from paca */
632
633 /* disable interrupts, we are overwriting kernel data next */
634 #ifdef CONFIG_PPC_BOOK3E
635 wrteei 0
636 #else
637 mfmsr r3
638 rlwinm r3,r3,0,17,15
639 mtmsrd r3,1
640 #endif
641
642 /* copy dest pages, flush whole dest image */
643 mr r3,r29
644 bl kexec_copy_flush /* (image) */
645
646 /* turn off mmu */
647 bl real_mode
648
649 /* copy 0x100 bytes starting at start to 0 */
650 li r3,0
651 mr r4,r30 /* start, aka phys mem offset */
652 li r5,0x100
653 li r6,0
654 bl copy_and_flush /* (dest, src, copy limit, start offset) */
655 1: /* assume normal blr return */
656
657 /* release other cpus to the new kernel secondary start at 0x60 */
658 mflr r5
659 li r6,1
660 stw r6,kexec_flag-1b(5)
661
662 #ifndef CONFIG_PPC_BOOK3E
663 /* clear out hardware hash page table and tlb */
664 #if !defined(_CALL_ELF) || _CALL_ELF != 2
665 ld r12,0(r27) /* deref function descriptor */
666 #else
667 mr r12,r27
668 #endif
669 mtctr r12
670 bctrl /* ppc_md.hpte_clear_all(void); */
671 #endif /* !CONFIG_PPC_BOOK3E */
672
673 /*
674 * kexec image calling is:
675 * the first 0x100 bytes of the entry point are copied to 0
676 *
677 * all slaves branch to slave = 0x60 (absolute)
678 * slave(phys_cpu_id);
679 *
680 * master goes to start = entry point
681 * start(phys_cpu_id, start, 0);
682 *
683 *
684 * a wrapper is needed to call existing kernels, here is an approximate
685 * description of one method:
686 *
687 * v2: (2.6.10)
688 * start will be near the boot_block (maybe 0x100 bytes before it?)
689 * it will have a 0x60, which will b to boot_block, where it will wait
690 * and 0 will store phys into struct boot-block and load r3 from there,
691 * copy kernel 0-0x100 and tell slaves to back down to 0x60 again
692 *
693 * v1: (2.6.9)
694 * boot block will have all cpus scanning device tree to see if they
695 * are the boot cpu ?????
696 * other device tree differences (prop sizes, va vs pa, etc)...
697 */
698 mr r3,r25 # my phys cpu
699 mr r4,r30 # start, aka phys mem offset
700 mtlr 4
701 li r5,0
702 blr /* image->start(physid, image->start, 0); */
703 #endif /* CONFIG_KEXEC */