2 * PARISC TLB and cache flushing support
3 * Copyright (C) 2000-2001 Hewlett-Packard (John Marvin)
4 * Copyright (C) 2001 Matthew Wilcox (willy at parisc-linux.org)
5 * Copyright (C) 2002 Richard Hirst (rhirst with parisc-linux.org)
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License as published by
9 * the Free Software Foundation; either version 2, or (at your option)
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with this program; if not, write to the Free Software
19 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 * NOTE: fdc,fic, and pdc instructions that use base register modification
24 * should only use index and base registers that are not shadowed,
25 * so that the fast path emulation in the non access miss handler
43 #include <linux/config.h>
46 #include <asm/assembly.h>
47 #include <asm/pgtable.h>
48 #include <asm/cache.h>
53 .export flush_tlb_all_local,code
61 * The pitlbe and pdtlbe instructions should only be used to
62 * flush the entire tlb. Also, there needs to be no intervening
63 * tlb operations, e.g. tlb misses, so the operation needs
64 * to happen in real mode with all interruptions disabled.
67 /* pcxt_ssm_bug - relied upon translation! PA 2.0 Arch. F-4 and F-5 */
68 rsm PSW_SM_I, %r19 /* save I-bit state */
76 rsm PSW_SM_Q, %r0 /* prep to load iia queue */
77 mtctl %r0, %cr17 /* Clear IIASQ tail */
78 mtctl %r0, %cr17 /* Clear IIASQ head */
79 mtctl %r1, %cr18 /* IIAOQ head */
81 mtctl %r1, %cr18 /* IIAOQ tail */
82 load32 REAL_MODE_PSW, %r1
87 1: ldil L%PA(cache_info), %r1
88 ldo R%PA(cache_info)(%r1), %r1
90 /* Flush Instruction Tlb */
92 LDREG ITLB_SID_BASE(%r1), %r20
93 LDREG ITLB_SID_STRIDE(%r1), %r21
94 LDREG ITLB_SID_COUNT(%r1), %r22
95 LDREG ITLB_OFF_BASE(%r1), %arg0
96 LDREG ITLB_OFF_STRIDE(%r1), %arg1
97 LDREG ITLB_OFF_COUNT(%r1), %arg2
98 LDREG ITLB_LOOP(%r1), %arg3
100 ADDIB= -1, %arg3, fitoneloop /* Preadjust and test */
101 movb,<,n %arg3, %r31, fitdone /* If loop < 0, skip */
102 copy %arg0, %r28 /* Init base addr */
104 fitmanyloop: /* Loop if LOOP >= 2 */
106 add %r21, %r20, %r20 /* increment space */
107 copy %arg2, %r29 /* Init middle loop count */
109 fitmanymiddle: /* Loop if LOOP >= 2 */
110 ADDIB> -1, %r31, fitmanymiddle /* Adjusted inner loop decr */
112 pitlbe,m %arg1(%sr1, %r28) /* Last pitlbe and addr adjust */
113 ADDIB> -1, %r29, fitmanymiddle /* Middle loop decr */
114 copy %arg3, %r31 /* Re-init inner loop count */
116 movb,tr %arg0, %r28, fitmanyloop /* Re-init base addr */
117 ADDIB<=,n -1, %r22, fitdone /* Outer loop count decr */
119 fitoneloop: /* Loop if LOOP = 1 */
121 copy %arg0, %r28 /* init base addr */
122 copy %arg2, %r29 /* init middle loop count */
124 fitonemiddle: /* Loop if LOOP = 1 */
125 ADDIB> -1, %r29, fitonemiddle /* Middle loop count decr */
126 pitlbe,m %arg1(%sr1, %r28) /* pitlbe for one loop */
128 ADDIB> -1, %r22, fitoneloop /* Outer loop count decr */
129 add %r21, %r20, %r20 /* increment space */
135 LDREG DTLB_SID_BASE(%r1), %r20
136 LDREG DTLB_SID_STRIDE(%r1), %r21
137 LDREG DTLB_SID_COUNT(%r1), %r22
138 LDREG DTLB_OFF_BASE(%r1), %arg0
139 LDREG DTLB_OFF_STRIDE(%r1), %arg1
140 LDREG DTLB_OFF_COUNT(%r1), %arg2
141 LDREG DTLB_LOOP(%r1), %arg3
143 ADDIB= -1, %arg3, fdtoneloop /* Preadjust and test */
144 movb,<,n %arg3, %r31, fdtdone /* If loop < 0, skip */
145 copy %arg0, %r28 /* Init base addr */
147 fdtmanyloop: /* Loop if LOOP >= 2 */
149 add %r21, %r20, %r20 /* increment space */
150 copy %arg2, %r29 /* Init middle loop count */
152 fdtmanymiddle: /* Loop if LOOP >= 2 */
153 ADDIB> -1, %r31, fdtmanymiddle /* Adjusted inner loop decr */
155 pdtlbe,m %arg1(%sr1, %r28) /* Last pdtlbe and addr adjust */
156 ADDIB> -1, %r29, fdtmanymiddle /* Middle loop decr */
157 copy %arg3, %r31 /* Re-init inner loop count */
159 movb,tr %arg0, %r28, fdtmanyloop /* Re-init base addr */
160 ADDIB<=,n -1, %r22,fdtdone /* Outer loop count decr */
162 fdtoneloop: /* Loop if LOOP = 1 */
164 copy %arg0, %r28 /* init base addr */
165 copy %arg2, %r29 /* init middle loop count */
167 fdtonemiddle: /* Loop if LOOP = 1 */
168 ADDIB> -1, %r29, fdtonemiddle /* Middle loop count decr */
169 pdtlbe,m %arg1(%sr1, %r28) /* pdtlbe for one loop */
171 ADDIB> -1, %r22, fdtoneloop /* Outer loop count decr */
172 add %r21, %r20, %r20 /* increment space */
177 * Switch back to virtual mode
188 rsm PSW_SM_Q, %r0 /* prep to load iia queue */
189 mtctl %r0, %cr17 /* Clear IIASQ tail */
190 mtctl %r0, %cr17 /* Clear IIASQ head */
191 mtctl %r1, %cr18 /* IIAOQ head */
193 mtctl %r1, %cr18 /* IIAOQ tail */
194 load32 KERNEL_PSW, %r1
195 or %r1, %r19, %r1 /* I-bit to state on entry */
196 mtctl %r1, %ipsw /* restore I-bit (entire PSW) */
206 .export flush_instruction_cache_local,code
207 .import cache_info,data
209 flush_instruction_cache_local:
215 ldil L%cache_info, %r1
216 ldo R%cache_info(%r1), %r1
218 /* Flush Instruction Cache */
220 LDREG ICACHE_BASE(%r1), %arg0
221 LDREG ICACHE_STRIDE(%r1), %arg1
222 LDREG ICACHE_COUNT(%r1), %arg2
223 LDREG ICACHE_LOOP(%r1), %arg3
224 rsm PSW_SM_I, %r22 /* No mmgt ops during loop*/
225 ADDIB= -1, %arg3, fioneloop /* Preadjust and test */
226 movb,<,n %arg3, %r31, fisync /* If loop < 0, do sync */
228 fimanyloop: /* Loop if LOOP >= 2 */
229 ADDIB> -1, %r31, fimanyloop /* Adjusted inner loop decr */
230 fice %r0(%sr1, %arg0)
231 fice,m %arg1(%sr1, %arg0) /* Last fice and addr adjust */
232 movb,tr %arg3, %r31, fimanyloop /* Re-init inner loop count */
233 ADDIB<=,n -1, %arg2, fisync /* Outer loop decr */
235 fioneloop: /* Loop if LOOP = 1 */
236 ADDIB> -1, %arg2, fioneloop /* Outer loop count decr */
237 fice,m %arg1(%sr1, %arg0) /* Fice for one loop */
241 mtsm %r22 /* restore I-bit */
248 .export flush_data_cache_local, code
249 .import cache_info, data
251 flush_data_cache_local:
257 ldil L%cache_info, %r1
258 ldo R%cache_info(%r1), %r1
260 /* Flush Data Cache */
262 LDREG DCACHE_BASE(%r1), %arg0
263 LDREG DCACHE_STRIDE(%r1), %arg1
264 LDREG DCACHE_COUNT(%r1), %arg2
265 LDREG DCACHE_LOOP(%r1), %arg3
267 ADDIB= -1, %arg3, fdoneloop /* Preadjust and test */
268 movb,<,n %arg3, %r31, fdsync /* If loop < 0, do sync */
270 fdmanyloop: /* Loop if LOOP >= 2 */
271 ADDIB> -1, %r31, fdmanyloop /* Adjusted inner loop decr */
272 fdce %r0(%sr1, %arg0)
273 fdce,m %arg1(%sr1, %arg0) /* Last fdce and addr adjust */
274 movb,tr %arg3, %r31, fdmanyloop /* Re-init inner loop count */
275 ADDIB<=,n -1, %arg2, fdsync /* Outer loop decr */
277 fdoneloop: /* Loop if LOOP = 1 */
278 ADDIB> -1, %arg2, fdoneloop /* Outer loop count decr */
279 fdce,m %arg1(%sr1, %arg0) /* Fdce for one loop */
284 mtsm %r22 /* restore I-bit */
291 .export copy_user_page_asm,code
300 /* PA8x00 CPUs can consume 2 loads or 1 store per cycle.
301 * Unroll the loop by hand and arrange insn appropriately.
302 * GCC probably can do this just as well.
306 ldi 32, %r1 /* PAGE_SIZE/128 == 32 */
307 ldw 64(%r25), %r0 /* prefetch 1 cacheline ahead */
308 ldw 128(%r25), %r0 /* prefetch 2 */
311 ldw 192(%r25), %r0 /* prefetch 3 */
312 ldw 256(%r25), %r0 /* prefetch 4 */
354 /* conditional branches nullify on forward taken branch, and on
355 * non-taken backward branch. Note that .+4 is a backwards branch.
356 * The ldd should only get executed if the branch is taken.
358 ADDIB>,n -1, %r1, 1b /* bundle 10 */
359 ldd 0(%r25), %r19 /* start next loads */
364 * This loop is optimized for PCXL/PCXL2 ldw/ldw and stw/stw
365 * bundles (very restricted rules for bundling).
366 * Note that until (if) we start saving
367 * the full 64 bit register values on interrupt, we can't
368 * use ldd/std on a 32 bit kernel.
371 ldi 64, %r1 /* PAGE_SIZE/64 == 64 */
417 * NOTE: Code in clear_user_page has a hard coded dependency on the
418 * maximum alias boundary being 4 Mb. We've been assured by the
419 * parisc chip designers that there will not ever be a parisc
420 * chip with a larger alias boundary (Never say never :-) ).
422 * Subtle: the dtlb miss handlers support the temp alias region by
423 * "knowing" that if a dtlb miss happens within the temp alias
424 * region it must have occurred while in clear_user_page. Since
425 * this routine makes use of processor local translations, we
426 * don't want to insert them into the kernel page table. Instead,
427 * we load up some general registers (they need to be registers
428 * which aren't shadowed) with the physical page numbers (preshifted
429 * for tlb insertion) needed to insert the translations. When we
430 * miss on the translation, the dtlb miss handler inserts the
431 * translation into the tlb using these values:
433 * %r26 physical page (shifted for tlb insert) of "to" translation
434 * %r23 physical page (shifted for tlb insert) of "from" translation
440 * We can't do this since copy_user_page is used to bring in
441 * file data that might have instructions. Since the data would
442 * then need to be flushed out so the i-fetch can see it, it
443 * makes more sense to just copy through the kernel translation
446 * I'm still keeping this around because it may be possible to
447 * use it if more information is passed into copy_user_page().
448 * Have to do some measurements to see if it is worthwhile to
449 * lobby for such a change.
452 .export copy_user_page_asm,code
459 ldil L%(__PAGE_OFFSET), %r1
461 sub %r25, %r1, %r23 /* move physical addr into non shadowed reg */
463 ldil L%(TMPALIAS_MAP_START), %r28
465 extrd,u %r26,56,32, %r26 /* convert phys addr to tlb insert format */
466 extrd,u %r23,56,32, %r23 /* convert phys addr to tlb insert format */
467 depd %r24,63,22, %r28 /* Form aliased virtual address 'to' */
468 depdi 0, 63,12, %r28 /* Clear any offset bits */
470 depdi 1, 41,1, %r29 /* Form aliased virtual address 'from' */
472 extrw,u %r26, 24,25, %r26 /* convert phys addr to tlb insert format */
473 extrw,u %r23, 24,25, %r23 /* convert phys addr to tlb insert format */
474 depw %r24, 31,22, %r28 /* Form aliased virtual address 'to' */
475 depwi 0, 31,12, %r28 /* Clear any offset bits */
477 depwi 1, 9,1, %r29 /* Form aliased virtual address 'from' */
480 /* Purge any old translations */
488 * This loop is optimized for PCXL/PCXL2 ldw/ldw and stw/stw
489 * bundles (very restricted rules for bundling). It probably
490 * does OK on PCXU and better, but we could do better with
491 * ldd/std instructions. Note that until (if) we start saving
492 * the full 64 bit register values on interrupt, we can't
493 * use ldd/std on a 32 bit kernel.
541 .export __clear_user_page_asm,code
543 __clear_user_page_asm:
550 ldil L%(TMPALIAS_MAP_START), %r28
552 #if (TMPALIAS_MAP_START >= 0x80000000)
553 depdi 0, 31,32, %r28 /* clear any sign extension */
555 extrd,u %r26, 56,32, %r26 /* convert phys addr to tlb insert format */
556 depd %r25, 63,22, %r28 /* Form aliased virtual address 'to' */
557 depdi 0, 63,12, %r28 /* Clear any offset bits */
559 extrw,u %r26, 24,25, %r26 /* convert phys addr to tlb insert format */
560 depw %r25, 31,22, %r28 /* Form aliased virtual address 'to' */
561 depwi 0, 31,12, %r28 /* Clear any offset bits */
564 /* Purge any old translation */
569 ldi 32, %r1 /* PAGE_SIZE/128 == 32 */
571 /* PREFETCH (Write) has not (yet) been proven to help here */
572 /* #define PREFETCHW_OP ldd 256(%0), %r0 */
593 #else /* ! CONFIG_64BIT */
595 ldi 64, %r1 /* PAGE_SIZE/64 == 64 */
616 #endif /* CONFIG_64BIT */
624 .export flush_kernel_dcache_page_asm
626 flush_kernel_dcache_page_asm:
631 ldil L%dcache_stride, %r1
632 ldw R%dcache_stride(%r1), %r23
635 depdi,z 1, 63-PAGE_SHIFT,1, %r25
637 depwi,z 1, 31-PAGE_SHIFT,1, %r25
668 .export flush_user_dcache_page
670 flush_user_dcache_page:
675 ldil L%dcache_stride, %r1
676 ldw R%dcache_stride(%r1), %r23
679 depdi,z 1,63-PAGE_SHIFT,1, %r25
681 depwi,z 1,31-PAGE_SHIFT,1, %r25
687 1: fdc,m %r23(%sr3, %r26)
688 fdc,m %r23(%sr3, %r26)
689 fdc,m %r23(%sr3, %r26)
690 fdc,m %r23(%sr3, %r26)
691 fdc,m %r23(%sr3, %r26)
692 fdc,m %r23(%sr3, %r26)
693 fdc,m %r23(%sr3, %r26)
694 fdc,m %r23(%sr3, %r26)
695 fdc,m %r23(%sr3, %r26)
696 fdc,m %r23(%sr3, %r26)
697 fdc,m %r23(%sr3, %r26)
698 fdc,m %r23(%sr3, %r26)
699 fdc,m %r23(%sr3, %r26)
700 fdc,m %r23(%sr3, %r26)
701 fdc,m %r23(%sr3, %r26)
703 fdc,m %r23(%sr3, %r26)
712 .export flush_user_icache_page
714 flush_user_icache_page:
719 ldil L%dcache_stride, %r1
720 ldw R%dcache_stride(%r1), %r23
723 depdi,z 1, 63-PAGE_SHIFT,1, %r25
725 depwi,z 1, 31-PAGE_SHIFT,1, %r25
731 1: fic,m %r23(%sr3, %r26)
732 fic,m %r23(%sr3, %r26)
733 fic,m %r23(%sr3, %r26)
734 fic,m %r23(%sr3, %r26)
735 fic,m %r23(%sr3, %r26)
736 fic,m %r23(%sr3, %r26)
737 fic,m %r23(%sr3, %r26)
738 fic,m %r23(%sr3, %r26)
739 fic,m %r23(%sr3, %r26)
740 fic,m %r23(%sr3, %r26)
741 fic,m %r23(%sr3, %r26)
742 fic,m %r23(%sr3, %r26)
743 fic,m %r23(%sr3, %r26)
744 fic,m %r23(%sr3, %r26)
745 fic,m %r23(%sr3, %r26)
747 fic,m %r23(%sr3, %r26)
757 .export purge_kernel_dcache_page
759 purge_kernel_dcache_page:
764 ldil L%dcache_stride, %r1
765 ldw R%dcache_stride(%r1), %r23
768 depdi,z 1, 63-PAGE_SHIFT,1, %r25
770 depwi,z 1, 31-PAGE_SHIFT,1, %r25
790 CMPB<< %r26, %r25, 1b
801 /* Currently not used, but it still is a possible alternate
805 .export flush_alias_page
814 ldil L%(TMPALIAS_MAP_START), %r28
816 extrd,u %r26, 56,32, %r26 /* convert phys addr to tlb insert format */
817 depd %r25, 63,22, %r28 /* Form aliased virtual address 'to' */
818 depdi 0, 63,12, %r28 /* Clear any offset bits */
820 extrw,u %r26, 24,25, %r26 /* convert phys addr to tlb insert format */
821 depw %r25, 31,22, %r28 /* Form aliased virtual address 'to' */
822 depwi 0, 31,12, %r28 /* Clear any offset bits */
825 /* Purge any old translation */
829 ldil L%dcache_stride, %r1
830 ldw R%dcache_stride(%r1), %r23
833 depdi,z 1, 63-PAGE_SHIFT,1, %r29
835 depwi,z 1, 31-PAGE_SHIFT,1, %r29
855 CMPB<< %r28, %r29, 1b
866 .export flush_user_dcache_range_asm
868 flush_user_dcache_range_asm:
873 ldil L%dcache_stride, %r1
874 ldw R%dcache_stride(%r1), %r23
876 ANDCM %r26, %r21, %r26
878 1: CMPB<<,n %r26, %r25, 1b
879 fdc,m %r23(%sr3, %r26)
888 .export flush_kernel_dcache_range_asm
890 flush_kernel_dcache_range_asm:
895 ldil L%dcache_stride, %r1
896 ldw R%dcache_stride(%r1), %r23
898 ANDCM %r26, %r21, %r26
900 1: CMPB<<,n %r26, %r25,1b
911 .export flush_user_icache_range_asm
913 flush_user_icache_range_asm:
918 ldil L%icache_stride, %r1
919 ldw R%icache_stride(%r1), %r23
921 ANDCM %r26, %r21, %r26
923 1: CMPB<<,n %r26, %r25,1b
924 fic,m %r23(%sr3, %r26)
933 .export flush_kernel_icache_page
935 flush_kernel_icache_page:
940 ldil L%icache_stride, %r1
941 ldw R%icache_stride(%r1), %r23
944 depdi,z 1, 63-PAGE_SHIFT,1, %r25
946 depwi,z 1, 31-PAGE_SHIFT,1, %r25
952 1: fic,m %r23(%sr4, %r26)
953 fic,m %r23(%sr4, %r26)
954 fic,m %r23(%sr4, %r26)
955 fic,m %r23(%sr4, %r26)
956 fic,m %r23(%sr4, %r26)
957 fic,m %r23(%sr4, %r26)
958 fic,m %r23(%sr4, %r26)
959 fic,m %r23(%sr4, %r26)
960 fic,m %r23(%sr4, %r26)
961 fic,m %r23(%sr4, %r26)
962 fic,m %r23(%sr4, %r26)
963 fic,m %r23(%sr4, %r26)
964 fic,m %r23(%sr4, %r26)
965 fic,m %r23(%sr4, %r26)
966 fic,m %r23(%sr4, %r26)
967 CMPB<< %r26, %r25, 1b
968 fic,m %r23(%sr4, %r26)
977 .export flush_kernel_icache_range_asm
979 flush_kernel_icache_range_asm:
984 ldil L%icache_stride, %r1
985 ldw R%icache_stride(%r1), %r23
987 ANDCM %r26, %r21, %r26
989 1: CMPB<<,n %r26, %r25, 1b
990 fic,m %r23(%sr4, %r26)
998 /* align should cover use of rfi in disable_sr_hashing_asm and
1002 .export disable_sr_hashing_asm,code
1004 disable_sr_hashing_asm:
1010 * Switch to real mode
1021 rsm PSW_SM_Q, %r0 /* prep to load iia queue */
1022 mtctl %r0, %cr17 /* Clear IIASQ tail */
1023 mtctl %r0, %cr17 /* Clear IIASQ head */
1024 mtctl %r1, %cr18 /* IIAOQ head */
1026 mtctl %r1, %cr18 /* IIAOQ tail */
1027 load32 REAL_MODE_PSW, %r1
1032 1: cmpib,=,n SRHASH_PCXST, %r26,srdis_pcxs
1033 cmpib,=,n SRHASH_PCXL, %r26,srdis_pcxl
1034 cmpib,=,n SRHASH_PA20, %r26,srdis_pa20
1039 /* Disable Space Register Hashing for PCXS,PCXT,PCXT' */
1041 .word 0x141c1a00 /* mfdiag %dr0, %r28 */
1042 .word 0x141c1a00 /* must issue twice */
1043 depwi 0,18,1, %r28 /* Clear DHE (dcache hash enable) */
1044 depwi 0,20,1, %r28 /* Clear IHE (icache hash enable) */
1045 .word 0x141c1600 /* mtdiag %r28, %dr0 */
1046 .word 0x141c1600 /* must issue twice */
1051 /* Disable Space Register Hashing for PCXL */
1053 .word 0x141c0600 /* mfdiag %dr0, %r28 */
1054 depwi 0,28,2, %r28 /* Clear DHASH_EN & IHASH_EN */
1055 .word 0x141c0240 /* mtdiag %r28, %dr0 */
1060 /* Disable Space Register Hashing for PCXU,PCXU+,PCXW,PCXW+,PCXW2 */
1062 .word 0x144008bc /* mfdiag %dr2, %r28 */
1063 depdi 0, 54,1, %r28 /* clear DIAG_SPHASH_ENAB (bit 54) */
1064 .word 0x145c1840 /* mtdiag %r28, %dr2 */
1068 /* Switch back to virtual mode */
1069 rsm PSW_SM_I, %r0 /* prep to load iia queue */
1077 rsm PSW_SM_Q, %r0 /* prep to load iia queue */
1078 mtctl %r0, %cr17 /* Clear IIASQ tail */
1079 mtctl %r0, %cr17 /* Clear IIASQ head */
1080 mtctl %r1, %cr18 /* IIAOQ head */
1082 mtctl %r1, %cr18 /* IIAOQ tail */
1083 load32 KERNEL_PSW, %r1