/* SPDX-License-Identifier: GPL-2.0-or-later */
/*
* PARISC TLB and cache flushing support
* Copyright (C) 2000-2001 Hewlett-Packard (John Marvin)
* Copyright (C) 2001 Matthew Wilcox (willy at parisc-linux.org)
* Copyright (C) 2002 Richard Hirst (rhirst with parisc-linux.org)
*/
/*
* NOTE: fdc,fic, and pdc instructions that use base register modification
* should only use index and base registers that are not shadowed,
* so that the fast path emulation in the non access miss handler
* can be used.
*/
#ifdef CONFIG_64BIT
.level 2 .0 w
#else
.level 2 .0
#endif
#include <asm/psw.h>
#include <asm/assembly.h>
#include <asm/cache.h>
#include <asm/ldcw.h>
#include <asm/alternative.h>
#include <linux/linkage.h>
#include <linux/init.h>
#include <linux/pgtable.h>
.section .text.hot
.align 16
ENTRY_CFI(flush_tlb_all_local)
/*
* The pitlbe and pdtlbe instructions should only be used to
* flush the entire tlb. Also, there needs to be no intervening
* tlb operations, e.g. tlb misses, so the operation needs
* to happen in real mode with all interruptions disabled.
*/
/* pcxt_ssm_bug - relied upon translation! PA 2.0 Arch. F-4 and F-5 */
rsm PSW_SM_I, %r19 /* save I-bit state */
load32 PA(1 f), %r1
nop
nop
nop
nop
nop
rsm PSW_SM_Q, %r0 /* prep to load iia queue */
mtctl %r0, %cr17 /* Clear IIASQ tail */
mtctl %r0, %cr17 /* Clear IIASQ head */
mtctl %r1, %cr18 /* IIAOQ head */
ldo 4 (%r1), %r1
mtctl %r1, %cr18 /* IIAOQ tail */
load32 REAL_MODE_PSW, %r1
mtctl %r1, %ipsw
rfi
nop
1 : load32 PA(cache_info), %r1
/* Flush Instruction Tlb */
88 : LDREG ITLB_SID_BASE(%r1), %r20
LDREG ITLB_SID_STRIDE(%r1), %r21
LDREG ITLB_SID_COUNT(%r1), %r22
LDREG ITLB_OFF_BASE(%r1), %arg0
LDREG ITLB_OFF_STRIDE(%r1), %arg1
LDREG ITLB_OFF_COUNT(%r1), %arg2
LDREG ITLB_LOOP(%r1), %arg3
addib,COND(=) -1 , %arg3, fitoneloop /* Preadjust and test */
movb,<,n %arg3, %r31, fitdone /* If loop < 0, skip */
copy %arg0, %r28 /* Init base addr */
fitmanyloop: /* Loop if LOOP >= 2 */
mtsp %r20, %sr1
add %r21, %r20, %r20 /* increment space */
copy %arg2, %r29 /* Init middle loop count */
fitmanymiddle: /* Loop if LOOP >= 2 */
addib,COND(>) -1 , %r31, fitmanymiddle /* Adjusted inner loop decr */
pitlbe %r0(%sr1, %r28)
pitlbe,m %arg1(%sr1, %r28) /* Last pitlbe and addr adjust */
addib,COND(>) -1 , %r29, fitmanymiddle /* Middle loop decr */
copy %arg3, %r31 /* Re-init inner loop count */
movb,tr %arg0, %r28, fitmanyloop /* Re-init base addr */
addib,COND(<=),n -1 , %r22, fitdone /* Outer loop count decr */
fitoneloop: /* Loop if LOOP = 1 */
mtsp %r20, %sr1
copy %arg0, %r28 /* init base addr */
copy %arg2, %r29 /* init middle loop count */
fitonemiddle: /* Loop if LOOP = 1 */
addib,COND(>) -1 , %r29, fitonemiddle /* Middle loop count decr */
pitlbe,m %arg1(%sr1, %r28) /* pitlbe for one loop */
addib,COND(>) -1 , %r22, fitoneloop /* Outer loop count decr */
add %r21, %r20, %r20 /* increment space */
fitdone:
ALTERNATIVE(88 b, fitdone, ALT_COND_NO_SPLIT_TLB, INSN_NOP)
/* Flush Data Tlb */
LDREG DTLB_SID_BASE(%r1), %r20
LDREG DTLB_SID_STRIDE(%r1), %r21
LDREG DTLB_SID_COUNT(%r1), %r22
LDREG DTLB_OFF_BASE(%r1), %arg0
LDREG DTLB_OFF_STRIDE(%r1), %arg1
LDREG DTLB_OFF_COUNT(%r1), %arg2
LDREG DTLB_LOOP(%r1), %arg3
addib,COND(=) -1 , %arg3, fdtoneloop /* Preadjust and test */
movb,<,n %arg3, %r31, fdtdone /* If loop < 0, skip */
copy %arg0, %r28 /* Init base addr */
fdtmanyloop: /* Loop if LOOP >= 2 */
mtsp %r20, %sr1
add %r21, %r20, %r20 /* increment space */
copy %arg2, %r29 /* Init middle loop count */
fdtmanymiddle: /* Loop if LOOP >= 2 */
addib,COND(>) -1 , %r31, fdtmanymiddle /* Adjusted inner loop decr */
pdtlbe %r0(%sr1, %r28)
pdtlbe,m %arg1(%sr1, %r28) /* Last pdtlbe and addr adjust */
addib,COND(>) -1 , %r29, fdtmanymiddle /* Middle loop decr */
copy %arg3, %r31 /* Re-init inner loop count */
movb,tr %arg0, %r28, fdtmanyloop /* Re-init base addr */
addib,COND(<=),n -1 , %r22,fdtdone /* Outer loop count decr */
fdtoneloop: /* Loop if LOOP = 1 */
mtsp %r20, %sr1
copy %arg0, %r28 /* init base addr */
copy %arg2, %r29 /* init middle loop count */
fdtonemiddle: /* Loop if LOOP = 1 */
addib,COND(>) -1 , %r29, fdtonemiddle /* Middle loop count decr */
pdtlbe,m %arg1(%sr1, %r28) /* pdtlbe for one loop */
addib,COND(>) -1 , %r22, fdtoneloop /* Outer loop count decr */
add %r21, %r20, %r20 /* increment space */
fdtdone:
/*
* Switch back to virtual mode
*/
/* pcxt_ssm_bug */
rsm PSW_SM_I, %r0
load32 2 f, %r1
nop
nop
nop
nop
nop
rsm PSW_SM_Q, %r0 /* prep to load iia queue */
mtctl %r0, %cr17 /* Clear IIASQ tail */
mtctl %r0, %cr17 /* Clear IIASQ head */
mtctl %r1, %cr18 /* IIAOQ head */
ldo 4 (%r1), %r1
mtctl %r1, %cr18 /* IIAOQ tail */
load32 KERNEL_PSW, %r1
or %r1, %r19, %r1 /* I-bit to state on entry */
mtctl %r1, %ipsw /* restore I-bit (entire PSW) */
rfi
nop
2 : bv %r0(%r2)
nop
/*
* When running in qemu, drop whole flush_tlb_all_local function and
* replace by one pdtlbe instruction, for which QEMU will drop all
* local TLB entries.
*/
3 : pdtlbe %r0(%sr1,%r0)
bv,n %r0(%r2)
ALTERNATIVE_CODE(flush_tlb_all_local, 2 , ALT_COND_RUN_ON_QEMU, 3 b)
ENDPROC_CFI(flush_tlb_all_local)
.import cache_info,data
ENTRY_CFI(flush_instruction_cache_local)
88 : load32 cache_info, %r1
/* Flush Instruction Cache */
LDREG ICACHE_BASE(%r1), %arg0
LDREG ICACHE_STRIDE(%r1), %arg1
LDREG ICACHE_COUNT(%r1), %arg2
LDREG ICACHE_LOOP(%r1), %arg3
rsm PSW_SM_I, %r22 /* No mmgt ops during loop*/
mtsp %r0, %sr1
addib,COND(=) -1 , %arg3, fioneloop /* Preadjust and test */
movb,<,n %arg3, %r31, fisync /* If loop < 0, do sync */
fimanyloop: /* Loop if LOOP >= 2 */
addib,COND(>) -1 , %r31, fimanyloop /* Adjusted inner loop decr */
fice %r0(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0) /* Last fice and addr adjust */
movb,tr %arg3, %r31, fimanyloop /* Re-init inner loop count */
addib,COND(<=),n -1 , %arg2, fisync /* Outer loop decr */
fioneloop: /* Loop if LOOP = 1 */
/* Some implementations may flush with a single fice instruction */
cmpib,COND(>>=),n 15 , %arg2, fioneloop2
fioneloop1:
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
fice,m %arg1(%sr1, %arg0)
addib,COND(>) -16 , %arg2, fioneloop1
fice,m %arg1(%sr1, %arg0)
/* Check if done */
cmpb,COND(=),n %arg2, %r0, fisync /* Predict branch taken */
fioneloop2:
addib,COND(>) -1 , %arg2, fioneloop2 /* Outer loop count decr */
fice,m %arg1(%sr1, %arg0) /* Fice for one loop */
fisync:
sync
mtsm %r22 /* restore I-bit */
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_ICACHE, INSN_NOP)
bv %r0(%r2)
nop
ENDPROC_CFI(flush_instruction_cache_local)
.import cache_info, data
ENTRY_CFI(flush_data_cache_local)
88 : load32 cache_info, %r1
/* Flush Data Cache */
LDREG DCACHE_BASE(%r1), %arg0
LDREG DCACHE_STRIDE(%r1), %arg1
LDREG DCACHE_COUNT(%r1), %arg2
LDREG DCACHE_LOOP(%r1), %arg3
rsm PSW_SM_I, %r22 /* No mmgt ops during loop*/
mtsp %r0, %sr1
addib,COND(=) -1 , %arg3, fdoneloop /* Preadjust and test */
movb,<,n %arg3, %r31, fdsync /* If loop < 0, do sync */
fdmanyloop: /* Loop if LOOP >= 2 */
addib,COND(>) -1 , %r31, fdmanyloop /* Adjusted inner loop decr */
fdce %r0(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0) /* Last fdce and addr adjust */
movb,tr %arg3, %r31, fdmanyloop /* Re-init inner loop count */
addib,COND(<=),n -1 , %arg2, fdsync /* Outer loop decr */
fdoneloop: /* Loop if LOOP = 1 */
/* Some implementations may flush with a single fdce instruction */
cmpib,COND(>>=),n 15 , %arg2, fdoneloop2
fdoneloop1:
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
fdce,m %arg1(%sr1, %arg0)
addib,COND(>) -16 , %arg2, fdoneloop1
fdce,m %arg1(%sr1, %arg0)
/* Check if done */
cmpb,COND(=),n %arg2, %r0, fdsync /* Predict branch taken */
fdoneloop2:
addib,COND(>) -1 , %arg2, fdoneloop2 /* Outer loop count decr */
fdce,m %arg1(%sr1, %arg0) /* Fdce for one loop */
fdsync:
sync
mtsm %r22 /* restore I-bit */
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
bv %r0(%r2)
nop
ENDPROC_CFI(flush_data_cache_local)
/* Clear page using kernel mapping. */
ENTRY_CFI(clear_page_asm)
#ifdef CONFIG_64BIT
/* Unroll the loop. */
ldi (PAGE_SIZE / 128 ), %r1
1 :
std %r0, 0 (%r26)
std %r0, 8 (%r26)
std %r0, 16 (%r26)
std %r0, 24 (%r26)
std %r0, 32 (%r26)
std %r0, 40 (%r26)
std %r0, 48 (%r26)
std %r0, 56 (%r26)
std %r0, 64 (%r26)
std %r0, 72 (%r26)
std %r0, 80 (%r26)
std %r0, 88 (%r26)
std %r0, 96 (%r26)
std %r0, 104 (%r26)
std %r0, 112 (%r26)
std %r0, 120 (%r26)
/* Note reverse branch hint for addib is taken. */
addib,COND(>),n -1 , %r1, 1 b
ldo 128 (%r26), %r26
#else
/*
* Note that until (if) we start saving the full 64-bit register
* values on interrupt, we can't use std on a 32 bit kernel.
*/
ldi (PAGE_SIZE / 64 ), %r1
1 :
stw %r0, 0 (%r26)
stw %r0, 4 (%r26)
stw %r0, 8 (%r26)
stw %r0, 12 (%r26)
stw %r0, 16 (%r26)
stw %r0, 20 (%r26)
stw %r0, 24 (%r26)
stw %r0, 28 (%r26)
stw %r0, 32 (%r26)
stw %r0, 36 (%r26)
stw %r0, 40 (%r26)
stw %r0, 44 (%r26)
stw %r0, 48 (%r26)
stw %r0, 52 (%r26)
stw %r0, 56 (%r26)
stw %r0, 60 (%r26)
addib,COND(>),n -1 , %r1, 1 b
ldo 64 (%r26), %r26
#endif
bv %r0(%r2)
nop
ENDPROC_CFI(clear_page_asm)
/* Copy page using kernel mapping. */
ENTRY_CFI(copy_page_asm)
#ifdef CONFIG_64BIT
/* PA8x00 CPUs can consume 2 loads or 1 store per cycle.
* Unroll the loop by hand and arrange insn appropriately.
* Prefetch doesn't improve performance on rp3440.
* GCC probably can do this just as well...
*/
ldi (PAGE_SIZE / 128 ), %r1
1 : ldd 0 (%r25), %r19
ldd 8 (%r25), %r20
ldd 16 (%r25), %r21
ldd 24 (%r25), %r22
std %r19, 0 (%r26)
std %r20, 8 (%r26)
ldd 32 (%r25), %r19
ldd 40 (%r25), %r20
std %r21, 16 (%r26)
std %r22, 24 (%r26)
ldd 48 (%r25), %r21
ldd 56 (%r25), %r22
std %r19, 32 (%r26)
std %r20, 40 (%r26)
ldd 64 (%r25), %r19
ldd 72 (%r25), %r20
std %r21, 48 (%r26)
std %r22, 56 (%r26)
ldd 80 (%r25), %r21
ldd 88 (%r25), %r22
std %r19, 64 (%r26)
std %r20, 72 (%r26)
ldd 96 (%r25), %r19
ldd 104 (%r25), %r20
std %r21, 80 (%r26)
std %r22, 88 (%r26)
ldd 112 (%r25), %r21
ldd 120 (%r25), %r22
ldo 128 (%r25), %r25
std %r19, 96 (%r26)
std %r20, 104 (%r26)
std %r21, 112 (%r26)
std %r22, 120 (%r26)
/* Note reverse branch hint for addib is taken. */
addib,COND(>),n -1 , %r1, 1 b
ldo 128 (%r26), %r26
#else
/*
* This loop is optimized for PCXL/PCXL2 ldw/ldw and stw/stw
* bundles (very restricted rules for bundling).
* Note that until (if) we start saving
* the full 64 bit register values on interrupt, we can't
* use ldd/std on a 32 bit kernel.
*/
ldw 0 (%r25), %r19
ldi (PAGE_SIZE / 64 ), %r1
1 :
ldw 4 (%r25), %r20
ldw 8 (%r25), %r21
ldw 12 (%r25), %r22
stw %r19, 0 (%r26)
stw %r20, 4 (%r26)
stw %r21, 8 (%r26)
stw %r22, 12 (%r26)
ldw 16 (%r25), %r19
ldw 20 (%r25), %r20
ldw 24 (%r25), %r21
ldw 28 (%r25), %r22
stw %r19, 16 (%r26)
stw %r20, 20 (%r26)
stw %r21, 24 (%r26)
stw %r22, 28 (%r26)
ldw 32 (%r25), %r19
ldw 36 (%r25), %r20
ldw 40 (%r25), %r21
ldw 44 (%r25), %r22
stw %r19, 32 (%r26)
stw %r20, 36 (%r26)
stw %r21, 40 (%r26)
stw %r22, 44 (%r26)
ldw 48 (%r25), %r19
ldw 52 (%r25), %r20
ldw 56 (%r25), %r21
ldw 60 (%r25), %r22
stw %r19, 48 (%r26)
stw %r20, 52 (%r26)
ldo 64 (%r25), %r25
stw %r21, 56 (%r26)
stw %r22, 60 (%r26)
ldo 64 (%r26), %r26
addib,COND(>),n -1 , %r1, 1 b
ldw 0 (%r25), %r19
#endif
bv %r0(%r2)
nop
ENDPROC_CFI(copy_page_asm)
/*
* NOTE: Code in clear_user_page has a hard coded dependency on the
* maximum alias boundary being 4 Mb. We've been assured by the
* parisc chip designers that there will not ever be a parisc
* chip with a larger alias boundary (Never say never :-) ).
*
* Yah, what about the PA8800 and PA8900 processors?
*
* Subtle: the dtlb miss handlers support the temp alias region by
* "knowing" that if a dtlb miss happens within the temp alias
* region it must have occurred while in clear_user_page. Since
* this routine makes use of processor local translations, we
* don't want to insert them into the kernel page table. Instead,
* we load up some general registers (they need to be registers
* which aren't shadowed) with the physical page numbers (preshifted
* for tlb insertion) needed to insert the translations. When we
* miss on the translation, the dtlb miss handler inserts the
* translation into the tlb using these values:
*
* %r26 physical address of "to" translation
* %r23 physical address of "from" translation
*/
/*
* copy_user_page_asm() performs a page copy using mappings
* equivalent to the user page mappings. It can be used to
* implement copy_user_page() but unfortunately both the `from'
* and `to' pages need to be flushed through mappings equivalent
* to the user mappings after the copy because the kernel accesses
* the `from' page through the kmap kernel mapping and the `to'
* page needs to be flushed since code can be copied. As a
* result, this implementation is less efficient than the simpler
* copy using the kernel mapping. It only needs the `from' page
* to flushed via the user mapping. The kunmap routines handle
* the flushes needed for the kernel mapping.
*
* I'm still keeping this around because it may be possible to
* use it if more information is passed into copy_user_page().
* Have to do some measurements to see if it is worthwhile to
* lobby for such a change.
*
*/
ENTRY_CFI(copy_user_page_asm)
/* Convert virtual `to' and `from' addresses to physical addresses.
Move `from' physical address to non shadowed register. */
ldil L%(__PAGE_OFFSET), %r1
sub %r26, %r1, %r26
sub %r25, %r1, %r23
ldil L%(TMPALIAS_MAP_START), %r28
dep_safe %r24, 31 ,TMPALIAS_SIZE_BITS, %r28 /* Form aliased virtual address 'to' */
depi_safe 0 , 31 ,PAGE_SHIFT, %r28 /* Clear any offset bits */
copy %r28, %r29
depi_safe 1 , 31 -TMPALIAS_SIZE_BITS,1 , %r29 /* Form aliased virtual address 'from' */
/* Purge any old translations */
#ifdef CONFIG_PA20
pdtlb,l %r0(%r28)
pdtlb,l %r0(%r29)
#else
0 : pdtlb %r0(%r28)
1 : pdtlb %r0(%r29)
ALTERNATIVE(0 b, 0 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
ALTERNATIVE(1 b, 1 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
#endif
#ifdef CONFIG_64BIT
/* PA8x00 CPUs can consume 2 loads or 1 store per cycle.
* Unroll the loop by hand and arrange insn appropriately.
* GCC probably can do this just as well.
*/
ldd 0 (%r29), %r19
ldi (PAGE_SIZE / 128 ), %r1
1 : ldd 8 (%r29), %r20
ldd 16 (%r29), %r21
ldd 24 (%r29), %r22
std %r19, 0 (%r28)
std %r20, 8 (%r28)
ldd 32 (%r29), %r19
ldd 40 (%r29), %r20
std %r21, 16 (%r28)
std %r22, 24 (%r28)
ldd 48 (%r29), %r21
ldd 56 (%r29), %r22
std %r19, 32 (%r28)
std %r20, 40 (%r28)
ldd 64 (%r29), %r19
ldd 72 (%r29), %r20
std %r21, 48 (%r28)
std %r22, 56 (%r28)
ldd 80 (%r29), %r21
ldd 88 (%r29), %r22
std %r19, 64 (%r28)
std %r20, 72 (%r28)
ldd 96 (%r29), %r19
ldd 104 (%r29), %r20
std %r21, 80 (%r28)
std %r22, 88 (%r28)
ldd 112 (%r29), %r21
ldd 120 (%r29), %r22
std %r19, 96 (%r28)
std %r20, 104 (%r28)
ldo 128 (%r29), %r29
std %r21, 112 (%r28)
std %r22, 120 (%r28)
ldo 128 (%r28), %r28
/* conditional branches nullify on forward taken branch, and on
* non-taken backward branch. Note that .+4 is a backwards branch.
* The ldd should only get executed if the branch is taken.
*/
addib,COND(>),n -1 , %r1, 1 b /* bundle 10 */
ldd 0 (%r29), %r19 /* start next loads */
#else
ldi (PAGE_SIZE / 64 ), %r1
/*
* This loop is optimized for PCXL/PCXL2 ldw/ldw and stw/stw
* bundles (very restricted rules for bundling). It probably
* does OK on PCXU and better, but we could do better with
* ldd/std instructions. Note that until (if) we start saving
* the full 64 bit register values on interrupt, we can't
* use ldd/std on a 32 bit kernel.
*/
1 : ldw 0 (%r29), %r19
ldw 4 (%r29), %r20
ldw 8 (%r29), %r21
ldw 12 (%r29), %r22
stw %r19, 0 (%r28)
stw %r20, 4 (%r28)
stw %r21, 8 (%r28)
stw %r22, 12 (%r28)
ldw 16 (%r29), %r19
ldw 20 (%r29), %r20
ldw 24 (%r29), %r21
ldw 28 (%r29), %r22
stw %r19, 16 (%r28)
stw %r20, 20 (%r28)
stw %r21, 24 (%r28)
stw %r22, 28 (%r28)
ldw 32 (%r29), %r19
ldw 36 (%r29), %r20
ldw 40 (%r29), %r21
ldw 44 (%r29), %r22
stw %r19, 32 (%r28)
stw %r20, 36 (%r28)
stw %r21, 40 (%r28)
stw %r22, 44 (%r28)
ldw 48 (%r29), %r19
ldw 52 (%r29), %r20
ldw 56 (%r29), %r21
ldw 60 (%r29), %r22
stw %r19, 48 (%r28)
stw %r20, 52 (%r28)
stw %r21, 56 (%r28)
stw %r22, 60 (%r28)
ldo 64 (%r28), %r28
addib,COND(>) -1 , %r1,1 b
ldo 64 (%r29), %r29
#endif
bv %r0(%r2)
nop
ENDPROC_CFI(copy_user_page_asm)
ENTRY_CFI(clear_user_page_asm)
tophys_r1 %r26
ldil L%(TMPALIAS_MAP_START), %r28
dep_safe %r25, 31 ,TMPALIAS_SIZE_BITS, %r28 /* Form aliased virtual address 'to' */
depi_safe 0 , 31 ,PAGE_SHIFT, %r28 /* Clear any offset bits */
/* Purge any old translation */
#ifdef CONFIG_PA20
pdtlb,l %r0(%r28)
#else
0 : pdtlb %r0(%r28)
ALTERNATIVE(0 b, 0 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
#endif
#ifdef CONFIG_64BIT
ldi (PAGE_SIZE / 128 ), %r1
/* PREFETCH (Write) has not (yet) been proven to help here */
/* #define PREFETCHW_OP ldd 256(%0), %r0 */
1 : std %r0, 0 (%r28)
std %r0, 8 (%r28)
std %r0, 16 (%r28)
std %r0, 24 (%r28)
std %r0, 32 (%r28)
std %r0, 40 (%r28)
std %r0, 48 (%r28)
std %r0, 56 (%r28)
std %r0, 64 (%r28)
std %r0, 72 (%r28)
std %r0, 80 (%r28)
std %r0, 88 (%r28)
std %r0, 96 (%r28)
std %r0, 104 (%r28)
std %r0, 112 (%r28)
std %r0, 120 (%r28)
addib,COND(>) -1 , %r1, 1 b
ldo 128 (%r28), %r28
#else /* ! CONFIG_64BIT */
ldi (PAGE_SIZE / 64 ), %r1
1 : stw %r0, 0 (%r28)
stw %r0, 4 (%r28)
stw %r0, 8 (%r28)
stw %r0, 12 (%r28)
stw %r0, 16 (%r28)
stw %r0, 20 (%r28)
stw %r0, 24 (%r28)
stw %r0, 28 (%r28)
stw %r0, 32 (%r28)
stw %r0, 36 (%r28)
stw %r0, 40 (%r28)
stw %r0, 44 (%r28)
stw %r0, 48 (%r28)
stw %r0, 52 (%r28)
stw %r0, 56 (%r28)
stw %r0, 60 (%r28)
addib,COND(>) -1 , %r1, 1 b
ldo 64 (%r28), %r28
#endif /* CONFIG_64BIT */
bv %r0(%r2)
nop
ENDPROC_CFI(clear_user_page_asm)
ENTRY_CFI(flush_dcache_page_asm)
ldil L%(TMPALIAS_MAP_START), %r28
dep_safe %r25, 31 ,TMPALIAS_SIZE_BITS, %r28 /* Form aliased virtual address 'to' */
depi_safe 0 , 31 ,PAGE_SHIFT, %r28 /* Clear any offset bits */
/* Purge any old translation */
#ifdef CONFIG_PA20
pdtlb,l %r0(%r28)
#else
0 : pdtlb %r0(%r28)
ALTERNATIVE(0 b, 0 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
#endif
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), r31
#ifdef CONFIG_64BIT
depdi,z 1 , 63 -PAGE_SHIFT,1 , %r25
#else
depwi,z 1 , 31 -PAGE_SHIFT,1 , %r25
#endif
add %r28, %r25, %r25
sub %r25, r31, %r25
1 : fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
fdc,m r31(%r28)
cmpb,COND(>>) %r25, %r28, 1 b /* predict taken */
fdc,m r31(%r28)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_dcache_page_asm)
ENTRY_CFI(purge_dcache_page_asm)
ldil L%(TMPALIAS_MAP_START), %r28
dep_safe %r25, 31 ,TMPALIAS_SIZE_BITS, %r28 /* Form aliased virtual address 'to' */
depi_safe 0 , 31 ,PAGE_SHIFT, %r28 /* Clear any offset bits */
/* Purge any old translation */
#ifdef CONFIG_PA20
pdtlb,l %r0(%r28)
#else
0 : pdtlb %r0(%r28)
ALTERNATIVE(0 b, 0 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
#endif
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), r31
#ifdef CONFIG_64BIT
depdi,z 1 , 63 -PAGE_SHIFT,1 , %r25
#else
depwi,z 1 , 31 -PAGE_SHIFT,1 , %r25
#endif
add %r28, %r25, %r25
sub %r25, r31, %r25
1 : pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
pdc,m r31(%r28)
cmpb,COND(>>) %r25, %r28, 1 b /* predict taken */
pdc,m r31(%r28)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(purge_dcache_page_asm)
ENTRY_CFI(flush_icache_page_asm)
ldil L%(TMPALIAS_MAP_START), %r28
dep_safe %r25, 31 ,TMPALIAS_SIZE_BITS, %r28 /* Form aliased virtual address 'to' */
depi_safe 0 , 31 ,PAGE_SHIFT, %r28 /* Clear any offset bits */
/* Purge any old translation. Note that the FIC instruction
* may use either the instruction or data TLB. Given that we
* have a flat address space, it's not clear which TLB will be
* used. So, we purge both entries. */
#ifdef CONFIG_PA20
pdtlb,l %r0(%r28)
1 : pitlb,l %r0(%sr4,%r28)
ALTERNATIVE(1 b, 1 b+4 , ALT_COND_NO_SPLIT_TLB, INSN_NOP)
#else
0 : pdtlb %r0(%r28)
1 : pitlb %r0(%sr4,%r28)
ALTERNATIVE(0 b, 0 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
ALTERNATIVE(1 b, 1 b+4 , ALT_COND_NO_SMP, INSN_PxTLB)
ALTERNATIVE(1 b, 1 b+4 , ALT_COND_NO_SPLIT_TLB, INSN_NOP)
#endif
88 : ldil L%icache_stride, %r1
ldw R%icache_stride(%r1), %r31
#ifdef CONFIG_64BIT
depdi,z 1 , 63 -PAGE_SHIFT,1 , %r25
#else
depwi,z 1 , 31 -PAGE_SHIFT,1 , %r25
#endif
add %r28, %r25, %r25
sub %r25, %r31, %r25
/* fic only has the type 26 form on PA1.1, requiring an
* explicit space specification, so use %sr4 */
1 : fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
fic,m %r31(%sr4,%r28)
cmpb,COND(>>) %r25, %r28, 1 b /* predict taken */
fic,m %r31(%sr4,%r28)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_ICACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_icache_page_asm)
ENTRY_CFI(flush_kernel_dcache_page_asm)
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), %r23
depi_safe 0 , 31 ,PAGE_SHIFT, %r26 /* Clear any offset bits */
#ifdef CONFIG_64BIT
depdi,z 1 , 63 -PAGE_SHIFT,1 , %r25
#else
depwi,z 1 , 31 -PAGE_SHIFT,1 , %r25
#endif
add %r26, %r25, %r25
sub %r25, %r23, %r25
1 : fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
cmpb,COND(>>) %r25, %r26, 1 b /* predict taken */
fdc,m %r23(%r26)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_kernel_dcache_page_asm)
ENTRY_CFI(purge_kernel_dcache_page_asm)
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), %r23
depi_safe 0 , 31 ,PAGE_SHIFT, %r26 /* Clear any offset bits */
#ifdef CONFIG_64BIT
depdi,z 1 , 63 -PAGE_SHIFT,1 , %r25
#else
depwi,z 1 , 31 -PAGE_SHIFT,1 , %r25
#endif
add %r26, %r25, %r25
sub %r25, %r23, %r25
1 : pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
cmpb,COND(>>) %r25, %r26, 1 b /* predict taken */
pdc,m %r23(%r26)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(purge_kernel_dcache_page_asm)
ENTRY_CFI(flush_user_dcache_range_asm)
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), %r23
ldo -1 (%r23), %r21
ANDCM %r26, %r21, %r26
#ifdef CONFIG_64BIT
depd,z %r23, 59 , 60 , %r21
#else
depw,z %r23, 27 , 28 , %r21
#endif
add %r26, %r21, %r22
cmpb,COND(>>),n %r22, %r25, 2 f /* predict not taken */
1 : add %r22, %r21, %r22
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
fdc,m %r23(%sr3, %r26)
cmpb,COND(<<=) %r22, %r25, 1 b /* predict taken */
fdc,m %r23(%sr3, %r26)
2 : cmpb,COND(>>),n %r25, %r26, 2 b
fdc,m %r23(%sr3, %r26)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_user_dcache_range_asm)
ENTRY_CFI(flush_kernel_dcache_range_asm)
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), %r23
ldo -1 (%r23), %r21
ANDCM %r26, %r21, %r26
#ifdef CONFIG_64BIT
depd,z %r23, 59 , 60 , %r21
#else
depw,z %r23, 27 , 28 , %r21
#endif
add %r26, %r21, %r22
cmpb,COND(>>),n %r22, %r25, 2 f /* predict not taken */
1 : add %r22, %r21, %r22
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
fdc,m %r23(%r26)
cmpb,COND(<<=) %r22, %r25, 1 b /* predict taken */
fdc,m %r23(%r26)
2 : cmpb,COND(>>),n %r25, %r26, 2 b /* predict taken */
fdc,m %r23(%r26)
sync
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
bv %r0(%r2)
nop
ENDPROC_CFI(flush_kernel_dcache_range_asm)
ENTRY_CFI(purge_kernel_dcache_range_asm)
88 : ldil L%dcache_stride, %r1
ldw R%dcache_stride(%r1), %r23
ldo -1 (%r23), %r21
ANDCM %r26, %r21, %r26
#ifdef CONFIG_64BIT
depd,z %r23, 59 , 60 , %r21
#else
depw,z %r23, 27 , 28 , %r21
#endif
add %r26, %r21, %r22
cmpb,COND(>>),n %r22, %r25, 2 f /* predict not taken */
1 : add %r22, %r21, %r22
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
pdc,m %r23(%r26)
cmpb,COND(<<=) %r22, %r25, 1 b /* predict taken */
pdc,m %r23(%r26)
2 : cmpb,COND(>>),n %r25, %r26, 2 b /* predict taken */
pdc,m %r23(%r26)
sync
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_DCACHE, INSN_NOP)
bv %r0(%r2)
nop
ENDPROC_CFI(purge_kernel_dcache_range_asm)
ENTRY_CFI(flush_user_icache_range_asm)
88 : ldil L%icache_stride, %r1
ldw R%icache_stride(%r1), %r23
ldo -1 (%r23), %r21
ANDCM %r26, %r21, %r26
#ifdef CONFIG_64BIT
depd,z %r23, 59 , 60 , %r21
#else
depw,z %r23, 27 , 28 , %r21
#endif
add %r26, %r21, %r22
cmpb,COND(>>),n %r22, %r25, 2 f /* predict not taken */
1 : add %r22, %r21, %r22
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
fic,m %r23(%sr3, %r26)
cmpb,COND(<<=) %r22, %r25, 1 b /* predict taken */
fic,m %r23(%sr3, %r26)
2 : cmpb,COND(>>),n %r25, %r26, 2 b
fic,m %r23(%sr3, %r26)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_ICACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_user_icache_range_asm)
ENTRY_CFI(flush_kernel_icache_page)
88 : ldil L%icache_stride, %r1
ldw R%icache_stride(%r1), %r23
#ifdef CONFIG_64BIT
depdi,z 1 , 63 -PAGE_SHIFT,1 , %r25
#else
depwi,z 1 , 31 -PAGE_SHIFT,1 , %r25
#endif
add %r26, %r25, %r25
sub %r25, %r23, %r25
1 : fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
cmpb,COND(>>) %r25, %r26, 1 b /* predict taken */
fic,m %r23(%sr4, %r26)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_ICACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_kernel_icache_page)
ENTRY_CFI(flush_kernel_icache_range_asm)
88 : ldil L%icache_stride, %r1
ldw R%icache_stride(%r1), %r23
ldo -1 (%r23), %r21
ANDCM %r26, %r21, %r26
#ifdef CONFIG_64BIT
depd,z %r23, 59 , 60 , %r21
#else
depw,z %r23, 27 , 28 , %r21
#endif
add %r26, %r21, %r22
cmpb,COND(>>),n %r22, %r25, 2 f /* predict not taken */
1 : add %r22, %r21, %r22
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
fic,m %r23(%sr4, %r26)
cmpb,COND(<<=) %r22, %r25, 1 b /* predict taken */
fic,m %r23(%sr4, %r26)
2 : cmpb,COND(>>),n %r25, %r26, 2 b /* predict taken */
fic,m %r23(%sr4, %r26)
89 : ALTERNATIVE(88 b, 89 b, ALT_COND_NO_ICACHE, INSN_NOP)
sync
bv %r0(%r2)
nop
ENDPROC_CFI(flush_kernel_icache_range_asm)
.text
/* align should cover use of rfi in disable_sr_hashing_asm and
* srdis_done.
*/
.align 256
ENTRY_CFI(disable_sr_hashing_asm)
/*
* Switch to real mode
*/
/* pcxt_ssm_bug */
rsm PSW_SM_I, %r0
load32 PA(1 f), %r1
nop
nop
nop
nop
nop
rsm PSW_SM_Q, %r0 /* prep to load iia queue */
mtctl %r0, %cr17 /* Clear IIASQ tail */
mtctl %r0, %cr17 /* Clear IIASQ head */
mtctl %r1, %cr18 /* IIAOQ head */
ldo 4 (%r1), %r1
mtctl %r1, %cr18 /* IIAOQ tail */
load32 REAL_MODE_PSW, %r1
mtctl %r1, %ipsw
rfi
nop
1 : cmpib,=,n SRHASH_PCXST, %r26,srdis_pcxs
cmpib,=,n SRHASH_PCXL, %r26,srdis_pcxl
cmpib,=,n SRHASH_PA20, %r26,srdis_pa20
b,n srdis_done
srdis_pcxs:
/* Disable Space Register Hashing for PCXS,PCXT,PCXT' */
.word 0 x141c1a00 /* mfdiag %dr0, %r28 */
.word 0 x141c1a00 /* must issue twice */
depwi 0 ,18 ,1 , %r28 /* Clear DHE (dcache hash enable) */
depwi 0 ,20 ,1 , %r28 /* Clear IHE (icache hash enable) */
.word 0 x141c1600 /* mtdiag %r28, %dr0 */
.word 0 x141c1600 /* must issue twice */
b,n srdis_done
srdis_pcxl:
/* Disable Space Register Hashing for PCXL */
.word 0 x141c0600 /* mfdiag %dr0, %r28 */
depwi 0 ,28 ,2 , %r28 /* Clear DHASH_EN & IHASH_EN */
.word 0 x141c0240 /* mtdiag %r28, %dr0 */
b,n srdis_done
srdis_pa20:
/* Disable Space Register Hashing for PCXU,PCXU+,PCXW,PCXW+,PCXW2 */
.word 0 x144008bc /* mfdiag %dr2, %r28 */
depdi 0 , 54 ,1 , %r28 /* clear DIAG_SPHASH_ENAB (bit 54) */
.word 0 x145c1840 /* mtdiag %r28, %dr2 */
srdis_done:
/* Switch back to virtual mode */
rsm PSW_SM_I, %r0 /* prep to load iia queue */
load32 2 f, %r1
nop
nop
nop
nop
nop
rsm PSW_SM_Q, %r0 /* prep to load iia queue */
mtctl %r0, %cr17 /* Clear IIASQ tail */
mtctl %r0, %cr17 /* Clear IIASQ head */
mtctl %r1, %cr18 /* IIAOQ head */
ldo 4 (%r1), %r1
mtctl %r1, %cr18 /* IIAOQ tail */
load32 KERNEL_PSW, %r1
mtctl %r1, %ipsw
rfi
nop
2 : bv %r0(%r2)
nop
ENDPROC_CFI(disable_sr_hashing_asm)
.end
Messung V0.5 in Prozent C=94 H=94 G=93
¤ Dauer der Verarbeitung: 0.17 Sekunden
(vorverarbeitet am 2026-06-06)
¤
*© Formatika GbR, Deutschland