[PATCH] fix TLB handling for 8xx on linuxppc-2.5

Benjamin Herrenschmidt benh at kernel.crashing.org
Tue Jun 1 08:00:30 EST 2004


On Tue, 2004-06-01 at 00:36, Pantelis Antoniou wrote:
> Hi
>
> The following patch fixes the problems of 8xx with the latest
> linuxppc-2.5 tree.
>
> With it user space progresses properly.
> Lots of gray areas remain and MM handling for 8xx is
> mighty inefficient IMO.
>
> Dan could you please take a look?

Ok, looks a bit weird on the edges.

>
> Pantelis
>
>
> ______________________________________________________________________
> diff -Nur --exclude=RCS --exclude=CVS --exclude=SCCS --exclude=BitKeeper --exclude=ChangeSet linuxppc_2.5/arch/ppc/kernel/head_8xx.S linuxppc_2.5-intracom/arch/ppc/kernel/head_8xx.S
> --- linuxppc_2.5/arch/ppc/kernel/head_8xx.S	Mon May 31 10:52:29 2004
> +++ linuxppc_2.5-intracom/arch/ppc/kernel/head_8xx.S	Mon May 31 17:24:05 2004
> @@ -157,6 +157,24 @@
>  	SAVE_2GPRS(7, r11)
>
>  /*
> +if ((val & (_PAGE_HWWRITE | _PAGE_RW | _PAGE_DIRTY)) == (_PAGE_RW | _PAGE_DIRTY))
> +	val |= _PAGE_HWWRITE;
> +else if ((val & (_PAGE_HWWRITE | _PAGE_RW | _PAGE_DIRTY)) == _PAGE_HWWRITE)
> +	val &= ~_PAGE_HWWRITE;
> +*/

I don't like the above. Things should be dealt with differently.

The TLB handler itself should only care about _setting_ _PAGE_HWWRITE I
think when it's missing (oh, and dirty of course). The clearing should
be done on a per-PTE basis in ptep_get_and_clear_*, ptep_clear_*, etc...
along with the necessary TLB invalidate (hrm... can we invalidate
selectively instead of the whole thing ?)

The tlbia in update_mmu_cache() doesn't look good. More like a
workaround for breakage in the implementation.

Paul, any comment ?

Ben.

> +#define LAZY_DTLB_FIX			\
> +	rlwinm  r12,r10,0,23,25;	\
> +	cmpwi   r12,0xc0;		\
> +	bne+    0f;			\
> +	ori     r10,r10,0x100;		\
> +	b	1f;			\
> + 0:	cmpwi   r12,0x100;		\
> +	bne+    1f;			\
> +	rlwinm  r10,r10,0,24,22;	\
> + 1:
> +
> +/*
>   * Note: code which follows this uses cr0.eq (set if from kernel),
>   * r11, r12 (SRR0), and r9 (SRR1).
>   *
> @@ -348,7 +366,6 @@
>  	mtspr	MD_TWC, r11	/* Load pte table base address */
>  	mfspr	r11, MD_TWC	/* ....and get the pte address */
>  	lwz	r10, 0(r11)	/* Get the pte */
> -
>  	ori	r10, r10, _PAGE_ACCESSED
>  	stw	r10, 0(r11)
>
> @@ -398,6 +415,7 @@
>  	mfcr	r10
>  	stw	r10, 0(r0)
>  	stw	r11, 4(r0)
> +	stw	r12, 16(r0)
>  	mfspr	r10, M_TWB	/* Get level 1 table entry address */
>
>  	/* If we are faulting a kernel address, we have to use the
> @@ -440,6 +458,7 @@
>  	mtspr	MD_TWC, r11
>
>  	mfspr	r11, MD_TWC	/* get the pte address again */
> +	LAZY_DTLB_FIX
>  	ori	r10, r10, _PAGE_ACCESSED
>  	stw	r10, 0(r11)
>
> @@ -463,6 +482,7 @@
>  	lwz	r11, 0(r0)
>  	mtcr	r11
>  	lwz	r11, 4(r0)
> +	lwz	r12, 16(r0)
>  #ifdef CONFIG_8xx_CPU6
>  	lwz	r3, 8(r0)
>  #endif
> @@ -472,6 +492,7 @@
>  	lwz	r11, 0(r0)
>  	mtcr	r11
>  	lwz	r11, 4(r0)
> +	lwz	r12, 16(r0)
>  #ifdef CONFIG_8xx_CPU6
>  	lwz	r3, 8(r0)
>  #endif
> @@ -505,6 +526,7 @@
>  	mfcr	r10
>  	stw	r10, 0(r0)
>  	stw	r11, 4(r0)
> +	stw	r12, 16(r0)
>
>  	/* First, make sure this was a store operation.
>  	*/
> @@ -574,6 +596,7 @@
>  	*/
>  	ori	r10, r10, _PAGE_DIRTY|_PAGE_ACCESSED|_PAGE_HWWRITE
>  	mfspr	r11, MD_TWC		/* Get pte address again */
> +	LAZY_DTLB_FIX
>  	stw	r10, 0(r11)		/* and update pte in table */
>
>  	/* The Linux PTE won't go exactly into the MMU TLB.
> @@ -596,6 +619,7 @@
>  	lwz	r11, 0(r0)
>  	mtcr	r11
>  	lwz	r11, 4(r0)
> +	lwz	r12, 16(r0)
>  #ifdef CONFIG_8xx_CPU6
>  	lwz	r3, 8(r0)
>  #endif
> @@ -605,6 +629,7 @@
>  	lwz	r11, 0(r0)
>  	mtcr	r11
>  	lwz	r11, 4(r0)
> +	lwz	r12, 16(r0)
>  #ifdef CONFIG_8xx_CPU6
>  	lwz	r3, 8(r0)
>  #endif
> diff -Nur --exclude=RCS --exclude=CVS --exclude=SCCS --exclude=BitKeeper --exclude=ChangeSet linuxppc_2.5/arch/ppc/kernel/misc.S linuxppc_2.5-intracom/arch/ppc/kernel/misc.S
> --- linuxppc_2.5/arch/ppc/kernel/misc.S	Mon May 31 10:52:30 2004
> +++ linuxppc_2.5-intracom/arch/ppc/kernel/misc.S	Mon May 31 17:24:05 2004
> @@ -565,10 +565,12 @@
>   * flush_icache_range(unsigned long start, unsigned long stop)
>   */
>  _GLOBAL(flush_icache_range)
> +#if !defined(CONFIG_8xx)
>  	mfspr	r5,PVR
>  	rlwinm	r5,r5,16,16,31
>  	cmpi	0,r5,1
>  	beqlr				/* for 601, do nothing */
> +#endif
>  	li	r5,L1_CACHE_LINE_SIZE-1
>  	andc	r3,r3,r5
>  	subf	r4,r3,r4
> @@ -683,10 +685,12 @@
>   *	void __flush_dcache_icache(void *page)
>   */
>  _GLOBAL(__flush_dcache_icache)
> +#if !defined(CONFIG_8xx)
>  	mfspr	r5,PVR
>  	rlwinm	r5,r5,16,16,31
>  	cmpi	0,r5,1
>  	beqlr					/* for 601, do nothing */
> +#endif
>  	rlwinm	r3,r3,0,0,19			/* Get page base address */
>  	li	r4,4096/L1_CACHE_LINE_SIZE	/* Number of lines in a page */
>  	mtctr	r4
> @@ -712,10 +716,12 @@
>   *	void __flush_dcache_icache_phys(unsigned long physaddr)
>   */
>  _GLOBAL(__flush_dcache_icache_phys)
> +#if !defined(CONFIG_8xx)
>  	mfspr	r5,PVR
>  	rlwinm	r5,r5,16,16,31
>  	cmpi	0,r5,1
>  	beqlr					/* for 601, do nothing */
> +#endif
>  	mfmsr	r10
>  	rlwinm	r0,r10,0,28,26			/* clear DR */
>  	mtmsr	r0
> diff -Nur --exclude=RCS --exclude=CVS --exclude=SCCS --exclude=BitKeeper --exclude=ChangeSet linuxppc_2.5/arch/ppc/mm/init.c linuxppc_2.5-intracom/arch/ppc/mm/init.c
> --- linuxppc_2.5/arch/ppc/mm/init.c	Mon May 31 10:52:30 2004
> +++ linuxppc_2.5-intracom/arch/ppc/mm/init.c	Mon May 31 17:24:05 2004
> @@ -605,7 +605,6 @@
>  	kunmap(page);
>  }
>
> -#ifndef update_mmu_cache
>  /*
>   * This is called at the end of handling a user page fault, when the
>   * fault has been handled by updating a PTE in the linux page tables.
> @@ -641,6 +640,7 @@
>  		if (!pmd_none(*pmd))
>  			add_hash_page(mm->context, address, pmd_val(*pmd));
>  	}
> +#else
> +	__tlbia();
>  #endif
>  }
> -#endif
> diff -Nur --exclude=RCS --exclude=CVS --exclude=SCCS --exclude=BitKeeper --exclude=ChangeSet linuxppc_2.5/include/asm-ppc/tlbflush.h linuxppc_2.5-intracom/include/asm-ppc/tlbflush.h
> --- linuxppc_2.5/include/asm-ppc/tlbflush.h	Mon May 31 10:53:26 2004
> +++ linuxppc_2.5-intracom/include/asm-ppc/tlbflush.h	Mon May 31 17:24:16 2004
> @@ -50,7 +50,8 @@
>  static inline void flush_tlb_kernel_range(unsigned long start,
>  				unsigned long end)
>  	{ __tlbia(); }
> -#define update_mmu_cache(vma, addr, pte)	do { } while(0)
> +/* #define update_mmu_cache(vma, addr, pte)	do { } while(0) */
> +extern void update_mmu_cache(struct vm_area_struct *, unsigned long, pte_t);
>
>  #else	/* 6xx, 7xx, 7xxx cpus */
>  struct mm_struct;
--
Benjamin Herrenschmidt <benh at kernel.crashing.org>


** Sent via the linuxppc-embedded mail list. See http://lists.linuxppc.org/




More information about the Linuxppc-embedded mailing list