[U-Boot] [PATCH] OMAP3 Move cache routines to cache.S

Dirk Behme dirk.behme at googlemail.com
Wed Aug 12 18:35:56 CEST 2009


Tom Rix wrote:
> v7_flush_dcache_all, because it depends on omap ROM code is not
> generic.  Rename the function to 'invalidate_dcache' and move it
> to the omap cpu directory.
> 
> Collect the other omap cache routines l2_cache_enable and
> l2_cache_disable with invalide_dcache into cache.S.  This
> means removing the old cache.c file that contained l2_cache_enable
> and l2_cache_disable.
> 
> The conversion from cache.c to cache.S was done most through
> disassembling the uboot binary.  The only significant change was
> to change the comparision for the return of get_cpu_rev from
> 
>    cmp	r0, #0
>    beq	earlier_than_label
> 
> Which was lost information to
> 
>    cmp	r0, #CPU_3XX_ES20
>    blt	earlier_than_label
> 
> The paths through the enable routine were verified by
> adding an infinite loop and seeing the hang.  Then
> removing the infinite loop and seeing it continue.
> 
> The disable routine is similar enough that it was not
> tested with this method.
> 
> Run tested by cold booting from nand on beagle and zoom1.
> Compile tested on MAKEALL arm.

Boot tested from SD card on BeagleBoard.

> Signed-off-by: Tom Rix <Tom.Rix at windriver.com>

Acked-by: Dirk Behme <dirk.behme at googlemail.com>

> ---
>  cpu/arm_cortexa8/cpu.c                 |    2 +-
>  cpu/arm_cortexa8/omap3/Makefile        |    2 +-
>  cpu/arm_cortexa8/omap3/board.c         |    2 +-
>  cpu/arm_cortexa8/omap3/cache.S         |  191 ++++++++++++++++++++++++++++++++
>  cpu/arm_cortexa8/omap3/cache.c         |   95 ----------------
>  cpu/arm_cortexa8/start.S               |   85 --------------
>  include/asm-arm/arch-omap3/omap3.h     |    2 +
>  include/asm-arm/arch-omap3/sys_proto.h |    2 +-
>  8 files changed, 197 insertions(+), 184 deletions(-)
>  create mode 100644 cpu/arm_cortexa8/omap3/cache.S
>  delete mode 100644 cpu/arm_cortexa8/omap3/cache.c
> 
> diff --git a/cpu/arm_cortexa8/cpu.c b/cpu/arm_cortexa8/cpu.c
> index 5a5981e..a01e0d6 100644
> --- a/cpu/arm_cortexa8/cpu.c
> +++ b/cpu/arm_cortexa8/cpu.c
> @@ -64,7 +64,7 @@ int cleanup_before_linux(void)
>  	/* turn off L2 cache */
>  	l2_cache_disable();
>  	/* invalidate L2 cache also */
> -	v7_flush_dcache_all(get_device_type());
> +	invalidate_dcache(get_device_type());
>  #endif
>  	i = 0;
>  	/* mem barrier to sync up things */
> diff --git a/cpu/arm_cortexa8/omap3/Makefile b/cpu/arm_cortexa8/omap3/Makefile
> index eef165c..136b163 100644
> --- a/cpu/arm_cortexa8/omap3/Makefile
> +++ b/cpu/arm_cortexa8/omap3/Makefile
> @@ -26,10 +26,10 @@ include $(TOPDIR)/config.mk
>  LIB	=  $(obj)lib$(SOC).a
>  
>  SOBJS	:= lowlevel_init.o
> +SOBJS	+= cache.o
>  SOBJS	+= reset.o
>  
>  COBJS	+= board.o
> -COBJS	+= cache.o
>  COBJS	+= clock.o
>  COBJS	+= gpio.o
>  COBJS	+= mem.o
> diff --git a/cpu/arm_cortexa8/omap3/board.c b/cpu/arm_cortexa8/omap3/board.c
> index 2337287..43262e7 100644
> --- a/cpu/arm_cortexa8/omap3/board.c
> +++ b/cpu/arm_cortexa8/omap3/board.c
> @@ -201,7 +201,7 @@ void s_init(void)
>  	 * Right now flushing at low MPU speed.
>  	 * Need to move after clock init
>  	 */
> -	v7_flush_dcache_all(get_device_type());
> +	invalidate_dcache(get_device_type());
>  #ifndef CONFIG_ICACHE_OFF
>  	icache_enable();
>  #endif
> diff --git a/cpu/arm_cortexa8/omap3/cache.S b/cpu/arm_cortexa8/omap3/cache.S
> new file mode 100644
> index 0000000..0f63815
> --- /dev/null
> +++ b/cpu/arm_cortexa8/omap3/cache.S
> @@ -0,0 +1,191 @@
> +/*
> + * Copyright (c) 2009 Wind River Systems, Inc.
> + * Tom Rix <Tom.Rix at windriver.com>
> + *
> + * This file is based on and replaces the existing cache.c file
> + * The copyrights for the cache.c file are:
> + *
> + * (C) Copyright 2008 Texas Insturments
> + *
> + * (C) Copyright 2002
> + * Sysgo Real-Time Solutions, GmbH <www.elinos.com>
> + * Marius Groeger <mgroeger at sysgo.de>
> + *
> + * (C) Copyright 2002
> + * Gary Jennejohn, DENX Software Engineering, <gj at denx.de>
> + *
> + * See file CREDITS for list of people who contributed to this
> + * project.
> + *
> + * This program is free software; you can redistribute it and/or
> + * modify it under the terms of the GNU General Public License as
> + * published by the Free Software Foundation; either version 2 of
> + * the License, or (at your option) any later version.
> + *
> + * This program is distributed in the hope that it will be useful,
> + * but WITHOUT ANY WARRANTY; without even the implied warranty of
> + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
> + * GNU General Public License for more details.
> + *
> + * You should have received a copy of the GNU General Public License
> + * along with this program; if not, write to the Free Software
> + * Foundation, Inc., 59 Temple Place, Suite 330, Boston,
> + * MA 02111-1307 USA
> + */
> +
> +#include <asm/arch/omap3.h>
> +
> +/*
> + * omap3 cache code
> + */
> +
> +.align 5
> +.global invalidate_dcache
> +.global l2_cache_enable
> +.global l2_cache_disable
> +
> +/*
> + *	invalidate_dcache()
> + *
> + *	Invalidate the whole D-cache.
> + *
> + *	Corrupted registers: r0-r5, r7, r9-r11
> + *
> + *	- mm	- mm_struct describing address space
> + */
> +invalidate_dcache:
> +	stmfd	r13!, {r0 - r5, r7, r9 - r12, r14}
> +
> +	mov	r7, r0				@ take a backup of device type
> +	cmp	r0, #0x3			@ check if the device type is
> +						@ GP
> +	moveq r12, #0x1				@ set up to invalide L2
> +smi:	.word 0x01600070			@ Call SMI monitor (smieq)
> +	cmp	r7, #0x3			@ compare again in case its
> +						@ lost
> +	beq	finished_inval			@ if GP device, inval done
> +						@ above
> +
> +	mrc	p15, 1, r0, c0, c0, 1		@ read clidr
> +	ands	r3, r0, #0x7000000		@ extract loc from clidr
> +	mov	r3, r3, lsr #23			@ left align loc bit field
> +	beq	finished_inval			@ if loc is 0, then no need to
> +						@ clean
> +	mov	r10, #0				@ start clean at cache level 0
> +inval_loop1:
> +	add	r2, r10, r10, lsr #1		@ work out 3x current cache
> +						@ level
> +	mov	r1, r0, lsr r2			@ extract cache type bits from
> +						@ clidr
> +	and	r1, r1, #7			@ mask of the bits for current
> +						@ cache only
> +	cmp	r1, #2				@ see what cache we have at
> +						@ this level
> +	blt	skip_inval			@ skip if no cache, or just
> +						@ i-cache
> +	mcr	p15, 2, r10, c0, c0, 0		@ select current cache level
> +						@ in cssr
> +	mov	r2, #0				@ operand for mcr SBZ
> +	mcr	p15, 0, r2, c7, c5, 4		@ flush prefetch buffer to
> +						@ sych the new cssr&csidr,
> +						@ with armv7 this is 'isb',
> +						@ but we compile with armv5
> +	mrc	p15, 1, r1, c0, c0, 0		@ read the new csidr
> +	and	r2, r1, #7			@ extract the length of the
> +						@ cache lines
> +	add	r2, r2, #4			@ add 4 (line length offset)
> +	ldr	r4, =0x3ff
> +	ands	r4, r4, r1, lsr #3		@ find maximum number on the
> +						@ way size
> +	clz	r5, r4				@ find bit position of way
> +						@ size increment
> +	ldr	r7, =0x7fff
> +	ands	r7, r7, r1, lsr #13		@ extract max number of the
> +						@ index size
> +inval_loop2:
> +	mov	r9, r4				@ create working copy of max
> +						@ way size
> +inval_loop3:
> +	orr	r11, r10, r9, lsl r5		@ factor way and cache number
> +						@ into r11
> +	orr	r11, r11, r7, lsl r2		@ factor index number into r11
> +	mcr	p15, 0, r11, c7, c6, 2		@ invalidate by set/way
> +	subs	r9, r9, #1			@ decrement the way
> +	bge	inval_loop3
> +	subs	r7, r7, #1			@ decrement the index
> +	bge	inval_loop2
> +skip_inval:
> +	add	r10, r10, #2			@ increment cache number
> +	cmp	r3, r10
> +	bgt	inval_loop1
> +finished_inval:
> +	mov	r10, #0				@ swith back to cache level 0
> +	mcr	p15, 2, r10, c0, c0, 0		@ select current cache level
> +						@ in cssr
> +	mcr	p15, 0, r10, c7, c5, 4		@ flush prefetch buffer,
> +						@ with armv7 this is 'isb',
> +						@ but we compile with armv5
> +
> +	ldmfd	r13!, {r0 - r5, r7, r9 - r12, pc}
> +
> +
> +l2_cache_enable:
> +	push	{r0, r1, r2, lr}
> +	@ ES2 onwards we can disable/enable L2 ourselves
> +	bl	get_cpu_rev
> +	cmp	r0, #CPU_3XX_ES20
> +	blt	l2_cache_disable_EARLIER_THAN_ES2
> +	mrc	15, 0, r3, cr1, cr0, 1
> +	orr	r3, r3, #2
> +	mcr	15, 0, r3, cr1, cr0, 1
> +	b	l2_cache_enable_END
> +l2_cache_enable_EARLIER_THAN_ES2:
> +	@ Save r0, r12 and restore them after usage
> +	mov	r3, ip
> +	str	r3, [sp, #4]
> +	mov	r3, r0
> +	@
> +	@ GP Device ROM code API usage here
> +	@ r12 = AUXCR Write function and r0 value
> +	@
> +	mov	ip, #3
> +	mrc	15, 0, r0, cr1, cr0, 1
> +	orr	r0, r0, #2
> +	@ SMI instruction to call ROM Code API
> +	.word	0xe1600070
> +	mov	r0, r3
> +	mov	ip, r3
> +	str	r3, [sp, #4]
> +l2_cache_enable_END:
> +	pop	{r1, r2, r3, pc}
> +
> +
> +l2_cache_disable:
> +	push	{r0, r1, r2, lr}
> +	@ ES2 onwards we can disable/enable L2 ourselves
> +	bl	get_cpu_rev
> +	cmp	r0, #CPU_3XX_ES20
> +	blt	l2_cache_disable_EARLIER_THAN_ES2
> +	mrc	15, 0, r3, cr1, cr0, 1
> +	bic	r3, r3, #2
> +	mcr	15, 0, r3, cr1, cr0, 1
> +	b	l2_cache_disable_END
> +l2_cache_disable_EARLIER_THAN_ES2:
> +	@ Save r0, r12 and restore them after usage
> +	mov	r3, ip
> +	str	r3, [sp, #4]
> +	mov	r3, r0
> +	@
> +	@ GP Device ROM code API usage here
> +	@ r12 = AUXCR Write function and r0 value
> +	@
> +	mov	ip, #3
> +	mrc	15, 0, r0, cr1, cr0, 1
> +	bic	r0, r0, #2
> +	@ SMI instruction to call ROM Code API
> +	.word	0xe1600070
> +	mov	r0, r3
> +	mov	ip, r3
> +	str	r3, [sp, #4]
> +l2_cache_disable_END:
> +	pop	{r1, r2, r3, pc}
> diff --git a/cpu/arm_cortexa8/omap3/cache.c b/cpu/arm_cortexa8/omap3/cache.c
> deleted file mode 100644
> index 0d5b444..0000000
> --- a/cpu/arm_cortexa8/omap3/cache.c
> +++ /dev/null
> @@ -1,95 +0,0 @@
> -/*
> - * (C) Copyright 2008 Texas Insturments
> - *
> - * (C) Copyright 2002
> - * Sysgo Real-Time Solutions, GmbH <www.elinos.com>
> - * Marius Groeger <mgroeger at sysgo.de>
> - *
> - * (C) Copyright 2002
> - * Gary Jennejohn, DENX Software Engineering, <gj at denx.de>
> - *
> - * See file CREDITS for list of people who contributed to this
> - * project.
> - *
> - * This program is free software; you can redistribute it and/or
> - * modify it under the terms of the GNU General Public License as
> - * published by the Free Software Foundation; either version 2 of
> - * the License, or (at your option) any later version.
> - *
> - * This program is distributed in the hope that it will be useful,
> - * but WITHOUT ANY WARRANTY; without even the implied warranty of
> - * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
> - * GNU General Public License for more details.
> - *
> - * You should have received a copy of the GNU General Public License
> - * along with this program; if not, write to the Free Software
> - * Foundation, Inc., 59 Temple Place, Suite 330, Boston,
> - * MA 02111-1307 USA
> - */
> -
> -/*
> - * omap3 L2 cache code
> - */
> -
> -#include <common.h>
> -#include <asm/arch/sys_proto.h>
> -#include <asm/cache.h>
> -
> -void l2_cache_enable(void)
> -{
> -	unsigned long i;
> -	volatile unsigned int j;
> -
> -	/* ES2 onwards we can disable/enable L2 ourselves */
> -	if (get_cpu_rev() >= CPU_3XX_ES20) {
> -		__asm__ __volatile__("mrc p15, 0, %0, c1, c0, 1":"=r"(i));
> -		__asm__ __volatile__("orr %0, %0, #0x2":"=r"(i));
> -		__asm__ __volatile__("mcr p15, 0, %0, c1, c0, 1":"=r"(i));
> -	} else {
> -		/* Save r0, r12 and restore them after usage */
> -		__asm__ __volatile__("mov %0, r12":"=r"(j));
> -		__asm__ __volatile__("mov %0, r0":"=r"(i));
> -
> -		/*
> -		 * GP Device ROM code API usage here
> -		 * r12 = AUXCR Write function and r0 value
> -		 */
> -		__asm__ __volatile__("mov r12, #0x3");
> -		__asm__ __volatile__("mrc p15, 0, r0, c1, c0, 1");
> -		__asm__ __volatile__("orr r0, r0, #0x2");
> -		/* SMI instruction to call ROM Code API */
> -		__asm__ __volatile__(".word 0xE1600070");
> -		__asm__ __volatile__("mov r0, %0":"=r"(i));
> -		__asm__ __volatile__("mov r12, %0":"=r"(j));
> -	}
> -
> -}
> -
> -void l2_cache_disable(void)
> -{
> -	unsigned long i;
> -	volatile unsigned int j;
> -
> -	/* ES2 onwards we can disable/enable L2 ourselves */
> -	if (get_cpu_rev() >= CPU_3XX_ES20) {
> -		__asm__ __volatile__("mrc p15, 0, %0, c1, c0, 1":"=r"(i));
> -		__asm__ __volatile__("bic %0, %0, #0x2":"=r"(i));
> -		__asm__ __volatile__("mcr p15, 0, %0, c1, c0, 1":"=r"(i));
> -	} else {
> -		/* Save r0, r12 and restore them after usage */
> -		__asm__ __volatile__("mov %0, r12":"=r"(j));
> -		__asm__ __volatile__("mov %0, r0":"=r"(i));
> -
> -		/*
> -		 * GP Device ROM code API usage here
> -		 * r12 = AUXCR Write function and r0 value
> -		 */
> -		__asm__ __volatile__("mov r12, #0x3");
> -		__asm__ __volatile__("mrc p15, 0, r0, c1, c0, 1");
> -		__asm__ __volatile__("bic r0, r0, #0x2");
> -		/* SMI instruction to call ROM Code API */
> -		__asm__ __volatile__(".word 0xE1600070");
> -		__asm__ __volatile__("mov r0, %0":"=r"(i));
> -		__asm__ __volatile__("mov r12, %0":"=r"(j));
> -	}
> -}
> diff --git a/cpu/arm_cortexa8/start.S b/cpu/arm_cortexa8/start.S
> index 6bd6552..14a9bd3 100644
> --- a/cpu/arm_cortexa8/start.S
> +++ b/cpu/arm_cortexa8/start.S
> @@ -415,88 +415,3 @@ fiq:
>  
>  #endif
>  
> -/*
> - *	v7_flush_dcache_all()
> - *
> - *	Flush the whole D-cache.
> - *
> - *	Corrupted registers: r0-r5, r7, r9-r11
> - *
> - *	- mm	- mm_struct describing address space
> - */
> -	.align 5
> -.global v7_flush_dcache_all
> -v7_flush_dcache_all:
> -	stmfd	r13!, {r0 - r5, r7, r9 - r12, r14}
> -
> -	mov	r7, r0				@ take a backup of device type
> -	cmp	r0, #0x3			@ check if the device type is
> -						@ GP
> -	moveq r12, #0x1				@ set up to invalide L2
> -smi:	.word 0x01600070			@ Call SMI monitor (smieq)
> -	cmp	r7, #0x3			@ compare again in case its
> -						@ lost
> -	beq	finished_inval			@ if GP device, inval done
> -						@ above
> -
> -	mrc	p15, 1, r0, c0, c0, 1		@ read clidr
> -	ands	r3, r0, #0x7000000		@ extract loc from clidr
> -	mov	r3, r3, lsr #23			@ left align loc bit field
> -	beq	finished_inval			@ if loc is 0, then no need to
> -						@ clean
> -	mov	r10, #0				@ start clean at cache level 0
> -inval_loop1:
> -	add	r2, r10, r10, lsr #1		@ work out 3x current cache
> -						@ level
> -	mov	r1, r0, lsr r2			@ extract cache type bits from
> -						@ clidr
> -	and	r1, r1, #7			@ mask of the bits for current
> -						@ cache only
> -	cmp	r1, #2				@ see what cache we have at
> -						@ this level
> -	blt	skip_inval			@ skip if no cache, or just
> -						@ i-cache
> -	mcr	p15, 2, r10, c0, c0, 0		@ select current cache level
> -						@ in cssr
> -	mov	r2, #0				@ operand for mcr SBZ
> -	mcr	p15, 0, r2, c7, c5, 4		@ flush prefetch buffer to
> -						@ sych the new cssr&csidr,
> -						@ with armv7 this is 'isb',
> -						@ but we compile with armv5
> -	mrc	p15, 1, r1, c0, c0, 0		@ read the new csidr
> -	and	r2, r1, #7			@ extract the length of the
> -						@ cache lines
> -	add	r2, r2, #4			@ add 4 (line length offset)
> -	ldr	r4, =0x3ff
> -	ands	r4, r4, r1, lsr #3		@ find maximum number on the
> -						@ way size
> -	clz	r5, r4				@ find bit position of way
> -						@ size increment
> -	ldr	r7, =0x7fff
> -	ands	r7, r7, r1, lsr #13		@ extract max number of the
> -						@ index size
> -inval_loop2:
> -	mov	r9, r4				@ create working copy of max
> -						@ way size
> -inval_loop3:
> -	orr	r11, r10, r9, lsl r5		@ factor way and cache number
> -						@ into r11
> -	orr	r11, r11, r7, lsl r2		@ factor index number into r11
> -	mcr	p15, 0, r11, c7, c6, 2		@ invalidate by set/way
> -	subs	r9, r9, #1			@ decrement the way
> -	bge	inval_loop3
> -	subs	r7, r7, #1			@ decrement the index
> -	bge	inval_loop2
> -skip_inval:
> -	add	r10, r10, #2			@ increment cache number
> -	cmp	r3, r10
> -	bgt	inval_loop1
> -finished_inval:
> -	mov	r10, #0				@ swith back to cache level 0
> -	mcr	p15, 2, r10, c0, c0, 0		@ select current cache level
> -						@ in cssr
> -	mcr	p15, 0, r10, c7, c5, 4		@ flush prefetch buffer,
> -						@ with armv7 this is 'isb',
> -						@ but we compile with armv5
> -
> -	ldmfd	r13!, {r0 - r5, r7, r9 - r12, pc}
> diff --git a/include/asm-arm/arch-omap3/omap3.h b/include/asm-arm/arch-omap3/omap3.h
> index 6459d99..12815f6 100644
> --- a/include/asm-arm/arch-omap3/omap3.h
> +++ b/include/asm-arm/arch-omap3/omap3.h
> @@ -168,6 +168,8 @@ struct gpio {
>   *  ES1     = rev 0
>   *
>   *  ES2 onwards, the value maps to contents of IDCODE register [31:28].
> + *
> + * Note : CPU_3XX_ES20 is used in cache.S.  Please review before changing.
>   */
>  #define CPU_3XX_ES10		0
>  #define CPU_3XX_ES20		1
> diff --git a/include/asm-arm/arch-omap3/sys_proto.h b/include/asm-arm/arch-omap3/sys_proto.h
> index 7361d08..2246f80 100644
> --- a/include/asm-arm/arch-omap3/sys_proto.h
> +++ b/include/asm-arm/arch-omap3/sys_proto.h
> @@ -55,7 +55,7 @@ void secureworld_exit(void);
>  void setup_auxcr(void);
>  void try_unlock_memory(void);
>  u32 get_boot_type(void);
> -void v7_flush_dcache_all(u32);
> +void invalidate_dcache(u32);
>  void sr32(void *, u32, u32, u32);
>  u32 wait_on_value(u32, u32, void *, u32);
>  void sdelay(unsigned long);



More information about the U-Boot mailing list