xref: /openbmc/u-boot/arch/nios2/cpu/start.S (revision 1a459660)
137e4dafaSPeter Tyser/*
237e4dafaSPeter Tyser * (C) Copyright 2004, Psyent Corporation <www.psyent.com>
337e4dafaSPeter Tyser * Scott McNutt <smcnutt@psyent.com>
437e4dafaSPeter Tyser *
5*1a459660SWolfgang Denk * SPDX-License-Identifier:	GPL-2.0+
637e4dafaSPeter Tyser */
737e4dafaSPeter Tyser
825ddd1fbSWolfgang Denk#include <asm-offsets.h>
937e4dafaSPeter Tyser#include <config.h>
1037e4dafaSPeter Tyser#include <version.h>
1137e4dafaSPeter Tyser
1237e4dafaSPeter Tyser/*************************************************************************
1337e4dafaSPeter Tyser * RESTART
1437e4dafaSPeter Tyser ************************************************************************/
1537e4dafaSPeter Tyser
1637e4dafaSPeter Tyser	.text
1737e4dafaSPeter Tyser	.global _start
1837e4dafaSPeter Tyser
1937e4dafaSPeter Tyser_start:
20fd2712d0SThomas Chou	wrctl	status, r0		/* Disable interrupts */
2137e4dafaSPeter Tyser	/* ICACHE INIT -- only the icache line at the reset address
2237e4dafaSPeter Tyser	 * is invalidated at reset. So the init must stay within
2337e4dafaSPeter Tyser	 * the cache line size (8 words). If GERMS is used, we'll
2437e4dafaSPeter Tyser	 * just be invalidating the cache a second time. If cache
2537e4dafaSPeter Tyser	 * is not implemented initi behaves as nop.
2637e4dafaSPeter Tyser	 */
2737e4dafaSPeter Tyser	ori	r4, r0, %lo(CONFIG_SYS_ICACHELINE_SIZE)
2837e4dafaSPeter Tyser	movhi	r5, %hi(CONFIG_SYS_ICACHE_SIZE)
2937e4dafaSPeter Tyser	ori	r5, r5, %lo(CONFIG_SYS_ICACHE_SIZE)
30fd2712d0SThomas Chou0:	initi	r5
31fd2712d0SThomas Chou	sub	r5, r5, r4
32fd2712d0SThomas Chou	bgt	r5, r0, 0b
3337e4dafaSPeter Tyser	br	_except_end	/* Skip the tramp */
3437e4dafaSPeter Tyser
3537e4dafaSPeter Tyser	/* EXCEPTION TRAMPOLINE -- the following gets copied
3637e4dafaSPeter Tyser	 * to the exception address (below), but is otherwise at the
3737e4dafaSPeter Tyser	 * default exception vector offset (0x0020).
3837e4dafaSPeter Tyser	 */
3937e4dafaSPeter Tyser_except_start:
4037e4dafaSPeter Tyser	movhi	et, %hi(_exception)
4137e4dafaSPeter Tyser	ori	et, et, %lo(_exception)
4237e4dafaSPeter Tyser	jmp	et
4337e4dafaSPeter Tyser_except_end:
4437e4dafaSPeter Tyser
4537e4dafaSPeter Tyser	/* INTERRUPTS -- for now, all interrupts masked and globally
4637e4dafaSPeter Tyser	 * disabled.
4737e4dafaSPeter Tyser	 */
4837e4dafaSPeter Tyser	wrctl	ienable, r0		/* All disabled	*/
4937e4dafaSPeter Tyser
5037e4dafaSPeter Tyser	/* DCACHE INIT -- if dcache not implemented, initd behaves as
5137e4dafaSPeter Tyser	 * nop.
5237e4dafaSPeter Tyser	 */
5337e4dafaSPeter Tyser	movhi	r4, %hi(CONFIG_SYS_DCACHELINE_SIZE)
5437e4dafaSPeter Tyser	ori	r4, r4, %lo(CONFIG_SYS_DCACHELINE_SIZE)
5537e4dafaSPeter Tyser	movhi	r5, %hi(CONFIG_SYS_DCACHE_SIZE)
5637e4dafaSPeter Tyser	ori	r5, r5, %lo(CONFIG_SYS_DCACHE_SIZE)
5737e4dafaSPeter Tyser	mov	r6, r0
5837e4dafaSPeter Tyser1:	initd	0(r6)
5937e4dafaSPeter Tyser	add	r6, r6, r4
6037e4dafaSPeter Tyser	bltu	r6, r5, 1b
6137e4dafaSPeter Tyser
6237e4dafaSPeter Tyser	/* RELOCATE CODE, DATA & COMMAND TABLE -- the following code
6337e4dafaSPeter Tyser	 * assumes code, data and the command table are all
6437e4dafaSPeter Tyser	 * contiguous. This lets us relocate everything as a single
6537e4dafaSPeter Tyser	 * block. Make sure the linker script matches this ;-)
6637e4dafaSPeter Tyser	 */
6737e4dafaSPeter Tyser	nextpc	r4
6837e4dafaSPeter Tyser_cur:	movhi	r5, %hi(_cur - _start)
6937e4dafaSPeter Tyser	ori	r5, r5, %lo(_cur - _start)
7037e4dafaSPeter Tyser	sub	r4, r4, r5		/* r4 <- cur _start */
7137e4dafaSPeter Tyser	mov	r8, r4
7237e4dafaSPeter Tyser	movhi	r5, %hi(_start)
7337e4dafaSPeter Tyser	ori	r5, r5, %lo(_start)	/* r5 <- linked _start */
7437e4dafaSPeter Tyser	beq	r4, r5, 3f
7537e4dafaSPeter Tyser
7637e4dafaSPeter Tyser	movhi	r6, %hi(_edata)
7737e4dafaSPeter Tyser	ori	r6, r6, %lo(_edata)
7837e4dafaSPeter Tyser2:	ldwio	r7, 0(r4)
7937e4dafaSPeter Tyser	addi	r4, r4, 4
8037e4dafaSPeter Tyser	stwio	r7, 0(r5)
8137e4dafaSPeter Tyser	addi	r5, r5, 4
8237e4dafaSPeter Tyser	bne	r5, r6, 2b
8337e4dafaSPeter Tyser3:
8437e4dafaSPeter Tyser
8537e4dafaSPeter Tyser	/* ZERO BSS/SBSS -- bss and sbss are assumed to be adjacent
863929fb0aSSimon Glass	 * and between __bss_start and __bss_end.
8737e4dafaSPeter Tyser	 */
8837e4dafaSPeter Tyser	 movhi	r5, %hi(__bss_start)
8937e4dafaSPeter Tyser	 ori	r5, r5, %lo(__bss_start)
903929fb0aSSimon Glass	 movhi	r6, %hi(__bss_end)
913929fb0aSSimon Glass	 ori	r6, r6, %lo(__bss_end)
9237e4dafaSPeter Tyser	 beq	r5, r6, 5f
9337e4dafaSPeter Tyser
9437e4dafaSPeter Tyser4:	stwio	r0, 0(r5)
9537e4dafaSPeter Tyser	 addi	r5, r5, 4
9637e4dafaSPeter Tyser	 bne	r5, r6, 4b
9737e4dafaSPeter Tyser5:
9837e4dafaSPeter Tyser
9937e4dafaSPeter Tyser	/* JUMP TO RELOC ADDR */
10037e4dafaSPeter Tyser	movhi	r4, %hi(_reloc)
10137e4dafaSPeter Tyser	ori	r4, r4, %lo(_reloc)
10237e4dafaSPeter Tyser	jmp	r4
10337e4dafaSPeter Tyser_reloc:
10437e4dafaSPeter Tyser
10537e4dafaSPeter Tyser	/* COPY EXCEPTION TRAMPOLINE -- copy the tramp to the
10637e4dafaSPeter Tyser	 * exception address. Define CONFIG_ROM_STUBS to prevent
10737e4dafaSPeter Tyser	 * the copy (e.g. exception in flash or in other
10837e4dafaSPeter Tyser	 * softare/firmware component).
10937e4dafaSPeter Tyser	 */
11037e4dafaSPeter Tyser#if !defined(CONFIG_ROM_STUBS)
11137e4dafaSPeter Tyser	movhi	r4, %hi(_except_start)
11237e4dafaSPeter Tyser	ori	r4, r4, %lo(_except_start)
11337e4dafaSPeter Tyser	movhi	r5, %hi(_except_end)
11437e4dafaSPeter Tyser	ori	r5, r5, %lo(_except_end)
11537e4dafaSPeter Tyser	movhi	r6, %hi(CONFIG_SYS_EXCEPTION_ADDR)
11637e4dafaSPeter Tyser	ori	r6, r6, %lo(CONFIG_SYS_EXCEPTION_ADDR)
11737e4dafaSPeter Tyser	beq	r4, r6, 7f	/* Skip if at proper addr */
11837e4dafaSPeter Tyser
11937e4dafaSPeter Tyser6:	ldwio	r7, 0(r4)
12037e4dafaSPeter Tyser	stwio	r7, 0(r6)
12137e4dafaSPeter Tyser	addi	r4, r4, 4
12237e4dafaSPeter Tyser	addi	r6, r6, 4
12337e4dafaSPeter Tyser	bne	r4, r5, 6b
12437e4dafaSPeter Tyser7:
12537e4dafaSPeter Tyser#endif
12637e4dafaSPeter Tyser
12737e4dafaSPeter Tyser	/* STACK INIT -- zero top two words for call back chain.
12837e4dafaSPeter Tyser	 */
12937e4dafaSPeter Tyser	movhi	sp, %hi(CONFIG_SYS_INIT_SP)
13037e4dafaSPeter Tyser	ori	sp, sp, %lo(CONFIG_SYS_INIT_SP)
13137e4dafaSPeter Tyser	addi	sp, sp, -8
13237e4dafaSPeter Tyser	stw	r0, 0(sp)
13337e4dafaSPeter Tyser	stw	r0, 4(sp)
13437e4dafaSPeter Tyser	mov	fp, sp
13537e4dafaSPeter Tyser
13637e4dafaSPeter Tyser	/*
13737e4dafaSPeter Tyser	 * Call board_init -- never returns
13837e4dafaSPeter Tyser	 */
13937e4dafaSPeter Tyser	movhi	r4, %hi(board_init@h)
14037e4dafaSPeter Tyser	ori	r4, r4, %lo(board_init@h)
14137e4dafaSPeter Tyser	callr	r4
14237e4dafaSPeter Tyser
14337e4dafaSPeter Tyser	/* NEVER RETURNS -- but branch to the _start just
14437e4dafaSPeter Tyser	 * in case ;-)
14537e4dafaSPeter Tyser	 */
14637e4dafaSPeter Tyser	br	_start
14737e4dafaSPeter Tyser
14837e4dafaSPeter Tyser
14937e4dafaSPeter Tyser/*
15037e4dafaSPeter Tyser * dly_clks -- Nios2 (like Nios1) doesn't have a timebase in
15137e4dafaSPeter Tyser * the core. For simple delay loops, we do our best by counting
15237e4dafaSPeter Tyser * instruction cycles.
15337e4dafaSPeter Tyser *
15437e4dafaSPeter Tyser * Instruction performance varies based on the core. For cores
15537e4dafaSPeter Tyser * with icache and static/dynamic branch prediction (II/f, II/s):
15637e4dafaSPeter Tyser *
15737e4dafaSPeter Tyser *	Normal ALU (e.g. add, cmp, etc):	1 cycle
15837e4dafaSPeter Tyser *	Branch (correctly predicted, taken):	2 cycles
15937e4dafaSPeter Tyser *	Negative offset is predicted (II/s).
16037e4dafaSPeter Tyser *
16137e4dafaSPeter Tyser * For cores without icache and no branch prediction (II/e):
16237e4dafaSPeter Tyser *
16337e4dafaSPeter Tyser *	Normal ALU (e.g. add, cmp, etc):	6 cycles
16437e4dafaSPeter Tyser *	Branch (no prediction):			6 cycles
16537e4dafaSPeter Tyser *
16637e4dafaSPeter Tyser * For simplicity, if an instruction cache is implemented we
16737e4dafaSPeter Tyser * assume II/f or II/s. Otherwise, we use the II/e.
16837e4dafaSPeter Tyser *
16937e4dafaSPeter Tyser */
17037e4dafaSPeter Tyser	.globl dly_clks
17137e4dafaSPeter Tyser
17237e4dafaSPeter Tyserdly_clks:
17337e4dafaSPeter Tyser
17437e4dafaSPeter Tyser#if (CONFIG_SYS_ICACHE_SIZE > 0)
17537e4dafaSPeter Tyser	subi	r4, r4, 3		/* 3 clocks/loop	*/
17637e4dafaSPeter Tyser#else
17737e4dafaSPeter Tyser	subi	r4, r4, 12		/* 12 clocks/loop	*/
17837e4dafaSPeter Tyser#endif
17937e4dafaSPeter Tyser	bge	r4, r0, dly_clks
18037e4dafaSPeter Tyser	ret
18137e4dafaSPeter Tyser
18237e4dafaSPeter Tyser	.data
18337e4dafaSPeter Tyser	.globl	version_string
18437e4dafaSPeter Tyser
18537e4dafaSPeter Tyserversion_string:
18609c2e90cSAndreas Bießmann	.ascii U_BOOT_VERSION_STRING, "\0"
187