xref: /rk3399_rockchip-uboot/arch/nios2/cpu/start.S (revision e900298ea4798cfb82cf89bdcf255f3614a5e1d8)
137e4dafaSPeter Tyser/*
237e4dafaSPeter Tyser * (C) Copyright 2004, Psyent Corporation <www.psyent.com>
337e4dafaSPeter Tyser * Scott McNutt <smcnutt@psyent.com>
437e4dafaSPeter Tyser *
51a459660SWolfgang Denk * SPDX-License-Identifier:	GPL-2.0+
637e4dafaSPeter Tyser */
737e4dafaSPeter Tyser
825ddd1fbSWolfgang Denk#include <asm-offsets.h>
937e4dafaSPeter Tyser#include <config.h>
1037e4dafaSPeter Tyser#include <version.h>
1137e4dafaSPeter Tyser
1237e4dafaSPeter Tyser/*************************************************************************
1337e4dafaSPeter Tyser * RESTART
1437e4dafaSPeter Tyser ************************************************************************/
1537e4dafaSPeter Tyser
1637e4dafaSPeter Tyser	.text
1737e4dafaSPeter Tyser	.global _start
1837e4dafaSPeter Tyser
1937e4dafaSPeter Tyser_start:
20fd2712d0SThomas Chou	wrctl	status, r0		/* Disable interrupts */
2137e4dafaSPeter Tyser	/* ICACHE INIT -- only the icache line at the reset address
2237e4dafaSPeter Tyser	 * is invalidated at reset. So the init must stay within
2337e4dafaSPeter Tyser	 * the cache line size (8 words). If GERMS is used, we'll
2437e4dafaSPeter Tyser	 * just be invalidating the cache a second time. If cache
2537e4dafaSPeter Tyser	 * is not implemented initi behaves as nop.
2637e4dafaSPeter Tyser	 */
2737e4dafaSPeter Tyser	ori	r4, r0, %lo(CONFIG_SYS_ICACHELINE_SIZE)
2837e4dafaSPeter Tyser	movhi	r5, %hi(CONFIG_SYS_ICACHE_SIZE)
2937e4dafaSPeter Tyser	ori	r5, r5, %lo(CONFIG_SYS_ICACHE_SIZE)
30fd2712d0SThomas Chou0:	initi	r5
31fd2712d0SThomas Chou	sub	r5, r5, r4
32fd2712d0SThomas Chou	bgt	r5, r0, 0b
3337e4dafaSPeter Tyser	br	_except_end	/* Skip the tramp */
3437e4dafaSPeter Tyser
3537e4dafaSPeter Tyser	/* EXCEPTION TRAMPOLINE -- the following gets copied
3637e4dafaSPeter Tyser	 * to the exception address (below), but is otherwise at the
3737e4dafaSPeter Tyser	 * default exception vector offset (0x0020).
3837e4dafaSPeter Tyser	 */
3937e4dafaSPeter Tyser_except_start:
4037e4dafaSPeter Tyser	movhi	et, %hi(_exception)
4137e4dafaSPeter Tyser	ori	et, et, %lo(_exception)
4237e4dafaSPeter Tyser	jmp	et
4337e4dafaSPeter Tyser_except_end:
4437e4dafaSPeter Tyser
4537e4dafaSPeter Tyser	/* INTERRUPTS -- for now, all interrupts masked and globally
4637e4dafaSPeter Tyser	 * disabled.
4737e4dafaSPeter Tyser	 */
4837e4dafaSPeter Tyser	wrctl	ienable, r0		/* All disabled	*/
4937e4dafaSPeter Tyser
5037e4dafaSPeter Tyser	/* DCACHE INIT -- if dcache not implemented, initd behaves as
5137e4dafaSPeter Tyser	 * nop.
5237e4dafaSPeter Tyser	 */
5337e4dafaSPeter Tyser	movhi	r4, %hi(CONFIG_SYS_DCACHELINE_SIZE)
5437e4dafaSPeter Tyser	ori	r4, r4, %lo(CONFIG_SYS_DCACHELINE_SIZE)
5537e4dafaSPeter Tyser	movhi	r5, %hi(CONFIG_SYS_DCACHE_SIZE)
5637e4dafaSPeter Tyser	ori	r5, r5, %lo(CONFIG_SYS_DCACHE_SIZE)
5737e4dafaSPeter Tyser	mov	r6, r0
5837e4dafaSPeter Tyser1:	initd	0(r6)
5937e4dafaSPeter Tyser	add	r6, r6, r4
6037e4dafaSPeter Tyser	bltu	r6, r5, 1b
6137e4dafaSPeter Tyser
6237e4dafaSPeter Tyser	/* RELOCATE CODE, DATA & COMMAND TABLE -- the following code
6337e4dafaSPeter Tyser	 * assumes code, data and the command table are all
6437e4dafaSPeter Tyser	 * contiguous. This lets us relocate everything as a single
6537e4dafaSPeter Tyser	 * block. Make sure the linker script matches this ;-)
6637e4dafaSPeter Tyser	 */
6737e4dafaSPeter Tyser	nextpc	r4
6837e4dafaSPeter Tyser_cur:	movhi	r5, %hi(_cur - _start)
6937e4dafaSPeter Tyser	ori	r5, r5, %lo(_cur - _start)
7037e4dafaSPeter Tyser	sub	r4, r4, r5		/* r4 <- cur _start */
7137e4dafaSPeter Tyser	mov	r8, r4
7237e4dafaSPeter Tyser	movhi	r5, %hi(_start)
7337e4dafaSPeter Tyser	ori	r5, r5, %lo(_start)	/* r5 <- linked _start */
7437e4dafaSPeter Tyser	beq	r4, r5, 3f
7537e4dafaSPeter Tyser
76*e900298eSThomas Chou	movhi	r6, %hi(CONFIG_SYS_MONITOR_LEN)
77*e900298eSThomas Chou	ori	r6, r6, %lo(CONFIG_SYS_MONITOR_LEN)
78*e900298eSThomas Chou	add	r6, r6, r5
7937e4dafaSPeter Tyser2:	ldwio	r7, 0(r4)
8037e4dafaSPeter Tyser	addi	r4, r4, 4
8137e4dafaSPeter Tyser	stwio	r7, 0(r5)
8237e4dafaSPeter Tyser	addi	r5, r5, 4
8337e4dafaSPeter Tyser	bne	r5, r6, 2b
8437e4dafaSPeter Tyser3:
8537e4dafaSPeter Tyser
8637e4dafaSPeter Tyser	/* JUMP TO RELOC ADDR */
8737e4dafaSPeter Tyser	movhi	r4, %hi(_reloc)
8837e4dafaSPeter Tyser	ori	r4, r4, %lo(_reloc)
8937e4dafaSPeter Tyser	jmp	r4
9037e4dafaSPeter Tyser_reloc:
9137e4dafaSPeter Tyser
9237e4dafaSPeter Tyser	/* COPY EXCEPTION TRAMPOLINE -- copy the tramp to the
9337e4dafaSPeter Tyser	 * exception address. Define CONFIG_ROM_STUBS to prevent
9437e4dafaSPeter Tyser	 * the copy (e.g. exception in flash or in other
9537e4dafaSPeter Tyser	 * softare/firmware component).
9637e4dafaSPeter Tyser	 */
9737e4dafaSPeter Tyser#if !defined(CONFIG_ROM_STUBS)
9837e4dafaSPeter Tyser	movhi	r4, %hi(_except_start)
9937e4dafaSPeter Tyser	ori	r4, r4, %lo(_except_start)
10037e4dafaSPeter Tyser	movhi	r5, %hi(_except_end)
10137e4dafaSPeter Tyser	ori	r5, r5, %lo(_except_end)
10237e4dafaSPeter Tyser	movhi	r6, %hi(CONFIG_SYS_EXCEPTION_ADDR)
10337e4dafaSPeter Tyser	ori	r6, r6, %lo(CONFIG_SYS_EXCEPTION_ADDR)
10437e4dafaSPeter Tyser	beq	r4, r6, 7f	/* Skip if at proper addr */
10537e4dafaSPeter Tyser
10637e4dafaSPeter Tyser6:	ldwio	r7, 0(r4)
10737e4dafaSPeter Tyser	stwio	r7, 0(r6)
10837e4dafaSPeter Tyser	addi	r4, r4, 4
10937e4dafaSPeter Tyser	addi	r6, r6, 4
11037e4dafaSPeter Tyser	bne	r4, r5, 6b
11137e4dafaSPeter Tyser7:
11237e4dafaSPeter Tyser#endif
11337e4dafaSPeter Tyser
11437e4dafaSPeter Tyser	/* STACK INIT -- zero top two words for call back chain.
11537e4dafaSPeter Tyser	 */
11637e4dafaSPeter Tyser	movhi	sp, %hi(CONFIG_SYS_INIT_SP)
11737e4dafaSPeter Tyser	ori	sp, sp, %lo(CONFIG_SYS_INIT_SP)
11837e4dafaSPeter Tyser	addi	sp, sp, -8
11937e4dafaSPeter Tyser	stw	r0, 0(sp)
12037e4dafaSPeter Tyser	stw	r0, 4(sp)
12137e4dafaSPeter Tyser	mov	fp, sp
12237e4dafaSPeter Tyser
12337e4dafaSPeter Tyser	/*
1245ff10aa7SThomas Chou	 * Call board_init_f -- never returns
12537e4dafaSPeter Tyser	 */
1265ff10aa7SThomas Chou	mov	r4, r0
1275ff10aa7SThomas Chou	movhi	r2, %hi(board_init_f@h)
1285ff10aa7SThomas Chou	ori	r2, r2, %lo(board_init_f@h)
1295ff10aa7SThomas Chou	callr	r2
13037e4dafaSPeter Tyser
13137e4dafaSPeter Tyser	/* NEVER RETURNS -- but branch to the _start just
13237e4dafaSPeter Tyser	 * in case ;-)
13337e4dafaSPeter Tyser	 */
13437e4dafaSPeter Tyser	br	_start
13537e4dafaSPeter Tyser
13637e4dafaSPeter Tyser
1375ff10aa7SThomas Chou
1385ff10aa7SThomas Chou/*
1395ff10aa7SThomas Chou * relocate_code -- Nios2 handles the relocation above. But
1405ff10aa7SThomas Chou * the generic board code monkeys with the heap, stack, etc.
1415ff10aa7SThomas Chou * (it makes some assumptions that may not be appropriate
1425ff10aa7SThomas Chou * for Nios). Nevertheless, we capitulate here.
1435ff10aa7SThomas Chou *
1445ff10aa7SThomas Chou * We'll call the board_init_r from here since this isn't
1455ff10aa7SThomas Chou * supposed to return.
1465ff10aa7SThomas Chou *
1475ff10aa7SThomas Chou * void relocate_code (ulong sp, gd_t *global_data,
1485ff10aa7SThomas Chou *			ulong reloc_addr)
1495ff10aa7SThomas Chou *			__attribute__ ((noreturn));
1505ff10aa7SThomas Chou */
1515ff10aa7SThomas Chou	.text
1525ff10aa7SThomas Chou	.global relocate_code
1535ff10aa7SThomas Chou
1545ff10aa7SThomas Chourelocate_code:
1555ff10aa7SThomas Chou	mov	sp, r4		/* Set the new sp */
1565ff10aa7SThomas Chou	mov	r4, r5
1574192b8c3SThomas Chou
1584192b8c3SThomas Chou	/*
1594192b8c3SThomas Chou	 * ZERO BSS/SBSS -- bss and sbss are assumed to be adjacent
1604192b8c3SThomas Chou	 * and between __bss_start and __bss_end.
1614192b8c3SThomas Chou	 */
1624192b8c3SThomas Chou	movhi	r5, %hi(__bss_start)
1634192b8c3SThomas Chou	ori	r5, r5, %lo(__bss_start)
1644192b8c3SThomas Chou	movhi	r6, %hi(__bss_end)
1654192b8c3SThomas Chou	ori	r6, r6, %lo(__bss_end)
1664192b8c3SThomas Chou	beq	r5, r6, 5f
1674192b8c3SThomas Chou
1684192b8c3SThomas Chou4:	stwio	r0, 0(r5)
1694192b8c3SThomas Chou	addi	r5, r5, 4
1704192b8c3SThomas Chou	bne	r5, r6, 4b
1714192b8c3SThomas Chou5:
1724192b8c3SThomas Chou
1735ff10aa7SThomas Chou	movhi	r8, %hi(board_init_r@h)
1745ff10aa7SThomas Chou	ori	r8, r8, %lo(board_init_r@h)
1755ff10aa7SThomas Chou	callr	r8
1765ff10aa7SThomas Chou	ret
1775ff10aa7SThomas Chou
17837e4dafaSPeter Tyser/*
17937e4dafaSPeter Tyser * dly_clks -- Nios2 (like Nios1) doesn't have a timebase in
18037e4dafaSPeter Tyser * the core. For simple delay loops, we do our best by counting
18137e4dafaSPeter Tyser * instruction cycles.
18237e4dafaSPeter Tyser *
18337e4dafaSPeter Tyser * Instruction performance varies based on the core. For cores
18437e4dafaSPeter Tyser * with icache and static/dynamic branch prediction (II/f, II/s):
18537e4dafaSPeter Tyser *
18637e4dafaSPeter Tyser *	Normal ALU (e.g. add, cmp, etc):	1 cycle
18737e4dafaSPeter Tyser *	Branch (correctly predicted, taken):	2 cycles
18837e4dafaSPeter Tyser *	Negative offset is predicted (II/s).
18937e4dafaSPeter Tyser *
19037e4dafaSPeter Tyser * For cores without icache and no branch prediction (II/e):
19137e4dafaSPeter Tyser *
19237e4dafaSPeter Tyser *	Normal ALU (e.g. add, cmp, etc):	6 cycles
19337e4dafaSPeter Tyser *	Branch (no prediction):			6 cycles
19437e4dafaSPeter Tyser *
19537e4dafaSPeter Tyser * For simplicity, if an instruction cache is implemented we
19637e4dafaSPeter Tyser * assume II/f or II/s. Otherwise, we use the II/e.
19737e4dafaSPeter Tyser *
19837e4dafaSPeter Tyser */
19937e4dafaSPeter Tyser	.globl dly_clks
20037e4dafaSPeter Tyser
20137e4dafaSPeter Tyserdly_clks:
20237e4dafaSPeter Tyser
20337e4dafaSPeter Tyser#if (CONFIG_SYS_ICACHE_SIZE > 0)
20437e4dafaSPeter Tyser	subi	r4, r4, 3		/* 3 clocks/loop	*/
20537e4dafaSPeter Tyser#else
20637e4dafaSPeter Tyser	subi	r4, r4, 12		/* 12 clocks/loop	*/
20737e4dafaSPeter Tyser#endif
20837e4dafaSPeter Tyser	bge	r4, r0, dly_clks
20937e4dafaSPeter Tyser	ret
21037e4dafaSPeter Tyser
21137e4dafaSPeter Tyser	.data
21237e4dafaSPeter Tyser	.globl	version_string
21337e4dafaSPeter Tyser
21437e4dafaSPeter Tyserversion_string:
21509c2e90cSAndreas Bießmann	.ascii U_BOOT_VERSION_STRING, "\0"
216