EMBARK/kinclude/boot.S

#include "csr.h"
.section    .stack

stack_bottom:
.space      4096
stack_top:

// put the startup code in a special section so that the linker can position it at the start of the binary
.section    .text._start

// tell the linker that init is a function located elsewhere
.extern     init
.type       init, @function

.global     _start
_start:
            // setup mie register, enable timer and software interrupts targeting machine mode
            // mie[7] MTIE = 1 - enable timer interrupts
            // mie[3] MSIE = 1 - enable software interrupts
            li      a0, 0x88
            csrw    CSR_MIE, a0         // write to mie csr
            // load trap vector address into a0
            la      a0, trap_vector
            csrw    CSR_MTVEC, a0       // write to mtvec csr
            // enable interrupts in mstatus
            // mstatus[07] MPIE = 1 - we want to enable interrupts with mret
            li      a0, 0x80
            csrw    CSR_MSTATUS, a0     // write to mstatus csr
.option push
.option norelax
            // init sp and gp
            la      sp, stack_top
            la      gp, __global_pointer$
.option pop
            // clear kernel bss section
            mv      a0, zero
            la      a1, _bss_start
            la      a2, _bss_end
            jal     memset

            // jump to init
            jal     init

            // halt machine after returning from init
            li      t0, -1
            csrw    CSR_HALT, t0
            // if the halt CSR somehow didn't exit immediately trap execution in this infinite loop
1:
            j       1b

.extern     trap_handle
.type       trap_handle, @function

.align 4
trap_vector:
            // save all registers into the PCB struct
            // switch contents of t6 with contents of mscratch
            // mscratch holds the PCBs regs field address
            csrrw   t6,  CSR_MSCRATCH, t6
            sw      ra,  0(t6)
            sw      sp,  4(t6)
            sw      gp,  8(t6)
            sw      tp,  12(t6)
            sw      t0,  16(t6)
            sw      t1,  20(t6)
            sw      t2,  24(t6)
            sw      s0,  28(t6)
            sw      s1,  32(t6)
            sw      a0,  36(t6)
            sw      a1,  40(t6)
            sw      a2,  44(t6)
            sw      a3,  48(t6)
            sw      a4,  52(t6)
            sw      a5,  56(t6)
            sw      a6,  60(t6)
            sw      a7,  64(t6)
            sw      s2,  68(t6)
            sw      s3,  72(t6)
            sw      s4,  76(t6)
            sw      s5,  80(t6)
            sw      s6,  84(t6)
            sw      s7,  88(t6)
            sw      s8,  92(t6)
            sw      s9,  96(t6)
            sw      s10, 100(t6)
            sw      s11, 104(t6)
            sw      t3,  108(t6)
            sw      t4,  112(t6)
            sw      t5,  116(t6)
            mv      a0,  t6             // save struct address to already saved register
            csrrw   t6,  CSR_MSCRATCH, t6   // load original t6 register from mscratch
            sw      t6,  120(a0)        // save original t6 register
            // save mepc to pc field in pcb
            csrr    t6,  CSR_MEPC
            sw      t6,  -4(a0)
            // load mcause and mtval values in the correct registers for call to trap_handle function
            csrr    a1,  CSR_MCAUSE
            srli    a0,  a1, 31
            slli    a1,  a1, 1
            srli    a1,  a1, 1
            csrr    a2,  CSR_MTVAL
            // reinit sp and gp
.option push
.option norelax
            la      sp, stack_top
            la      gp, _gp
.option pop
            jal     trap_handle


// make memset global
.global     memset
.type       memset, @function
#ifdef __risc_no_ext
// "dumb" memset, if RV32M is not present on the target
// since memset is currently only used at startup, the performance implications
// should be minimal.
memset:
            bge     a1, a2, 2f
1:
            sw      a0, 0(a1)
            addi    a1, a1, 4
            blt     a1, a2, 1b
2:
            ret

#else

// "smart" memset, writing 32 bytes at a time. uses RV32M. If not present,
// the "dumb" fallback above is used.

// write a0 to memory starting at a1, until a2 (both must be four byte aligned)
// this uses a loop which writes 32 (numbytes) bytes at a time
// to prevent overshooting the end, we first calulate how many instructions to
// skip of the first iteration of the loop. this way, (a2 - a1) is a multiple of
// (numbytes) when we reach the blt instruction for the first time.
// this math works so good, because we write 4 bytes of mem, in 4 bytes of
// instructions. Therefore instruction bytes to skip = write bytes to skip
// bytes to skip = numbytes - ((a2 - a1) % numbytes)
memset:
            sub     t1, a2, a1      // t1 = a2 - a1
            li      t2, 32          // = numbytes
            rem     t1, t1, t2      // t1 = (a2 - a1) % numbytes
            beq     zero, t1, 1f    // skip 0 bytes? => begin loop
            sub     t2, t2, t1      // t2 = numbytes - ((a2 - a1) % numbytes)
                                    // = bytes to skip
            sub     a1, a1, t2      // subtract skipped bytes from a2
                                    // to account for the skipped instruction
                                    // when we reach the addi, a1, a1, 32 inst.
            auipc   t1, 0           // get current address
            add     t1, t2, t1      // add calulated offset
            jalr    zero, t1, 12    // skip the instructions by forward-jumping
                                    // the 12 is added to compensate for the
                                    // three instructions auipc, add, jalr
1:
            sw      a0, 0(a1)
            sw      a0, 4(a1)
            sw      a0, 8(a1)
            sw      a0, 12(a1)
            sw      a0, 16(a1)
            sw      a0, 20(a1)
            sw      a0, 24(a1)
            sw      a0, 28(a1)
            addi    a1, a1, 32
            blt     a1, a2, 1b
            ret
#endif

// this is where instantiated threads return to once they are finished
.section    .thread_fini
.global     thread_finalizer
thread_finalizer:
// just a simple exit syscall
            nop
            li      a7, 5
            ecall
added config options to makefile - now able to build various variations 3 years ago			`#include "csr.h"`
initial commit 3 years ago			`.section .stack`

			`stack_bottom:`
			`.space 4096`
			`stack_top:`

improved scheduling code 3 years ago			`// put the startup code in a special section so that the linker can position it at the start of the binary`
using my own linker now 3 years ago			`.section .text._start`
initial commit 3 years ago
improved scheduling code 3 years ago			`// tell the linker that init is a function located elsewhere`
initial commit 3 years ago			`.extern init`
			`.type init, @function`

			`.global _start`
			`_start:`
improved scheduling code 3 years ago			`// setup mie register, enable timer and software interrupts targeting machine mode`
			`// mie[7] MTIE = 1 - enable timer interrupts`
			`// mie[3] MSIE = 1 - enable software interrupts`
			`li a0, 0x88`
			`csrw CSR_MIE, a0 // write to mie csr`
			`// load trap vector address into a0`
			`la a0, trap_vector`
			`csrw CSR_MTVEC, a0 // write to mtvec csr`
initial commit 3 years ago			`// enable interrupts in mstatus`
improved scheduling code 3 years ago			`// mstatus[07] MPIE = 1 - we want to enable interrupts with mret`
initial commit 3 years ago			`li a0, 0x80`
improved scheduling code 3 years ago			`csrw CSR_MSTATUS, a0 // write to mstatus csr`
initial commit 3 years ago			`.option push`
			`.option norelax`
			`// init sp and gp`
			`la sp, stack_top`
improved scheduling code 3 years ago			`la gp, __global_pointer$`
initial commit 3 years ago			`.option pop`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`// clear kernel bss section`
			`mv a0, zero`
switched to a real linker script 3 years ago			`la a1, _bss_start`
			`la a2, _bss_end`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`jal memset`

added comment for jump to init 3 years ago			`// jump to init`
initial commit 3 years ago			`jal init`
removed trailing whitespaces 3 years ago
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`// halt machine after returning from init`
various imrpovements and implementations on the kernel 3 years ago			`li t0, -1`
			`csrw CSR_HALT, t0`
improved scheduling code 3 years ago			`// if the halt CSR somehow didn't exit immediately trap execution in this infinite loop`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`1:`
			`j 1b`
initial commit 3 years ago
improved scheduling code 3 years ago			`.extern trap_handle`
			`.type trap_handle, @function`

initial commit 3 years ago			`.align 4`
			`trap_vector:`
			`// save all registers into the PCB struct`
			`// switch contents of t6 with contents of mscratch`
			`// mscratch holds the PCBs regs field address`
switched boot.S to use csr.h constants for csr addresses 3 years ago			`csrrw t6, CSR_MSCRATCH, t6`
initial commit 3 years ago			`sw ra, 0(t6)`
			`sw sp, 4(t6)`
			`sw gp, 8(t6)`
			`sw tp, 12(t6)`
			`sw t0, 16(t6)`
			`sw t1, 20(t6)`
			`sw t2, 24(t6)`
			`sw s0, 28(t6)`
			`sw s1, 32(t6)`
			`sw a0, 36(t6)`
			`sw a1, 40(t6)`
			`sw a2, 44(t6)`
			`sw a3, 48(t6)`
			`sw a4, 52(t6)`
			`sw a5, 56(t6)`
			`sw a6, 60(t6)`
			`sw a7, 64(t6)`
			`sw s2, 68(t6)`
			`sw s3, 72(t6)`
			`sw s4, 76(t6)`
			`sw s5, 80(t6)`
			`sw s6, 84(t6)`
			`sw s7, 88(t6)`
			`sw s8, 92(t6)`
			`sw s9, 96(t6)`
			`sw s10, 100(t6)`
			`sw s11, 104(t6)`
			`sw t3, 108(t6)`
			`sw t4, 112(t6)`
			`sw t5, 116(t6)`
			`mv a0, t6 // save struct address to already saved register`
switched boot.S to use csr.h constants for csr addresses 3 years ago			`csrrw t6, CSR_MSCRATCH, t6 // load original t6 register from mscratch`
initial commit 3 years ago			`sw t6, 120(a0) // save original t6 register`
started properly implementing syscall structure 3 years ago			`// save mepc to pc field in pcb`
switched boot.S to use csr.h constants for csr addresses 3 years ago			`csrr t6, CSR_MEPC`
started properly implementing syscall structure 3 years ago			`sw t6, -4(a0)`
			`// load mcause and mtval values in the correct registers for call to trap_handle function`
switched boot.S to use csr.h constants for csr addresses 3 years ago			`csrr a1, CSR_MCAUSE`
initial commit 3 years ago			`srli a0, a1, 31`
			`slli a1, a1, 1`
			`srli a1, a1, 1`
switched boot.S to use csr.h constants for csr addresses 3 years ago			`csrr a2, CSR_MTVAL`
initial commit 3 years ago			`// reinit sp and gp`
			`.option push`
			`.option norelax`
			`la sp, stack_top`
switched to a real linker script 3 years ago			`la gp, _gp`
initial commit 3 years ago			`.option pop`
			`jal trap_handle`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago
added memset for non-rv32m environments 3 years ago
added TextIO module for outputting text 3 years ago			`// make memset global`
			`.global memset`
			`.type memset, @function`
added memset for non-rv32m environments 3 years ago			`#ifdef __risc_no_ext`
			`// "dumb" memset, if RV32M is not present on the target`
			`// since memset is currently only used at startup, the performance implications`
			`// should be minimal.`
			`memset:`
added TextIO module for outputting text 3 years ago			`bge a1, a2, 2f`
added memset for non-rv32m environments 3 years ago			`1:`
added TextIO module for outputting text 3 years ago			`sw a0, 0(a1)`
			`addi a1, a1, 4`
			`blt a1, a2, 1b`
added memset for non-rv32m environments 3 years ago			`2:`
added TextIO module for outputting text 3 years ago			`ret`
added memset for non-rv32m environments 3 years ago
			`#else`

			`// "smart" memset, writing 32 bytes at a time. uses RV32M. If not present,`
			`// the "dumb" fallback above is used.`

implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`// write a0 to memory starting at a1, until a2 (both must be four byte aligned)`
			`// this uses a loop which writes 32 (numbytes) bytes at a time`
removed trailing whitespaces 3 years ago			`// to prevent overshooting the end, we first calulate how many instructions to`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`// skip of the first iteration of the loop. this way, (a2 - a1) is a multiple of`
removed trailing whitespaces 3 years ago			`// (numbytes) when we reach the blt instruction for the first time.`
			`// this math works so good, because we write 4 bytes of mem, in 4 bytes of`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`// instructions. Therefore instruction bytes to skip = write bytes to skip`
			`// bytes to skip = numbytes - ((a2 - a1) % numbytes)`
added config options to makefile - now able to build various variations 3 years ago			`memset:`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`sub t1, a2, a1 // t1 = a2 - a1`
			`li t2, 32 // = numbytes`
			`rem t1, t1, t2 // t1 = (a2 - a1) % numbytes`
			`beq zero, t1, 1f // skip 0 bytes? => begin loop`
			`sub t2, t2, t1 // t2 = numbytes - ((a2 - a1) % numbytes)`
			`// = bytes to skip`
			`sub a1, a1, t2 // subtract skipped bytes from a2`
			`// to account for the skipped instruction`
			`// when we reach the addi, a1, a1, 32 inst.`
added config options to makefile - now able to build various variations 3 years ago			`auipc t1, 0 // get current address`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`add t1, t2, t1 // add calulated offset`
			`jalr zero, t1, 12 // skip the instructions by forward-jumping`
removed trailing whitespaces 3 years ago			`// the 12 is added to compensate for the`
added config options to makefile - now able to build various variations 3 years ago			`// three instructions auipc, add, jalr`
implemented a smart memset routine, use it to clear bss, and halt after returning from init 3 years ago			`1:`
			`sw a0, 0(a1)`
			`sw a0, 4(a1)`
			`sw a0, 8(a1)`
			`sw a0, 12(a1)`
			`sw a0, 16(a1)`
			`sw a0, 20(a1)`
			`sw a0, 24(a1)`
			`sw a0, 28(a1)`
			`addi a1, a1, 32`
			`blt a1, a2, 1b`
added config options to makefile - now able to build various variations 3 years ago			`ret`
various imrpovements and implementations on the kernel 3 years ago			`#endif`

			`// this is where instantiated threads return to once they are finished`
			`.section .thread_fini`
			`.global thread_finalizer`
			`thread_finalizer:`
			`// just a simple exit syscall`
			`nop`
			`li a7, 5`
			`ecall`