1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
|
#include "encoding.h"
#ifdef __riscv64
# define LREG ld
# define SREG sd
#else
# define LREG lw
# define SREG sw
#endif
.text
.globl _start
_start:
li x1, 0
li x2, 0
li x3, 0
li x4, 0
li x5, 0
li x6, 0
li x7, 0
li x8, 0
li x9, 0
li x10,0
li x11,0
li x12,0
li x13,0
li x14,0
li x15,0
li x16,0
li x17,0
li x18,0
li x19,0
li x20,0
li x21,0
li x22,0
li x23,0
li x24,0
li x25,0
li x26,0
li x27,0
li x28,0
li x29,0
li x30,0
li x31,0
#ifdef __riscv64
li a0, SR_U64 | SR_S64
csrs status, a0
#endif
csrc status, SR_PS
# enable fp and accelerator
li a0, SR_EF | SR_EA
csrs status, a0
csrr t0, status
and t1, t0, SR_EA
sw t1, have_vec, t2
## if that didn't stick, we don't have an FPU, so don't initialize it
and t1, t0, SR_EF
beqz t1, 1f
fssr x0
fmv.s.x f0, x0
fmv.s.x f1, x0
fmv.s.x f2, x0
fmv.s.x f3, x0
fmv.s.x f4, x0
fmv.s.x f5, x0
fmv.s.x f6, x0
fmv.s.x f7, x0
fmv.s.x f8, x0
fmv.s.x f9, x0
fmv.s.x f10,x0
fmv.s.x f11,x0
fmv.s.x f12,x0
fmv.s.x f13,x0
fmv.s.x f14,x0
fmv.s.x f15,x0
fmv.s.x f16,x0
fmv.s.x f17,x0
fmv.s.x f18,x0
fmv.s.x f19,x0
fmv.s.x f20,x0
fmv.s.x f21,x0
fmv.s.x f22,x0
fmv.s.x f23,x0
fmv.s.x f24,x0
fmv.s.x f25,x0
fmv.s.x f26,x0
fmv.s.x f27,x0
fmv.s.x f28,x0
fmv.s.x f29,x0
fmv.s.x f30,x0
fmv.s.x f31,x0
1:
la t0, trap_entry
csrw evec, t0
la tp, _end + 63
and tp, tp, -64
# get core id and number of cores
csrr a0, hartid
lw a1, 4(zero)
# give each core 128KB of stack + TLS
#define STKSHIFT 17
sll a2, a0, STKSHIFT
add tp, tp, a2
add sp, a0, 1
sll sp, sp, STKSHIFT
add sp, sp, tp
lui t0, %tprel_hi(tls_start)
add t0, t0, %tprel_lo(tls_start)
sub tp, tp, t0
la t0, _init
csrw epc, t0
sret
trap_entry:
csrw sup0, sp
csrw sup1, t0
csrr t0, status
andi t0, t0, SR_PS
bnez t0, 1f
la sp, kstacktop
1:
addi sp, sp, -272
csrr t0, sup1
SREG x1, 8(sp)
SREG x2, 16(sp)
SREG x3, 24(sp)
SREG x4, 32(sp)
SREG x5, 40(sp)
SREG x6, 48(sp)
SREG x7, 56(sp)
SREG x8, 64(sp)
SREG x9, 72(sp)
SREG x10, 80(sp)
SREG x11, 88(sp)
SREG x12, 96(sp)
SREG x13, 104(sp)
SREG x14, 112(sp)
SREG x15, 120(sp)
SREG x16, 128(sp)
SREG x17, 136(sp)
SREG x18, 144(sp)
SREG x19, 152(sp)
SREG x20, 160(sp)
SREG x21, 168(sp)
SREG x22, 176(sp)
SREG x23, 184(sp)
SREG x24, 192(sp)
SREG x25, 200(sp)
SREG x26, 208(sp)
SREG x27, 216(sp)
SREG x28, 224(sp)
SREG x29, 232(sp)
SREG x30, 240(sp)
SREG x31, 248(sp)
csrr t0, sup0
csrr t1, status
SREG t0, 256(sp)
SREG t1, 264(sp)
csrr a0, cause
csrr a1, epc
mv a2, sp
jal handle_trap
csrw epc, v0
LREG t0, 256(sp)
LREG t1, 264(sp)
csrw sup0, t0
csrw status, t1
LREG x1, 8(sp)
LREG x2, 16(sp)
LREG x3, 24(sp)
LREG x4, 32(sp)
LREG x5, 40(sp)
LREG x6, 48(sp)
LREG x7, 56(sp)
LREG x8, 64(sp)
LREG x9, 72(sp)
LREG x10, 80(sp)
LREG x11, 88(sp)
LREG x12, 96(sp)
LREG x13, 104(sp)
LREG x14, 112(sp)
LREG x15, 120(sp)
LREG x16, 128(sp)
LREG x17, 136(sp)
LREG x18, 144(sp)
LREG x19, 152(sp)
LREG x20, 160(sp)
LREG x21, 168(sp)
LREG x22, 176(sp)
LREG x23, 184(sp)
LREG x24, 192(sp)
LREG x25, 200(sp)
LREG x26, 208(sp)
LREG x27, 216(sp)
LREG x28, 224(sp)
LREG x29, 232(sp)
LREG x30, 240(sp)
LREG x31, 248(sp)
csrr sp, sup0
sret
.bss
.align 4
.skip 4096
kstacktop:
.section .tbss
tls_start:
|