2 * IA-64 specific setjmp/longjmp routines
4 * Inspired by setjmp.s from the FreeBSD kernel.
46 #define J_SIGMASK 0x1d8
47 #define J_SIGSET 0x1e0
50 // int setjmp(struct jmp_buffer *)
52 // Setup a non-local goto.
56 // SetJump stores the current register set in the area pointed to
57 // by "save". It returns zero. Subsequent calls to "LongJump" will
58 // restore the registers and return non-zero to the same location.
60 // On entry, r32 contains the pointer to the jmp_buffer
67 // Make sure buffer is aligned at 16byte boundary
69 add r10 = -0x10,r0 ;; // mask the lower 4 bits
71 add r32 = 0x10, r32;; // move to next 16 byte boundary
73 add r10 = J_PREDS, r32 // skip Unats & pfs save area
76 // save immediate context
78 mov r2 = ar.bsp // save backing store pointer
79 mov r3 = pr // save predicates
83 // save user Unat register
85 mov r16 = ar.lc // save loop count register
86 mov r14 = ar.unat // save user Unat register
88 st8 [r10] = r3, J_LC-J_PREDS
89 st8 [r11] = r2, J_R4-J_BSP
91 st8 [r10] = r16, J_R5-J_LC
92 st8 [r32] = r14, J_NATS // Note: Unat at the
93 // beginning of the save area
97 // save preserved general registers & NaT's
99 st8.spill [r11] = r4, J_R6-J_R4
101 st8.spill [r10] = r5, J_R7-J_R5
103 st8.spill [r11] = r6, J_SP-J_R6
105 st8.spill [r10] = r7, J_F3-J_R7
107 st8.spill [r11] = sp, J_F2-J_SP
110 // save spilled Unat and pfs registers
112 mov r2 = ar.unat // save Unat register after spill
114 st8 [r32] = r2, J_PFS-J_NATS // save unat for spilled regs
116 st8 [r32] = r15 // save pfs
118 // save floating registers
120 stf.spill [r11] = f2, J_F4-J_F2
121 stf.spill [r10] = f3, J_F5-J_F3
123 stf.spill [r11] = f4, J_F16-J_F4
124 stf.spill [r10] = f5, J_F17-J_F5
126 stf.spill [r11] = f16, J_F18-J_F16
127 stf.spill [r10] = f17, J_F19-J_F17
129 stf.spill [r11] = f18, J_F20-J_F18
130 stf.spill [r10] = f19, J_F21-J_F19
132 stf.spill [r11] = f20, J_F22-J_F20
133 stf.spill [r10] = f21, J_F23-J_F21
135 stf.spill [r11] = f22, J_F24-J_F22
136 stf.spill [r10] = f23, J_F25-J_F23
138 stf.spill [r11] = f24, J_F26-J_F24
139 stf.spill [r10] = f25, J_F27-J_F25
141 stf.spill [r11] = f26, J_F28-J_F26
142 stf.spill [r10] = f27, J_F29-J_F27
144 stf.spill [r11] = f28, J_F30-J_F28
145 stf.spill [r10] = f29, J_F31-J_F29
147 stf.spill [r11] = f30, J_FPSR-J_F30
148 stf.spill [r10] = f31, J_B0-J_F31 // size of f31 + fpsr
150 // save FPSR register & branch registers
152 mov r2 = ar.fpsr // save fpsr register
155 st8 [r11] = r2, J_B1-J_FPSR
156 st8 [r10] = r3, J_B2-J_B0
160 st8 [r11] = r2, J_B3-J_B1
161 st8 [r10] = r3, J_B4-J_B2
165 st8 [r11] = r2, J_B5-J_B3
174 mov r8 = r0 // return 0 from setjmp
175 mov ar.unat = r14 // restore unat
180 // void longjmp(struct jmp_buffer *, int val)
182 // Perform a non-local goto.
186 // LongJump initializes the register set to the values saved by a
187 // previous 'SetJump' and jumps to the return location saved by that
188 // 'SetJump'. This has the effect of unwinding the stack and returning
189 // for a second time to the 'SetJump'.
197 // Make sure buffer is aligned at 16byte boundary
199 add r10 = -0x10,r0 ;; // mask the lower 4 bits
201 add r32 = 0x10, r32;; // move to next 16 byte boundary
204 // caching the return value as we do invala in the end
206 mov r8 = r33 // return value
209 // get immediate context
211 mov r14 = ar.rsc // get user RSC conf
212 add r10 = J_PFS, r32 // get address of pfs
213 add r11 = J_NATS, r32
215 ld8 r15 = [r10], J_BSP-J_PFS // get pfs
216 ld8 r2 = [r11], J_LC-J_NATS // get unat for spilled regs
220 ld8 r16 = [r10], J_PREDS-J_BSP // get backing store pointer
221 mov ar.rsc = r0 // put RSE in enforced lazy
226 // while returning from longjmp the BSPSTORE and BSP needs to be
227 // same and discard all the registers allocated after we did
228 // setjmp. Also, we need to generate the RNAT register since we
229 // did not flushed the RSE on setjmp.
231 mov r17 = ar.bspstore // get current BSPSTORE
233 cmp.ltu p6,p7 = r17, r16 // is it less than BSP of
234 (p6) br.spnt.few .flush_rse
235 mov r19 = ar.rnat // get current RNAT
237 loadrs // invalidate dirty regs
238 br.sptk.many .restore_rnat // restore RNAT
243 mov r19 = ar.rnat // get current RNAT
244 mov r17 = r16 // current BSPSTORE
248 // check if RNAT is saved between saved BSP and curr BSPSTORE
252 dep r18 = r18,r16,3,6 // get RNAT address
254 cmp.ltu p8,p9 = r18, r17 // RNAT saved on RSE
256 (p8) ld8 r19 = [r18] // get RNAT from RSE
258 mov ar.bspstore = r16 // set new BSPSTORE
260 mov ar.rnat = r19 // restore RNAT
261 mov ar.rsc = r14 // restore RSC conf
264 ld8 r3 = [r11], J_R4-J_LC // get lc register
265 ld8 r2 = [r10], J_R5-J_PREDS // get predicates
270 // restore preserved general registers & NaT's
272 ld8.fill r4 = [r11], J_R6-J_R4
274 ld8.fill r5 = [r10], J_R7-J_R5
275 ld8.fill r6 = [r11], J_SP-J_R6
277 ld8.fill r7 = [r10], J_F2-J_R7
278 ld8.fill sp = [r11], J_F3-J_SP
281 // restore floating registers
283 ldf.fill f2 = [r10], J_F4-J_F2
284 ldf.fill f3 = [r11], J_F5-J_F3
286 ldf.fill f4 = [r10], J_F16-J_F4
287 ldf.fill f5 = [r11], J_F17-J_F5
289 ldf.fill f16 = [r10], J_F18-J_F16
290 ldf.fill f17 = [r11], J_F19-J_F17
292 ldf.fill f18 = [r10], J_F20-J_F18
293 ldf.fill f19 = [r11], J_F21-J_F19
295 ldf.fill f20 = [r10], J_F22-J_F20
296 ldf.fill f21 = [r11], J_F23-J_F21
298 ldf.fill f22 = [r10], J_F24-J_F22
299 ldf.fill f23 = [r11], J_F25-J_F23
301 ldf.fill f24 = [r10], J_F26-J_F24
302 ldf.fill f25 = [r11], J_F27-J_F25
304 ldf.fill f26 = [r10], J_F28-J_F26
305 ldf.fill f27 = [r11], J_F29-J_F27
307 ldf.fill f28 = [r10], J_F30-J_F28
308 ldf.fill f29 = [r11], J_F31-J_F29
310 ldf.fill f30 = [r10], J_FPSR-J_F30
311 ldf.fill f31 = [r11], J_B0-J_F31 ;;
314 // restore branch registers and fpsr
316 ld8 r16 = [r10], J_B1-J_FPSR // get fpsr
317 ld8 r17 = [r11], J_B2-J_B0 // get return pointer
321 ld8 r2 = [r10], J_B3-J_B1
322 ld8 r3 = [r11], J_B4-J_B2
326 ld8 r2 = [r10], J_B5-J_B3
332 ld8 r21 = [r32] // get user unat