3 * Register dump and debugging support
5 * (c) 2019 Straylight/Edgeware
8 /*----- Licensing notice --------------------------------------------------*
10 * This file is part of Catacomb.
12 * Catacomb is free software: you can redistribute it and/or modify it
13 * under the terms of the GNU Library General Public License as published
14 * by the Free Software Foundation; either version 2 of the License, or
15 * (at your option) any later version.
17 * Catacomb is distributed in the hope that it will be useful, but
18 * WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * Library General Public License for more details.
22 * You should have received a copy of the GNU Library General Public
23 * License along with Catacomb. If not, write to the Free Software
24 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
28 #ifndef CATACOMB_REGDUMP_H
29 #define CATACOMB_REGDUMP_H
35 /*----- Header files ------------------------------------------------------*/
39 #ifndef ENABLE_ASM_DEBUG
40 # error "Assembler-level debug disabled by `configure' script."
44 # include "asm-common.h"
47 # include <mLib/bits.h>
50 /*----- Random utilities --------------------------------------------------*/
53 _(0) _(1) _(2) _(3) _(4) _(5) _(6) _(7)
55 _(8) _(9) _(10) _(11) _(12) _(13) _(14) _(15)
57 #define DO16(_) DO8(_) DOHI8(_)
61 _(16) _(17) _(18) _(19) _(20) _(21) _(22) _(23) \
62 _(24) _(25) _(26) _(27) _(28) _(29) _(30) _(31)
64 /*----- Common data structures --------------------------------------------*/
68 /* The following are good on our assembler targets. */
69 typedef signed char int8;
72 #if LONG_MAX >> 31 > 0x7fffffff
75 typedef long long int64;
77 typedef float float32;
78 typedef double float64;
79 typedef long double float80;
81 #if CPUFAM_X86 || CPUFAM_ARMEL
82 # define PTR32 void *p;
85 #if CPUFAM_AMD64 || CPUFAM_ARM64
87 # define PTR64 void *p;
90 #define SIMD_COMMON(wd) \
102 union gp32 { uint32 u32; int32 i32; PTR32 };
103 union gp64 { uint64 u64; int64 i64; PTR64 };
107 /*----- Format word layout ------------------------------------------------*/
109 #define REGF_IXMASK 0x000000ff
110 #define REGF_IXSHIFT 0
111 /* The index into the vector indicated by `REGF_SRCMASK', if applicable. */
113 #define REGF_FMTMASK 0x0000ff00
114 #define REGF_FMTSHIFT 8
115 #define REGF_HEX 0x00000100
116 #define REGF_CHR 0x00000200
117 #define REGF_FLT 0x00000400
118 #define REGF_UNSGN 0x00000800
119 #define REGF_SGN 0x00001000
120 /* How to format the value(s) found. */
122 #define REGF_TYMASK 0x00ff0000
123 #define REGF_TYSHIFT 16
124 #define REGF_80 0x00010000
125 #define REGF_64 0x00020000
126 #define REGF_32 0x00040000
127 #define REGF_16 0x00080000
128 #define REGF_8 0x00100000
129 /* Size of the value(s) to dump. */
131 #define REGF_SRCMASK 0x0f000000
132 #define REGSRC_ABS 0x01000000 /* absolute address */
133 #define REGSRC_GP 0x02000000 /* general-purpose register */
134 #define REGSRC_FP 0x03000000 /* floating-point register */
135 #define REGSRC_SIMD 0x04000000 /* SIMD vector register */
136 #define REGSRC_STMMX 0x05000000 /* x86-specific: x87/MMX register */
137 #define REGSRC_SEG 0x06000000 /* x86-specific: segment register */
138 #define REGSRC_NONE 0x0f000000 /* just a message */
139 /* Where to find the values. */
141 #define REGF_WDMASK 0xf0000000
142 #define REGF_WDSHIFT 28
143 /* If we're to print a scalar, this is zero; otherwise, log_2 of the vector
144 * register width, in bits.
147 /*----- x86 and AMD64 -----------------------------------------------------*/
149 #if CPUFAM_X86 || CPUFAM_AMD64
151 #define REGIX_FLAGS 0
163 # define REGIX_GPLIM 11
168 # define REGIX_R10 13
169 # define REGIX_R11 14
170 # define REGIX_R12 15
171 # define REGIX_R13 16
172 # define REGIX_R14 17
173 # define REGIX_R15 18
174 # define REGIX_GPLIM 19
183 #define REGIX_SEGLIM 6
185 #define REGIX_FPFLAGS 255
190 typedef union gp32 gpreg;
193 typedef union gp64 gpreg;
197 gpreg gp[REGIX_GPLIM];
198 uint16 seg[REGIX_SEGLIM];
203 #if FLT_RADIX == 2 && LDBL_MANT_DIG == 64
206 unsigned char _pad[16];
209 union xmm { SIMD_COMMON(128); };
210 union ymm { SIMD_COMMON(256); };
211 union vreg { union xmm v128[2]; union ymm v256; };
221 unsigned short fpu_cs;
222 unsigned short _res1;
224 unsigned short fpu_ds;
225 unsigned short _res2;
228 unsigned long long fpu_ip;
229 unsigned long long fpu_dp;
232 unsigned int mxcsr_mask;
234 union stmmx stmmx[8];
238 unsigned char _pad0[8*16];
244 unsigned char _pad1[96];
250 unsigned char _pad0[8*16];
260 struct xsave_avx *avx;
265 .extern regdump_gpsave
266 .extern regdump_xtsave
267 .extern regdump_xtrstr
268 .extern regdump_gprstr
272 regmap_avx = 2*WORDSZ
273 regmap_size = 3*WORDSZ
275 #define REGDEF_GPX86_COMMON(rn, ix) \
276 regsrc.e##rn = REGSRC_GP | ix; \
277 regty.e##rn = REGF_32; \
278 regfmt.e##rn = REGF_HEX; \
279 regsrc.r##rn = REGSRC_GP | ix; \
280 regty.r##rn = REGF_64; \
281 regfmt.r##rn = REGF_HEX
283 #define REGDEF_GPX86_ABCD(rn, RN) \
284 regsrc.rn##hl = (4 << REGF_WDSHIFT) | REGSRC_GP | REGIX_##RN##X; \
285 regty.rn##hl = REGF_8; \
286 regfmt.rn##hl = REGF_HEX; \
287 regsrc.rn##l = REGSRC_GP | REGIX_##RN##X; \
288 regty.rn##l = REGF_8; \
289 regfmt.rn##l = REGF_HEX; \
290 regsrc.rn##x = REGSRC_GP | REGIX_##RN##X; \
291 regty.rn##x = REGF_16; \
292 regfmt.rn##x = REGF_HEX; \
293 REGDEF_GPX86_COMMON(rn##x, REGIX_##RN##X)
294 REGDEF_GPX86_ABCD(a, A)
295 REGDEF_GPX86_ABCD(b, B)
296 REGDEF_GPX86_ABCD(c, C)
297 REGDEF_GPX86_ABCD(d, D)
299 regsrc.eflags = REGSRC_GP | REGIX_FLAGS
300 regty.eflags = REGF_32
304 regsrc.rflags = REGSRC_GP | REGIX_FLAGS
305 regty.rflags = REGF_64
309 #define REGDEF_GPX86_XP(rn, RN) \
310 regsrc.rn##l = REGSRC_GP | REGIX_##RN; \
311 regty.rn##l = REGF_8; \
312 regfmt.rn##l = REGF_HEX; \
313 regsrc.rn = REGSRC_GP | REGIX_##RN; \
314 regty.rn = REGF_16; \
315 regfmt.rn = REGF_HEX; \
316 REGDEF_GPX86_COMMON(rn, REGIX_##RN)
317 REGDEF_GPX86_XP(ip, IP)
318 REGDEF_GPX86_XP(si, SI)
319 REGDEF_GPX86_XP(di, DI)
320 REGDEF_GPX86_XP(bp, BP)
321 REGDEF_GPX86_XP(sp, SP)
324 # define REGDEF_GPAMD64(i) \
325 regsrc.r##i##b = REGSRC_GP | REGIX_R##i; \
326 regty.r##i##b = REGF_8; \
327 regfmt.r##i##b = REGF_HEX; \
328 regsrc.r##i##w = REGSRC_GP | REGIX_R##i; \
329 regty.r##i##w = REGF_16; \
330 regfmt.r##i##w = REGF_HEX; \
331 regsrc.r##i##d = REGSRC_GP | REGIX_R##i; \
332 regty.r##i##d = REGF_32; \
333 regfmt.r##i##d = REGF_HEX; \
334 regsrc.r##i = REGSRC_GP | REGIX_R##i; \
335 regty.r##i = REGF_64; \
336 regfmt.r##i = REGF_HEX;
337 DOHI8(REGDEF_GPAMD64)
340 #define REGDEF_SEG(rn, RN) \
341 regsrc.rn = REGSRC_SEG | REGIX_##RN; \
342 regty.rn = REGF_16; \
351 #define REGDEF_STMMX(i) \
352 regsrc.st##i = REGSRC_STMMX | i; \
353 regty.st##i = REGF_80; \
354 regfmt.st##i = REGF_FLT; \
355 regsrc.mm##i = (6 << REGF_WDSHIFT) | REGSRC_STMMX | i; \
356 regty.mm##i = REGF_16; \
357 regfmt.mm##i = REGF_HEX;
360 #define REGDEF_SIMD(i) \
361 regsrc.xmm##i = (7 << REGF_WDSHIFT) | REGSRC_SIMD | i; \
362 regty.xmm##i = REGF_32; \
363 regfmt.xmm##i = REGF_HEX; \
364 regsrc.ymm##i = (8 << REGF_WDSHIFT) | REGSRC_SIMD | i; \
365 regty.ymm##i = REGF_32; \
366 regfmt.ymm##i = REGF_HEX;
372 REGDUMP_GPSIZE = REGIX_GPLIM*WORDSZ + REGIX_SEGLIM*2
374 # if CPUFAM_AMD64 && ABI_SYSV
375 REGDUMP_SPADJ = REGDUMP_GPSIZE + WORDSZ + 128
377 REGDUMP_SPADJ = REGDUMP_GPSIZE + WORDSZ
380 .macro _saveregs addr=nil
381 // Save the registers, leaving r/ebp pointing to the register map.
383 // Stash r/eax. This is bletcherous: hope we don't get a signal in
384 // the next few instructions.
385 mov [SP - REGDUMP_SPADJ + (REGIX_AX - 1)*WORDSZ], AX
387 .ifnes "\addr", "nil"
388 // Collect the effective address for the following dump, leaving it
389 // in the `addr' slot of the dump.
391 mov [SP - REGDUMP_SPADJ + (REGIX_ADDR - 1)*WORDSZ], AX
394 // Make space for the register save area. On AMD64 with System/V
395 // ABI, also skip the red zone. Use `lea' here to preserve the
397 lea SP, [SP - REGDUMP_SPADJ]
399 // Save flags and general-purpose registers. On 32-bit x86, we save
400 // ebx here and establish a GOT pointer here for the benefit of the
401 // PLT-indirect calls made later on.
404 mov [SP + 4*REGIX_BX], ebx
407 callext F(regdump_gpsave)
409 // Make space for the extended registers.
411 callext F(regdump_xtsave)
413 // Prepare for calling back into C. On 32-bit x86, leave space for
414 // the arguments and set up the GOT pointer; on AMD64 Windows, leave
415 // the `shadow space' for the called-function's arguments. Also,
416 // forcibly align the stack pointer to a 16-byte boundary.
426 // Restore registers.
428 // We assume r/ebp still points to the register map.
429 callext F(regdump_xtrstr)
431 callext F(regdump_gprstr)
433 lea SP, [SP + REGDUMP_SPADJ]
458 mov AX, [BP + regmap_gp]
460 mov eax, [eax + REGIX_ADDR*WORDSZ]
463 mov rdi, [rax + REGIX_ADDR*WORDSZ]
465 mov rcx, [rax + REGIX_ADDR*WORDSZ]
472 mov dword ptr [SP + 4], 0
480 lea eax, [INTADDR(.L$_reglbl$\@)]
483 lea rsi, [INTADDR(.L$_reglbl$\@)]
485 lea rdx, [INTADDR(.L$_reglbl$\@)]
496 mov dword ptr [SP + 8], \arg
508 /*----- ARM32 -------------------------------------------------------------*/
513 extern unsigned regdump__flags;
518 #define REGIX_CPSR 16
519 #define REGIX_ADDR 17
520 #define REGIX_GPLIM 18
522 #define REGIX_FPSCR 255
526 union neon64 { SIMD_COMMON(64); };
527 union neon128 { SIMD_COMMON(128); };
529 struct gpsave { union gp32 r[REGIX_GPLIM]; };
548 .extern regdump_gpsave
549 .extern regdump_xtsave
550 .extern regdump_xtrstr
551 .extern regdump_gprstr
557 #define REGDEF_GP(i) \
558 regsrc.r##i = REGSRC_GP | i; \
559 regty.r##i = REGF_32; \
560 regfmt.r##i = REGF_HEX;
563 regsrc.cpsr = REGSRC_GP | REGIX_CPSR
567 #define REGDEF_NEONS(i) \
568 regsrc.s##i = REGSRC_FP | i; \
569 regty.s##i = REGF_32; \
570 regfmt.s##i = REGF_FLT;
573 #define REGDEF_NEOND(i) \
574 regsrc.d##i = (6 << REGF_WDSHIFT) | REGSRC_FP | i; \
575 regty.d##i = REGF_32; \
576 regfmt.d##i = REGF_HEX;
579 #define REGDEF_NEONQ(i) \
580 regsrc.q##i = (7 << REGF_WDSHIFT) | REGSRC_FP | i; \
581 regty.q##i = REGF_32; \
582 regfmt.q##i = REGF_HEX;
585 regsrc.fpscr = REGSRC_FP | REGIX_FPSCR
586 regty.fpscr = REGF_32
589 REGDUMP_GPSIZE = 4*REGIX_GPLIM
590 REGDUMP_FPSIZE_D16 = 8 + 16*8
591 REGDUMP_FPSIZE_D32 = 8 + 32*8
593 .macro _saveregs base=nil, off=#0
594 // Save the registers, leaving r4 pointing to the register map.
596 // Stash r14. This is bletcherous: hope we don't get a signal in
597 // the next few instructions.
598 str r14, [r13, #-REGDUMP_GPSIZE + 14*4]
600 .ifnes "\base,\off", "nil,#0"
601 // Collect the effective address for the following dump, leaving it
602 // in the `addr' slot of the dump.
603 .ifeqs "\base", "nil"
608 str r14, [r13, #-REGDUMP_GPSIZE + 4*REGIX_ADDR]
611 // Make space for the register save area.
612 sub r13, r13, #REGDUMP_GPSIZE
614 // Save flags and general-purpose registers.
615 str r12, [r13, #4*12]
618 // Make space for the extended registers.
622 // Prepare for calling back into C.
630 // Restore registers.
632 // We assume r4 still points to the register map.
636 ldr r14, [r13, #14*4]
637 add r13, r13, #REGDUMP_GPSIZE
653 adrl r1, .L$_reglbl$\@
662 movw r2, #(\arg)&0xffff
663 movt r2, #((\arg) >> 16)&0xffff
670 /*----- ARM64 -------------------------------------------------------------*/
674 #define REGIX_NZCV 32
676 #define REGIX_ADDR 34
677 #define REGIX_GPLIM 36
679 #define REGIX_FPFLAGS 255
683 union v128 { SIMD_COMMON(128); };
685 struct gpsave { union gp64 r[REGIX_GPLIM]; };
699 .extern regdump_gpsave
700 .extern regdump_xtsave
701 .extern regdump_xtrstr
702 .extern regdump_gprstr
708 #define REGDEF_GP(i) \
709 regsrc.x##i = REGSRC_GP | i; \
710 regty.x##i = REGF_64; \
711 regfmt.x##i = REGF_HEX; \
712 regsrc.w##i = REGSRC_GP | i; \
713 regty.w##i = REGF_32; \
714 regfmt.w##i = REGF_HEX;
717 regsrc.sp = REGSRC_GP | 31
721 regsrc.pc = REGSRC_GP | REGIX_PC
725 regsrc.nzcv = REGSRC_GP | REGIX_NZCV
729 #define REGDEF_FP(i) \
730 regsrc.b##i = REGSRC_FP | i; \
731 regty.b##i = REGF_8; \
732 regfmt.b##i = REGF_HEX; \
733 regsrc.h##i = REGSRC_FP | i; \
734 regty.h##i = REGF_16; \
735 regfmt.h##i = REGF_HEX; \
736 regsrc.s##i = REGSRC_FP | i; \
737 regty.s##i = REGF_32; \
738 regfmt.s##i = REGF_FLT; \
739 regsrc.d##i = REGSRC_FP | i; \
740 regty.d##i = REGF_64; \
741 regfmt.d##i = REGF_FLT; \
742 regsrc.v##i = (7 << REGF_WDSHIFT) | REGSRC_FP | i; \
743 regty.v##i = REGF_32; \
744 regfmt.v##i = REGF_HEX;
747 regsrc.fpflags = REGSRC_FP | REGIX_FPFLAGS
748 regty.fpflags = REGF_32
751 REGDUMP_GPSIZE = 8*REGIX_GPLIM
752 REGDUMP_FPSIZE = 16 + 16 + 32*16
754 .macro _saveregs base=nil, off=#0
755 // Save the registers, leaving x20 pointing to the register map.
757 // Stash x30. This is bletcherous: hope we don't get a signal in
758 // the next few instructions.
759 str x30, [sp, #-REGDUMP_GPSIZE + 30*8]
761 .ifnes "\base,\off", "nil,#0"
762 // Collect the effective address for the following dump, leaving it
763 // in the `addr' slot of the dump.
764 .ifeqs "\base", "nil"
769 str x30, [sp, #-REGDUMP_GPSIZE + 8*REGIX_ADDR]
772 // Make space for the register save area.
773 sub sp, sp, #REGDUMP_GPSIZE
775 // Save flags and general-purpose registers.
776 stp x16, x17, [sp, #8*16]
779 // Make space for the extended registers.
785 // Restore registers.
787 // We assume x21 still points to the register map.
792 add sp, sp, #REGDUMP_GPSIZE
808 adr x1, .L$_reglbl$\@
817 movz w2, #(\arg)&0xffff
818 movk w2, #((\arg) >> 16)&0xffff, lsl #16
825 /*----- Functions provided ------------------------------------------------*/
827 /* --- @regdump_init@ --- *
833 * Use: Performs one-time initialization for register dumping. In
834 * particular, this performs CPU feature detection on platforms
835 * where that is a difficult task: without it, registers
836 * corresponding to optional architectural features can be
837 * neither printed nor preserved by the register-dump machinery.
841 extern void regdump_init(void);
844 /* --- @regdump@ --- *
846 * Arguments: @const void *base@ = pointer to base structure, corresponding
847 * to the @REGF_SRCMASK@ part of @f@
848 * @const char *lbl@ = label to print
849 * @uint32 f@ = format control word; see @REGF_...@
853 * Use: Dump a register value, or chunk of memory.
855 * This function is not usually called directly; instead, use
856 * the `reg' or `mem' assembler macros.
860 extern void regdump(const void *base, const char *lbl, uint32 f);
865 /* --- @regdump_gp@, @regdump_fp@, @regdump_simd@ --- *
867 * Arguments: @const struct regmap *map@ = pointer to register map
871 * Use: Dump the general-purpose/floating-point/SIMD registers.
873 * This function is not usually called directly; instead, use
874 * the `regdump' assembler macro.
878 extern void regdump_gp(const struct regmap */*map*/);
879 extern void regdump_fp(const struct regmap */*map*/);
880 extern void regdump_simd(const struct regmap */*map*/);
887 /* --- @regdump_freshline@ --- *
893 * Use: Begin a fresh line of output.
897 extern void regdump_freshline(void);
899 .extern regdump_freshline
902 /*----- Main user interface macros ----------------------------------------*/
908 callext F(regdump_freshline)
916 _regfmt REGSRC_NONE | (1 << REGF_WDSHIFT)
921 .macro reg lbl, rn, fmt=0
925 .L$reg.fmt$\@ = regsrc.\rn | \fmt | \
926 (((\fmt®F_TYMASK) == 0)®ty.\rn) | \
927 (((\fmt®F_FMTMASK) == 0)®fmt.\rn)
928 _regfmt .L$reg.fmt$\@
933 .macro mem lbl, addr, fmt=0
937 .L$mem.fmt$\@ = REGSRC_ABS | \fmt | \
938 (((\fmt®F_TYMASK) == 0)®F_32) | \
939 (((\fmt®F_FMTMASK) == 0)®F_HEX)
940 _regfmt .L$mem.fmt$\@
945 .macro regdump gp=nil, fp=nil, simd=nil
949 callext F(regdump_gp)
953 callext F(regdump_fp)
955 .ifnes "\simd", "nil"
957 callext F(regdump_simd)
964 /*----- That's all, folks -------------------------------------------------*/