diff options
| author | bhgv <bhgv.empire@gmail.com> | 2018-03-01 16:54:45 +0200 |
|---|---|---|
| committer | bhgv <bhgv.empire@gmail.com> | 2018-03-01 16:54:45 +0200 |
| commit | b786f20bbab5a59046aa78a2c6c2a11536497202 (patch) | |
| tree | 0851ecdec889eb9b7ba3751cc04d4f0b474e4a9e /utils/libmach | |
inferno-os tree was separated from the inferno-os-android (separated from the Android driver)
Diffstat (limited to 'utils/libmach')
46 files changed, 14646 insertions, 0 deletions
diff --git a/utils/libmach/4.c b/utils/libmach/4.c new file mode 100644 index 0000000..3b1f38d --- /dev/null +++ b/utils/libmach/4.c @@ -0,0 +1,139 @@ +/* + * mips definition + */ +#include <lib9.h> +#include <bio.h> +#include "ureg4.h" +#include "mach.h" + +#define FPREGBYTES 4 +#define REGOFF(x) (ulong)(&((struct Ureg *) 0)->x) + +#define SP REGOFF(u0.sp) +#define PC REGOFF(pc) +#define R1 REGOFF(hr1) +#define R31 REGOFF(hr31) +#define FP_REG(x) (R1+8+FPREGBYTES*(x)) + +#define REGSIZE sizeof(struct Ureg) +#define FPREGSIZE (FPREGBYTES*33) + +Reglist mips2reglist[] = { + {"STATUS", REGOFF(status), RINT|RRDONLY, 'X'}, + {"CAUSE", REGOFF(cause), RINT|RRDONLY, 'X'}, + {"BADVADDR", REGOFF(badvaddr), RINT|RRDONLY, 'X'}, + {"TLBVIRT", REGOFF(tlbvirt), RINT|RRDONLY, 'X'}, + {"HI", REGOFF(hhi), RINT|RRDONLY, 'Y'}, + {"LO", REGOFF(hlo), RINT|RRDONLY, 'Y'}, + {"PC", PC, RINT, 'X'}, + {"SP", SP, RINT, 'X'}, + {"R31", R31, RINT, 'Y'}, + {"R30", REGOFF(hr30), RINT, 'Y'}, + {"R28", REGOFF(hr28), RINT, 'Y'}, + {"R27", REGOFF(hr27), RINT, 'Y'}, + {"R26", REGOFF(hr26), RINT, 'Y'}, + {"R25", REGOFF(hr25), RINT, 'Y'}, + {"R24", REGOFF(hr24), RINT, 'Y'}, + {"R23", REGOFF(hr23), RINT, 'Y'}, + {"R22", REGOFF(hr22), RINT, 'Y'}, + {"R21", REGOFF(hr21), RINT, 'Y'}, + {"R20", REGOFF(hr20), RINT, 'Y'}, + {"R19", REGOFF(hr19), RINT, 'Y'}, + {"R18", REGOFF(hr18), RINT, 'Y'}, + {"R17", REGOFF(hr17), RINT, 'Y'}, + {"R16", REGOFF(hr16), RINT, 'Y'}, + {"R15", REGOFF(hr15), RINT, 'Y'}, + {"R14", REGOFF(hr14), RINT, 'Y'}, + {"R13", REGOFF(hr13), RINT, 'Y'}, + {"R12", REGOFF(hr12), RINT, 'Y'}, + {"R11", REGOFF(hr11), RINT, 'Y'}, + {"R10", REGOFF(hr10), RINT, 'Y'}, + {"R9", REGOFF(hr9), RINT, 'Y'}, + {"R8", REGOFF(hr8), RINT, 'Y'}, + {"R7", REGOFF(hr7), RINT, 'Y'}, + {"R6", REGOFF(hr6), RINT, 'Y'}, + {"R5", REGOFF(hr5), RINT, 'Y'}, + {"R4", REGOFF(hr4), RINT, 'Y'}, + {"R3", REGOFF(hr3), RINT, 'Y'}, + {"R2", REGOFF(hr2), RINT, 'Y'}, + {"R1", REGOFF(hr1), RINT, 'Y'}, + {"F0", FP_REG(0), RFLT, 'F'}, + {"F1", FP_REG(1), RFLT, 'f'}, + {"F2", FP_REG(2), RFLT, 'F'}, + {"F3", FP_REG(3), RFLT, 'f'}, + {"F4", FP_REG(4), RFLT, 'F'}, + {"F5", FP_REG(5), RFLT, 'f'}, + {"F6", FP_REG(6), RFLT, 'F'}, + {"F7", FP_REG(7), RFLT, 'f'}, + {"F8", FP_REG(8), RFLT, 'F'}, + {"F9", FP_REG(9), RFLT, 'f'}, + {"F10", FP_REG(10), RFLT, 'F'}, + {"F11", FP_REG(11), RFLT, 'f'}, + {"F12", FP_REG(12), RFLT, 'F'}, + {"F13", FP_REG(13), RFLT, 'f'}, + {"F14", FP_REG(14), RFLT, 'F'}, + {"F15", FP_REG(15), RFLT, 'f'}, + {"F16", FP_REG(16), RFLT, 'F'}, + {"F17", FP_REG(17), RFLT, 'f'}, + {"F18", FP_REG(18), RFLT, 'F'}, + {"F19", FP_REG(19), RFLT, 'f'}, + {"F20", FP_REG(20), RFLT, 'F'}, + {"F21", FP_REG(21), RFLT, 'f'}, + {"F22", FP_REG(22), RFLT, 'F'}, + {"F23", FP_REG(23), RFLT, 'f'}, + {"F24", FP_REG(24), RFLT, 'F'}, + {"F25", FP_REG(25), RFLT, 'f'}, + {"F26", FP_REG(26), RFLT, 'F'}, + {"F27", FP_REG(27), RFLT, 'f'}, + {"F28", FP_REG(28), RFLT, 'F'}, + {"F29", FP_REG(29), RFLT, 'f'}, + {"F30", FP_REG(30), RFLT, 'F'}, + {"F31", FP_REG(31), RFLT, 'f'}, + {"FPCR", FP_REG(32), RFLT, 'X'}, + { 0 } +}; + + /* the machine description */ +Mach mmips2be = +{ + "mips2", + MMIPS2, /* machine type */ + mips2reglist, /* register set */ + REGSIZE, /* number of bytes in reg set */ + FPREGSIZE, /* number of bytes in fp reg set */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "R31", /* name of link register */ + "setR30", /* static base register name */ + 0, /* SB value */ + 0x1000, /* page size */ + 0xC0000000, /* kernel base */ + 0x40000000, /* kernel text mask */ + 4, /* quantization of pc */ + 4, /* szaddr */ + 8, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; + +Mach mmips2le = +{ + "mips2", + NMIPS2, /* machine type */ + mips2reglist, /* register set */ + REGSIZE, /* number of bytes in reg set */ + FPREGSIZE, /* number of bytes in fp reg set */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "R31", /* name of link register */ + "setR30", /* static base register name */ + 0, /* SB value */ + 0x1000, /* page size */ + 0xC0000000, /* kernel base */ + 0x40000000, /* kernel text mask */ + 4, /* quantization of pc */ + 4, /* szaddr */ + 8, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/4db.c b/utils/libmach/4db.c new file mode 100644 index 0000000..d3fa97a --- /dev/null +++ b/utils/libmach/4db.c @@ -0,0 +1,57 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +/* + * Mips-specific debugger interface + */ + +char *mipsexcep(Map*, Rgetter); +int mipsfoll(Map*, ulong, Rgetter, ulong*); +int mipsinst(Map*, ulong, char, char*, int); +int mipsdas(Map*, ulong, char*, int); +int mipsinstlen(Map*, ulong); +/* + * Debugger interface + */ +Machdata mipsmach2be = +{ + {0, 0, 0, 0xD}, /* break point */ + 4, /* break point size */ + + beswab, /* short to local byte order */ + beswal, /* long to local byte order */ + beswav, /* vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + mipsexcep, /* print exception */ + 0, /* breakpoint fixup */ + beieeesftos, /* single precision float printer */ + beieeedftos, /* double precisioin float printer */ + mipsfoll, /* following addresses */ + mipsinst, /* print instruction */ + mipsdas, /* dissembler */ + mipsinstlen, /* instruction size */ +}; + +/* + * Debugger interface + */ +Machdata mipsmach2le = +{ + {0, 0, 0, 0xD}, /* break point */ + 4, /* break point size */ + + leswab, /* short to local byte order */ + leswal, /* long to local byte order */ + leswav, /* vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + mipsexcep, /* print exception */ + 0, /* breakpoint fixup */ + leieeesftos, /* single precision float printer */ + leieeedftos, /* double precisioin float printer */ + mipsfoll, /* following addresses */ + mipsinst, /* print instruction */ + mipsdas, /* dissembler */ + mipsinstlen, /* instruction size */ +}; diff --git a/utils/libmach/5.c b/utils/libmach/5.c new file mode 100644 index 0000000..a96f938 --- /dev/null +++ b/utils/libmach/5.c @@ -0,0 +1,64 @@ +/* + * arm definition + */ +#include <lib9.h> +#include <bio.h> +#include "ureg5.h" +#include "mach.h" + + +#define REGOFF(x) (ulong) (&((struct Ureg *) 0)->x) + +#define SP REGOFF(r13) +#define PC REGOFF(pc) + +#define REGSIZE sizeof(struct Ureg) + +Reglist armreglist[] = +{ + {"TYPE", REGOFF(type), RINT|RRDONLY, 'X'}, + {"PSR", REGOFF(psr), RINT|RRDONLY, 'X'}, + {"PC", PC, RINT, 'X'}, + {"SP", SP, RINT, 'X'}, + {"R15", PC, RINT, 'X'}, + {"R14", REGOFF(r14), RINT, 'X'}, + {"R13", REGOFF(r13), RINT, 'X'}, + {"R12", REGOFF(r12), RINT, 'X'}, + {"R11", REGOFF(r11), RINT, 'X'}, + {"R10", REGOFF(r10), RINT, 'X'}, + {"R9", REGOFF(r9), RINT, 'X'}, + {"R8", REGOFF(r8), RINT, 'X'}, + {"R7", REGOFF(r7), RINT, 'X'}, + {"R6", REGOFF(r6), RINT, 'X'}, + {"R5", REGOFF(r5), RINT, 'X'}, + {"R4", REGOFF(r4), RINT, 'X'}, + {"R3", REGOFF(r3), RINT, 'X'}, + {"R2", REGOFF(r2), RINT, 'X'}, + {"R1", REGOFF(r1), RINT, 'X'}, + {"R0", REGOFF(r0), RINT, 'X'}, + { 0 } +}; + + /* the machine description */ +Mach marm = +{ + "arm", + MARM, /* machine type */ + armreglist, /* register set */ + REGSIZE, /* register set size */ + 0, /* fp register set size */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "R14", /* name of link register */ + "setR12", /* static base register name */ + 0, /* static base register value */ + 0x1000, /* page size */ + 0xC0000000, /* kernel base */ + 0xC0000000, /* kernel text mask */ + 0x3FFFFFFF, /* user stack top */ + 4, /* quantization of pc */ + 4, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/5db.c b/utils/libmach/5db.c new file mode 100644 index 0000000..fb6bf89 --- /dev/null +++ b/utils/libmach/5db.c @@ -0,0 +1,1121 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +static int debug = 0; + +#define BITS(a, b) ((1<<(b+1))-(1<<a)) + +#define LSR(v, s) ((ulong)(v) >> (s)) +#define ASR(v, s) ((long)(v) >> (s)) +#define ROR(v, s) (LSR((v), (s)) | (((v) & ((1 << (s))-1)) << (32 - (s)))) + + + +typedef struct Instr Instr; +struct Instr +{ + Map *map; + ulong w; + uvlong addr; + uchar op; /* super opcode */ + + uchar cond; /* bits 28-31 */ + uchar store; /* bit 20 */ + + uchar rd; /* bits 12-15 */ + uchar rn; /* bits 16-19 */ + uchar rs; /* bits 0-11 (shifter operand) */ + + long imm; /* rotated imm */ + char* curr; /* fill point in buffer */ + char* end; /* end of buffer */ + char* err; /* error message */ +}; + +typedef struct Opcode Opcode; +struct Opcode +{ + char* o; + void (*fmt)(Opcode*, Instr*); + uvlong (*foll)(Map*, Rgetter, Instr*, uvlong); + char* a; +}; + +static void format(char*, Instr*, char*); +static char FRAMENAME[] = ".frame"; + +/* + * Arm-specific debugger interface + */ + +static char *armexcep(Map*, Rgetter); +static int armfoll(Map*, uvlong, Rgetter, uvlong*); +static int arminst(Map*, uvlong, char, char*, int); +static int armdas(Map*, uvlong, char*, int); +static int arminstlen(Map*, uvlong); + +/* + * Debugger interface + */ +Machdata armmach = +{ + {0x70, 0x00, 0x20, 0xD1}, /* break point */ /* D1200070 */ + 4, /* break point size */ + + leswab, /* short to local byte order */ + leswal, /* long to local byte order */ + leswav, /* long to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + armexcep, /* print exception */ + 0, /* breakpoint fixup */ + 0, /* single precision float printer */ + 0, /* double precision float printer */ + armfoll, /* following addresses */ + arminst, /* print instruction */ + armdas, /* dissembler */ + arminstlen, /* instruction size */ +}; + +static char* +armexcep(Map *map, Rgetter rget) +{ + uvlong c; + + c = (*rget)(map, "TYPE"); + switch ((int)c&0x1f) { + case 0x11: + return "Fiq interrupt"; + case 0x12: + return "Mirq interrupt"; + case 0x13: + return "SVC/SWI Exception"; + case 0x17: + return "Prefetch Abort/Data Abort"; + case 0x18: + return "Data Abort"; + case 0x1b: + return "Undefined instruction/Breakpoint"; + case 0x1f: + return "Sys trap"; + default: + return "Undefined trap"; + } +} + +static +char* cond[16] = +{ + "EQ", "NE", "CS", "CC", + "MI", "PL", "VS", "VC", + "HI", "LS", "GE", "LT", + "GT", "LE", 0, "NV" +}; + +static +char* shtype[4] = +{ + "<<", ">>", "->", "@>" +}; + +static +char *hb[4] = +{ + "?", "HU", "B", "H" +}; + +static +char* addsub[2] = +{ + "-", "+", +}; + +int +armclass(long w) +{ + int op, done; + + op = (w >> 25) & 0x7; + switch(op) { + case 0: /* data processing r,r,r */ + op = ((w >> 4) & 0xf); + if(op == 0x9) { + op = 48+16; /* mul, swp or *rex */ + if((w & 0x0ff00fff) == 0x01900f9f) { + op = 93; /* ldrex */ + break; + } + if((w & 0x0ff00ff0) == 0x01800f90) { + op = 94; /* strex */ + break; + } + if(w & (1<<24)) { + op += 2; + if(w & (1<<22)) + op++; /* swpb */ + break; + } + if(w & (1<<23)) { /* mullu */ + op = (48+24+4+4+2+2+4); + if(w & (1<<22)) /* mull */ + op += 2; + } + if(w & (1<<21)) + op++; /* mla */ + break; + } + if((op & 0x9) == 0x9) /* ld/st byte/half s/u */ + { + op = (48+16+4) + ((w >> 22) & 0x1) + ((w >> 19) & 0x2); + break; + } + op = (w >> 21) & 0xf; + if(w & (1<<4)) + op += 32; + else + if((w & (31<<7)) || (w & (1<<5))) + op += 16; + break; + case 1: /* data processing i,r,r */ + op = (48) + ((w >> 21) & 0xf); + break; + case 2: /* load/store byte/word i(r) */ + if ((w & 0xffffff8f) == 0xf57ff00f) { /* barriers, clrex */ + done = 1; + switch ((w >> 4) & 7) { + case 1: + op = 95; /* clrex */ + break; + case 4: + op = 96; /* dsb */ + break; + case 5: + op = 97; /* dmb */ + break; + case 6: + op = 98; /* isb */ + break; + default: + done = 0; + break; + } + if (done) + break; + } + op = (48+24) + ((w >> 22) & 0x1) + ((w >> 19) & 0x2); + break; + case 3: /* load/store byte/word (r)(r) */ + op = (48+24+4) + ((w >> 22) & 0x1) + ((w >> 19) & 0x2); + break; + case 4: /* block data transfer (r)(r) */ + if ((w & 0xfe50ffff) == 0xf8100a00) { /* v7 RFE */ + op = 99; + break; + } + op = (48+24+4+4) + ((w >> 20) & 0x1); + break; + case 5: /* branch / branch link */ + op = (48+24+4+4+2) + ((w >> 24) & 0x1); + break; + case 7: /* coprocessor crap */ + op = (48+24+4+4+2+2) + ((w >> 3) & 0x2) + ((w >> 20) & 0x1); + break; + default: + op = (48+24+4+4+2+2+4+4); + break; + } + return op; +} + +static int +decode(Map *map, uvlong pc, Instr *i) +{ + ulong w; + + if(get4(map, pc, &w) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + i->w = w; + i->addr = pc; + i->cond = (w >> 28) & 0xF; + i->op = armclass(w); + i->map = map; + return 1; +} + +#pragma varargck argpos bprint 2 + +static void +bprint(Instr *i, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + i->curr = vseprint(i->curr, i->end, fmt, arg); + va_end(arg); +} + +static int +plocal(Instr *i) +{ + char *reg; + Symbol s; + char *fn; + int class; + int offset; + + if(!findsym(i->addr, CTEXT, &s)) { + if(debug)fprint(2,"fn not found @%llux: %r\n", i->addr); + return 0; + } + fn = s.name; + if (!findlocal(&s, FRAMENAME, &s)) { + if(debug)fprint(2,"%s.%s not found @%s: %r\n", fn, FRAMENAME, s.name); + return 0; + } + if(s.value > i->imm) { + class = CAUTO; + offset = s.value-i->imm; + reg = "(SP)"; + } else { + class = CPARAM; + offset = i->imm-s.value-4; + reg = "(FP)"; + } + if(!getauto(&s, offset, class, &s)) { + if(debug)fprint(2,"%s %s not found @%ux: %r\n", fn, + class == CAUTO ? " auto" : "param", offset); + return 0; + } + bprint(i, "%s%c%lld%s", s.name, class == CPARAM ? '+' : '-', s.value, reg); + return 1; +} + +/* + * Print value v as name[+offset] + */ +static int +gsymoff(char *buf, int n, long v, int space) +{ + Symbol s; + int r; + long delta; + + r = delta = 0; /* to shut compiler up */ + if (v) { + r = findsym(v, space, &s); + if (r) + delta = v-s.value; + if (delta < 0) + delta = -delta; + } + if (v == 0 || r == 0 || delta >= 4096) + return snprint(buf, n, "#%lux", v); + if (strcmp(s.name, ".string") == 0) + return snprint(buf, n, "#%lux", v); + if (!delta) + return snprint(buf, n, "%s", s.name); + if (s.type != 't' && s.type != 'T') + return snprint(buf, n, "%s+%llux", s.name, v-s.value); + else + return snprint(buf, n, "#%lux", v); +} + +static void +armdps(Opcode *o, Instr *i) +{ + i->store = (i->w >> 20) & 1; + i->rn = (i->w >> 16) & 0xf; + i->rd = (i->w >> 12) & 0xf; + i->rs = (i->w >> 0) & 0xf; + if(i->rn == 15 && i->rs == 0) { + if(i->op == 8) { + format("MOVW", i,"CPSR, R%d"); + return; + } else + if(i->op == 10) { + format("MOVW", i,"SPSR, R%d"); + return; + } + } else + if(i->rn == 9 && i->rd == 15) { + if(i->op == 9) { + format("MOVW", i, "R%s, CPSR"); + return; + } else + if(i->op == 11) { + format("MOVW", i, "R%s, SPSR"); + return; + } + } + format(o->o, i, o->a); +} + +static void +armdpi(Opcode *o, Instr *i) +{ + ulong v; + int c; + + v = (i->w >> 0) & 0xff; + c = (i->w >> 8) & 0xf; + while(c) { + v = (v<<30) | (v>>2); + c--; + } + i->imm = v; + i->store = (i->w >> 20) & 1; + i->rn = (i->w >> 16) & 0xf; + i->rd = (i->w >> 12) & 0xf; + i->rs = i->w&0x0f; + + /* RET is encoded as ADD #0,R14,R15 */ + if((i->w & 0x0fffffff) == 0x028ef000){ + format("RET%C", i, ""); + return; + } + if((i->w & 0x0ff0ffff) == 0x0280f000){ + format("B%C", i, "0(R%n)"); + return; + } + format(o->o, i, o->a); +} + +static void +armsdti(Opcode *o, Instr *i) +{ + ulong v; + + v = i->w & 0xfff; + if(!(i->w & (1<<23))) + v = -v; + i->store = ((i->w >> 23) & 0x2) | ((i->w >>21) & 0x1); + i->imm = v; + i->rn = (i->w >> 16) & 0xf; + i->rd = (i->w >> 12) & 0xf; + /* RET is encoded as LW.P x,R13,R15 */ + if ((i->w & 0x0ffff000) == 0x049df000) + { + format("RET%C%p", i, "%I"); + return; + } + format(o->o, i, o->a); +} + +/* arm V4 ld/st halfword, signed byte */ +static void +armhwby(Opcode *o, Instr *i) +{ + i->store = ((i->w >> 23) & 0x2) | ((i->w >>21) & 0x1); + i->imm = (i->w & 0xf) | ((i->w >> 8) & 0xf); + if (!(i->w & (1 << 23))) + i->imm = - i->imm; + i->rn = (i->w >> 16) & 0xf; + i->rd = (i->w >> 12) & 0xf; + i->rs = (i->w >> 0) & 0xf; + format(o->o, i, o->a); +} + +static void +armsdts(Opcode *o, Instr *i) +{ + i->store = ((i->w >> 23) & 0x2) | ((i->w >>21) & 0x1); + i->rs = (i->w >> 0) & 0xf; + i->rn = (i->w >> 16) & 0xf; + i->rd = (i->w >> 12) & 0xf; + format(o->o, i, o->a); +} + +static void +armbdt(Opcode *o, Instr *i) +{ + i->store = (i->w >> 21) & 0x3; /* S & W bits */ + i->rn = (i->w >> 16) & 0xf; + i->imm = i->w & 0xffff; + if(i->w == 0xe8fd8000) + format("RFE", i, ""); + else + format(o->o, i, o->a); +} + +static void +armund(Opcode *o, Instr *i) +{ + format(o->o, i, o->a); +} + +static void +armcdt(Opcode *o, Instr *i) +{ + format(o->o, i, o->a); +} + +static void +armunk(Opcode *o, Instr *i) +{ + format(o->o, i, o->a); +} + +static void +armb(Opcode *o, Instr *i) +{ + ulong v; + + v = i->w & 0xffffff; + if(v & 0x800000) + v |= ~0xffffff; + i->imm = (v<<2) + i->addr + 8; + format(o->o, i, o->a); +} + +static void +armco(Opcode *o, Instr *i) /* coprocessor instructions */ +{ + int op, p, cp; + + char buf[1024]; + + i->rn = (i->w >> 16) & 0xf; + i->rd = (i->w >> 12) & 0xf; + i->rs = i->w&0xf; + cp = (i->w >> 8) & 0xf; + p = (i->w >> 5) & 0x7; + if(i->w&(1<<4)) { + op = (i->w >> 21) & 0x07; + snprint(buf, sizeof(buf), "#%x, #%x, R%d, C(%d), C(%d), #%x", cp, op, i->rd, i->rn, i->rs, p); + } else { + op = (i->w >> 20) & 0x0f; + snprint(buf, sizeof(buf), "#%x, #%x, C(%d), C(%d), C(%d), #%x", cp, op, i->rd, i->rn, i->rs, p); + } + format(o->o, i, buf); +} + +static int +armcondpass(Map *map, Rgetter rget, uchar cond) +{ + uvlong psr; + uchar n; + uchar z; + uchar c; + uchar v; + + psr = rget(map, "PSR"); + n = (psr >> 31) & 1; + z = (psr >> 30) & 1; + c = (psr >> 29) & 1; + v = (psr >> 28) & 1; + + switch(cond) { + default: + case 0: return z; + case 1: return !z; + case 2: return c; + case 3: return !c; + case 4: return n; + case 5: return !n; + case 6: return v; + case 7: return !v; + case 8: return c && !z; + case 9: return !c || z; + case 10: return n == v; + case 11: return n != v; + case 12: return !z && (n == v); + case 13: return z && (n != v); + case 14: return 1; + case 15: return 0; + } +} + +static ulong +armshiftval(Map *map, Rgetter rget, Instr *i) +{ + if(i->w & (1 << 25)) { /* immediate */ + ulong imm = i->w & BITS(0, 7); + ulong s = (i->w & BITS(8, 11)) >> 7; /* this contains the *2 */ + return ROR(imm, s); + } else { + char buf[8]; + ulong v; + ulong s = (i->w & BITS(7,11)) >> 7; + + sprint(buf, "R%ld", i->w & 0xf); + v = rget(map, buf); + + switch((i->w & BITS(4, 6)) >> 4) { + default: + case 0: /* LSLIMM */ + return v << s; + case 1: /* LSLREG */ + sprint(buf, "R%lud", s >> 1); + s = rget(map, buf) & 0xFF; + if(s >= 32) return 0; + return v << s; + case 2: /* LSRIMM */ + return LSR(v, s); + case 3: /* LSRREG */ + sprint(buf, "R%ld", s >> 1); + s = rget(map, buf) & 0xFF; + if(s >= 32) return 0; + return LSR(v, s); + case 4: /* ASRIMM */ + if(s == 0) { + if((v & (1U<<31)) == 0) + return 0; + return 0xFFFFFFFF; + } + return ASR(v, s); + case 5: /* ASRREG */ + sprint(buf, "R%ld", s >> 1); + s = rget(map, buf) & 0xFF; + if(s >= 32) { + if((v & (1U<<31)) == 0) + return 0; + return 0xFFFFFFFF; + } + return ASR(v, s); + case 6: /* RORIMM */ + if(s == 0) { + ulong c = (rget(map, "PSR") >> 29) & 1; + + return (c << 31) | LSR(v, 1); + } + return ROR(v, s); + case 7: /* RORREG */ + sprint(buf, "R%ld", (s>>1)&0xF); + s = rget(map, buf); + if(s == 0 || (s & 0xF) == 0) + return v; + return ROR(v, s & 0xF); + } + } +} + +static int +nbits(ulong v) +{ + int n = 0; + int i; + + for(i=0; i < 32 ; i++) { + if(v & 1) ++n; + v >>= 1; + } + + return n; +} + +static ulong +armmaddr(Map *map, Rgetter rget, Instr *i) +{ + ulong v; + ulong nb; + char buf[8]; + ulong rn; + + rn = (i->w >> 16) & 0xf; + sprint(buf,"R%ld", rn); + + v = rget(map, buf); + nb = nbits(i->w & ((1 << 15) - 1)); + + switch((i->w >> 23) & 3) { + default: + case 0: return (v - (nb*4)) + 4; + case 1: return v; + case 2: return v - (nb*4); + case 3: return v + 4; + } +} + +static uvlong +armaddr(Map *map, Rgetter rget, Instr *i) +{ + char buf[8]; + ulong rn; + + snprint(buf, sizeof(buf), "R%ld", (i->w >> 16) & 0xf); + rn = rget(map, buf); + + if((i->w & (1<<24)) == 0) /* POSTIDX */ + return rn; + + if((i->w & (1<<25)) == 0) { /* OFFSET */ + if(i->w & (1U<<23)) + return rn + (i->w & BITS(0,11)); + return rn - (i->w & BITS(0,11)); + } else { /* REGOFF */ + ulong index = 0; + uchar c; + uchar rm; + + sprint(buf, "R%ld", i->w & 0xf); + rm = rget(map, buf); + + switch((i->w & BITS(5,6)) >> 5) { + case 0: index = rm << ((i->w & BITS(7,11)) >> 7); break; + case 1: index = LSR(rm, ((i->w & BITS(7,11)) >> 7)); break; + case 2: index = ASR(rm, ((i->w & BITS(7,11)) >> 7)); break; + case 3: + if((i->w & BITS(7,11)) == 0) { + c = (rget(map, "PSR") >> 29) & 1; + index = c << 31 | LSR(rm, 1); + } else { + index = ROR(rm, ((i->w & BITS(7,11)) >> 7)); + } + break; + } + if(i->w & (1<<23)) + return rn + index; + return rn - index; + } +} + +static uvlong +armfadd(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + char buf[8]; + int r; + + r = (i->w >> 12) & 0xf; + if(r != 15 || !armcondpass(map, rget, (i->w >> 28) & 0xf)) + return pc+4; + + r = (i->w >> 16) & 0xf; + sprint(buf, "R%d", r); + + return rget(map, buf) + armshiftval(map, rget, i); +} + +static uvlong +armfmovm(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + ulong v; + ulong addr; + + v = i->w & 1<<15; + if(!v || !armcondpass(map, rget, (i->w>>28)&0xf)) + return pc+4; + + addr = armmaddr(map, rget, i) + nbits(i->w & BITS(0,15)); + if(get4(map, addr, &v) < 0) { + werrstr("can't read addr: %r"); + return -1; + } + return v; +} + +static uvlong +armfbranch(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + if(!armcondpass(map, rget, (i->w >> 28) & 0xf)) + return pc+4; + + return pc + (((signed long)i->w << 8) >> 6) + 8; +} + +static uvlong +armfmov(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + ulong rd, v; + + rd = (i->w >> 12) & 0xf; + if(rd != 15 || !armcondpass(map, rget, (i->w>>28)&0xf)) + return pc+4; + + /* LDR */ + /* BUG: Needs LDH/B, too */ + if(((i->w>>26)&0x3) == 1) { + if(get4(map, armaddr(map, rget, i), &v) < 0) { + werrstr("can't read instruction: %r"); + return pc+4; + } + return v; + } + + /* MOV */ + v = armshiftval(map, rget, i); + + return v; +} + +static Opcode opcodes[] = +{ + "AND%C%S", armdps, 0, "R%s,R%n,R%d", + "EOR%C%S", armdps, 0, "R%s,R%n,R%d", + "SUB%C%S", armdps, 0, "R%s,R%n,R%d", + "RSB%C%S", armdps, 0, "R%s,R%n,R%d", + "ADD%C%S", armdps, armfadd, "R%s,R%n,R%d", + "ADC%C%S", armdps, 0, "R%s,R%n,R%d", + "SBC%C%S", armdps, 0, "R%s,R%n,R%d", + "RSC%C%S", armdps, 0, "R%s,R%n,R%d", + "TST%C%S", armdps, 0, "R%s,R%n", + "TEQ%C%S", armdps, 0, "R%s,R%n", + "CMP%C%S", armdps, 0, "R%s,R%n", + "CMN%C%S", armdps, 0, "R%s,R%n", + "ORR%C%S", armdps, 0, "R%s,R%n,R%d", + "MOVW%C%S", armdps, armfmov, "R%s,R%d", + "BIC%C%S", armdps, 0, "R%s,R%n,R%d", + "MVN%C%S", armdps, 0, "R%s,R%d", + +/* 16 */ + "AND%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "EOR%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "SUB%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "RSB%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "ADD%C%S", armdps, armfadd, "(R%s%h%m),R%n,R%d", + "ADC%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "SBC%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "RSC%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "TST%C%S", armdps, 0, "(R%s%h%m),R%n", + "TEQ%C%S", armdps, 0, "(R%s%h%m),R%n", + "CMP%C%S", armdps, 0, "(R%s%h%m),R%n", + "CMN%C%S", armdps, 0, "(R%s%h%m),R%n", + "ORR%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "MOVW%C%S", armdps, armfmov, "(R%s%h%m),R%d", + "BIC%C%S", armdps, 0, "(R%s%h%m),R%n,R%d", + "MVN%C%S", armdps, 0, "(R%s%h%m),R%d", + +/* 32 */ + "AND%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "EOR%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "SUB%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "RSB%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "ADD%C%S", armdps, armfadd, "(R%s%hR%M),R%n,R%d", + "ADC%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "SBC%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "RSC%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "TST%C%S", armdps, 0, "(R%s%hR%M),R%n", + "TEQ%C%S", armdps, 0, "(R%s%hR%M),R%n", + "CMP%C%S", armdps, 0, "(R%s%hR%M),R%n", + "CMN%C%S", armdps, 0, "(R%s%hR%M),R%n", + "ORR%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "MOVW%C%S", armdps, armfmov, "(R%s%hR%M),R%d", + "BIC%C%S", armdps, 0, "(R%s%hR%M),R%n,R%d", + "MVN%C%S", armdps, 0, "(R%s%hR%M),R%d", + +/* 48 */ + "AND%C%S", armdpi, 0, "$#%i,R%n,R%d", + "EOR%C%S", armdpi, 0, "$#%i,R%n,R%d", + "SUB%C%S", armdpi, 0, "$#%i,R%n,R%d", + "RSB%C%S", armdpi, 0, "$#%i,R%n,R%d", + "ADD%C%S", armdpi, armfadd, "$#%i,R%n,R%d", + "ADC%C%S", armdpi, 0, "$#%i,R%n,R%d", + "SBC%C%S", armdpi, 0, "$#%i,R%n,R%d", + "RSC%C%S", armdpi, 0, "$#%i,R%n,R%d", + "TST%C%S", armdpi, 0, "$#%i,R%n", + "TEQ%C%S", armdpi, 0, "$#%i,R%n", + "CMP%C%S", armdpi, 0, "$#%i,R%n", + "CMN%C%S", armdpi, 0, "$#%i,R%n", + "ORR%C%S", armdpi, 0, "$#%i,R%n,R%d", + "MOVW%C%S", armdpi, armfmov, "$#%i,R%d", + "BIC%C%S", armdpi, 0, "$#%i,R%n,R%d", + "MVN%C%S", armdpi, 0, "$#%i,R%d", + +/* 48+16 */ + "MUL%C%S", armdpi, 0, "R%M,R%s,R%n", + "MULA%C%S", armdpi, 0, "R%M,R%s,R%n,R%d", + "SWPW", armdpi, 0, "R%s,(R%n),R%d", + "SWPB", armdpi, 0, "R%s,(R%n),R%d", + +/* 48+16+4 */ + "MOV%u%C%p", armhwby, 0, "R%d,(R%n%UR%M)", + "MOV%u%C%p", armhwby, 0, "R%d,%I", + "MOV%u%C%p", armhwby, armfmov, "(R%n%UR%M),R%d", + "MOV%u%C%p", armhwby, armfmov, "%I,R%d", + +/* 48+24 */ + "MOVW%C%p", armsdti, 0, "R%d,%I", + "MOVB%C%p", armsdti, 0, "R%d,%I", + "MOVW%C%p", armsdti, armfmov, "%I,R%d", + "MOVBU%C%p", armsdti, armfmov, "%I,R%d", + + "MOVW%C%p", armsdts, 0, "R%d,(R%s%h%m)(R%n)", + "MOVB%C%p", armsdts, 0, "R%d,(R%s%h%m)(R%n)", + "MOVW%C%p", armsdts, armfmov, "(R%s%h%m)(R%n),R%d", + "MOVBU%C%p", armsdts, armfmov, "(R%s%h%m)(R%n),R%d", + + "MOVM%C%P%a", armbdt, armfmovm, "[%r],(R%n)", + "MOVM%C%P%a", armbdt, armfmovm, "(R%n),[%r]", + + "B%C", armb, armfbranch, "%b", + "BL%C", armb, armfbranch, "%b", + + "CDP%C", armco, 0, "", + "CDP%C", armco, 0, "", + "MCR%C", armco, 0, "", + "MRC%C", armco, 0, "", + +/* 48+24+4+4+2+2+4 */ + "MULLU%C%S", armdpi, 0, "R%M,R%s,(R%n,R%d)", + "MULALU%C%S", armdpi, 0, "R%M,R%s,(R%n,R%d)", + "MULL%C%S", armdpi, 0, "R%M,R%s,(R%n,R%d)", + "MULAL%C%S", armdpi, 0, "R%M,R%s,(R%n,R%d)", + +/* 48+24+4+4+2+2+4+4 = 92 */ + "UNK", armunk, 0, "", + + /* new v7 arch instructions */ +/* 93 */ + "LDREX", armdpi, 0, "(R%n),R%d", + "STREX", armdpi, 0, "R%s,(R%n),R%d", + "CLREX", armunk, 0, "", + +/* 96 */ + "DSB", armunk, 0, "", + "DMB", armunk, 0, "", + "ISB", armunk, 0, "", + +/* 99 */ + "RFEV7%P%a", armbdt, 0, "(R%n)", +}; + +static void +gaddr(Instr *i) +{ + *i->curr++ = '$'; + i->curr += gsymoff(i->curr, i->end-i->curr, i->imm, CANY); +} + +static char *mode[] = { 0, "IA", "DB", "IB" }; +static char *pw[] = { "P", "PW", 0, "W" }; +static char *sw[] = { 0, "W", "S", "SW" }; + +static void +format(char *mnemonic, Instr *i, char *f) +{ + int j, k, m, n; + int g; + char *fmt; + + if(mnemonic) + format(0, i, mnemonic); + if(f == 0) + return; + if(mnemonic) + if(i->curr < i->end) + *i->curr++ = '\t'; + for ( ; *f && i->curr < i->end; f++) { + if(*f != '%') { + *i->curr++ = *f; + continue; + } + switch (*++f) { + + case 'C': /* .CONDITION */ + if(cond[i->cond]) + bprint(i, ".%s", cond[i->cond]); + break; + + case 'S': /* .STORE */ + if(i->store) + bprint(i, ".S"); + break; + + case 'P': /* P & U bits for block move */ + n = (i->w >>23) & 0x3; + if (mode[n]) + bprint(i, ".%s", mode[n]); + break; + + case 'p': /* P & W bits for single data xfer*/ + if (pw[i->store]) + bprint(i, ".%s", pw[i->store]); + break; + + case 'a': /* S & W bits for single data xfer*/ + if (sw[i->store]) + bprint(i, ".%s", sw[i->store]); + break; + + case 's': + bprint(i, "%d", i->rs & 0xf); + break; + + case 'M': + bprint(i, "%lud", (i->w>>8) & 0xf); + break; + + case 'm': + bprint(i, "%lud", (i->w>>7) & 0x1f); + break; + + case 'h': + bprint(i, shtype[(i->w>>5) & 0x3]); + break; + + case 'u': /* Signed/unsigned Byte/Halfword */ + bprint(i, hb[(i->w>>5) & 0x3]); + break; + + case 'I': + if (i->rn == 13) { + if (plocal(i)) + break; + } + g = 0; + fmt = "#%lx(R%d)"; + if (i->rn == 15) { + /* convert load of offset(PC) to a load immediate */ + if (get4(i->map, i->addr+i->imm+8, (ulong*)&i->imm) > 0) + { + g = 1; + fmt = ""; + } + } + if (mach->sb) + { + if (i->rd == 11) { + ulong nxti; + + if (get4(i->map, i->addr+4, &nxti) > 0) { + if ((nxti & 0x0e0f0fff) == 0x060c000b) { + i->imm += mach->sb; + g = 1; + fmt = "-SB"; + } + } + } + if (i->rn == 12) + { + i->imm += mach->sb; + g = 1; + fmt = "-SB(SB)"; + } + } + if (g) + { + gaddr(i); + bprint(i, fmt, i->rn); + } + else + bprint(i, fmt, i->imm, i->rn); + break; + case 'U': /* Add/subtract from base */ + bprint(i, addsub[(i->w >> 23) & 1]); + break; + + case 'n': + bprint(i, "%d", i->rn); + break; + + case 'd': + bprint(i, "%d", i->rd); + break; + + case 'i': + bprint(i, "%lux", i->imm); + break; + + case 'b': + i->curr += symoff(i->curr, i->end-i->curr, + i->imm, CTEXT); + break; + + case 'g': + i->curr += gsymoff(i->curr, i->end-i->curr, + i->imm, CANY); + break; + + case 'r': + n = i->imm&0xffff; + j = 0; + k = 0; + while(n) { + m = j; + while(n&0x1) { + j++; + n >>= 1; + } + if(j != m) { + if(k) + bprint(i, ","); + if(j == m+1) + bprint(i, "R%d", m); + else + bprint(i, "R%d-R%d", m, j-1); + k = 1; + } + j++; + n >>= 1; + } + break; + + case '\0': + *i->curr++ = '%'; + return; + + default: + bprint(i, "%%%c", *f); + break; + } + } + *i->curr = 0; +} + +static int +printins(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + + i.curr = buf; + i.end = buf+n-1; + if(decode(map, pc, &i) < 0) + return -1; + + (*opcodes[i.op].fmt)(&opcodes[i.op], &i); + return 4; +} + +static int +arminst(Map *map, uvlong pc, char modifier, char *buf, int n) +{ + USED(modifier); + return printins(map, pc, buf, n); +} + +static int +armdas(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + + i.curr = buf; + i.end = buf+n; + if(decode(map, pc, &i) < 0) + return -1; + if(i.end-i.curr > 8) + i.curr = _hexify(buf, i.w, 7); + *i.curr = 0; + return 4; +} + +static int +arminstlen(Map *map, uvlong pc) +{ + Instr i; + + if(decode(map, pc, &i) < 0) + return -1; + return 4; +} + +static int +armfoll(Map *map, uvlong pc, Rgetter rget, uvlong *foll) +{ + uvlong d; + Instr i; + + if(decode(map, pc, &i) < 0) + return -1; + + if(opcodes[i.op].foll) { + d = (*opcodes[i.op].foll)(map, rget, &i, pc); + if(d == -1) + return -1; + } else + d = pc+4; + + foll[0] = d; + return 1; +} diff --git a/utils/libmach/5obj.c b/utils/libmach/5obj.c new file mode 100644 index 0000000..4cf6940 --- /dev/null +++ b/utils/libmach/5obj.c @@ -0,0 +1,137 @@ +/* + * 5obj.c - identify and parse a arm object file + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "5c/5.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char type; + char sym; + char name; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + +int +_is5(char *s) +{ + return s[0] == ANAME /* ANAME */ + && s[1] == D_FILE /* type */ + && s[2] == 1 /* sym */ + && s[3] == '<'; /* name of file */ +} + +int +_read5(Biobuf *bp, Prog *p) +{ + int as, n; + Addr a; + + as = Bgetc(bp); /* as */ + if(as < 0) + return 0; + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = leswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + else if(as == AGLOBL) + p->kind = aData; + skip(bp, 6); /* scond(1), reg(1), lineno(4) */ + a = addr(bp); + addr(bp); + if(a.type != D_OREG || a.name != D_STATIC && a.name != D_EXTERN) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + long off; + + a.type = Bgetc(bp); /* a.type */ + skip(bp,1); /* reg */ + a.sym = Bgetc(bp); /* sym index */ + a.name = Bgetc(bp); /* sym type */ + switch(a.type){ + default: + case D_NONE: + case D_REG: + case D_FREG: + case D_PSR: + case D_FPCR: + break; + case D_OREG: + case D_CONST: + case D_BRANCH: + case D_SHIFT: + off = Bgetc(bp); + off |= Bgetc(bp) << 8; + off |= Bgetc(bp) << 16; + off |= Bgetc(bp) << 24; + if(off < 0) + off = -off; + if(a.sym && (a.name==D_PARAM || a.name==D_AUTO)) + _offset(a.sym, off); + break; + case D_SCONST: + skip(bp, NSNAME); + break; + case D_FCONST: + skip(bp, 8); + break; + } + return a; +} + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} diff --git a/utils/libmach/6.c b/utils/libmach/6.c new file mode 100644 index 0000000..914bbdd --- /dev/null +++ b/utils/libmach/6.c @@ -0,0 +1,116 @@ +/* + * amd64 definition + */ +#include <lib9.h> +#include <bio.h> +#include "ureg6.h" +#include "mach.h" + +#define REGOFF(x) offsetof(struct Ureg, x) + +#define REGSIZE sizeof(struct Ureg) +#define FP_CTLS(x) (REGSIZE+2*(x)) +#define FP_CTL(x) (REGSIZE+4*(x)) +#define FP_REG(x) (FP_CTL(8)+16*(x)) +#define XM_REG(x) (FP_CTL(8)+8*16+16*(x)) + +#define FPREGSIZE 512 /* TO DO? currently only 0x1A0 used */ + +Reglist amd64reglist[] = { + {"AX", REGOFF(ax), RINT, 'Y'}, + {"BX", REGOFF(bx), RINT, 'Y'}, + {"CX", REGOFF(cx), RINT, 'Y'}, + {"DX", REGOFF(dx), RINT, 'Y'}, + {"SI", REGOFF(si), RINT, 'Y'}, + {"DI", REGOFF(di), RINT, 'Y'}, + {"BP", REGOFF(bp), RINT, 'Y'}, + {"R8", REGOFF(r8), RINT, 'Y'}, + {"R9", REGOFF(r9), RINT, 'Y'}, + {"R10", REGOFF(r10), RINT, 'Y'}, + {"R11", REGOFF(r11), RINT, 'Y'}, + {"R12", REGOFF(r12), RINT, 'Y'}, + {"R13", REGOFF(r13), RINT, 'Y'}, + {"R14", REGOFF(r14), RINT, 'Y'}, + {"R15", REGOFF(r15), RINT, 'Y'}, + {"DS", REGOFF(ds), RINT, 'x'}, + {"ES", REGOFF(es), RINT, 'x'}, + {"FS", REGOFF(fs), RINT, 'x'}, + {"GS", REGOFF(gs), RINT, 'x'}, + {"TYPE", REGOFF(type), RINT, 'Y'}, + {"TRAP", REGOFF(type), RINT, 'Y'}, /* alias for acid */ + {"ERROR", REGOFF(error), RINT, 'Y'}, + {"IP", REGOFF(ip), RINT, 'Y'}, + {"PC", REGOFF(ip), RINT, 'Y'}, /* alias for acid */ + {"CS", REGOFF(cs), RINT, 'Y'}, + {"FLAGS", REGOFF(flags), RINT, 'Y'}, + {"SP", REGOFF(sp), RINT, 'Y'}, + {"SS", REGOFF(ss), RINT, 'Y'}, + + {"FCW", FP_CTLS(0), RFLT, 'x'}, + {"FSW", FP_CTLS(1), RFLT, 'x'}, + {"FTW", FP_CTLS(2), RFLT, 'b'}, + {"FOP", FP_CTLS(3), RFLT, 'x'}, + {"RIP", FP_CTL(2), RFLT, 'Y'}, + {"RDP", FP_CTL(4), RFLT, 'Y'}, + {"MXCSR", FP_CTL(6), RFLT, 'X'}, + {"MXCSRMASK", FP_CTL(7), RFLT, 'X'}, + {"M0", FP_REG(0), RFLT, 'F'}, /* assumes double */ + {"M1", FP_REG(1), RFLT, 'F'}, + {"M2", FP_REG(2), RFLT, 'F'}, + {"M3", FP_REG(3), RFLT, 'F'}, + {"M4", FP_REG(4), RFLT, 'F'}, + {"M5", FP_REG(5), RFLT, 'F'}, + {"M6", FP_REG(6), RFLT, 'F'}, + {"M7", FP_REG(7), RFLT, 'F'}, + {"X0", XM_REG(0), RFLT, 'F'}, /* assumes double */ + {"X1", XM_REG(1), RFLT, 'F'}, + {"X2", XM_REG(2), RFLT, 'F'}, + {"X3", XM_REG(3), RFLT, 'F'}, + {"X4", XM_REG(4), RFLT, 'F'}, + {"X5", XM_REG(5), RFLT, 'F'}, + {"X6", XM_REG(6), RFLT, 'F'}, + {"X7", XM_REG(7), RFLT, 'F'}, + {"X8", XM_REG(8), RFLT, 'F'}, + {"X9", XM_REG(9), RFLT, 'F'}, + {"X10", XM_REG(10), RFLT, 'F'}, + {"X11", XM_REG(11), RFLT, 'F'}, + {"X12", XM_REG(12), RFLT, 'F'}, + {"X13", XM_REG(13), RFLT, 'F'}, + {"X14", XM_REG(14), RFLT, 'F'}, + {"X15", XM_REG(15), RFLT, 'F'}, + {"X16", XM_REG(16), RFLT, 'F'}, +/* + {"F0", FP_REG(7), RFLT, '3'}, + {"F1", FP_REG(6), RFLT, '3'}, + {"F2", FP_REG(5), RFLT, '3'}, + {"F3", FP_REG(4), RFLT, '3'}, + {"F4", FP_REG(3), RFLT, '3'}, + {"F5", FP_REG(2), RFLT, '3'}, + {"F6", FP_REG(1), RFLT, '3'}, + {"F7", FP_REG(0), RFLT, '3'}, +*/ + { 0 } +}; + +Mach mamd64= +{ + "amd64", + MAMD64, /* machine type */ + amd64reglist, /* register list */ + REGSIZE, /* size of registers in bytes */ + FPREGSIZE, /* size of fp registers in bytes */ + "PC", /* name of PC */ + "SP", /* name of SP */ + 0, /* link register */ + "setSB", /* static base register name (bogus anyways) */ + 0, /* static base register value */ + 0x200000, /* page size */ + 0xFFFFFFFFF0110000U, /* kernel base */ + 0xFFFF800000000000U, /* kernel text mask */ + 0x00007FFFFFFFF000U, /* user stack top */ + 1, /* quantization of pc */ + 8, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/6obj.c b/utils/libmach/6obj.c new file mode 100644 index 0000000..24a458c --- /dev/null +++ b/utils/libmach/6obj.c @@ -0,0 +1,146 @@ +/* + * 6obj.c - identify and parse an amd64 object file + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "6c/6.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char sym; + char flags; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + +int +_is6(char *t) +{ + uchar *s = (uchar*)t; + + return s[0] == (ANAME&0xff) /* aslo = ANAME */ + && s[1] == ((ANAME>>8)&0xff) + && s[2] == D_FILE /* type */ + && s[3] == 1 /* sym */ + && s[4] == '<'; /* name of file */ +} + +int +_read6(Biobuf *bp, Prog* p) +{ + int as, n, c; + Addr a; + + as = Bgetc(bp); /* as(low) */ + if(as < 0) + return 0; + c = Bgetc(bp); /* as(high) */ + if(c < 0) + return 0; + as |= ((c & 0xff) << 8); + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = leswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + if(as == AGLOBL) + p->kind = aData; + skip(bp, 4); /* lineno(4) */ + a = addr(bp); + addr(bp); + if(!(a.flags & T_SYM)) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + int t; + long l; + vlong off; + + off = 0; + a.sym = -1; + a.flags = Bgetc(bp); /* flags */ + if(a.flags & T_INDEX) + skip(bp, 2); + if(a.flags & T_OFFSET){ + l = Bgetc(bp); + l |= Bgetc(bp) << 8; + l |= Bgetc(bp) << 16; + l |= Bgetc(bp) << 24; + off = l; + if(a.flags & T_64){ + l = Bgetc(bp); + l |= Bgetc(bp) << 8; + l |= Bgetc(bp) << 16; + l |= Bgetc(bp) << 24; + off = ((vlong)l << 32) | (off & 0xFFFFFFFF); + } + if(off < 0) + off = -off; + } + if(a.flags & T_SYM) + a.sym = Bgetc(bp); + if(a.flags & T_FCONST) + skip(bp, 8); + else + if(a.flags & T_SCONST) + skip(bp, NSNAME); + if(a.flags & T_TYPE) { + t = Bgetc(bp); + if(a.sym > 0 && (t==D_PARAM || t==D_AUTO)) + _offset(a.sym, off); + } + return a; +} + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} diff --git a/utils/libmach/8.c b/utils/libmach/8.c new file mode 100644 index 0000000..c636bd0 --- /dev/null +++ b/utils/libmach/8.c @@ -0,0 +1,79 @@ +/* + * 386 definition + */ +#include <lib9.h> +#include <bio.h> +#include "ureg8.h" +#include "mach.h" + +#define REGOFF(x) (ulong)(&((struct Ureg *) 0)->x) + +#define PC REGOFF(pc) +#define SP REGOFF(u0.sp) +#define AX REGOFF(ax) + +#define REGSIZE sizeof(struct Ureg) +#define FP_CTL(x) (REGSIZE+4*(x)) +#define FP_REG(x) (FP_CTL(7)+10*(x)) +#define FPREGSIZE (7*4+8*10) + +Reglist i386reglist[] = { + {"DI", REGOFF(di), RINT, 'X'}, + {"SI", REGOFF(si), RINT, 'X'}, + {"BP", REGOFF(bp), RINT, 'X'}, + {"BX", REGOFF(bx), RINT, 'X'}, + {"DX", REGOFF(dx), RINT, 'X'}, + {"CX", REGOFF(cx), RINT, 'X'}, + {"AX", REGOFF(ax), RINT, 'X'}, + {"GS", REGOFF(gs), RINT, 'X'}, + {"FS", REGOFF(fs), RINT, 'X'}, + {"ES", REGOFF(es), RINT, 'X'}, + {"DS", REGOFF(ds), RINT, 'X'}, + {"TRAP", REGOFF(trap), RINT, 'X'}, + {"ECODE", REGOFF(ecode), RINT, 'X'}, + {"PC", PC, RINT, 'X'}, + {"CS", REGOFF(cs), RINT, 'X'}, + {"EFLAGS", REGOFF(flags), RINT, 'X'}, + {"SP", SP, RINT, 'X'}, + {"SS", REGOFF(ss), RINT, 'X'}, + + {"E0", FP_CTL(0), RFLT, 'X'}, + {"E1", FP_CTL(1), RFLT, 'X'}, + {"E2", FP_CTL(2), RFLT, 'X'}, + {"E3", FP_CTL(3), RFLT, 'X'}, + {"E4", FP_CTL(4), RFLT, 'X'}, + {"E5", FP_CTL(5), RFLT, 'X'}, + {"E6", FP_CTL(6), RFLT, 'X'}, + {"F0", FP_REG(0), RFLT, '3'}, + {"F1", FP_REG(1), RFLT, '3'}, + {"F2", FP_REG(2), RFLT, '3'}, + {"F3", FP_REG(3), RFLT, '3'}, + {"F4", FP_REG(4), RFLT, '3'}, + {"F5", FP_REG(5), RFLT, '3'}, + {"F6", FP_REG(6), RFLT, '3'}, + {"F7", FP_REG(7), RFLT, '3'}, + { 0 } +}; + +Mach mi386 = +{ + "386", + MI386, /* machine type */ + i386reglist, /* register list */ + REGSIZE, /* size of registers in bytes */ + FPREGSIZE, /* size of fp registers in bytes */ + "PC", /* name of PC */ + "SP", /* name of SP */ + 0, /* link register */ + "setSB", /* static base register name (bogus anyways) */ + 0, /* static base register value */ + 0x1000, /* page size */ + 0x80100000, /* kernel base */ + 0x80000000, /* kernel text mask */ + 0x7FFFFFFF, /* user stack top */ + 1, /* quantization of pc */ + 4, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/8db.c b/utils/libmach/8db.c new file mode 100644 index 0000000..50befdb --- /dev/null +++ b/utils/libmach/8db.c @@ -0,0 +1,2266 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +/* + * i386-specific debugger interface + * also amd64 extensions + */ + +static char *i386excep(Map*, Rgetter); + +static int i386trace(Map*, uvlong, uvlong, uvlong, Tracer); +static uvlong i386frame(Map*, uvlong, uvlong, uvlong, uvlong); +static int i386foll(Map*, uvlong, Rgetter, uvlong*); +static int i386inst(Map*, uvlong, char, char*, int); +static int i386das(Map*, uvlong, char*, int); +static int i386instlen(Map*, uvlong); + +static char STARTSYM[] = "_main"; +static char PROFSYM[] = "_mainp"; +static char FRAMENAME[] = ".frame"; +static char *excname[65] = +{ +/*[0]*/ "divide error", +/*[1]*/ "debug exception", +/*[2]*/ nil, +/*[3]*/ nil, +/*[4]*/ "overflow", +/*[5]*/ "bounds check", +/*[6]*/ "invalid opcode", +/*[7]*/ "math coprocessor emulation", +/*[8]*/ "double fault", +/*[9]*/ "math coprocessor overrun", +/*[10]*/ "invalid TSS", +/*[11]*/ "segment not present", +/*[12]*/ "stack exception", +/*[13]*/ "general protection violation", +/*[14]*/ "page fault", +/*[15]*/ nil, +/*[16]*/ "math coprocessor error", +/*[17]*/ "alignment check", +/*[18]*/ "machine check", +/*[19]*/ "floating-point exception", +/*[20]*/ nil, +/*[21]*/ nil, +/*[22]*/ nil, +/*[23]*/ nil, +/*[24]*/ "clock", +/*[25]*/ "keyboard", +/*[26]*/ nil, +/*[27]*/ "modem status", +/*[28]*/ "serial line status", +/*[29]*/ nil, +/*[30]*/ "floppy disk", +/*[31]*/ nil, +/*[32]*/ nil, +/*[33]*/ nil, +/*[34]*/ nil, +/*[35]*/ nil, +/*[36]*/ "mouse", +/*[37]*/ "math coprocessor", +/*[38]*/ "hard disk", + 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,/* 39-54 */ + 0,0,0,0,0,0,0,0,0, /* 55-63 */ +/*[64]*/ "system call", +}; + +Machdata i386mach = +{ + {0xCC, 0, 0, 0}, /* break point: INT 3 */ + 1, /* break point size */ + + leswab, /* convert short to local byte order */ + leswal, /* convert long to local byte order */ + leswav, /* convert vlong to local byte order */ + i386trace, /* C traceback */ + i386frame, /* frame finder */ + i386excep, /* print exception */ + 0, /* breakpoint fixup */ + leieeesftos, /* single precision float printer */ + leieeedftos, /* double precision float printer */ + i386foll, /* following addresses */ + i386inst, /* print instruction */ + i386das, /* dissembler */ + i386instlen, /* instruction size calculation */ +}; + +static char* +i386excep(Map *map, Rgetter rget) +{ + ulong c; + uvlong pc; + static char buf[16]; + + c = (*rget)(map, "TRAP"); + if(c > 64 || excname[c] == 0) { + if (c == 3) { + pc = (*rget)(map, "PC"); + if (get1(map, pc, (uchar*)buf, machdata->bpsize) > 0) + if (memcmp(buf, machdata->bpinst, machdata->bpsize) == 0) + return "breakpoint"; + } + snprint(buf, sizeof(buf), "exception %ld", c); + return buf; + } else + return excname[c]; +} + +static int +i386trace(Map *map, uvlong pc, uvlong sp, uvlong link, Tracer trace) +{ + int i; + uvlong osp; + Symbol s, f; + + USED(link); + i = 0; + osp = 0; + while(findsym(pc, CTEXT, &s)) { + if (osp == sp) + break; + osp = sp; + + if(strcmp(STARTSYM, s.name) == 0 || strcmp(PROFSYM, s.name) == 0) + break; + + if(pc != s.value) { /* not at first instruction */ + if(findlocal(&s, FRAMENAME, &f) == 0) + break; + sp += f.value-mach->szaddr; + } + + if (geta(map, sp, &pc) < 0) + break; + + if(pc == 0) + break; + + (*trace)(map, pc, sp, &s); + sp += mach->szaddr; + + if(++i > 1000) + break; + } + return i; +} + +static uvlong +i386frame(Map *map, uvlong addr, uvlong pc, uvlong sp, uvlong link) +{ + Symbol s, f; + + USED(link); + while (findsym(pc, CTEXT, &s)) { + if(strcmp(STARTSYM, s.name) == 0 || strcmp(PROFSYM, s.name) == 0) + break; + + if(pc != s.value) { /* not first instruction */ + if(findlocal(&s, FRAMENAME, &f) == 0) + break; + sp += f.value-mach->szaddr; + } + + if (s.value == addr) + return sp; + + if (geta(map, sp, &pc) < 0) + break; + sp += mach->szaddr; + } + return 0; +} + + /* I386/486 - Disassembler and related functions */ + +/* + * an instruction + */ +typedef struct Instr Instr; +struct Instr +{ + uchar mem[1+1+1+1+2+1+1+4+4]; /* raw instruction */ + uvlong addr; /* address of start of instruction */ + int n; /* number of bytes in instruction */ + char *prefix; /* instr prefix */ + char *segment; /* segment override */ + uchar jumptype; /* set to the operand type for jump/ret/call */ + uchar amd64; + uchar rex; /* REX prefix (or zero) */ + char osize; /* 'W' or 'L' (or 'Q' on amd64) */ + char asize; /* address size 'W' or 'L' (or 'Q' or amd64) */ + uchar mod; /* bits 6-7 of mod r/m field */ + uchar reg; /* bits 3-5 of mod r/m field */ + char ss; /* bits 6-7 of SIB */ + char index; /* bits 3-5 of SIB */ + char base; /* bits 0-2 of SIB */ + char rip; /* RIP-relative in amd64 mode */ + uchar opre; /* f2/f3 could introduce media */ + short seg; /* segment of far address */ + ulong disp; /* displacement */ + ulong imm; /* immediate */ + ulong imm2; /* second immediate operand */ + uvlong imm64; /* big immediate */ + char *curr; /* fill level in output buffer */ + char *end; /* end of output buffer */ + char *err; /* error message */ +}; + + /* 386 register (ha!) set */ +enum{ + AX=0, + CX, + DX, + BX, + SP, + BP, + SI, + DI, + + /* amd64 */ + R8, + R9, + R10, + R11, + R12, + R13, + R14, + R15 +}; + + /* amd64 rex extension byte */ +enum{ + REXW = 1<<3, /* =1, 64-bit operand size */ + REXR = 1<<2, /* extend modrm reg */ + REXX = 1<<1, /* extend sib index */ + REXB = 1<<0 /* extend modrm r/m, sib base, or opcode reg */ +}; + + /* Operand Format codes */ +/* +%A - address size register modifier (!asize -> 'E') +%C - Control register CR0/CR1/CR2 +%D - Debug register DR0/DR1/DR2/DR3/DR6/DR7 +%I - second immediate operand +%O - Operand size register modifier (!osize -> 'E') +%T - Test register TR6/TR7 +%S - size code ('W' or 'L') +%W - Weird opcode: OSIZE == 'W' => "CBW"; else => "CWDE" +%d - displacement 16-32 bits +%e - effective address - Mod R/M value +%f - floating point register F0-F7 - from Mod R/M register +%g - segment register +%i - immediate operand 8-32 bits +%p - PC-relative - signed displacement in immediate field +%r - Reg from Mod R/M +%w - Weird opcode: OSIZE == 'W' => "CWD"; else => "CDQ" +*/ + +typedef struct Optable Optable; +struct Optable +{ + int x; + char operand[2]; + void *proto; /* actually either (char*) or (Optable*) */ +}; + /* Operand decoding codes */ +enum { + Ib = 1, /* 8-bit immediate - (no sign extension)*/ + Ibs, /* 8-bit immediate (sign extended) */ + Jbs, /* 8-bit sign-extended immediate in jump or call */ + Iw, /* 16-bit immediate -> imm */ + Iw2, /* 16-bit immediate -> imm2 */ + Iwd, /* Operand-sized immediate (no sign extension)*/ + Iwdq, /* Operand-sized immediate, possibly 64 bits */ + Awd, /* Address offset */ + Iwds, /* Operand-sized immediate (sign extended) */ + RM, /* Word or long R/M field with register (/r) */ + RMB, /* Byte R/M field with register (/r) */ + RMOP, /* Word or long R/M field with op code (/digit) */ + RMOPB, /* Byte R/M field with op code (/digit) */ + RMR, /* R/M register only (mod = 11) */ + RMM, /* R/M memory only (mod = 0/1/2) */ + R0, /* Base reg of Mod R/M is literal 0x00 */ + R1, /* Base reg of Mod R/M is literal 0x01 */ + FRMOP, /* Floating point R/M field with opcode */ + FRMEX, /* Extended floating point R/M field with opcode */ + JUMP, /* Jump or Call flag - no operand */ + RET, /* Return flag - no operand */ + OA, /* literal 0x0a byte */ + PTR, /* Seg:Displacement addr (ptr16:16 or ptr16:32) */ + AUX, /* Multi-byte op code - Auxiliary table */ + AUXMM, /* multi-byte op code - auxiliary table chosen by prefix */ + PRE, /* Instr Prefix */ + OPRE, /* Instr Prefix or media op extension */ + SEG, /* Segment Prefix */ + OPOVER, /* Operand size override */ + ADDOVER, /* Address size override */ +}; + +static Optable optab0F00[8]= +{ +0x00, 0,0, "MOVW LDT,%e", +0x01, 0,0, "MOVW TR,%e", +0x02, 0,0, "MOVW %e,LDT", +0x03, 0,0, "MOVW %e,TR", +0x04, 0,0, "VERR %e", +0x05, 0,0, "VERW %e", +}; + +static Optable optab0F01[8]= +{ +0x00, 0,0, "MOVL GDTR,%e", +0x01, 0,0, "MOVL IDTR,%e", +0x02, 0,0, "MOVL %e,GDTR", +0x03, 0,0, "MOVL %e,IDTR", +0x04, 0,0, "MOVW MSW,%e", /* word */ +0x06, 0,0, "MOVW %e,MSW", /* word */ +0x07, 0,0, "INVLPG %e", /* or SWAPGS */ +}; + +static Optable optab0F01F8[1]= +{ +0x00, 0,0, "SWAPGS", +}; + +/* 0F71 */ +/* 0F72 */ +/* 0F73 */ + +static Optable optab0FAE[8]= +{ +0x00, 0,0, "FXSAVE %e", +0x01, 0,0, "FXRSTOR %e", +0x02, 0,0, "LDMXCSR %e", +0x03, 0,0, "STMXCSR %e", +0x05, 0,0, "LFENCE", +0x06, 0,0, "MFENCE", +0x07, 0,0, "SFENCE", +}; + +/* 0F18 */ +/* 0F0D */ + +static Optable optab0FBA[8]= +{ +0x04, Ib,0, "BT%S %i,%e", +0x05, Ib,0, "BTS%S %i,%e", +0x06, Ib,0, "BTR%S %i,%e", +0x07, Ib,0, "BTC%S %i,%e", +}; + +static Optable optab0F0F[256]= +{ +0x0c, 0,0, "PI2FW %m,%M", +0x0d, 0,0, "PI2L %m,%M", +0x1c, 0,0, "PF2IW %m,%M", +0x1d, 0,0, "PF2IL %m,%M", +0x8a, 0,0, "PFNACC %m,%M", +0x8e, 0,0, "PFPNACC %m,%M", +0x90, 0,0, "PFCMPGE %m,%M", +0x94, 0,0, "PFMIN %m,%M", +0x96, 0,0, "PFRCP %m,%M", +0x97, 0,0, "PFRSQRT %m,%M", +0x9a, 0,0, "PFSUB %m,%M", +0x9e, 0,0, "PFADD %m,%M", +0xa0, 0,0, "PFCMPGT %m,%M", +0xa4, 0,0, "PFMAX %m,%M", +0xa6, 0,0, "PFRCPIT1 %m,%M", +0xa7, 0,0, "PFRSQIT1 %m,%M", +0xaa, 0,0, "PFSUBR %m,%M", +0xae, 0,0, "PFACC %m,%M", +0xb0, 0,0, "PFCMPEQ %m,%M", +0xb4, 0,0, "PFMUL %m,%M", +0xb6, 0,0, "PFRCPI2T %m,%M", +0xb7, 0,0, "PMULHRW %m,%M", +0xbb, 0,0, "PSWAPL %m,%M", +}; + +static Optable optab0FC7[8]= +{ +0x01, 0,0, "CMPXCHG8B %e", +}; + +static Optable optab660F71[8]= +{ +0x02, Ib,0, "PSRLW %i,%X", +0x04, Ib,0, "PSRAW %i,%X", +0x06, Ib,0, "PSLLW %i,%X", +}; + +static Optable optab660F72[8]= +{ +0x02, Ib,0, "PSRLL %i,%X", +0x04, Ib,0, "PSRAL %i,%X", +0x06, Ib,0, "PSLLL %i,%X", +}; + +static Optable optab660F73[8]= +{ +0x02, Ib,0, "PSRLQ %i,%X", +0x03, Ib,0, "PSRLO %i,%X", +0x06, Ib,0, "PSLLQ %i,%X", +0x07, Ib,0, "PSLLO %i,%X", +}; + +static Optable optab660F[256]= +{ +0x2B, RM,0, "MOVNTPD %x,%e", +0x2E, RM,0, "UCOMISD %x,%X", +0x2F, RM,0, "COMISD %x,%X", +0x5A, RM,0, "CVTPD2PS %x,%X", +0x5B, RM,0, "CVTPS2PL %x,%X", +0x6A, RM,0, "PUNPCKHLQ %x,%X", +0x6B, RM,0, "PACKSSLW %x,%X", +0x6C, RM,0, "PUNPCKLQDQ %x,%X", +0x6D, RM,0, "PUNPCKHQDQ %x,%X", +0x6E, RM,0, "MOV%S %e,%X", +0x6F, RM,0, "MOVO %x,%X", /* MOVDQA */ +0x70, RM,Ib, "PSHUFL %i,%x,%X", +0x71, RMOP,0, optab660F71, +0x72, RMOP,0, optab660F72, +0x73, RMOP,0, optab660F73, +0x7E, RM,0, "MOV%S %X,%e", +0x7F, RM,0, "MOVO %X,%x", +0xC4, RM,Ib, "PINSRW %i,%e,%X", +0xC5, RMR,Ib, "PEXTRW %i,%X,%e", +0xD4, RM,0, "PADDQ %x,%X", +0xD5, RM,0, "PMULLW %x,%X", +0xD6, RM,0, "MOVQ %X,%x", +0xE6, RM,0, "CVTTPD2PL %x,%X", +0xE7, RM,0, "MOVNTO %X,%e", +0xF7, RM,0, "MASKMOVOU %x,%X", +}; + +static Optable optabF20F[256]= +{ +0x10, RM,0, "MOVSD %x,%X", +0x11, RM,0, "MOVSD %X,%x", +0x2A, RM,0, "CVTS%S2SD %e,%X", +0x2C, RM,0, "CVTTSD2S%S %x,%r", +0x2D, RM,0, "CVTSD2S%S %x,%r", +0x5A, RM,0, "CVTSD2SS %x,%X", +0x6F, RM,0, "MOVOU %x,%X", +0x70, RM,Ib, "PSHUFLW %i,%x,%X", +0x7F, RM,0, "MOVOU %X,%x", +0xD6, RM,0, "MOVQOZX %M,%X", +0xE6, RM,0, "CVTPD2PL %x,%X", +}; + +static Optable optabF30F[256]= +{ +0x10, RM,0, "MOVSS %x,%X", +0x11, RM,0, "MOVSS %X,%x", +0x2A, RM,0, "CVTS%S2SS %e,%X", +0x2C, RM,0, "CVTTSS2S%S %x,%r", +0x2D, RM,0, "CVTSS2S%S %x,%r", +0x5A, RM,0, "CVTSS2SD %x,%X", +0x5B, RM,0, "CVTTPS2PL %x,%X", +0x6F, RM,0, "MOVOU %x,%X", +0x70, RM,Ib, "PSHUFHW %i,%x,%X", +0x7E, RM,0, "MOVQOZX %x,%X", +0x7F, RM,0, "MOVOU %X,%x", +0xD6, RM,0, "MOVQOZX %m*,%X", +0xE6, RM,0, "CVTPL2PD %x,%X", +}; + +static Optable optab0F[256]= +{ +0x00, RMOP,0, optab0F00, +0x01, RMOP,0, optab0F01, +0x02, RM,0, "LAR %e,%r", +0x03, RM,0, "LSL %e,%r", +0x05, 0,0, "SYSCALL", +0x06, 0,0, "CLTS", +0x07, 0,0, "SYSRET", +0x08, 0,0, "INVD", +0x09, 0,0, "WBINVD", +0x0B, 0,0, "UD2", +0x0F, RM,AUX, optab0F0F, /* 3DNow! */ +0x10, RM,0, "MOVU%s %x,%X", +0x11, RM,0, "MOVU%s %X,%x", +0x12, RM,0, "MOV[H]L%s %x,%X", /* TO DO: H if source is XMM */ +0x13, RM,0, "MOVL%s %X,%e", +0x14, RM,0, "UNPCKL%s %x,%X", +0x15, RM,0, "UNPCKH%s %x,%X", +0x16, RM,0, "MOV[L]H%s %x,%X", /* TO DO: L if source is XMM */ +0x17, RM,0, "MOVH%s %X,%x", +0x20, RMR,0, "MOVL %C,%e", +0x21, RMR,0, "MOVL %D,%e", +0x22, RMR,0, "MOVL %e,%C", +0x23, RMR,0, "MOVL %e,%D", +0x24, RMR,0, "MOVL %T,%e", +0x26, RMR,0, "MOVL %e,%T", +0x28, RM,0, "MOVA%s %x,%X", +0x29, RM,0, "MOVA%s %X,%x", +0x2A, RM,0, "CVTPL2%s %m*,%X", +0x2B, RM,0, "MOVNT%s %X,%e", +0x2C, RM,0, "CVTT%s2PL %x,%M", +0x2D, RM,0, "CVT%s2PL %x,%M", +0x2E, RM,0, "UCOMISS %x,%X", +0x2F, RM,0, "COMISS %x,%X", +0x30, 0,0, "WRMSR", +0x31, 0,0, "RDTSC", +0x32, 0,0, "RDMSR", +0x33, 0,0, "RDPMC", +0x42, RM,0, "CMOVC %e,%r", /* CF */ +0x43, RM,0, "CMOVNC %e,%r", /* ¬ CF */ +0x44, RM,0, "CMOVZ %e,%r", /* ZF */ +0x45, RM,0, "CMOVNZ %e,%r", /* ¬ ZF */ +0x46, RM,0, "CMOVBE %e,%r", /* CF ∨ ZF */ +0x47, RM,0, "CMOVA %e,%r", /* ¬CF ∧ ¬ZF */ +0x48, RM,0, "CMOVS %e,%r", /* SF */ +0x49, RM,0, "CMOVNS %e,%r", /* ¬ SF */ +0x4A, RM,0, "CMOVP %e,%r", /* PF */ +0x4B, RM,0, "CMOVNP %e,%r", /* ¬ PF */ +0x4C, RM,0, "CMOVLT %e,%r", /* LT ≡ OF ≠SF */ +0x4D, RM,0, "CMOVGE %e,%r", /* GE ≡ ZF ∨ SF */ +0x4E, RM,0, "CMOVLE %e,%r", /* LE ≡ ZF ∨ LT */ +0x4F, RM,0, "CMOVGT %e,%r", /* GT ≡ ¬ZF ∧ GE */ +0x50, RM,0, "MOVMSK%s %X,%r", /* TO DO: check */ +0x51, RM,0, "SQRT%s %x,%X", +0x52, RM,0, "RSQRT%s %x,%X", +0x53, RM,0, "RCP%s %x,%X", +0x54, RM,0, "AND%s %x,%X", +0x55, RM,0, "ANDN%s %x,%X", +0x56, RM,0, "OR%s %x,%X", /* TO DO: S/D */ +0x57, RM,0, "XOR%s %x,%X", /* S/D */ +0x58, RM,0, "ADD%s %x,%X", /* S/P S/D */ +0x59, RM,0, "MUL%s %x,%X", +0x5A, RM,0, "CVTPS2PD %x,%X", +0x5B, RM,0, "CVTPL2PS %x,%X", +0x5C, RM,0, "SUB%s %x,%X", +0x5D, RM,0, "MIN%s %x,%X", +0x5E, RM,0, "DIV%s %x,%X", /* TO DO: S/P S/D */ +0x5F, RM,0, "MAX%s %x,%X", +0x60, RM,0, "PUNPCKLBW %m,%M", +0x61, RM,0, "PUNPCKLWL %m,%M", +0x62, RM,0, "PUNPCKLLQ %m,%M", +0x63, RM,0, "PACKSSWB %m,%M", +0x64, RM,0, "PCMPGTB %m,%M", +0x65, RM,0, "PCMPGTW %m,%M", +0x66, RM,0, "PCMPGTL %m,%M", +0x67, RM,0, "PACKUSWB %m,%M", +0x68, RM,0, "PUNPCKHBW %m,%M", +0x69, RM,0, "PUNPCKHWL %m,%M", +0x6A, RM,0, "PUNPCKHLQ %m,%M", +0x6B, RM,0, "PACKSSLW %m,%M", +0x6E, RM,0, "MOV%S %e,%M", +0x6F, RM,0, "MOVQ %m,%M", +0x70, RM,Ib, "PSHUFW %i,%m,%M", +0x74, RM,0, "PCMPEQB %m,%M", +0x75, RM,0, "PCMPEQW %m,%M", +0x76, RM,0, "PCMPEQL %m,%M", +0x7E, RM,0, "MOV%S %M,%e", +0x7F, RM,0, "MOVQ %M,%m", +0xAE, RMOP,0, optab0FAE, +0xAA, 0,0, "RSM", +0xB0, RM,0, "CMPXCHGB %r,%e", +0xB1, RM,0, "CMPXCHG%S %r,%e", +0xC0, RMB,0, "XADDB %r,%e", +0xC1, RM,0, "XADD%S %r,%e", +0xC2, RM,Ib, "CMP%s %i,%x,%X", +0xC3, RM,0, "MOVNTI%S %r,%e", +0xC6, RM,Ib, "SHUF%s %i,%x,%X", +0xC8, 0,0, "BSWAP AX", +0xC9, 0,0, "BSWAP CX", +0xCA, 0,0, "BSWAP DX", +0xCB, 0,0, "BSWAP BX", +0xCC, 0,0, "BSWAP SP", +0xCD, 0,0, "BSWAP BP", +0xCE, 0,0, "BSWAP SI", +0xCF, 0,0, "BSWAP DI", +0xD1, RM,0, "PSRLW %m,%M", +0xD2, RM,0, "PSRLL %m,%M", +0xD3, RM,0, "PSRLQ %m,%M", +0xD5, RM,0, "PMULLW %m,%M", +0xD6, RM,0, "MOVQOZX %m*,%X", +0xD7, RM,0, "PMOVMSKB %m,%r", +0xD8, RM,0, "PSUBUSB %m,%M", +0xD9, RM,0, "PSUBUSW %m,%M", +0xDA, RM,0, "PMINUB %m,%M", +0xDB, RM,0, "PAND %m,%M", +0xDC, RM,0, "PADDUSB %m,%M", +0xDD, RM,0, "PADDUSW %m,%M", +0xDE, RM,0, "PMAXUB %m,%M", +0xDF, RM,0, "PANDN %m,%M", +0xE0, RM,0, "PAVGB %m,%M", +0xE1, RM,0, "PSRAW %m,%M", +0xE2, RM,0, "PSRAL %m,%M", +0xE3, RM,0, "PAVGW %m,%M", +0xE4, RM,0, "PMULHUW %m,%M", +0xE5, RM,0, "PMULHW %m,%M", +0xE7, RM,0, "MOVNTQ %M,%e", +0xE8, RM,0, "PSUBSB %m,%M", +0xE9, RM,0, "PSUBSW %m,%M", +0xEA, RM,0, "PMINSW %m,%M", +0xEB, RM,0, "POR %m,%M", +0xEC, RM,0, "PADDSB %m,%M", +0xED, RM,0, "PADDSW %m,%M", +0xEE, RM,0, "PMAXSW %m,%M", +0xEF, RM,0, "PXOR %m,%M", +0xF1, RM,0, "PSLLW %m,%M", +0xF2, RM,0, "PSLLL %m,%M", +0xF3, RM,0, "PSLLQ %m,%M", +0xF4, RM,0, "PMULULQ %m,%M", +0xF5, RM,0, "PMADDWL %m,%M", +0xF6, RM,0, "PSADBW %m,%M", +0xF7, RMR,0, "MASKMOVQ %m,%M", +0xF8, RM,0, "PSUBB %m,%M", +0xF9, RM,0, "PSUBW %m,%M", +0xFA, RM,0, "PSUBL %m,%M", +0xFC, RM,0, "PADDB %m,%M", +0xFD, RM,0, "PADDW %m,%M", +0xFE, RM,0, "PADDL %m,%M", + +0x80, Iwds,0, "JOS %p", +0x81, Iwds,0, "JOC %p", +0x82, Iwds,0, "JCS %p", +0x83, Iwds,0, "JCC %p", +0x84, Iwds,0, "JEQ %p", +0x85, Iwds,0, "JNE %p", +0x86, Iwds,0, "JLS %p", +0x87, Iwds,0, "JHI %p", +0x88, Iwds,0, "JMI %p", +0x89, Iwds,0, "JPL %p", +0x8a, Iwds,0, "JPS %p", +0x8b, Iwds,0, "JPC %p", +0x8c, Iwds,0, "JLT %p", +0x8d, Iwds,0, "JGE %p", +0x8e, Iwds,0, "JLE %p", +0x8f, Iwds,0, "JGT %p", +0x90, RMB,0, "SETOS %e", +0x91, RMB,0, "SETOC %e", +0x92, RMB,0, "SETCS %e", +0x93, RMB,0, "SETCC %e", +0x94, RMB,0, "SETEQ %e", +0x95, RMB,0, "SETNE %e", +0x96, RMB,0, "SETLS %e", +0x97, RMB,0, "SETHI %e", +0x98, RMB,0, "SETMI %e", +0x99, RMB,0, "SETPL %e", +0x9a, RMB,0, "SETPS %e", +0x9b, RMB,0, "SETPC %e", +0x9c, RMB,0, "SETLT %e", +0x9d, RMB,0, "SETGE %e", +0x9e, RMB,0, "SETLE %e", +0x9f, RMB,0, "SETGT %e", +0xa0, 0,0, "PUSHL FS", +0xa1, 0,0, "POPL FS", +0xa2, 0,0, "CPUID", +0xa3, RM,0, "BT%S %r,%e", +0xa4, RM,Ib, "SHLD%S %r,%i,%e", +0xa5, RM,0, "SHLD%S %r,CL,%e", +0xa8, 0,0, "PUSHL GS", +0xa9, 0,0, "POPL GS", +0xab, RM,0, "BTS%S %r,%e", +0xac, RM,Ib, "SHRD%S %r,%i,%e", +0xad, RM,0, "SHRD%S %r,CL,%e", +0xaf, RM,0, "IMUL%S %e,%r", +0xb2, RMM,0, "LSS %e,%r", +0xb3, RM,0, "BTR%S %r,%e", +0xb4, RMM,0, "LFS %e,%r", +0xb5, RMM,0, "LGS %e,%r", +0xb6, RMB,0, "MOVBZX %e,%R", +0xb7, RM,0, "MOVWZX %e,%R", +0xba, RMOP,0, optab0FBA, +0xbb, RM,0, "BTC%S %e,%r", +0xbc, RM,0, "BSF%S %e,%r", +0xbd, RM,0, "BSR%S %e,%r", +0xbe, RMB,0, "MOVBSX %e,%R", +0xbf, RM,0, "MOVWSX %e,%R", +0xc7, RMOP,0, optab0FC7, +}; + +static Optable optab80[8]= +{ +0x00, Ib,0, "ADDB %i,%e", +0x01, Ib,0, "ORB %i,%e", +0x02, Ib,0, "ADCB %i,%e", +0x03, Ib,0, "SBBB %i,%e", +0x04, Ib,0, "ANDB %i,%e", +0x05, Ib,0, "SUBB %i,%e", +0x06, Ib,0, "XORB %i,%e", +0x07, Ib,0, "CMPB %e,%i", +}; + +static Optable optab81[8]= +{ +0x00, Iwd,0, "ADD%S %i,%e", +0x01, Iwd,0, "OR%S %i,%e", +0x02, Iwd,0, "ADC%S %i,%e", +0x03, Iwd,0, "SBB%S %i,%e", +0x04, Iwd,0, "AND%S %i,%e", +0x05, Iwd,0, "SUB%S %i,%e", +0x06, Iwd,0, "XOR%S %i,%e", +0x07, Iwd,0, "CMP%S %e,%i", +}; + +static Optable optab83[8]= +{ +0x00, Ibs,0, "ADD%S %i,%e", +0x01, Ibs,0, "OR%S %i,%e", +0x02, Ibs,0, "ADC%S %i,%e", +0x03, Ibs,0, "SBB%S %i,%e", +0x04, Ibs,0, "AND%S %i,%e", +0x05, Ibs,0, "SUB%S %i,%e", +0x06, Ibs,0, "XOR%S %i,%e", +0x07, Ibs,0, "CMP%S %e,%i", +}; + +static Optable optabC0[8] = +{ +0x00, Ib,0, "ROLB %i,%e", +0x01, Ib,0, "RORB %i,%e", +0x02, Ib,0, "RCLB %i,%e", +0x03, Ib,0, "RCRB %i,%e", +0x04, Ib,0, "SHLB %i,%e", +0x05, Ib,0, "SHRB %i,%e", +0x07, Ib,0, "SARB %i,%e", +}; + +static Optable optabC1[8] = +{ +0x00, Ib,0, "ROL%S %i,%e", +0x01, Ib,0, "ROR%S %i,%e", +0x02, Ib,0, "RCL%S %i,%e", +0x03, Ib,0, "RCR%S %i,%e", +0x04, Ib,0, "SHL%S %i,%e", +0x05, Ib,0, "SHR%S %i,%e", +0x07, Ib,0, "SAR%S %i,%e", +}; + +static Optable optabD0[8] = +{ +0x00, 0,0, "ROLB %e", +0x01, 0,0, "RORB %e", +0x02, 0,0, "RCLB %e", +0x03, 0,0, "RCRB %e", +0x04, 0,0, "SHLB %e", +0x05, 0,0, "SHRB %e", +0x07, 0,0, "SARB %e", +}; + +static Optable optabD1[8] = +{ +0x00, 0,0, "ROL%S %e", +0x01, 0,0, "ROR%S %e", +0x02, 0,0, "RCL%S %e", +0x03, 0,0, "RCR%S %e", +0x04, 0,0, "SHL%S %e", +0x05, 0,0, "SHR%S %e", +0x07, 0,0, "SAR%S %e", +}; + +static Optable optabD2[8] = +{ +0x00, 0,0, "ROLB CL,%e", +0x01, 0,0, "RORB CL,%e", +0x02, 0,0, "RCLB CL,%e", +0x03, 0,0, "RCRB CL,%e", +0x04, 0,0, "SHLB CL,%e", +0x05, 0,0, "SHRB CL,%e", +0x07, 0,0, "SARB CL,%e", +}; + +static Optable optabD3[8] = +{ +0x00, 0,0, "ROL%S CL,%e", +0x01, 0,0, "ROR%S CL,%e", +0x02, 0,0, "RCL%S CL,%e", +0x03, 0,0, "RCR%S CL,%e", +0x04, 0,0, "SHL%S CL,%e", +0x05, 0,0, "SHR%S CL,%e", +0x07, 0,0, "SAR%S CL,%e", +}; + +static Optable optabD8[8+8] = +{ +0x00, 0,0, "FADDF %e,F0", +0x01, 0,0, "FMULF %e,F0", +0x02, 0,0, "FCOMF %e,F0", +0x03, 0,0, "FCOMFP %e,F0", +0x04, 0,0, "FSUBF %e,F0", +0x05, 0,0, "FSUBRF %e,F0", +0x06, 0,0, "FDIVF %e,F0", +0x07, 0,0, "FDIVRF %e,F0", +0x08, 0,0, "FADDD %f,F0", +0x09, 0,0, "FMULD %f,F0", +0x0a, 0,0, "FCOMD %f,F0", +0x0b, 0,0, "FCOMPD %f,F0", +0x0c, 0,0, "FSUBD %f,F0", +0x0d, 0,0, "FSUBRD %f,F0", +0x0e, 0,0, "FDIVD %f,F0", +0x0f, 0,0, "FDIVRD %f,F0", +}; +/* + * optabD9 and optabDB use the following encoding: + * if (0 <= modrm <= 2) instruction = optabDx[modrm&0x07]; + * else instruction = optabDx[(modrm&0x3f)+8]; + * + * the instructions for MOD == 3, follow the 8 instructions + * for the other MOD values stored at the front of the table. + */ +static Optable optabD9[64+8] = +{ +0x00, 0,0, "FMOVF %e,F0", +0x02, 0,0, "FMOVF F0,%e", +0x03, 0,0, "FMOVFP F0,%e", +0x04, 0,0, "FLDENV%S %e", +0x05, 0,0, "FLDCW %e", +0x06, 0,0, "FSTENV%S %e", +0x07, 0,0, "FSTCW %e", +0x08, 0,0, "FMOVD F0,F0", /* Mod R/M = 11xx xxxx*/ +0x09, 0,0, "FMOVD F1,F0", +0x0a, 0,0, "FMOVD F2,F0", +0x0b, 0,0, "FMOVD F3,F0", +0x0c, 0,0, "FMOVD F4,F0", +0x0d, 0,0, "FMOVD F5,F0", +0x0e, 0,0, "FMOVD F6,F0", +0x0f, 0,0, "FMOVD F7,F0", +0x10, 0,0, "FXCHD F0,F0", +0x11, 0,0, "FXCHD F1,F0", +0x12, 0,0, "FXCHD F2,F0", +0x13, 0,0, "FXCHD F3,F0", +0x14, 0,0, "FXCHD F4,F0", +0x15, 0,0, "FXCHD F5,F0", +0x16, 0,0, "FXCHD F6,F0", +0x17, 0,0, "FXCHD F7,F0", +0x18, 0,0, "FNOP", +0x28, 0,0, "FCHS", +0x29, 0,0, "FABS", +0x2c, 0,0, "FTST", +0x2d, 0,0, "FXAM", +0x30, 0,0, "FLD1", +0x31, 0,0, "FLDL2T", +0x32, 0,0, "FLDL2E", +0x33, 0,0, "FLDPI", +0x34, 0,0, "FLDLG2", +0x35, 0,0, "FLDLN2", +0x36, 0,0, "FLDZ", +0x38, 0,0, "F2XM1", +0x39, 0,0, "FYL2X", +0x3a, 0,0, "FPTAN", +0x3b, 0,0, "FPATAN", +0x3c, 0,0, "FXTRACT", +0x3d, 0,0, "FPREM1", +0x3e, 0,0, "FDECSTP", +0x3f, 0,0, "FNCSTP", +0x40, 0,0, "FPREM", +0x41, 0,0, "FYL2XP1", +0x42, 0,0, "FSQRT", +0x43, 0,0, "FSINCOS", +0x44, 0,0, "FRNDINT", +0x45, 0,0, "FSCALE", +0x46, 0,0, "FSIN", +0x47, 0,0, "FCOS", +}; + +static Optable optabDA[8+8] = +{ +0x00, 0,0, "FADDL %e,F0", +0x01, 0,0, "FMULL %e,F0", +0x02, 0,0, "FCOML %e,F0", +0x03, 0,0, "FCOMLP %e,F0", +0x04, 0,0, "FSUBL %e,F0", +0x05, 0,0, "FSUBRL %e,F0", +0x06, 0,0, "FDIVL %e,F0", +0x07, 0,0, "FDIVRL %e,F0", +0x0d, R1,0, "FUCOMPP", +}; + +static Optable optabDB[8+64] = +{ +0x00, 0,0, "FMOVL %e,F0", +0x02, 0,0, "FMOVL F0,%e", +0x03, 0,0, "FMOVLP F0,%e", +0x05, 0,0, "FMOVX %e,F0", +0x07, 0,0, "FMOVXP F0,%e", +0x2a, 0,0, "FCLEX", +0x2b, 0,0, "FINIT", +}; + +static Optable optabDC[8+8] = +{ +0x00, 0,0, "FADDD %e,F0", +0x01, 0,0, "FMULD %e,F0", +0x02, 0,0, "FCOMD %e,F0", +0x03, 0,0, "FCOMDP %e,F0", +0x04, 0,0, "FSUBD %e,F0", +0x05, 0,0, "FSUBRD %e,F0", +0x06, 0,0, "FDIVD %e,F0", +0x07, 0,0, "FDIVRD %e,F0", +0x08, 0,0, "FADDD F0,%f", +0x09, 0,0, "FMULD F0,%f", +0x0c, 0,0, "FSUBRD F0,%f", +0x0d, 0,0, "FSUBD F0,%f", +0x0e, 0,0, "FDIVRD F0,%f", +0x0f, 0,0, "FDIVD F0,%f", +}; + +static Optable optabDD[8+8] = +{ +0x00, 0,0, "FMOVD %e,F0", +0x02, 0,0, "FMOVD F0,%e", +0x03, 0,0, "FMOVDP F0,%e", +0x04, 0,0, "FRSTOR%S %e", +0x06, 0,0, "FSAVE%S %e", +0x07, 0,0, "FSTSW %e", +0x08, 0,0, "FFREED %f", +0x0a, 0,0, "FMOVD %f,F0", +0x0b, 0,0, "FMOVDP %f,F0", +0x0c, 0,0, "FUCOMD %f,F0", +0x0d, 0,0, "FUCOMDP %f,F0", +}; + +static Optable optabDE[8+8] = +{ +0x00, 0,0, "FADDW %e,F0", +0x01, 0,0, "FMULW %e,F0", +0x02, 0,0, "FCOMW %e,F0", +0x03, 0,0, "FCOMWP %e,F0", +0x04, 0,0, "FSUBW %e,F0", +0x05, 0,0, "FSUBRW %e,F0", +0x06, 0,0, "FDIVW %e,F0", +0x07, 0,0, "FDIVRW %e,F0", +0x08, 0,0, "FADDDP F0,%f", +0x09, 0,0, "FMULDP F0,%f", +0x0b, R1,0, "FCOMPDP", +0x0c, 0,0, "FSUBRDP F0,%f", +0x0d, 0,0, "FSUBDP F0,%f", +0x0e, 0,0, "FDIVRDP F0,%f", +0x0f, 0,0, "FDIVDP F0,%f", +}; + +static Optable optabDF[8+8] = +{ +0x00, 0,0, "FMOVW %e,F0", +0x02, 0,0, "FMOVW F0,%e", +0x03, 0,0, "FMOVWP F0,%e", +0x04, 0,0, "FBLD %e", +0x05, 0,0, "FMOVL %e,F0", +0x06, 0,0, "FBSTP %e", +0x07, 0,0, "FMOVLP F0,%e", +0x0c, R0,0, "FSTSW %OAX", +}; + +static Optable optabF6[8] = +{ +0x00, Ib,0, "TESTB %i,%e", +0x02, 0,0, "NOTB %e", +0x03, 0,0, "NEGB %e", +0x04, 0,0, "MULB AL,%e", +0x05, 0,0, "IMULB AL,%e", +0x06, 0,0, "DIVB AL,%e", +0x07, 0,0, "IDIVB AL,%e", +}; + +static Optable optabF7[8] = +{ +0x00, Iwd,0, "TEST%S %i,%e", +0x02, 0,0, "NOT%S %e", +0x03, 0,0, "NEG%S %e", +0x04, 0,0, "MUL%S %OAX,%e", +0x05, 0,0, "IMUL%S %OAX,%e", +0x06, 0,0, "DIV%S %OAX,%e", +0x07, 0,0, "IDIV%S %OAX,%e", +}; + +static Optable optabFE[8] = +{ +0x00, 0,0, "INCB %e", +0x01, 0,0, "DECB %e", +}; + +static Optable optabFF[8] = +{ +0x00, 0,0, "INC%S %e", +0x01, 0,0, "DEC%S %e", +0x02, JUMP,0, "CALL* %e", +0x03, JUMP,0, "CALLF* %e", +0x04, JUMP,0, "JMP* %e", +0x05, JUMP,0, "JMPF* %e", +0x06, 0,0, "PUSHL %e", +}; + +static Optable optable[256+1] = +{ +0x00, RMB,0, "ADDB %r,%e", +0x01, RM,0, "ADD%S %r,%e", +0x02, RMB,0, "ADDB %e,%r", +0x03, RM,0, "ADD%S %e,%r", +0x04, Ib,0, "ADDB %i,AL", +0x05, Iwd,0, "ADD%S %i,%OAX", +0x06, 0,0, "PUSHL ES", +0x07, 0,0, "POPL ES", +0x08, RMB,0, "ORB %r,%e", +0x09, RM,0, "OR%S %r,%e", +0x0a, RMB,0, "ORB %e,%r", +0x0b, RM,0, "OR%S %e,%r", +0x0c, Ib,0, "ORB %i,AL", +0x0d, Iwd,0, "OR%S %i,%OAX", +0x0e, 0,0, "PUSHL CS", +0x0f, AUXMM,0, optab0F, +0x10, RMB,0, "ADCB %r,%e", +0x11, RM,0, "ADC%S %r,%e", +0x12, RMB,0, "ADCB %e,%r", +0x13, RM,0, "ADC%S %e,%r", +0x14, Ib,0, "ADCB %i,AL", +0x15, Iwd,0, "ADC%S %i,%OAX", +0x16, 0,0, "PUSHL SS", +0x17, 0,0, "POPL SS", +0x18, RMB,0, "SBBB %r,%e", +0x19, RM,0, "SBB%S %r,%e", +0x1a, RMB,0, "SBBB %e,%r", +0x1b, RM,0, "SBB%S %e,%r", +0x1c, Ib,0, "SBBB %i,AL", +0x1d, Iwd,0, "SBB%S %i,%OAX", +0x1e, 0,0, "PUSHL DS", +0x1f, 0,0, "POPL DS", +0x20, RMB,0, "ANDB %r,%e", +0x21, RM,0, "AND%S %r,%e", +0x22, RMB,0, "ANDB %e,%r", +0x23, RM,0, "AND%S %e,%r", +0x24, Ib,0, "ANDB %i,AL", +0x25, Iwd,0, "AND%S %i,%OAX", +0x26, SEG,0, "ES:", +0x27, 0,0, "DAA", +0x28, RMB,0, "SUBB %r,%e", +0x29, RM,0, "SUB%S %r,%e", +0x2a, RMB,0, "SUBB %e,%r", +0x2b, RM,0, "SUB%S %e,%r", +0x2c, Ib,0, "SUBB %i,AL", +0x2d, Iwd,0, "SUB%S %i,%OAX", +0x2e, SEG,0, "CS:", +0x2f, 0,0, "DAS", +0x30, RMB,0, "XORB %r,%e", +0x31, RM,0, "XOR%S %r,%e", +0x32, RMB,0, "XORB %e,%r", +0x33, RM,0, "XOR%S %e,%r", +0x34, Ib,0, "XORB %i,AL", +0x35, Iwd,0, "XOR%S %i,%OAX", +0x36, SEG,0, "SS:", +0x37, 0,0, "AAA", +0x38, RMB,0, "CMPB %r,%e", +0x39, RM,0, "CMP%S %r,%e", +0x3a, RMB,0, "CMPB %e,%r", +0x3b, RM,0, "CMP%S %e,%r", +0x3c, Ib,0, "CMPB %i,AL", +0x3d, Iwd,0, "CMP%S %i,%OAX", +0x3e, SEG,0, "DS:", +0x3f, 0,0, "AAS", +0x40, 0,0, "INC%S %OAX", +0x41, 0,0, "INC%S %OCX", +0x42, 0,0, "INC%S %ODX", +0x43, 0,0, "INC%S %OBX", +0x44, 0,0, "INC%S %OSP", +0x45, 0,0, "INC%S %OBP", +0x46, 0,0, "INC%S %OSI", +0x47, 0,0, "INC%S %ODI", +0x48, 0,0, "DEC%S %OAX", +0x49, 0,0, "DEC%S %OCX", +0x4a, 0,0, "DEC%S %ODX", +0x4b, 0,0, "DEC%S %OBX", +0x4c, 0,0, "DEC%S %OSP", +0x4d, 0,0, "DEC%S %OBP", +0x4e, 0,0, "DEC%S %OSI", +0x4f, 0,0, "DEC%S %ODI", +0x50, 0,0, "PUSH%S %OAX", +0x51, 0,0, "PUSH%S %OCX", +0x52, 0,0, "PUSH%S %ODX", +0x53, 0,0, "PUSH%S %OBX", +0x54, 0,0, "PUSH%S %OSP", +0x55, 0,0, "PUSH%S %OBP", +0x56, 0,0, "PUSH%S %OSI", +0x57, 0,0, "PUSH%S %ODI", +0x58, 0,0, "POP%S %OAX", +0x59, 0,0, "POP%S %OCX", +0x5a, 0,0, "POP%S %ODX", +0x5b, 0,0, "POP%S %OBX", +0x5c, 0,0, "POP%S %OSP", +0x5d, 0,0, "POP%S %OBP", +0x5e, 0,0, "POP%S %OSI", +0x5f, 0,0, "POP%S %ODI", +0x60, 0,0, "PUSHA%S", +0x61, 0,0, "POPA%S", +0x62, RMM,0, "BOUND %e,%r", +0x63, RM,0, "ARPL %r,%e", +0x64, SEG,0, "FS:", +0x65, SEG,0, "GS:", +0x66, OPOVER,0, "", +0x67, ADDOVER,0, "", +0x68, Iwd,0, "PUSH%S %i", +0x69, RM,Iwd, "IMUL%S %e,%i,%r", +0x6a, Ib,0, "PUSH%S %i", +0x6b, RM,Ibs, "IMUL%S %e,%i,%r", +0x6c, 0,0, "INSB DX,(%ODI)", +0x6d, 0,0, "INS%S DX,(%ODI)", +0x6e, 0,0, "OUTSB (%ASI),DX", +0x6f, 0,0, "OUTS%S (%ASI),DX", +0x70, Jbs,0, "JOS %p", +0x71, Jbs,0, "JOC %p", +0x72, Jbs,0, "JCS %p", +0x73, Jbs,0, "JCC %p", +0x74, Jbs,0, "JEQ %p", +0x75, Jbs,0, "JNE %p", +0x76, Jbs,0, "JLS %p", +0x77, Jbs,0, "JHI %p", +0x78, Jbs,0, "JMI %p", +0x79, Jbs,0, "JPL %p", +0x7a, Jbs,0, "JPS %p", +0x7b, Jbs,0, "JPC %p", +0x7c, Jbs,0, "JLT %p", +0x7d, Jbs,0, "JGE %p", +0x7e, Jbs,0, "JLE %p", +0x7f, Jbs,0, "JGT %p", +0x80, RMOPB,0, optab80, +0x81, RMOP,0, optab81, +0x83, RMOP,0, optab83, +0x84, RMB,0, "TESTB %r,%e", +0x85, RM,0, "TEST%S %r,%e", +0x86, RMB,0, "XCHGB %r,%e", +0x87, RM,0, "XCHG%S %r,%e", +0x88, RMB,0, "MOVB %r,%e", +0x89, RM,0, "MOV%S %r,%e", +0x8a, RMB,0, "MOVB %e,%r", +0x8b, RM,0, "MOV%S %e,%r", +0x8c, RM,0, "MOVW %g,%e", +0x8d, RM,0, "LEA%S %e,%r", +0x8e, RM,0, "MOVW %e,%g", +0x8f, RM,0, "POP%S %e", +0x90, 0,0, "NOP", +0x91, 0,0, "XCHG %OCX,%OAX", +0x92, 0,0, "XCHG %ODX,%OAX", +0x93, 0,0, "XCHG %OBX,%OAX", +0x94, 0,0, "XCHG %OSP,%OAX", +0x95, 0,0, "XCHG %OBP,%OAX", +0x96, 0,0, "XCHG %OSI,%OAX", +0x97, 0,0, "XCHG %ODI,%OAX", +0x98, 0,0, "%W", /* miserable CBW or CWDE */ +0x99, 0,0, "%w", /* idiotic CWD or CDQ */ +0x9a, PTR,0, "CALL%S %d", +0x9b, 0,0, "WAIT", +0x9c, 0,0, "PUSHF", +0x9d, 0,0, "POPF", +0x9e, 0,0, "SAHF", +0x9f, 0,0, "LAHF", +0xa0, Awd,0, "MOVB %i,AL", +0xa1, Awd,0, "MOV%S %i,%OAX", +0xa2, Awd,0, "MOVB AL,%i", +0xa3, Awd,0, "MOV%S %OAX,%i", +0xa4, 0,0, "MOVSB (%ASI),(%ADI)", +0xa5, 0,0, "MOVS%S (%ASI),(%ADI)", +0xa6, 0,0, "CMPSB (%ASI),(%ADI)", +0xa7, 0,0, "CMPS%S (%ASI),(%ADI)", +0xa8, Ib,0, "TESTB %i,AL", +0xa9, Iwd,0, "TEST%S %i,%OAX", +0xaa, 0,0, "STOSB AL,(%ADI)", +0xab, 0,0, "STOS%S %OAX,(%ADI)", +0xac, 0,0, "LODSB (%ASI),AL", +0xad, 0,0, "LODS%S (%ASI),%OAX", +0xae, 0,0, "SCASB (%ADI),AL", +0xaf, 0,0, "SCAS%S (%ADI),%OAX", +0xb0, Ib,0, "MOVB %i,AL", +0xb1, Ib,0, "MOVB %i,CL", +0xb2, Ib,0, "MOVB %i,DL", +0xb3, Ib,0, "MOVB %i,BL", +0xb4, Ib,0, "MOVB %i,AH", +0xb5, Ib,0, "MOVB %i,CH", +0xb6, Ib,0, "MOVB %i,DH", +0xb7, Ib,0, "MOVB %i,BH", +0xb8, Iwdq,0, "MOV%S %i,%OAX", +0xb9, Iwdq,0, "MOV%S %i,%OCX", +0xba, Iwdq,0, "MOV%S %i,%ODX", +0xbb, Iwdq,0, "MOV%S %i,%OBX", +0xbc, Iwdq,0, "MOV%S %i,%OSP", +0xbd, Iwdq,0, "MOV%S %i,%OBP", +0xbe, Iwdq,0, "MOV%S %i,%OSI", +0xbf, Iwdq,0, "MOV%S %i,%ODI", +0xc0, RMOPB,0, optabC0, +0xc1, RMOP,0, optabC1, +0xc2, Iw,0, "RET %i", +0xc3, RET,0, "RET", +0xc4, RM,0, "LES %e,%r", +0xc5, RM,0, "LDS %e,%r", +0xc6, RMB,Ib, "MOVB %i,%e", +0xc7, RM,Iwd, "MOV%S %i,%e", +0xc8, Iw2,Ib, "ENTER %i,%I", /* loony ENTER */ +0xc9, RET,0, "LEAVE", /* bizarre LEAVE */ +0xca, Iw,0, "RETF %i", +0xcb, RET,0, "RETF", +0xcc, 0,0, "INT 3", +0xcd, Ib,0, "INTB %i", +0xce, 0,0, "INTO", +0xcf, 0,0, "IRET", +0xd0, RMOPB,0, optabD0, +0xd1, RMOP,0, optabD1, +0xd2, RMOPB,0, optabD2, +0xd3, RMOP,0, optabD3, +0xd4, OA,0, "AAM", +0xd5, OA,0, "AAD", +0xd7, 0,0, "XLAT", +0xd8, FRMOP,0, optabD8, +0xd9, FRMEX,0, optabD9, +0xda, FRMOP,0, optabDA, +0xdb, FRMEX,0, optabDB, +0xdc, FRMOP,0, optabDC, +0xdd, FRMOP,0, optabDD, +0xde, FRMOP,0, optabDE, +0xdf, FRMOP,0, optabDF, +0xe0, Jbs,0, "LOOPNE %p", +0xe1, Jbs,0, "LOOPE %p", +0xe2, Jbs,0, "LOOP %p", +0xe3, Jbs,0, "JCXZ %p", +0xe4, Ib,0, "INB %i,AL", +0xe5, Ib,0, "IN%S %i,%OAX", +0xe6, Ib,0, "OUTB AL,%i", +0xe7, Ib,0, "OUT%S %OAX,%i", +0xe8, Iwds,0, "CALL %p", +0xe9, Iwds,0, "JMP %p", +0xea, PTR,0, "JMP %d", +0xeb, Jbs,0, "JMP %p", +0xec, 0,0, "INB DX,AL", +0xed, 0,0, "IN%S DX,%OAX", +0xee, 0,0, "OUTB AL,DX", +0xef, 0,0, "OUT%S %OAX,DX", +0xf0, PRE,0, "LOCK", +0xf2, OPRE,0, "REPNE", +0xf3, OPRE,0, "REP", +0xf4, 0,0, "HLT", +0xf5, 0,0, "CMC", +0xf6, RMOPB,0, optabF6, +0xf7, RMOP,0, optabF7, +0xf8, 0,0, "CLC", +0xf9, 0,0, "STC", +0xfa, 0,0, "CLI", +0xfb, 0,0, "STI", +0xfc, 0,0, "CLD", +0xfd, 0,0, "STD", +0xfe, RMOPB,0, optabFE, +0xff, RMOP,0, optabFF, +0x100, RM,0, "MOVLQSX %r,%e", +}; + +static struct { + Optable *tab; + uint nel; +} optabtab[] = { + optab0F00, nelem(optab0F00), + optab0F01, nelem(optab0F01), + optab0F01F8, nelem(optab0F01F8), + optab0FAE, nelem(optab0FAE), + optab0FBA, nelem(optab0FBA), + optab0F0F, nelem(optab0F0F), + optab0FC7, nelem(optab0FC7), + optab660F71, nelem(optab660F71), + optab660F72, nelem(optab660F72), + optab660F73, nelem(optab660F73), + optab660F, nelem(optab660F), + optabF20F, nelem(optabF20F), + optabF30F, nelem(optabF30F), + optab0F, nelem(optab0F), + optab80, nelem(optab80), + optab81, nelem(optab81), + optab83, nelem(optab83), + optabC0, nelem(optabC0), + optabC1, nelem(optabC1), + optabD0, nelem(optabD0), + optabD1, nelem(optabD1), + optabD2, nelem(optabD2), + optabD3, nelem(optabD3), + optabD8, nelem(optabD8), + optabD9, nelem(optabD9), + optabDA, nelem(optabDA), + optabDB, nelem(optabDB), + optabDC, nelem(optabDC), + optabDD, nelem(optabDD), + optabDE, nelem(optabDE), + optabDF, nelem(optabDF), + optabF6, nelem(optabF6), + optabF7, nelem(optabF7), + optabFE, nelem(optabFE), + optabFF, nelem(optabFF), + optable, nelem(optable), +}; + +/* + * compensate for Microsoft's ageing compilers + */ +static void +ordertab(Optable *tab, int nel) +{ + int i, x; + static Optable empty; + + for(i = nel; --i >= 0;){ + x = tab[i].x; + if(x != i){ + tab[x] = tab[i]; + tab[i] = empty; + } + } +} + +static void +soptoms(void) +{ + int i; + static int reordered; /* assumes non-concurrent use */ + + if(reordered) + return; + reordered = 1; + for(i = 0; i < nelem(optabtab); i++) + ordertab(optabtab[i].tab, optabtab[i].nel); +} + +/* + * get a byte of the instruction + */ +static int +igetc(Map *map, Instr *ip, uchar *c) +{ + if(ip->n+1 > sizeof(ip->mem)){ + werrstr("instruction too long"); + return -1; + } + if (get1(map, ip->addr+ip->n, c, 1) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + ip->mem[ip->n++] = *c; + return 1; +} + +/* + * get two bytes of the instruction + */ +static int +igets(Map *map, Instr *ip, ushort *sp) +{ + uchar c; + ushort s; + + if (igetc(map, ip, &c) < 0) + return -1; + s = c; + if (igetc(map, ip, &c) < 0) + return -1; + s |= (c<<8); + *sp = s; + return 1; +} + +/* + * get 4 bytes of the instruction + */ +static int +igetl(Map *map, Instr *ip, ulong *lp) +{ + ushort s; + long l; + + if (igets(map, ip, &s) < 0) + return -1; + l = s; + if (igets(map, ip, &s) < 0) + return -1; + l |= (s<<16); + *lp = l; + return 1; +} + +/* + * get 8 bytes of the instruction + */ +static int +igetq(Map *map, Instr *ip, vlong *qp) +{ + ulong l; + uvlong q; + + if (igetl(map, ip, &l) < 0) + return -1; + q = l; + if (igetl(map, ip, &l) < 0) + return -1; + q |= ((uvlong)l<<32); + *qp = q; + return 1; +} + +static int +getdisp(Map *map, Instr *ip, int mod, int rm, int code, int pcrel) +{ + uchar c; + ushort s; + + if (mod > 2) + return 1; + if (mod == 1) { + if (igetc(map, ip, &c) < 0) + return -1; + if (c&0x80) + ip->disp = c|0xffffff00; + else + ip->disp = c&0xff; + } else if (mod == 2 || rm == code) { + if (ip->asize == 'E') { + if (igetl(map, ip, &ip->disp) < 0) + return -1; + if (mod == 0) + ip->rip = pcrel; + } else { + if (igets(map, ip, &s) < 0) + return -1; + if (s&0x8000) + ip->disp = s|0xffff0000; + else + ip->disp = s; + } + if (mod == 0) + ip->base = -1; + } + return 1; +} + +static int +modrm(Map *map, Instr *ip, uchar c) +{ + uchar rm, mod; + + mod = (c>>6)&3; + rm = c&7; + ip->mod = mod; + ip->base = rm; + ip->reg = (c>>3)&7; + ip->rip = 0; + if (mod == 3) /* register */ + return 1; + if (ip->asize == 0) { /* 16-bit mode */ + switch(rm) { + case 0: + ip->base = BX; ip->index = SI; + break; + case 1: + ip->base = BX; ip->index = DI; + break; + case 2: + ip->base = BP; ip->index = SI; + break; + case 3: + ip->base = BP; ip->index = DI; + break; + case 4: + ip->base = SI; + break; + case 5: + ip->base = DI; + break; + case 6: + ip->base = BP; + break; + case 7: + ip->base = BX; + break; + default: + break; + } + return getdisp(map, ip, mod, rm, 6, 0); + } + if (rm == 4) { /* scummy sib byte */ + if (igetc(map, ip, &c) < 0) + return -1; + ip->ss = (c>>6)&0x03; + ip->index = (c>>3)&0x07; + if (ip->index == 4) + ip->index = -1; + ip->base = c&0x07; + return getdisp(map, ip, mod, ip->base, 5, 0); + } + return getdisp(map, ip, mod, rm, 5, ip->amd64); +} + +static Optable * +mkinstr(Map *map, Instr *ip, uvlong pc) +{ + int i, n, norex; + uchar c; + ushort s; + Optable *op, *obase; + char buf[128]; + + soptoms(); + memset(ip, 0, sizeof(*ip)); + norex = 1; + ip->base = -1; + ip->index = -1; + if(asstype == AI8086) + ip->osize = 'W'; + else { + ip->osize = 'L'; + ip->asize = 'E'; + ip->amd64 = asstype != AI386; + norex = 0; + } + ip->addr = pc; + if (igetc(map, ip, &c) < 0) + return 0; + obase = optable; +newop: + if(ip->amd64 && !norex){ + if(c >= 0x40 && c <= 0x4f) { + ip->rex = c; + if(igetc(map, ip, &c) < 0) + return 0; + } + if(c == 0x63){ + op = &obase[0x100]; /* MOVLQSX */ + goto hack; + } + } + op = &obase[c]; +hack: + if (op->proto == 0) { +badop: + n = snprint(buf, sizeof(buf), "opcode: ??"); + for (i = 0; i < ip->n && n < sizeof(buf)-3; i++, n+=2) + _hexify(buf+n, ip->mem[i], 1); + strcpy(buf+n, "??"); + werrstr(buf); + return 0; + } + for(i = 0; i < 2 && op->operand[i]; i++) { + switch(op->operand[i]) { + case Ib: /* 8-bit immediate - (no sign extension)*/ + if (igetc(map, ip, &c) < 0) + return 0; + ip->imm = c&0xff; + ip->imm64 = ip->imm; + break; + case Jbs: /* 8-bit jump immediate (sign extended) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (c&0x80) + ip->imm = c|0xffffff00; + else + ip->imm = c&0xff; + ip->imm64 = (long)ip->imm; + ip->jumptype = Jbs; + break; + case Ibs: /* 8-bit immediate (sign extended) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (c&0x80) + if (ip->osize == 'L') + ip->imm = c|0xffffff00; + else + ip->imm = c|0xff00; + else + ip->imm = c&0xff; + ip->imm64 = (long)ip->imm; + break; + case Iw: /* 16-bit immediate -> imm */ + if (igets(map, ip, &s) < 0) + return 0; + ip->imm = s&0xffff; + ip->imm64 = ip->imm; + ip->jumptype = Iw; + break; + case Iw2: /* 16-bit immediate -> in imm2*/ + if (igets(map, ip, &s) < 0) + return 0; + ip->imm2 = s&0xffff; + break; + case Iwd: /* Operand-sized immediate (no sign extension unless 64 bits)*/ + if (ip->osize == 'L') { + if (igetl(map, ip, &ip->imm) < 0) + return 0; + ip->imm64 = ip->imm; + if(ip->rex&REXW && (ip->imm & (1<<31)) != 0) + ip->imm64 |= (vlong)~0 << 32; + } else { + if (igets(map, ip, &s)< 0) + return 0; + ip->imm = s&0xffff; + ip->imm64 = ip->imm; + } + break; + case Iwdq: /* Operand-sized immediate, possibly big */ + if (ip->osize == 'L') { + if (igetl(map, ip, &ip->imm) < 0) + return 0; + ip->imm64 = ip->imm; + if (ip->rex & REXW) { + ulong l; + if (igetl(map, ip, &l) < 0) + return 0; + ip->imm64 |= (uvlong)l << 32; + } + } else { + if (igets(map, ip, &s)< 0) + return 0; + ip->imm = s&0xffff; + } + break; + case Awd: /* Address-sized immediate (no sign extension)*/ + if (ip->asize == 'E') { + if (igetl(map, ip, &ip->imm) < 0) + return 0; + /* TO DO: REX */ + } else { + if (igets(map, ip, &s)< 0) + return 0; + ip->imm = s&0xffff; + } + break; + case Iwds: /* Operand-sized immediate (sign extended) */ + if (ip->osize == 'L') { + if (igetl(map, ip, &ip->imm) < 0) + return 0; + } else { + if (igets(map, ip, &s)< 0) + return 0; + if (s&0x8000) + ip->imm = s|0xffff0000; + else + ip->imm = s&0xffff; + } + ip->jumptype = Iwds; + break; + case OA: /* literal 0x0a byte */ + if (igetc(map, ip, &c) < 0) + return 0; + if (c != 0x0a) + goto badop; + break; + case R0: /* base register must be R0 */ + if (ip->base != 0) + goto badop; + break; + case R1: /* base register must be R1 */ + if (ip->base != 1) + goto badop; + break; + case RMB: /* R/M field with byte register (/r)*/ + if (igetc(map, ip, &c) < 0) + return 0; + if (modrm(map, ip, c) < 0) + return 0; + ip->osize = 'B'; + break; + case RM: /* R/M field with register (/r) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (modrm(map, ip, c) < 0) + return 0; + break; + case RMOPB: /* R/M field with op code (/digit) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (modrm(map, ip, c) < 0) + return 0; + c = ip->reg; /* secondary op code */ + obase = (Optable*)op->proto; + ip->osize = 'B'; + goto newop; + case RMOP: /* R/M field with op code (/digit) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (modrm(map, ip, c) < 0) + return 0; + obase = (Optable*)op->proto; + if(ip->amd64 && obase == optab0F01 && c == 0xF8) + return optab0F01F8; + c = ip->reg; + goto newop; + case FRMOP: /* FP R/M field with op code (/digit) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (modrm(map, ip, c) < 0) + return 0; + if ((c&0xc0) == 0xc0) + c = ip->reg+8; /* 16 entry table */ + else + c = ip->reg; + obase = (Optable*)op->proto; + goto newop; + case FRMEX: /* Extended FP R/M field with op code (/digit) */ + if (igetc(map, ip, &c) < 0) + return 0; + if (modrm(map, ip, c) < 0) + return 0; + if ((c&0xc0) == 0xc0) + c = (c&0x3f)+8; /* 64-entry table */ + else + c = ip->reg; + obase = (Optable*)op->proto; + goto newop; + case RMR: /* R/M register only (mod = 11) */ + if (igetc(map, ip, &c) < 0) + return 0; + if ((c&0xc0) != 0xc0) { + werrstr("invalid R/M register: %x", c); + return 0; + } + if (modrm(map, ip, c) < 0) + return 0; + break; + case RMM: /* R/M register only (mod = 11) */ + if (igetc(map, ip, &c) < 0) + return 0; + if ((c&0xc0) == 0xc0) { + werrstr("invalid R/M memory mode: %x", c); + return 0; + } + if (modrm(map, ip, c) < 0) + return 0; + break; + case PTR: /* Seg:Displacement addr (ptr16:16 or ptr16:32) */ + if (ip->osize == 'L') { + if (igetl(map, ip, &ip->disp) < 0) + return 0; + } else { + if (igets(map, ip, &s)< 0) + return 0; + ip->disp = s&0xffff; + } + if (igets(map, ip, (ushort*)&ip->seg) < 0) + return 0; + ip->jumptype = PTR; + break; + case AUXMM: /* Multi-byte op code; prefix determines table selection */ + if (igetc(map, ip, &c) < 0) + return 0; + obase = (Optable*)op->proto; + switch (ip->opre) { + case 0x66: op = optab660F; break; + case 0xF2: op = optabF20F; break; + case 0xF3: op = optabF30F; break; + default: op = nil; break; + } + if(op != nil && op[c].proto != nil) + obase = op; + norex = 1; /* no more rex prefixes */ + /* otherwise the optab entry captures it */ + goto newop; + case AUX: /* Multi-byte op code - Auxiliary table */ + obase = (Optable*)op->proto; + if (igetc(map, ip, &c) < 0) + return 0; + goto newop; + case OPRE: /* Instr Prefix or media op */ + ip->opre = c; + /* fall through */ + case PRE: /* Instr Prefix */ + ip->prefix = (char*)op->proto; + if (igetc(map, ip, &c) < 0) + return 0; + if (ip->opre && c == 0x0F) + ip->prefix = 0; + goto newop; + case SEG: /* Segment Prefix */ + ip->segment = (char*)op->proto; + if (igetc(map, ip, &c) < 0) + return 0; + goto newop; + case OPOVER: /* Operand size override */ + ip->opre = c; + ip->osize = 'W'; + if (igetc(map, ip, &c) < 0) + return 0; + if (c == 0x0F) + ip->osize = 'L'; + else if (ip->amd64 && (c&0xF0) == 0x40) + ip->osize = 'Q'; + goto newop; + case ADDOVER: /* Address size override */ + ip->asize = 0; + if (igetc(map, ip, &c) < 0) + return 0; + goto newop; + case JUMP: /* mark instruction as JUMP or RET */ + case RET: + ip->jumptype = op->operand[i]; + break; + default: + werrstr("bad operand type %d", op->operand[i]); + return 0; + } + } + return op; +} + +#pragma varargck argpos bprint 2 + +static void +bprint(Instr *ip, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + ip->curr = vseprint(ip->curr, ip->end, fmt, arg); + va_end(arg); +} + +/* + * if we want to call 16 bit regs AX,BX,CX,... + * and 32 bit regs EAX,EBX,ECX,... then + * change the defs of ANAME and ONAME to: + * #define ANAME(ip) ((ip->asize == 'E' ? "E" : "") + * #define ONAME(ip) ((ip)->osize == 'L' ? "E" : "") + */ +#define ANAME(ip) "" +#define ONAME(ip) "" + +static char *reg[] = { + "AX", + "CX", + "DX", + "BX", + "SP", + "BP", + "SI", + "DI", + + /* amd64 */ + "R8", + "R9", + "R10", + "R11", + "R12", + "R13", + "R14", + "R15", +}; + +static char *breg[] = { "AL", "CL", "DL", "BL", "AH", "CH", "DH", "BH" }; +static char *breg64[] = { "AL", "CL", "DL", "BL", "SPB", "BPB", "SIB", "DIB", + "R8B", "R9B", "R10B", "R11B", "R12B", "R13B", "R14B", "R15B" }; +static char *sreg[] = { "ES", "CS", "SS", "DS", "FS", "GS" }; + +static void +plocal(Instr *ip) +{ + int ret; + long offset; + Symbol s; + char *reg; + + offset = ip->disp; + if (!findsym(ip->addr, CTEXT, &s) || !findlocal(&s, FRAMENAME, &s)) { + bprint(ip, "%lux(SP)", offset); + return; + } + + if (s.value > ip->disp) { + ret = getauto(&s, s.value-ip->disp-mach->szaddr, CAUTO, &s); + reg = "(SP)"; + } else { + offset -= s.value; + ret = getauto(&s, offset, CPARAM, &s); + reg = "(FP)"; + } + if (ret) + bprint(ip, "%s+", s.name); + else + offset = ip->disp; + bprint(ip, "%lux%s", offset, reg); +} + +static int +isjmp(Instr *ip) +{ + switch(ip->jumptype){ + case Iwds: + case Jbs: + case JUMP: + return 1; + default: + return 0; + } +} + +/* + * This is too smart for its own good, but it really is nice + * to have accurate translations when debugging, and it + * helps us identify which code is different in binaries that + * are changed on sources. + */ +static int +issymref(Instr *ip, Symbol *s, long w, long val) +{ + Symbol next, tmp; + long isstring, size; + + if (isjmp(ip)) + return 1; + if (s->class==CTEXT && w==0) + return 1; + if (s->class==CDATA) { + /* use first bss symbol (or "end") rather than edata */ + if (s->name[0]=='e' && strcmp(s->name, "edata") == 0){ + if((s ->index >= 0 && globalsym(&tmp, s->index+1) && tmp.value==s->value) + || (s->index > 0 && globalsym(&tmp, s->index-1) && tmp.value==s->value)) + *s = tmp; + } + if (w == 0) + return 1; + for (next=*s; next.value==s->value; next=tmp) + if (!globalsym(&tmp, next.index+1)) + break; + size = next.value - s->value; + if (w >= size) + return 0; + if (w > size-w) + w = size-w; + /* huge distances are usually wrong except in .string */ + isstring = (s->name[0]=='.' && strcmp(s->name, ".string") == 0); + if (w > 8192 && !isstring) + return 0; + /* medium distances are tricky - look for constants */ + /* near powers of two */ + if ((val&(val-1)) == 0 || (val&(val+1)) == 0) + return 0; + return 1; + } + return 0; +} + +static void +immediate(Instr *ip, vlong val) +{ + Symbol s; + long w; + + if (findsym(val, CANY, &s)) { /* TO DO */ + w = val - s.value; + if (w < 0) + w = -w; + if (issymref(ip, &s, w, val)) { + if (w) + bprint(ip, "%s+%lux(SB)", s.name, w); + else + bprint(ip, "%s(SB)", s.name); + return; + } +/* + if (s.class==CDATA && globalsym(&s, s.index+1)) { + w = s.value - val; + if (w < 0) + w = -w; + if (w < 4096) { + bprint(ip, "%s-%lux(SB)", s.name, w); + return; + } + } +*/ + } + if((ip->rex & REXW) == 0) + bprint(ip, "%lux", (long)val); + else + bprint(ip, "%llux", val); +} + +static void +pea(Instr *ip) +{ + if (ip->mod == 3) { + if (ip->osize == 'B') + bprint(ip, (ip->rex & REXB? breg64: breg)[ip->base]); + else if(ip->rex & REXB) + bprint(ip, "%s%s", ANAME(ip), reg[ip->base+8]); + else + bprint(ip, "%s%s", ANAME(ip), reg[ip->base]); + return; + } + if (ip->segment) + bprint(ip, ip->segment); + if (ip->asize == 'E' && ip->base == SP) + plocal(ip); + else { + if (ip->base < 0) + immediate(ip, ip->disp); + else { + bprint(ip, "%lux", ip->disp); + if(ip->rip) + bprint(ip, "(RIP)"); + bprint(ip,"(%s%s)", ANAME(ip), reg[ip->rex&REXB? ip->base+8: ip->base]); + } + } + if (ip->index >= 0) + bprint(ip,"(%s%s*%d)", ANAME(ip), reg[ip->rex&REXX? ip->index+8: ip->index], 1<<ip->ss); +} + +static void +prinstr(Instr *ip, char *fmt) +{ + vlong v; + + if (ip->prefix) + bprint(ip, "%s ", ip->prefix); + for (; *fmt && ip->curr < ip->end; fmt++) { + if (*fmt != '%'){ + *ip->curr++ = *fmt; + continue; + } + switch(*++fmt){ + case '%': + *ip->curr++ = '%'; + break; + case 'A': + bprint(ip, "%s", ANAME(ip)); + break; + case 'C': + bprint(ip, "CR%d", ip->reg); + break; + case 'D': + if (ip->reg < 4 || ip->reg == 6 || ip->reg == 7) + bprint(ip, "DR%d",ip->reg); + else + bprint(ip, "?"); + break; + case 'I': + bprint(ip, "$"); + immediate(ip, ip->imm2); + break; + case 'O': + bprint(ip,"%s", ONAME(ip)); + break; + case 'i': + bprint(ip, "$"); + v = ip->imm; + if(ip->rex & REXW) + v = ip->imm64; + immediate(ip, v); + break; + case 'R': + bprint(ip, "%s%s", ONAME(ip), reg[ip->rex&REXR? ip->reg+8: ip->reg]); + break; + case 'S': + if(ip->osize == 'Q' || ip->osize == 'L' && ip->rex & REXW) + bprint(ip, "Q"); + else + bprint(ip, "%c", ip->osize); + break; + case 's': + if(ip->opre == 0 || ip->opre == 0x66) + bprint(ip, "P"); + else + bprint(ip, "S"); + if(ip->opre == 0xf2 || ip->opre == 0x66) + bprint(ip, "D"); + else + bprint(ip, "S"); + break; + case 'T': + if (ip->reg == 6 || ip->reg == 7) + bprint(ip, "TR%d",ip->reg); + else + bprint(ip, "?"); + break; + case 'W': + if (ip->osize == 'Q' || ip->osize == 'L' && ip->rex & REXW) + bprint(ip, "CDQE"); + else if (ip->osize == 'L') + bprint(ip,"CWDE"); + else + bprint(ip, "CBW"); + break; + case 'd': + bprint(ip,"%ux:%lux",ip->seg,ip->disp); + break; + case 'm': + if (ip->mod == 3 && ip->osize != 'B') { + if(fmt[1] != '*'){ + if(ip->opre != 0) { + bprint(ip, "X%d", ip->rex&REXB? ip->base+8: ip->base); + break; + } + } else + fmt++; + bprint(ip, "M%d", ip->base); + break; + } + pea(ip); + break; + case 'e': + pea(ip); + break; + case 'f': + bprint(ip, "F%d", ip->base); + break; + case 'g': + if (ip->reg < 6) + bprint(ip,"%s",sreg[ip->reg]); + else + bprint(ip,"?"); + break; + case 'p': + /* + * signed immediate in the ulong ip->imm. + */ + v = (long)ip->imm; + immediate(ip, v+ip->addr+ip->n); + break; + case 'r': + if (ip->osize == 'B') + bprint(ip,"%s", (ip->rex? breg64: breg)[ip->rex&REXR? ip->reg+8: ip->reg]); + else + bprint(ip, reg[ip->rex&REXR? ip->reg+8: ip->reg]); + break; + case 'w': + if (ip->osize == 'Q' || ip->rex & REXW) + bprint(ip, "CQO"); + else if (ip->osize == 'L') + bprint(ip,"CDQ"); + else + bprint(ip, "CWD"); + break; + case 'M': + if(ip->opre != 0) + bprint(ip, "X%d", ip->rex&REXR? ip->reg+8: ip->reg); + else + bprint(ip, "M%d", ip->reg); + break; + case 'x': + if (ip->mod == 3 && ip->osize != 'B') { + bprint(ip, "X%d", ip->rex&REXB? ip->base+8: ip->base); + break; + } + pea(ip); + break; + case 'X': + bprint(ip, "X%d", ip->rex&REXR? ip->reg+8: ip->reg); + break; + default: + bprint(ip, "%%%c", *fmt); + break; + } + } + *ip->curr = 0; /* there's always room for 1 byte */ +} + +static int +i386inst(Map *map, uvlong pc, char modifier, char *buf, int n) +{ + Instr instr; + Optable *op; + + USED(modifier); + op = mkinstr(map, &instr, pc); + if (op == 0) { + errstr(buf, n); + return -1; + } + instr.curr = buf; + instr.end = buf+n-1; + prinstr(&instr, op->proto); + return instr.n; +} + +static int +i386das(Map *map, uvlong pc, char *buf, int n) +{ + Instr instr; + int i; + + if (mkinstr(map, &instr, pc) == 0) { + errstr(buf, n); + return -1; + } + for(i = 0; i < instr.n && n > 2; i++) { + _hexify(buf, instr.mem[i], 1); + buf += 2; + n -= 2; + } + *buf = 0; + return instr.n; +} + +static int +i386instlen(Map *map, uvlong pc) +{ + Instr i; + + if (mkinstr(map, &i, pc)) + return i.n; + return -1; +} + +static int +i386foll(Map *map, uvlong pc, Rgetter rget, uvlong *foll) +{ + Instr i; + Optable *op; + ushort s; + uvlong l, addr; + vlong v; + int n; + + op = mkinstr(map, &i, pc); + if (!op) + return -1; + + n = 0; + + switch(i.jumptype) { + case RET: /* RETURN or LEAVE */ + case Iw: /* RETURN */ + if (strcmp(op->proto, "LEAVE") == 0) { + if (geta(map, (*rget)(map, "BP"), &l) < 0) + return -1; + } else if (geta(map, (*rget)(map, mach->sp), &l) < 0) + return -1; + foll[0] = l; + return 1; + case Iwds: /* pc relative JUMP or CALL*/ + case Jbs: /* pc relative JUMP or CALL */ + v = (long)i.imm; + foll[0] = pc+v+i.n; + n = 1; + break; + case PTR: /* seg:displacement JUMP or CALL */ + foll[0] = (i.seg<<4)+i.disp; + return 1; + case JUMP: /* JUMP or CALL EA */ + + if(i.mod == 3) { + foll[0] = (*rget)(map, reg[i.rex&REXB? i.base+8: i.base]); + return 1; + } + /* calculate the effective address */ + addr = i.disp; + if (i.base >= 0) { + if (geta(map, (*rget)(map, reg[i.rex&REXB? i.base+8: i.base]), &l) < 0) + return -1; + addr += l; + } + if (i.index >= 0) { + if (geta(map, (*rget)(map, reg[i.rex&REXX? i.index+8: i.index]), &l) < 0) + return -1; + addr += l*(1<<i.ss); + } + /* now retrieve a seg:disp value at that address */ + if (get2(map, addr, &s) < 0) /* seg */ + return -1; + foll[0] = s<<4; + addr += 2; + if (i.asize == 'L') { + if (geta(map, addr, &l) < 0) /* disp32 */ + return -1; + foll[0] += l; + } else { /* disp16 */ + if (get2(map, addr, &s) < 0) + return -1; + foll[0] += s; + } + return 1; + default: + break; + } + if (strncmp(op->proto,"JMP", 3) == 0 || strncmp(op->proto,"CALL", 4) == 0) + return 1; + foll[n++] = pc+i.n; + return n; +} diff --git a/utils/libmach/8obj.c b/utils/libmach/8obj.c new file mode 100644 index 0000000..11e6911 --- /dev/null +++ b/utils/libmach/8obj.c @@ -0,0 +1,137 @@ +/* + * 8obj.c - identify and parse a 386 object file + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "8c/8.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char sym; + char flags; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + +int +_is8(char *t) +{ + uchar *s = (uchar*)t; + + return s[0] == (ANAME&0xff) /* aslo = ANAME */ + && s[1] == ((ANAME>>8)&0xff) + && s[2] == D_FILE /* type */ + && s[3] == 1 /* sym */ + && s[4] == '<'; /* name of file */ +} + +int +_read8(Biobuf *bp, Prog* p) +{ + int as, n, c; + Addr a; + + as = Bgetc(bp); /* as(low) */ + if(as < 0) + return 0; + c = Bgetc(bp); /* as(high) */ + if(c < 0) + return 0; + as |= ((c & 0xff) << 8); + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = leswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + if(as == AGLOBL) + p->kind = aData; + skip(bp, 4); /* lineno(4) */ + a = addr(bp); + addr(bp); + if(!(a.flags & T_SYM)) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + int t; + long off; + + off = 0; + a.sym = -1; + a.flags = Bgetc(bp); /* flags */ + if(a.flags & T_INDEX) + skip(bp, 2); + if(a.flags & T_OFFSET){ + off = Bgetc(bp); + off |= Bgetc(bp) << 8; + off |= Bgetc(bp) << 16; + off |= Bgetc(bp) << 24; + if(off < 0) + off = -off; + } + if(a.flags & T_SYM) + a.sym = Bgetc(bp); + if(a.flags & T_FCONST) + skip(bp, 8); + else + if(a.flags & T_SCONST) + skip(bp, NSNAME); + if(a.flags & T_TYPE) { + t = Bgetc(bp); + if(a.sym > 0 && (t==D_PARAM || t==D_AUTO)) + _offset(a.sym, off); + } + return a; +} + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} diff --git a/utils/libmach/9.c b/utils/libmach/9.c new file mode 100644 index 0000000..6a46a00 --- /dev/null +++ b/utils/libmach/9.c @@ -0,0 +1,120 @@ +/* + * PowerPC 64 definition + * forsyth@vitanuova.com + */ +#include <lib9.h> +#include <bio.h> +#include "ureg9.h" +#include "mach.h" + + +#define REGOFF(x) offsetof(struct Ureg, x) + +#define R31 REGOFF(r31) +#define FP_REG(x) (R31+4+8*(x)) + +#define REGSIZE sizeof(struct Ureg) +#define FPREGSIZE (8*33) + +Reglist power64reglist[] = { + {"CAUSE", REGOFF(cause), RINT|RRDONLY, 'Y'}, + {"TRAP", REGOFF(cause), RINT|RRDONLY, 'Y'}, /* alias for acid */ + {"MSR", REGOFF(msr), RINT|RRDONLY, 'Y'}, + {"PC", REGOFF(pc), RINT, 'Y'}, + {"LR", REGOFF(lr), RINT, 'Y'}, + {"CR", REGOFF(cr), RINT, 'X'}, + {"XER", REGOFF(xer), RINT, 'Y'}, + {"CTR", REGOFF(ctr), RINT, 'Y'}, + {"PC", REGOFF(pc), RINT, 'Y'}, + {"SP", REGOFF(sp), RINT, 'Y'}, + {"R0", REGOFF(r0), RINT, 'Y'}, + /* R1 is SP */ + {"R2", REGOFF(r2), RINT, 'Y'}, + {"R3", REGOFF(r3), RINT, 'Y'}, + {"R4", REGOFF(r4), RINT, 'Y'}, + {"R5", REGOFF(r5), RINT, 'Y'}, + {"R6", REGOFF(r6), RINT, 'Y'}, + {"R7", REGOFF(r7), RINT, 'Y'}, + {"R8", REGOFF(r8), RINT, 'Y'}, + {"R9", REGOFF(r9), RINT, 'Y'}, + {"R10", REGOFF(r10), RINT, 'Y'}, + {"R11", REGOFF(r11), RINT, 'Y'}, + {"R12", REGOFF(r12), RINT, 'Y'}, + {"R13", REGOFF(r13), RINT, 'Y'}, + {"R14", REGOFF(r14), RINT, 'Y'}, + {"R15", REGOFF(r15), RINT, 'Y'}, + {"R16", REGOFF(r16), RINT, 'Y'}, + {"R17", REGOFF(r17), RINT, 'Y'}, + {"R18", REGOFF(r18), RINT, 'Y'}, + {"R19", REGOFF(r19), RINT, 'Y'}, + {"R20", REGOFF(r20), RINT, 'Y'}, + {"R21", REGOFF(r21), RINT, 'Y'}, + {"R22", REGOFF(r22), RINT, 'Y'}, + {"R23", REGOFF(r23), RINT, 'Y'}, + {"R24", REGOFF(r24), RINT, 'Y'}, + {"R25", REGOFF(r25), RINT, 'Y'}, + {"R26", REGOFF(r26), RINT, 'Y'}, + {"R27", REGOFF(r27), RINT, 'Y'}, + {"R28", REGOFF(r28), RINT, 'Y'}, + {"R29", REGOFF(r29), RINT, 'Y'}, + {"R30", REGOFF(r30), RINT, 'Y'}, + {"R31", REGOFF(r31), RINT, 'Y'}, + {"F0", FP_REG(0), RFLT, 'F'}, + {"F1", FP_REG(1), RFLT, 'F'}, + {"F2", FP_REG(2), RFLT, 'F'}, + {"F3", FP_REG(3), RFLT, 'F'}, + {"F4", FP_REG(4), RFLT, 'F'}, + {"F5", FP_REG(5), RFLT, 'F'}, + {"F6", FP_REG(6), RFLT, 'F'}, + {"F7", FP_REG(7), RFLT, 'F'}, + {"F8", FP_REG(8), RFLT, 'F'}, + {"F9", FP_REG(9), RFLT, 'F'}, + {"F10", FP_REG(10), RFLT, 'F'}, + {"F11", FP_REG(11), RFLT, 'F'}, + {"F12", FP_REG(12), RFLT, 'F'}, + {"F13", FP_REG(13), RFLT, 'F'}, + {"F14", FP_REG(14), RFLT, 'F'}, + {"F15", FP_REG(15), RFLT, 'F'}, + {"F16", FP_REG(16), RFLT, 'F'}, + {"F17", FP_REG(17), RFLT, 'F'}, + {"F18", FP_REG(18), RFLT, 'F'}, + {"F19", FP_REG(19), RFLT, 'F'}, + {"F20", FP_REG(20), RFLT, 'F'}, + {"F21", FP_REG(21), RFLT, 'F'}, + {"F22", FP_REG(22), RFLT, 'F'}, + {"F23", FP_REG(23), RFLT, 'F'}, + {"F24", FP_REG(24), RFLT, 'F'}, + {"F25", FP_REG(25), RFLT, 'F'}, + {"F26", FP_REG(26), RFLT, 'F'}, + {"F27", FP_REG(27), RFLT, 'F'}, + {"F28", FP_REG(28), RFLT, 'F'}, + {"F29", FP_REG(29), RFLT, 'F'}, + {"F30", FP_REG(30), RFLT, 'F'}, + {"F31", FP_REG(31), RFLT, 'F'}, + {"FPSCR", FP_REG(32)+4, RFLT, 'X'}, + { 0 } +}; + + /* the machine description */ +Mach mpower64 = +{ + "power64", + MPOWER64, /* machine type */ + power64reglist, /* register set */ + REGSIZE, /* number of bytes in register set */ + FPREGSIZE, /* number of bytes in FP register set */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "LR", /* name of link register */ + "setSB", /* static base register name */ + 0, /* value */ + 0x1000, /* page size */ + 0x80000000U, /* kernel base */ + 0, /* kernel text mask */ + 0x7FFFFFFFU, /* user stack top */ + 4, /* quantization of pc */ + 8, /* szaddr */ + 8, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/9obj.c b/utils/libmach/9obj.c new file mode 100644 index 0000000..4ec76b9 --- /dev/null +++ b/utils/libmach/9obj.c @@ -0,0 +1,155 @@ +/* + * 9obj.c - identify and parse a PowerPC-64 object file + * forsyth@terzarima.net + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "9c/9.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char type; + char sym; + char name; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + +int +_is9(char *s) +{ + return (s[0]&0377) == ANAME /* ANAME */ + && (s[1]&0377) == ANAME>>8 + && s[2] == D_FILE /* type */ + && s[3] == 1 /* sym */ + && s[4] == '<'; /* name of file */ +} + +int +_read9(Biobuf *bp, Prog *p) +{ + int as, n, c; + Addr a; + + as = Bgetc(bp); /* as(low) */ + if(as < 0) + return 0; + c = Bgetc(bp); /* as(high) */ + if(c < 0) + return 0; + as |= ((c & 0xff) << 8); + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = beswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + else if(as == AGLOBL) + p->kind = aData; + n = Bgetc(bp); /* reg and flag */ + skip(bp, 4); /* lineno(4) */ + a = addr(bp); + if(n & 0x40) + addr(bp); + addr(bp); + if(a.type != D_OREG || a.name != D_STATIC && a.name != D_EXTERN) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + vlong off; + long l; + + a.type = Bgetc(bp); /* a.type */ + skip(bp,1); /* reg */ + a.sym = Bgetc(bp); /* sym index */ + a.name = Bgetc(bp); /* sym type */ + switch(a.type){ + default: + case D_NONE: case D_REG: case D_FREG: case D_CREG: + case D_FPSCR: case D_MSR: + break; + case D_SPR: + case D_OREG: + case D_CONST: + case D_BRANCH: + case D_DCONST: + case D_DCR: + l = Bgetc(bp); + l |= Bgetc(bp) << 8; + l |= Bgetc(bp) << 16; + l |= Bgetc(bp) << 24; + off = l; + if(a.type == D_DCONST){ + l = Bgetc(bp); + l |= Bgetc(bp) << 8; + l |= Bgetc(bp) << 16; + l |= Bgetc(bp) << 24; + off = ((vlong)l << 32) | (off & 0xFFFFFFFF); + a.type = D_CONST; /* perhaps */ + } + if(off < 0) + off = -off; + if(a.sym && (a.name==D_PARAM || a.name==D_AUTO)) + _offset(a.sym, off); + break; + case D_SCONST: + skip(bp, NSNAME); + break; + case D_FCONST: + skip(bp, 8); + break; + } + return a; +} + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} diff --git a/utils/libmach/NOTICE b/utils/libmach/NOTICE new file mode 100644 index 0000000..c708cf0 --- /dev/null +++ b/utils/libmach/NOTICE @@ -0,0 +1,31 @@ +This copyright NOTICE applies to all files in this directory and +subdirectories, unless another copyright notice appears in a given +file or subdirectory. If you take substantial code from this software to use in +other programs, you must somehow include with it an appropriate +copyright notice that includes the copyright notice and the other +notices below. It is fine (and often tidier) to do that in a separate +file such as NOTICE, LICENCE or COPYING. + + Copyright © 1994-1999 Lucent Technologies Inc. + Power PC support Copyright © 1995-2004 C H Forsyth (forsyth@terzarima.net). + Portions Copyright © 1997-1999 Vita Nuova Limited. + Portions Copyright © 2000-2007 Vita Nuova Holdings Limited (www.vitanuova.com). + Revisions Copyright © 2000-2004 Lucent Technologies Inc. and others. + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in +all copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN +THE SOFTWARE. diff --git a/utils/libmach/access.c b/utils/libmach/access.c new file mode 100644 index 0000000..e054839 --- /dev/null +++ b/utils/libmach/access.c @@ -0,0 +1,275 @@ +/* + * functions to read and write an executable or file image + */ + +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +static int mget(Map*, uvlong, void*, int); +static int mput(Map*, uvlong, void*, int); +static struct segment* reloc(Map*, uvlong, vlong*); + +/* + * routines to get/put various types + */ +int +geta(Map *map, uvlong addr, uvlong *x) +{ + ulong l; + uvlong vl; + + if (mach->szaddr == 8){ + if (get8(map, addr, &vl) < 0) + return -1; + *x = vl; + return 1; + } + + if (get4(map, addr, &l) < 0) + return -1; + *x = l; + + return 1; +} + +int +get8(Map *map, uvlong addr, uvlong *x) +{ + if (!map) { + werrstr("get8: invalid map"); + return -1; + } + + if (map->nsegs == 1 && map->seg[0].fd < 0) { + *x = addr; + return 1; + } + if (mget(map, addr, x, 8) < 0) + return -1; + *x = machdata->swav(*x); + return 1; +} + +int +get4(Map *map, uvlong addr, ulong *x) +{ + if (!map) { + werrstr("get4: invalid map"); + return -1; + } + + if (map->nsegs == 1 && map->seg[0].fd < 0) { + *x = addr; + return 1; + } + if (mget(map, addr, x, 4) < 0) + return -1; + *x = machdata->swal(*x); + return 1; +} + +int +get2(Map *map, uvlong addr, ushort *x) +{ + if (!map) { + werrstr("get2: invalid map"); + return -1; + } + + if (map->nsegs == 1 && map->seg[0].fd < 0) { + *x = addr; + return 1; + } + if (mget(map, addr, x, 2) < 0) + return -1; + *x = machdata->swab(*x); + return 1; +} + +int +get1(Map *map, uvlong addr, uchar *x, int size) +{ + uchar *cp; + + if (!map) { + werrstr("get1: invalid map"); + return -1; + } + + if (map->nsegs == 1 && map->seg[0].fd < 0) { + cp = (uchar*)&addr; + while (cp < (uchar*)(&addr+1) && size-- > 0) + *x++ = *cp++; + while (size-- > 0) + *x++ = 0; + } else + return mget(map, addr, x, size); + return 1; +} + +int +puta(Map *map, uvlong addr, uvlong v) +{ + if (mach->szaddr == 8) + return put8(map, addr, v); + + return put4(map, addr, v); +} + +int +put8(Map *map, uvlong addr, uvlong v) +{ + if (!map) { + werrstr("put8: invalid map"); + return -1; + } + v = machdata->swav(v); + return mput(map, addr, &v, 8); +} + +int +put4(Map *map, uvlong addr, ulong v) +{ + if (!map) { + werrstr("put4: invalid map"); + return -1; + } + v = machdata->swal(v); + return mput(map, addr, &v, 4); +} + +int +put2(Map *map, uvlong addr, ushort v) +{ + if (!map) { + werrstr("put2: invalid map"); + return -1; + } + v = machdata->swab(v); + return mput(map, addr, &v, 2); +} + +int +put1(Map *map, uvlong addr, uchar *v, int size) +{ + if (!map) { + werrstr("put1: invalid map"); + return -1; + } + return mput(map, addr, v, size); +} + +static int +spread(struct segment *s, void *buf, int n, uvlong off) +{ + uvlong base; + + static struct { + struct segment *s; + char a[8192]; + uvlong off; + } cache; + + if(s->cache){ + base = off&~(sizeof cache.a-1); + if(cache.s != s || cache.off != base){ + cache.off = ~0; + if(seek(s->fd, base, 0) >= 0 + && readn(s->fd, cache.a, sizeof cache.a) == sizeof cache.a){ + cache.s = s; + cache.off = base; + } + } + if(cache.s == s && cache.off == base){ + off &= sizeof cache.a-1; + if(off+n > sizeof cache.a) + n = sizeof cache.a - off; + memmove(buf, cache.a+off, n); + return n; + } + } + + return pread(s->fd, buf, n, off); +} + +static int +mget(Map *map, uvlong addr, void *buf, int size) +{ + uvlong off; + int i, j, k; + struct segment *s; + + s = reloc(map, addr, (vlong*)&off); + if (!s) + return -1; + if (s->fd < 0) { + werrstr("unreadable map"); + return -1; + } + if (s->mget) + return s->mget(s, addr, off, buf, size); + for (i = j = 0; i < 2; i++) { /* in case read crosses page */ + k = spread(s, (void*)((uchar *)buf+j), size-j, off+j); + if (k < 0) { + werrstr("can't read address %llux: %r", addr); + return -1; + } + j += k; + if (j == size) + return j; + } + werrstr("partial read at address %llux (size %d j %d)", addr, size, j); + return -1; +} + +static int +mput(Map *map, uvlong addr, void *buf, int size) +{ + vlong off; + int i, j, k; + struct segment *s; + + s = reloc(map, addr, &off); + if (!s) + return -1; + if (s->fd < 0) { + werrstr("unwritable map"); + return -1; + } + if (s->mput) + return s->mput(s, addr, off, buf, size); + + seek(s->fd, off, 0); + for (i = j = 0; i < 2; i++) { /* in case read crosses page */ + k = write(s->fd, buf, size-j); + if (k < 0) { + werrstr("can't write address %llux: %r", addr); + return -1; + } + j += k; + if (j == size) + return j; + } + werrstr("partial write at address %llux", addr); + return -1; +} + +/* + * convert address to file offset; returns nonzero if ok + */ +static struct segment* +reloc(Map *map, uvlong addr, vlong *offp) +{ + int i; + + for (i = 0; i < map->nsegs; i++) { + if (map->seg[i].inuse) + if (map->seg[i].b <= addr && addr < map->seg[i].e) { + *offp = addr + map->seg[i].f - map->seg[i].b; + return &map->seg[i]; + } + } + werrstr("can't translate address %llux", addr); + return 0; +} diff --git a/utils/libmach/bootexec.h b/utils/libmach/bootexec.h new file mode 100644 index 0000000..b401d39 --- /dev/null +++ b/utils/libmach/bootexec.h @@ -0,0 +1,136 @@ +struct coffsect +{ + char name[8]; + ulong phys; + ulong virt; + ulong size; + ulong fptr; + ulong fptrreloc; + ulong fptrlineno; + ulong nrelocnlineno; + ulong flags; +}; + +/* + * proprietary exec headers, needed to bootstrap various machines + */ +struct mipsexec +{ + short mmagic; /* (0x160) mips magic number */ + short nscns; /* (unused) number of sections */ + long timdat; /* (unused) time & date stamp */ + long symptr; /* offset to symbol table */ + long nsyms; /* size of symbol table */ + short opthdr; /* (0x38) sizeof(optional hdr) */ + short pcszs; /* flags */ + short amagic; /* see above */ + short vstamp; /* version stamp */ + long tsize; /* text size in bytes */ + long dsize; /* initialized data */ + long bsize; /* uninitialized data */ + long mentry; /* entry pt. */ + long text_start; /* base of text used for this file */ + long data_start; /* base of data used for this file */ + long bss_start; /* base of bss used for this file */ + long gprmask; /* general purpose register mask */ + long cprmask[4]; /* co-processor register masks */ + long gp_value; /* the gp value used for this object */ +}; +#define pcsize cprmask[0] + +struct mips4kexec +{ + struct mipsexec h; + struct coffsect itexts; + struct coffsect idatas; + struct coffsect ibsss; +}; + +struct sparcexec +{ + short sjunk; /* dynamic bit and version number */ + short smagic; /* 0407 */ + ulong stext; + ulong sdata; + ulong sbss; + ulong ssyms; + ulong sentry; + ulong strsize; + ulong sdrsize; +}; + +struct nextexec +{ + struct nexthdr{ + ulong nmagic; + ulong ncputype; + ulong ncpusubtype; + ulong nfiletype; + ulong ncmds; + ulong nsizeofcmds; + ulong nflags; + }texth; + + struct nextcmd{ + ulong cmd; + ulong cmdsize; + uchar segname[16]; + ulong vmaddr; + ulong vmsize; + ulong fileoff; + ulong filesize; + ulong maxprot; + ulong initprot; + ulong nsects; + ulong flags; + }textc; + struct nextsect{ + char sectname[16]; + char segname[16]; + ulong addr; + ulong size; + ulong offset; + ulong align; + ulong reloff; + ulong nreloc; + ulong flags; + ulong reserved1; + ulong reserved2; + }texts; + struct nextcmd datac; + struct nextsect datas; + struct nextsect bsss; + struct nextsym{ + ulong cmd; + ulong cmdsize; + ulong symoff; + ulong nsyms; + ulong spoff; + ulong pcoff; + }symc; +}; + +struct i386exec +{ + struct i386coff{ + ulong isectmagic; + ulong itime; + ulong isyms; + ulong insyms; + ulong iflags; + } icoff; + struct i386hdr{ + ulong imagic; + ulong itextsize; + ulong idatasize; + ulong ibsssize; + ulong ientry; + ulong itextstart; + ulong idatastart; + } ihdr; + struct coffsect itexts; + struct coffsect idatas; + struct coffsect ibsss; + struct coffsect icomments; +}; + diff --git a/utils/libmach/elf.h b/utils/libmach/elf.h new file mode 100644 index 0000000..6bd483d --- /dev/null +++ b/utils/libmach/elf.h @@ -0,0 +1,114 @@ +/* + * Definitions needed for accessing Irix ELF headers + */ +typedef struct { + uchar ident[16]; /* ident bytes */ + ushort type; /* file type */ + ushort machine; /* target machine */ + int version; /* file version */ + ulong elfentry; /* start address */ + ulong phoff; /* phdr file offset */ + ulong shoff; /* shdr file offset */ + int flags; /* file flags */ + ushort ehsize; /* sizeof ehdr */ + ushort phentsize; /* sizeof phdr */ + ushort phnum; /* number phdrs */ + ushort shentsize; /* sizeof shdr */ + ushort shnum; /* number shdrs */ + ushort shstrndx; /* shdr string index */ +} Ehdr; + +typedef struct { + int type; /* entry type */ + ulong offset; /* file offset */ + ulong vaddr; /* virtual address */ + ulong paddr; /* physical address */ + int filesz; /* file size */ + ulong memsz; /* memory size */ + int flags; /* entry flags */ + int align; /* memory/file alignment */ +} Phdr; + +typedef struct { + ulong name; /* section name */ + ulong type; /* SHT_... */ + ulong flags; /* SHF_... */ + ulong addr; /* virtual address */ + ulong offset; /* file offset */ + ulong size; /* section size */ + ulong link; /* misc info */ + ulong info; /* misc info */ + ulong addralign; /* memory alignment */ + ulong entsize; /* entry size if table */ +} Shdr; + +enum { + /* Ehdr codes */ + MAG0 = 0, /* ident[] indexes */ + MAG1 = 1, + MAG2 = 2, + MAG3 = 3, + CLASS = 4, + DATA = 5, + VERSION = 6, + + ELFCLASSNONE = 0, /* ident[CLASS] */ + ELFCLASS32 = 1, + ELFCLASS64 = 2, + ELFCLASSNUM = 3, + + ELFDATANONE = 0, /* ident[DATA] */ + ELFDATA2LSB = 1, + ELFDATA2MSB = 2, + ELFDATANUM = 3, + + NOETYPE = 0, /* type */ + REL = 1, + EXEC = 2, + DYN = 3, + CORE = 4, + + NONE = 0, /* machine */ + M32 = 1, /* AT&T WE 32100 */ + SPARC = 2, /* Sun SPARC */ + I386 = 3, /* Intel 80386 */ + M68K = 4, /* Motorola 68000 */ + M88K = 5, /* Motorola 88000 */ + I486 = 6, /* Intel 80486 */ + I860 = 7, /* Intel i860 */ + MIPS = 8, /* Mips R2000 */ + S370 = 9, /* Amdhal */ + SPARC64 = 18, /* Sun SPARC v9 */ + POWER = 20, /* PowerPC */ + POWER64 = 21, /* PowerPC64 */ + ARM = 40, /* ARM */ + AMD64 = 62, /* Amd64 */ + ARM64 = 183, /* ARM64 */ + + NO_VERSION = 0, /* version, ident[VERSION] */ + CURRENT = 1, + + /* Phdr Codes */ + NOPTYPE = 0, /* type */ + LOAD = 1, + DYNAMIC = 2, + INTERP = 3, + NOTE = 4, + SHLIB = 5, + PHDR = 6, + + R = 0x4, /* flags */ + W = 0x2, + X = 0x1, + + /* Shdr Codes */ + Progbits = 1, /* section types */ + Strtab = 3, + Nobits = 8, + + Swrite = 1, /* section attributes */ + Salloc = 2, + Sexec = 4, +}; + +#define ELF_MAG ((0x7f<<24) | ('E'<<16) | ('L'<<8) | 'F') diff --git a/utils/libmach/executable.c b/utils/libmach/executable.c new file mode 100644 index 0000000..b9954f0 --- /dev/null +++ b/utils/libmach/executable.c @@ -0,0 +1,713 @@ +#include <lib9.h> +#include <bio.h> +#include "bootexec.h" +#include "mach.h" +#include "elf.h" + +/* + * All a.out header types. The dummy entry allows canonical + * processing of the union as a sequence of longs + */ + +typedef struct { + union{ + Exec exec; + struct { + u32int ohdr[8]; /* Exec */ + uvlong hdr[1]; + } exechdr64; + Ehdr elfhdr32; /* elf.h */ + struct mipsexec mips; /* bootexec.h */ + struct mips4kexec mips4k; /* bootexec.h */ + struct sparcexec sparc; /* bootexec.h */ + struct nextexec next; /* bootexec.h */ + } e; + u32int dummy; /* padding to ensure extra u32int */ +} ExecHdr; + +static int nextboot(int, Fhdr*, ExecHdr*); +static int sparcboot(int, Fhdr*, ExecHdr*); +static int mipsboot(int, Fhdr*, ExecHdr*); +static int mips4kboot(int, Fhdr*, ExecHdr*); +static int common(int, Fhdr*, ExecHdr*); +static int commonllp64(int, Fhdr*, ExecHdr*); +static int adotout(int, Fhdr*, ExecHdr*); +static int elfdotout(int, Fhdr*, ExecHdr*); +static int armdotout(int, Fhdr*, ExecHdr*); +static void setsym(Fhdr*, long, long, long, vlong); +static void setdata(Fhdr*, uvlong, long, vlong, long); +static void settext(Fhdr*, uvlong, uvlong, long, vlong); +static void hswal(void*, int, ulong(*)(ulong)); +static uvlong _round(uvlong, ulong); + +/* + * definition of per-executable file type structures + */ + +typedef struct Exectable{ + long magic; /* big-endian magic number of file */ + char *name; /* executable identifier */ + char *dlmname; /* dynamically loadable module identifier */ + uchar type; /* Internal code */ + uchar _magic; /* _MAGIC() magic */ + Mach *mach; /* Per-machine data */ + long hsize; /* header size */ + ulong (*swal)(ulong); /* beswal or leswal */ + int (*hparse)(int, Fhdr*, ExecHdr*); +} ExecTable; + +extern Mach mmips; +extern Mach mmips2le; +extern Mach mmips2be; +extern Mach msparc; +extern Mach mi386; +extern Mach mamd64; +extern Mach marm; +extern Mach mpower; +extern Mach mpower64; + +ExecTable exectab[] = +{ + { V_MAGIC, /* Mips v.out */ + "mips plan 9 executable BE", + "mips plan 9 dlm BE", + FMIPS, + 1, + &mmips, + sizeof(Exec), + beswal, + adotout }, + { P_MAGIC, /* Mips 0.out (r3k le) */ + "mips plan 9 executable LE", + "mips plan 9 dlm LE", + FMIPSLE, + 1, + &mmips, + sizeof(Exec), + beswal, + adotout }, + { M_MAGIC, /* Mips 4.out */ + "mips 4k plan 9 executable BE", + "mips 4k plan 9 dlm BE", + FMIPS2BE, + 1, + &mmips2be, + sizeof(Exec), + beswal, + adotout }, + { N_MAGIC, /* Mips 0.out */ + "mips 4k plan 9 executable LE", + "mips 4k plan 9 dlm LE", + FMIPS2LE, + 1, + &mmips2le, + sizeof(Exec), + beswal, + adotout }, + { 0x160<<16, /* Mips boot image */ + "mips plan 9 boot image", + nil, + FMIPSB, + 0, + &mmips, + sizeof(struct mipsexec), + beswal, + mipsboot }, + { (0x160<<16)|3, /* Mips boot image */ + "mips 4k plan 9 boot image", + nil, + FMIPSB, + 0, + &mmips2be, + sizeof(struct mips4kexec), + beswal, + mips4kboot }, + { K_MAGIC, /* Sparc k.out */ + "sparc plan 9 executable", + "sparc plan 9 dlm", + FSPARC, + 1, + &msparc, + sizeof(Exec), + beswal, + adotout }, + { 0x01030107, /* Sparc boot image */ + "sparc plan 9 boot image", + nil, + FSPARCB, + 0, + &msparc, + sizeof(struct sparcexec), + beswal, + sparcboot }, + { I_MAGIC, /* I386 8.out & boot image */ + "386 plan 9 executable", + "386 plan 9 dlm", + FI386, + 1, + &mi386, + sizeof(Exec), + beswal, + common }, + { S_MAGIC, /* amd64 6.out & boot image */ + "amd64 plan 9 executable", + "amd64 plan 9 dlm", + FAMD64, + 1, + &mamd64, + sizeof(Exec)+8, + nil, + commonllp64 }, + { Q_MAGIC, /* PowerPC q.out & boot image */ + "power plan 9 executable", + "power plan 9 dlm", + FPOWER, + 1, + &mpower, + sizeof(Exec), + beswal, + common }, + { T_MAGIC, /* power64 9.out & boot image */ + "power64 plan 9 executable", + "power64 plan 9 dlm", + FPOWER64, + 1, + &mpower64, + sizeof(Exec)+8, + nil, + commonllp64 }, + { ELF_MAG, /* any elf32 */ + "elf executable", + nil, + FNONE, + 0, + &mi386, + sizeof(Ehdr), + nil, + elfdotout }, + { E_MAGIC, /* Arm 5.out and boot image */ + "arm plan 9 executable", + "arm plan 9 dlm", + FARM, + 1, + &marm, + sizeof(Exec), + beswal, + common }, + { (143<<16)|0413, /* (Free|Net)BSD Arm */ + "arm *bsd executable", + nil, + FARM, + 0, + &marm, + sizeof(Exec), + leswal, + armdotout }, + { 0 }, +}; + +Mach *mach = &mi386; /* Global current machine table */ + +static ExecTable* +couldbe4k(ExecTable *mp) +{ + Dir *d; + ExecTable *f; + + if((d=dirstat("/proc/1/regs")) == nil) + return mp; + if(d->length < 32*8){ /* R3000 */ + free(d); + return mp; + } + free(d); + for (f = exectab; f->magic; f++) + if(f->magic == M_MAGIC) { + f->name = "mips plan 9 executable on mips2 kernel"; + return f; + } + return mp; +} + +int +crackhdr(int fd, Fhdr *fp) +{ + ExecTable *mp; + ExecHdr d; + int nb, ret; + ulong magic; + + fp->type = FNONE; + nb = read(fd, (char *)&d.e, sizeof(d.e)); + if (nb <= 0) + return 0; + + ret = 0; + magic = beswal(d.e.exec.magic); /* big-endian */ + for (mp = exectab; mp->magic; mp++) { + if (nb < mp->hsize) + continue; + + /* + * The.exec.magic number has morphed into something + * with fields (the straw was DYN_MAGIC) so now + * a flag is needed in Fhdr to distinguish _MAGIC() + * magic numbers from foreign magic numbers. + * + * This code is creaking a bit and if it has to + * be modified/extended much more it's probably + * time to step back and redo it all. + */ + if(mp->_magic){ + if(mp->magic != (magic & ~DYN_MAGIC)) + continue; + + if(mp->magic == V_MAGIC) + mp = couldbe4k(mp); + + if ((magic & DYN_MAGIC) && mp->dlmname != nil) + fp->name = mp->dlmname; + else + fp->name = mp->name; + } + else{ + if(mp->magic != magic) + continue; + fp->name = mp->name; + } + fp->type = mp->type; + fp->hdrsz = mp->hsize; /* will be zero on bootables */ + fp->_magic = mp->_magic; + fp->magic = magic; + + mach = mp->mach; + if(mp->swal != nil) + hswal(&d, sizeof(d.e)/sizeof(ulong), mp->swal); + ret = mp->hparse(fd, fp, &d); + seek(fd, mp->hsize, 0); /* seek to end of header */ + break; + } + if(mp->magic == 0) + werrstr("unknown header type"); + return ret; +} + +/* + * Convert header to canonical form + */ +static void +hswal(void *v, int n, ulong (*swap)(ulong)) +{ + ulong *ulp; + + for(ulp = v; n--; ulp++) + *ulp = (*swap)(*ulp); +} + +/* + * Crack a normal a.out-type header + */ +static int +adotout(int fd, Fhdr *fp, ExecHdr *hp) +{ + long pgsize; + + USED(fd); + pgsize = mach->pgsize; + settext(fp, hp->e.exec.entry, pgsize+sizeof(Exec), + hp->e.exec.text, sizeof(Exec)); + setdata(fp, _round(pgsize+fp->txtsz+sizeof(Exec), pgsize), + hp->e.exec.data, fp->txtsz+sizeof(Exec), hp->e.exec.bss); + setsym(fp, hp->e.exec.syms, hp->e.exec.spsz, hp->e.exec.pcsz, fp->datoff+fp->datsz); + return 1; +} + +static void +commonboot(Fhdr *fp) +{ + if (!(fp->entry & mach->ktmask)) + return; + + switch(fp->type) { /* boot image */ + case F68020: + fp->type = F68020B; + fp->name = "68020 plan 9 boot image"; + break; + case FI386: + fp->type = FI386B; + fp->txtaddr = (u32int)fp->entry; + fp->name = "386 plan 9 boot image"; + fp->dataddr = _round(fp->txtaddr+fp->txtsz, mach->pgsize); + break; + case FARM: + fp->type = FARMB; + fp->txtaddr = (u32int)fp->entry; + fp->name = "ARM plan 9 boot image"; + fp->dataddr = _round(fp->txtaddr+fp->txtsz, mach->pgsize); + return; + case FPOWER: + fp->type = FPOWERB; + fp->txtaddr = (u32int)fp->entry; + fp->name = "power plan 9 boot image"; + fp->dataddr = fp->txtaddr+fp->txtsz; + break; + case FAMD64: + fp->type = FAMD64B; + fp->txtaddr = fp->entry; + fp->name = "amd64 plan 9 boot image"; + fp->dataddr = _round(fp->txtaddr+fp->txtsz, mach->pgsize); + break; + default: + return; + } + fp->hdrsz = 0; /* header stripped */ +} + +/* + * _MAGIC() style headers and + * alpha plan9-style bootable images for axp "headerless" boot + * + */ +static int +common(int fd, Fhdr *fp, ExecHdr *hp) +{ + adotout(fd, fp, hp); + if(hp->e.exec.magic & DYN_MAGIC) { + fp->txtaddr = 0; + fp->dataddr = fp->txtsz; + return 1; + } + commonboot(fp); + return 1; +} + +static int +commonllp64(int fd, Fhdr *fp, ExecHdr *hp) +{ + long pgsize; + uvlong entry; + + USED(fd); + hswal(&hp->e, sizeof(Exec)/sizeof(long), beswal); + if(!(hp->e.exec.magic & HDR_MAGIC)) + return 0; + + /* + * There can be more.exec.magic here if the + * header ever needs more expansion. + * For now just catch use of any of the + * unused bits. + */ + if((hp->e.exec.magic & ~DYN_MAGIC)>>16) + return 0; + entry = beswav(hp->e.exechdr64.hdr[0]); + + pgsize = mach->pgsize; + settext(fp, entry, pgsize+fp->hdrsz, hp->e.exec.text, fp->hdrsz); + setdata(fp, _round(pgsize+fp->txtsz+fp->hdrsz, pgsize), + hp->e.exec.data, fp->txtsz+fp->hdrsz, hp->e.exec.bss); + setsym(fp, hp->e.exec.syms, hp->e.exec.spsz, hp->e.exec.pcsz, fp->datoff+fp->datsz); + + if(hp->e.exec.magic & DYN_MAGIC) { + fp->txtaddr = 0; + fp->dataddr = fp->txtsz; + return 1; + } + commonboot(fp); + return 1; +} + +/* + * mips bootable image. + */ +static int +mipsboot(int fd, Fhdr *fp, ExecHdr *hp) +{ + USED(fd); + fp->type = FMIPSB; + switch(hp->e.mips.amagic) { + default: + case 0407: /* some kind of mips */ + settext(fp, (u32int)hp->e.mips.mentry, (u32int)hp->e.mips.text_start, + hp->e.mips.tsize, sizeof(struct mipsexec)+4); + setdata(fp, (u32int)hp->e.mips.data_start, hp->e.mips.dsize, + fp->txtoff+hp->e.mips.tsize, hp->e.mips.bsize); + break; + case 0413: /* some kind of mips */ + settext(fp, (u32int)hp->e.mips.mentry, (u32int)hp->e.mips.text_start, + hp->e.mips.tsize, 0); + setdata(fp, (u32int)hp->e.mips.data_start, hp->e.mips.dsize, + hp->e.mips.tsize, hp->e.mips.bsize); + break; + } + setsym(fp, hp->e.mips.nsyms, 0, hp->e.mips.pcsize, hp->e.mips.symptr); + fp->hdrsz = 0; /* header stripped */ + return 1; +} + +/* + * mips4k bootable image. + */ +static int +mips4kboot(int fd, Fhdr *fp, ExecHdr *hp) +{ + USED(fd); + fp->type = FMIPSB; + switch(hp->e.mips4k.h.amagic) { + default: + case 0407: /* some kind of mips */ + settext(fp, (u32int)hp->e.mips4k.h.mentry, (u32int)hp->e.mips4k.h.text_start, + hp->e.mips4k.h.tsize, sizeof(struct mips4kexec)); + setdata(fp, (u32int)hp->e.mips4k.h.data_start, hp->e.mips4k.h.dsize, + fp->txtoff+hp->e.mips4k.h.tsize, hp->e.mips4k.h.bsize); + break; + case 0413: /* some kind of mips */ + settext(fp, (u32int)hp->e.mips4k.h.mentry, (u32int)hp->e.mips4k.h.text_start, + hp->e.mips4k.h.tsize, 0); + setdata(fp, (u32int)hp->e.mips4k.h.data_start, hp->e.mips4k.h.dsize, + hp->e.mips4k.h.tsize, hp->e.mips4k.h.bsize); + break; + } + setsym(fp, hp->e.mips4k.h.nsyms, 0, hp->e.mips4k.h.pcsize, hp->e.mips4k.h.symptr); + fp->hdrsz = 0; /* header stripped */ + return 1; +} + +/* + * sparc bootable image + */ +static int +sparcboot(int fd, Fhdr *fp, ExecHdr *hp) +{ + USED(fd); + fp->type = FSPARCB; + settext(fp, hp->e.sparc.sentry, hp->e.sparc.sentry, hp->e.sparc.stext, + sizeof(struct sparcexec)); + setdata(fp, hp->e.sparc.sentry+hp->e.sparc.stext, hp->e.sparc.sdata, + fp->txtoff+hp->e.sparc.stext, hp->e.sparc.sbss); + setsym(fp, hp->e.sparc.ssyms, 0, hp->e.sparc.sdrsize, fp->datoff+hp->e.sparc.sdata); + fp->hdrsz = 0; /* header stripped */ + return 1; +} + +/* + * next bootable image + */ +static int +nextboot(int fd, Fhdr *fp, ExecHdr *hp) +{ + USED(fd); + fp->type = FNEXTB; + settext(fp, hp->e.next.textc.vmaddr, hp->e.next.textc.vmaddr, + hp->e.next.texts.size, hp->e.next.texts.offset); + setdata(fp, hp->e.next.datac.vmaddr, hp->e.next.datas.size, + hp->e.next.datas.offset, hp->e.next.bsss.size); + setsym(fp, hp->e.next.symc.nsyms, hp->e.next.symc.spoff, hp->e.next.symc.pcoff, + hp->e.next.symc.symoff); + fp->hdrsz = 0; /* header stripped */ + return 1; +} + +/* + * Elf32 binaries. + */ +static int +elfdotout(int fd, Fhdr *fp, ExecHdr *hp) +{ + + ulong (*swal)(ulong); + ushort (*swab)(ushort); + Ehdr *ep; + Phdr *ph; + int i, it, id, is, phsz; + + /* bitswap the header according to the DATA format */ + ep = &hp->e.elfhdr32; + if(ep->ident[CLASS] != ELFCLASS32) { + werrstr("bad ELF class - not 32 bit"); + return 0; + } + if(ep->ident[DATA] == ELFDATA2LSB) { + swab = leswab; + swal = leswal; + } else if(ep->ident[DATA] == ELFDATA2MSB) { + swab = beswab; + swal = beswal; + } else { + werrstr("bad ELF encoding - not big or little endian"); + return 0; + } + + ep->type = swab(ep->type); + ep->machine = swab(ep->machine); + ep->version = swal(ep->version); + ep->elfentry = swal(ep->elfentry); + ep->phoff = swal(ep->phoff); + ep->shoff = swal(ep->shoff); + ep->flags = swal(ep->flags); + ep->ehsize = swab(ep->ehsize); + ep->phentsize = swab(ep->phentsize); + ep->phnum = swab(ep->phnum); + ep->shentsize = swab(ep->shentsize); + ep->shnum = swab(ep->shnum); + ep->shstrndx = swab(ep->shstrndx); + if(ep->type != EXEC || ep->version != CURRENT) + return 0; + + /* we could definitely support a lot more machines here */ + fp->magic = ELF_MAG; + fp->hdrsz = (ep->ehsize+ep->phnum*ep->phentsize+16)&~15; + switch(ep->machine) { + case I386: + mach = &mi386; + fp->type = FI386; + break; + case MIPS: + mach = &mmips; + fp->type = FMIPS; + break; + case SPARC64: + return 0; + case POWER: + mach = &mpower; + fp->type = FPOWER; + break; + case AMD64: + mach = &mamd64; + fp->type = FAMD64; + break; + case ARM: + mach = &marm; + fp->type = FARM; + break; + default: + return 0; + } + + if(ep->phentsize != sizeof(Phdr)) { + werrstr("bad ELF header size"); + return 0; + } + phsz = sizeof(Phdr)*ep->phnum; + ph = malloc(phsz); + if(!ph) + return 0; + seek(fd, ep->phoff, 0); + if(read(fd, ph, phsz) < 0) { + free(ph); + return 0; + } + hswal(ph, phsz/sizeof(ulong), swal); + + /* find text, data and symbols and install them */ + it = id = is = -1; + for(i = 0; i < ep->phnum; i++) { + if(ph[i].type == LOAD + && (ph[i].flags & (R|X)) == (R|X) && it == -1) + it = i; + else if(ph[i].type == LOAD + && (ph[i].flags & (R|W)) == (R|W) && id == -1) + id = i; + else if(ph[i].type == NOPTYPE && is == -1) + is = i; + } + if(it == -1 || id == -1) { + /* + * The SPARC64 boot image is something of an ELF hack. + * Text+Data+BSS are represented by ph[0]. Symbols + * are represented by ph[1]: + * + * filesz, memsz, vaddr, paddr, off + * ph[0] : txtsz+datsz, txtsz+datsz+bsssz, txtaddr-KZERO, datasize, txtoff + * ph[1] : symsz, lcsz, 0, 0, symoff + */ + if(ep->machine == SPARC64 && ep->phnum == 2) { + ulong txtaddr, txtsz, dataddr, bsssz; + + txtaddr = ph[0].vaddr | 0x80000000; + txtsz = ph[0].filesz - ph[0].paddr; + dataddr = txtaddr + txtsz; + bsssz = ph[0].memsz - ph[0].filesz; + settext(fp, ep->elfentry | 0x80000000, txtaddr, txtsz, ph[0].offset); + setdata(fp, dataddr, ph[0].paddr, ph[0].offset + txtsz, bsssz); + setsym(fp, ph[1].filesz, 0, ph[1].memsz, ph[1].offset); + free(ph); + return 1; + } + + werrstr("No TEXT or DATA sections"); + free(ph); + return 0; + } + + settext(fp, ep->elfentry, ph[it].vaddr, ph[it].memsz, ph[it].offset); + setdata(fp, ph[id].vaddr, ph[id].filesz, ph[id].offset, ph[id].memsz - ph[id].filesz); + if(is != -1) + setsym(fp, ph[is].filesz, 0, ph[is].memsz, ph[is].offset); + free(ph); + return 1; +} + +/* + * (Free|Net)BSD ARM header. + */ +static int +armdotout(int fd, Fhdr *fp, ExecHdr *hp) +{ + uvlong kbase; + + USED(fd); + settext(fp, hp->e.exec.entry, sizeof(Exec), hp->e.exec.text, sizeof(Exec)); + setdata(fp, fp->txtsz, hp->e.exec.data, fp->txtsz, hp->e.exec.bss); + setsym(fp, hp->e.exec.syms, hp->e.exec.spsz, hp->e.exec.pcsz, fp->datoff+fp->datsz); + + kbase = 0xF0000000; + if ((fp->entry & kbase) == kbase) { /* Boot image */ + fp->txtaddr = kbase+sizeof(Exec); + fp->name = "ARM *BSD boot image"; + fp->hdrsz = 0; /* header stripped */ + fp->dataddr = kbase+fp->txtsz; + } + return 1; +} + +static void +settext(Fhdr *fp, uvlong e, uvlong a, long s, vlong off) +{ + fp->txtaddr = a; + fp->entry = e; + fp->txtsz = s; + fp->txtoff = off; +} + +static void +setdata(Fhdr *fp, uvlong a, long s, vlong off, long bss) +{ + fp->dataddr = a; + fp->datsz = s; + fp->datoff = off; + fp->bsssz = bss; +} + +static void +setsym(Fhdr *fp, long symsz, long sppcsz, long lnpcsz, vlong symoff) +{ + fp->symsz = symsz; + fp->symoff = symoff; + fp->sppcsz = sppcsz; + fp->sppcoff = fp->symoff+fp->symsz; + fp->lnpcsz = lnpcsz; + fp->lnpcoff = fp->sppcoff+fp->sppcsz; +} + + +static uvlong +_round(uvlong a, ulong b) +{ + uvlong w; + + w = (a/b)*b; + if (a!=w) + w += b; + return(w); +} diff --git a/utils/libmach/k.c b/utils/libmach/k.c new file mode 100644 index 0000000..9b0a45e --- /dev/null +++ b/utils/libmach/k.c @@ -0,0 +1,118 @@ +/* + * sparc definition + */ +#include <lib9.h> +#include <bio.h> +#include "uregk.h" +#include "mach.h" + +#define REGOFF(x) (ulong)(&((struct Ureg *) 0)->x) + +#define R1 REGOFF(u0.r1) +#define R7 REGOFF(r7) +#define PC REGOFF(pc) +#define R15 REGOFF(r15) + +#define REGSIZE sizeof(struct Ureg) +#define FP_REG(x) (REGSIZE+4*(x)) +#define FPREGSIZE (33*4) + +Reglist sparcreglist[] = { + {"Y", REGOFF(y), RINT|RRDONLY, 'X'}, + {"TBR", REGOFF(tbr), RINT|RRDONLY, 'X'}, + {"PSR", REGOFF(psr), RINT|RRDONLY, 'X'}, + {"PC", REGOFF(pc), RINT, 'X'}, + {"R1", REGOFF(u0.r1), RINT, 'X'}, + {"R2", REGOFF(r2), RINT, 'X'}, + {"R3", REGOFF(r3), RINT, 'X'}, + {"R4", REGOFF(r4), RINT, 'X'}, + {"R5", REGOFF(r5), RINT, 'X'}, + {"R6", REGOFF(r6), RINT, 'X'}, + {"R7", REGOFF(r7), RINT, 'X'}, + {"R8", REGOFF(r8), RINT, 'X'}, + {"R9", REGOFF(r9), RINT, 'X'}, + {"R10", REGOFF(r10), RINT, 'X'}, + {"R11", REGOFF(r11), RINT, 'X'}, + {"R12", REGOFF(r12), RINT, 'X'}, + {"R13", REGOFF(r13), RINT, 'X'}, + {"R14", REGOFF(r14), RINT, 'X'}, + {"R15", REGOFF(r15), RINT, 'X'}, + {"R16", REGOFF(r16), RINT, 'X'}, + {"R17", REGOFF(r17), RINT, 'X'}, + {"R18", REGOFF(r18), RINT, 'X'}, + {"R19", REGOFF(r19), RINT, 'X'}, + {"R20", REGOFF(r20), RINT, 'X'}, + {"R21", REGOFF(r21), RINT, 'X'}, + {"R22", REGOFF(r22), RINT, 'X'}, + {"R23", REGOFF(r23), RINT, 'X'}, + {"R24", REGOFF(r24), RINT, 'X'}, + {"R25", REGOFF(r25), RINT, 'X'}, + {"R26", REGOFF(r26), RINT, 'X'}, + {"R27", REGOFF(r27), RINT, 'X'}, + {"R28", REGOFF(r28), RINT, 'X'}, + {"R29", REGOFF(r29), RINT, 'X'}, + {"R30", REGOFF(r30), RINT, 'X'}, + {"R31", REGOFF(r31), RINT, 'X'}, + {"NPC", REGOFF(npc), RINT, 'X'}, + + {"FSR", FP_REG(0), RINT, 'X'}, + {"F0", FP_REG(1), RFLT, 'F'}, + {"F1", FP_REG(2), RFLT, 'f'}, + {"F2", FP_REG(3), RFLT, 'F'}, + {"F3", FP_REG(4), RFLT, 'f'}, + {"F4", FP_REG(5), RFLT, 'F'}, + {"F5", FP_REG(6), RFLT, 'f'}, + {"F6", FP_REG(7), RFLT, 'F'}, + {"F7", FP_REG(8), RFLT, 'f'}, + {"F8", FP_REG(9), RFLT, 'F'}, + {"F9", FP_REG(10), RFLT, 'f'}, + {"F10", FP_REG(11), RFLT, 'F'}, + {"F11", FP_REG(12), RFLT, 'f'}, + {"F12", FP_REG(13), RFLT, 'F'}, + {"F13", FP_REG(14), RFLT, 'f'}, + {"F14", FP_REG(15), RFLT, 'F'}, + {"F15", FP_REG(16), RFLT, 'f'}, + {"F16", FP_REG(17), RFLT, 'F'}, + {"F17", FP_REG(18), RFLT, 'f'}, + {"F18", FP_REG(19), RFLT, 'F'}, + {"F19", FP_REG(20), RFLT, 'f'}, + {"F20", FP_REG(21), RFLT, 'F'}, + {"F21", FP_REG(22), RFLT, 'f'}, + {"F22", FP_REG(23), RFLT, 'F'}, + {"F23", FP_REG(24), RFLT, 'f'}, + {"F24", FP_REG(25), RFLT, 'F'}, + {"F25", FP_REG(26), RFLT, 'f'}, + {"F26", FP_REG(27), RFLT, 'F'}, + {"F27", FP_REG(28), RFLT, 'f'}, + {"F28", FP_REG(29), RFLT, 'F'}, + {"F29", FP_REG(30), RFLT, 'f'}, + {"F30", FP_REG(31), RFLT, 'F'}, + {"F31", FP_REG(32), RFLT, 'f'}, + { 0 } +}; + +/* + * sparc has same stack format as mips + */ +Mach msparc = +{ + "sparc", + MSPARC, /* machine type */ + sparcreglist, /* register list */ + REGSIZE, /* register set size in bytes */ + FPREGSIZE, /* floating point register size in bytes */ + "PC", /* name of PC */ + "R1", /* name of SP */ + "R15", /* name of link register */ + "setSB", /* static base register name */ + 0, /* value */ + 0x1000, /* page size */ + 0xE0000000, /* kernel base */ + 0xE0000000, /* kernel text mask */ + 0x7FFFFFFF, /* user stack top */ + 4, /* quantization of pc */ + 4, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/kdb.c b/utils/libmach/kdb.c new file mode 100644 index 0000000..68a25ed --- /dev/null +++ b/utils/libmach/kdb.c @@ -0,0 +1,1058 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +/* + * Sparc-specific debugger interface + */ + +static char *sparcexcep(Map*, Rgetter); +static int sparcfoll(Map*, uvlong, Rgetter, uvlong*); +static int sparcinst(Map*, uvlong, char, char*, int); +static int sparcdas(Map*, uvlong, char*, int); +static int sparcinstlen(Map*, uvlong); + +Machdata sparcmach = +{ + {0x91, 0xd0, 0x20, 0x01}, /* breakpoint: TA $1 */ + 4, /* break point size */ + + beswab, /* convert short to local byte order */ + beswal, /* convert long to local byte order */ + beswav, /* convert vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* frame finder */ + sparcexcep, /* print exception */ + 0, /* breakpoint fixup */ + beieeesftos, /* single precision float printer */ + beieeedftos, /* double precision float printer */ + sparcfoll, /* following addresses */ + sparcinst, /* print instruction */ + sparcdas, /* dissembler */ + sparcinstlen, /* instruction size */ +}; + +static char *trapname[] = +{ + "reset", + "instruction access exception", + "illegal instruction", + "privileged instruction", + "fp disabled", + "window overflow", + "window underflow", + "unaligned address", + "fp exception", + "data access exception", + "tag overflow", +}; + +static char* +excname(ulong tbr) +{ + static char buf[32]; + + if(tbr < sizeof trapname/sizeof(char*)) + return trapname[tbr]; + if(tbr >= 130) + sprint(buf, "trap instruction %ld", tbr-128); + else if(17<=tbr && tbr<=31) + sprint(buf, "interrupt level %ld", tbr-16); + else switch(tbr){ + case 36: + return "cp disabled"; + case 40: + return "cp exception"; + case 128: + return "syscall"; + case 129: + return "breakpoint"; + default: + sprint(buf, "unknown trap %ld", tbr); + } + return buf; +} + +static char* +sparcexcep(Map *map, Rgetter rget) +{ + long tbr; + + tbr = (*rget)(map, "TBR"); + tbr = (tbr&0xFFF)>>4; + return excname(tbr); +} + + /* Sparc disassembler and related functions */ +typedef struct instr Instr; + +struct opcode { + char *mnemonic; + void (*f)(Instr*, char*); + int flag; +}; + +static char FRAMENAME[] = ".frame"; + + +struct instr { + uchar op; /* bits 31-30 */ + uchar rd; /* bits 29-25 */ + uchar op2; /* bits 24-22 */ + uchar a; /* bit 29 */ + uchar cond; /* bits 28-25 */ + uchar op3; /* bits 24-19 */ + uchar rs1; /* bits 18-14 */ + uchar i; /* bit 13 */ + uchar asi; /* bits 12-05 */ + uchar rs2; /* bits 04-00 */ + short simm13; /* bits 12-00, signed */ + ushort opf; /* bits 13-05 */ + ulong immdisp22; /* bits 21-00 */ + ulong simmdisp22; /* bits 21-00, signed */ + ulong disp30; /* bits 30-00 */ + ulong imm32; /* SETHI+ADD constant */ + int target; /* SETHI+ADD dest reg */ + long w0; + long w1; + uvlong addr; /* pc of instruction */ + char *curr; /* current fill level in output buffer */ + char *end; /* end of buffer */ + int size; /* number of longs in instr */ + char *err; /* errmsg */ +}; + +static Map *mymap; /* disassembler context */ +static int dascase; + +static int mkinstr(uvlong, Instr*); +static void bra1(Instr*, char*, char*[]); +static void bra(Instr*, char*); +static void fbra(Instr*, char*); +static void cbra(Instr*, char*); +static void unimp(Instr*, char*); +static void fpop(Instr*, char*); +static void shift(Instr*, char*); +static void sethi(Instr*, char*); +static void load(Instr*, char*); +static void loada(Instr*, char*); +static void store(Instr*, char*); +static void storea(Instr*, char*); +static void add(Instr*, char*); +static void cmp(Instr*, char*); +static void wr(Instr*, char*); +static void jmpl(Instr*, char*); +static void rd(Instr*, char*); +static void loadf(Instr*, char*); +static void storef(Instr*, char*); +static void loadc(Instr*, char*); +static void loadcsr(Instr*, char*); +static void trap(Instr*, char*); + +static struct opcode sparcop0[8] = { + "UNIMP", unimp, 0, /* page 137 */ /* 0 */ + "", 0, 0, /* 1 */ + "B", bra, 0, /* page 119 */ /* 2 */ + "", 0, 0, /* 3 */ + "SETHI", sethi, 0, /* page 104 */ /* 4 */ + "", 0, 0, /* 5 */ + "FB", fbra, 0, /* page 121 */ /* 6 */ + "CB", cbra, 0, /* page 123 */ /* 7 */ +}; + +static struct opcode sparcop2[64] = { + "ADD", add, 0, /* page 108 */ /* 0x00 */ + "AND", add, 0, /* page 106 */ /* 0x01 */ + "OR", add, 0, /* 0x02 */ + "XOR", add, 0, /* 0x03 */ + "SUB", add, 0, /* page 110 */ /* 0x04 */ + "ANDN", add, 0, /* 0x05 */ + "ORN", add, 0, /* 0x06 */ + "XORN", add, 0, /* 0x07 */ + "ADDX", add, 0, /* 0x08 */ + "", 0, 0, /* 0x09 */ + "UMUL", add, 0, /* page 113 */ /* 0x0a */ + "SMUL", add, 0, /* 0x0b */ + "SUBX", add, 0, /* 0x0c */ + "", 0, 0, /* 0x0d */ + "UDIV", add, 0, /* page 115 */ /* 0x0e */ + "SDIV", add, 0, /* 0x0f */ + "ADDCC", add, 0, /* 0x10 */ + "ANDCC", add, 0, /* 0x11 */ + "ORCC", add, 0, /* 0x12 */ + "XORCC", add, 0, /* 0x13 */ + "SUBCC", cmp, 0, /* 0x14 */ + "ANDNCC", add, 0, /* 0x15 */ + "ORNCC", add, 0, /* 0x16 */ + "XORNCC", add, 0, /* 0x17 */ + "ADDXCC", add, 0, /* 0x18 */ + "", 0, 0, /* 0x19 */ + "UMULCC", add, 0, /* 0x1a */ + "SMULCC", add, 0, /* 0x1b */ + "SUBXCC", add, 0, /* 0x1c */ + "", 0, 0, /* 0x1d */ + "UDIVCC", add, 0, /* 0x1e */ + "SDIVCC", add, 0, /* 0x1f */ + "TADD", add, 0, /* page 109 */ /* 0x20 */ + "TSUB", add, 0, /* page 111 */ /* 0x21 */ + "TADDCCTV", add, 0, /* 0x22 */ + "TSUBCCTV", add, 0, /* 0x23 */ + "MULSCC", add, 0, /* page 112 */ /* 0x24 */ + "SLL", shift, 0, /* page 107 */ /* 0x25 */ + "SRL", shift, 0, /* 0x26 */ + "SRA", shift, 0, /* 0x27 */ + "rdy", rd, 0, /* page 131 */ /* 0x28 */ + "rdpsr", rd, 0, /* 0x29 */ + "rdwim", rd, 0, /* 0x2a */ + "rdtbr", rd, 0, /* 0x2b */ + "", 0, 0, /* 0x2c */ + "", 0, 0, /* 0x2d */ + "", 0, 0, /* 0x2e */ + "", 0, 0, /* 0x2f */ + "wry", wr, 0, /* page 133 */ /* 0x30 */ + "wrpsr", wr, 0, /* 0x31 */ + "wrwim", wr, 0, /* 0x32 */ + "wrtbr", wr, 0, /* 0x33 */ + "FPOP", fpop, 0, /* page 140 */ /* 0x34 */ + "FPOP", fpop, 0, /* 0x35 */ + "", 0, 0, /* 0x36 */ + "", 0, 0, /* 0x37 */ + "JMPL", jmpl, 0, /* page 126 */ /* 0x38 */ + "RETT", add, 0, /* page 127 */ /* 0x39 */ + "T", trap, 0, /* page 129 */ /* 0x3a */ + "flush", add, 0, /* page 138 */ /* 0x3b */ + "SAVE", add, 0, /* page 117 */ /* 0x3c */ + "RESTORE", add, 0, /* 0x3d */ +}; + +static struct opcode sparcop3[64]={ + "ld", load, 0, /* 0x00 */ + "ldub", load, 0, /* 0x01 */ + "lduh", load, 0, /* 0x02 */ + "ldd", load, 0, /* 0x03 */ + "st", store, 0, /* 0x04 */ + "stb", store, 0, /* page 95 */ /* 0x05 */ + "sth", store, 0, /* 0x06 */ + "std", store, 0, /* 0x07 */ + "", 0, 0, /* 0x08 */ + "ldsb", load, 0, /* page 90 */ /* 0x09 */ + "ldsh", load, 0, /* 0x0a */ + "", 0, 0, /* 0x0b */ + "", 0, 0, /* 0x0c */ + "ldstub", store, 0, /* page 101 */ /* 0x0d */ + "", 0, 0, /* 0x0e */ + "swap", load, 0, /* page 102 */ /* 0x0f */ + "lda", loada, 0, /* 0x10 */ + "lduba", loada, 0, /* 0x11 */ + "lduha", loada, 0, /* 0x12 */ + "ldda", loada, 0, /* 0x13 */ + "sta", storea, 0, /* 0x14 */ + "stba", storea, 0, /* 0x15 */ + "stha", storea, 0, /* 0x16 */ + "stda", storea, 0, /* 0x17 */ + "", 0, 0, /* 0x18 */ + "ldsba", loada, 0, /* 0x19 */ + "ldsha", loada, 0, /* 0x1a */ + "", 0, 0, /* 0x1b */ + "", 0, 0, /* 0x1c */ + "ldstuba", storea, 0, /* 0x1d */ + "", 0, 0, /* 0x1e */ + "swapa", loada, 0, /* 0x1f */ + "ldf", loadf, 0, /* page 92 */ /* 0x20 */ + "ldfsr", loadf,0, /* 0x21 */ + "", 0, 0, /* 0x22 */ + "lddf", loadf, 0, /* 0x23 */ + "stf", storef, 0, /* page 97 */ /* 0x24 */ + "stfsr", storef,0, /* 0x25 */ + "stdfq", storef,0, /* 0x26 */ + "stdf", storef, 0, /* 0x27 */ + "", 0, 0, /* 0x28 */ + "", 0, 0, /* 0x29 */ + "", 0, 0, /* 0x2a */ + "", 0, 0, /* 0x2b */ + "", 0, 0, /* 0x2c */ + "", 0, 0, /* 0x2d */ + "", 0, 0, /* 0x2e */ + "", 0, 0, /* 0x2f */ + "ldc", loadc, 0, /* page 94 */ /* 0x30 */ + "ldcsr", loadcsr,0, /* 0x31 */ + "", 0, 0, /* 0x32 */ + "lddc", loadc, 0, /* 0x33 */ + "stc", loadc, 0, /* page 99 */ /* 0x34 */ + "stcsr", loadcsr,0, /* 0x35 */ + "stdcq", loadcsr,0, /* 0x36 */ + "stdc", loadc, 0, /* 0x37 */ +}; + +#pragma varargck argpos bprint 2 +#pragma varargck type "T" char* + +/* convert to lower case from upper, according to dascase */ +static int +Tfmt(Fmt *f) +{ + char buf[128]; + char *s, *t, *oa; + + oa = va_arg(f->args, char*); + if(dascase){ + for(s=oa,t=buf; *t = *s; s++,t++) + if('A'<=*t && *t<='Z') + *t += 'a'-'A'; + return fmtstrcpy(f, buf); + } + return fmtstrcpy(f, oa); +} + +static void +bprint(Instr *i, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + i->curr = vseprint(i->curr, i->end, fmt, arg); + va_end(arg); +} + +static int +decode(uvlong pc, Instr *i) +{ + ulong w; + + if (get4(mymap, pc, &w) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + i->op = (w >> 30) & 0x03; + i->rd = (w >> 25) & 0x1F; + i->op2 = (w >> 22) & 0x07; + i->a = (w >> 29) & 0x01; + i->cond = (w >> 25) & 0x0F; + i->op3 = (w >> 19) & 0x3F; + i->rs1 = (w >> 14) & 0x1F; + i->i = (w >> 13) & 0x01; + i->asi = (w >> 5) & 0xFF; + i->rs2 = (w >> 0) & 0x1F; + i->simm13 = (w >> 0) & 0x1FFF; + if(i->simm13 & (1<<12)) + i->simm13 |= ~((1<<13)-1); + i->opf = (w >> 5) & 0x1FF; + i->immdisp22 = (w >> 0) & 0x3FFFFF; + i->simmdisp22 = i->immdisp22; + if(i->simmdisp22 & (1<<21)) + i->simmdisp22 |= ~((1<<22)-1); + i->disp30 = (w >> 0) & 0x3FFFFFFF; + i->w0 = w; + i->target = -1; + i->addr = pc; + i->size = 1; + return 1; +} + +static int +mkinstr(uvlong pc, Instr *i) +{ + Instr xi; + + if (decode(pc, i) < 0) + return -1; + if(i->op==0 && i->op2==4 && !dascase){ /* SETHI */ + if (decode(pc+4, &xi) < 0) + return -1; + if(xi.op==2 && xi.op3==0) /* ADD */ + if(xi.i == 1 && xi.rs1 == i->rd){ /* immediate to same reg */ + i->imm32 = xi.simm13 + (i->immdisp22<<10); + i->target = xi.rd; + i->w1 = xi.w0; + i->size++; + return 1; + } + } + if(i->op==2 && i->opf==1 && !dascase){ /* FMOVS */ + if (decode(pc+4, &xi) < 0) + return -1; + if(i->op==2 && i->opf==1) /* FMOVS */ + if(xi.rd==i->rd+1 && xi.rs2==i->rs2+1){ /* next pair */ + i->w1 = xi.w0; + i->size++; + } + } + return 1; +} + +static int +printins(Map *map, uvlong pc, char *buf, int n) +{ + Instr instr; + void (*f)(Instr*, char*); + + mymap = map; + memset(&instr, 0, sizeof(instr)); + instr.curr = buf; + instr.end = buf+n-1; + if (mkinstr(pc, &instr) < 0) + return -1; + switch(instr.op){ + case 0: + f = sparcop0[instr.op2].f; + if(f) + (*f)(&instr, sparcop0[instr.op2].mnemonic); + else + bprint(&instr, "unknown %lux", instr.w0); + break; + + case 1: + bprint(&instr, "%T", "CALL\t"); + instr.curr += symoff(instr.curr, instr.end-instr.curr, + pc+instr.disp30*4, CTEXT); + if (!dascase) + bprint(&instr, "(SB)"); + break; + + case 2: + f = sparcop2[instr.op3].f; + if(f) + (*f)(&instr, sparcop2[instr.op3].mnemonic); + else + bprint(&instr, "unknown %lux", instr.w0); + break; + + case 3: + f = sparcop3[instr.op3].f; + if(f) + (*f)(&instr, sparcop3[instr.op3].mnemonic); + else + bprint(&instr, "unknown %lux", instr.w0); + break; + } + if (instr.err) { + if (instr.curr != buf) + bprint(&instr, "\t\t;"); + bprint(&instr, instr.err); + } + return instr.size*4; +} + +static int +sparcinst(Map *map, uvlong pc, char modifier, char *buf, int n) +{ + static int fmtinstalled = 0; + + /* a modifier of 'I' toggles the dissassembler type */ + if (!fmtinstalled) { + fmtinstalled = 1; + fmtinstall('T', Tfmt); + } + if ((asstype == ASUNSPARC && modifier == 'i') + || (asstype == ASPARC && modifier == 'I')) + dascase = 'a'-'A'; + else + dascase = 0; + return printins(map, pc, buf, n); +} + +static int +sparcdas(Map *map, uvlong pc, char *buf, int n) +{ + Instr instr; + + mymap = map; + memset(&instr, 0, sizeof(instr)); + instr.curr = buf; + instr.end = buf+n-1; + if (mkinstr(pc, &instr) < 0) + return -1; + if (instr.end-instr.curr > 8) + instr.curr = _hexify(instr.curr, instr.w0, 7); + if (instr.end-instr.curr > 9 && instr.size == 2) { + *instr.curr++ = ' '; + instr.curr = _hexify(instr.curr, instr.w1, 7); + } + *instr.curr = 0; + return instr.size*4; +} + +static int +sparcinstlen(Map *map, uvlong pc) +{ + Instr i; + + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + return i.size*4; +} + +static int +plocal(Instr *i) +{ + int offset; + Symbol s; + + if (!findsym(i->addr, CTEXT, &s) || !findlocal(&s, FRAMENAME, &s)) + return -1; + if (s.value > i->simm13) { + if(getauto(&s, s.value-i->simm13, CAUTO, &s)) { + bprint(i, "%s+%lld(SP)", s.name, s.value); + return 1; + } + } else { + offset = i->simm13-s.value; + if (getauto(&s, offset-4, CPARAM, &s)) { + bprint(i, "%s+%d(FP)", s.name, offset); + return 1; + } + } + return -1; +} + +static void +address(Instr *i) +{ + Symbol s, s2; + uvlong off, off1; + + if (i->rs1 == 1 && plocal(i) >= 0) + return; + off = mach->sb+i->simm13; + if(i->rs1 == 2 && findsym(off, CANY, &s) + && s.value-off < 4096 + && (s.class == CDATA || s.class == CTEXT)) { + if(off==s.value && s.name[0]=='$'){ + off1 = 0; + geta(mymap, s.value, &off1); + if(off1 && findsym(off1, CANY, &s2) && s2.value == off1){ + bprint(i, "$%s(SB)", s2.name); + return; + } + } + bprint(i, "%s", s.name); + if (s.value != off) + bprint(i, "+%llux", s.value-off); + bprint(i, "(SB)"); + return; + } + bprint(i, "%ux(R%d)", i->simm13, i->rs1); +} + +static void +unimp(Instr *i, char *m) +{ + bprint(i, "%T", m); +} + +static char *bratab[16] = { /* page 91 */ + "N", /* 0x0 */ + "E", /* 0x1 */ + "LE", /* 0x2 */ + "L", /* 0x3 */ + "LEU", /* 0x4 */ + "CS", /* 0x5 */ + "NEG", /* 0x6 */ + "VS", /* 0x7 */ + "A", /* 0x8 */ + "NE", /* 0x9 */ + "G", /* 0xa */ + "GE", /* 0xb */ + "GU", /* 0xc */ + "CC", /* 0xd */ + "POS", /* 0xe */ + "VC", /* 0xf */ +}; + +static char *fbratab[16] = { /* page 91 */ + "N", /* 0x0 */ + "NE", /* 0x1 */ + "LG", /* 0x2 */ + "UL", /* 0x3 */ + "L", /* 0x4 */ + "UG", /* 0x5 */ + "G", /* 0x6 */ + "U", /* 0x7 */ + "A", /* 0x8 */ + "E", /* 0x9 */ + "UE", /* 0xa */ + "GE", /* 0xb */ + "UGE", /* 0xc */ + "LE", /* 0xd */ + "ULE", /* 0xe */ + "O", /* 0xf */ +}; + +static char *cbratab[16] = { /* page 91 */ + "N", /* 0x0 */ + "123", /* 0x1 */ + "12", /* 0x2 */ + "13", /* 0x3 */ + "1", /* 0x4 */ + "23", /* 0x5 */ + "2", /* 0x6 */ + "3", /* 0x7 */ + "A", /* 0x8 */ + "0", /* 0x9 */ + "03", /* 0xa */ + "02", /* 0xb */ + "023", /* 0xc */ + "01", /* 0xd */ + "013", /* 0xe */ + "012", /* 0xf */ +}; + +static void +bra1(Instr *i, char *m, char *tab[]) +{ + long imm; + + imm = i->simmdisp22; + if(i->a) + bprint(i, "%T%T.%c\t", m, tab[i->cond], 'A'+dascase); + else + bprint(i, "%T%T\t", m, tab[i->cond]); + i->curr += symoff(i->curr, i->end-i->curr, i->addr+4*imm, CTEXT); + if (!dascase) + bprint(i, "(SB)"); +} + +static void +bra(Instr *i, char *m) /* page 91 */ +{ + bra1(i, m, bratab); +} + +static void +fbra(Instr *i, char *m) /* page 93 */ +{ + bra1(i, m, fbratab); +} + +static void +cbra(Instr *i, char *m) /* page 95 */ +{ + bra1(i, m, cbratab); +} + +static void +trap(Instr *i, char *m) /* page 101 */ +{ + if(i->i == 0) + bprint(i, "%T%T\tR%d+R%d", m, bratab[i->cond], i->rs2, i->rs1); + else + bprint(i, "%T%T\t$%ux+R%d", m, bratab[i->cond], i->simm13, i->rs1); +} + +static void +sethi(Instr *i, char *m) /* page 89 */ +{ + ulong imm; + + imm = i->immdisp22<<10; + if(dascase){ + bprint(i, "%T\t%lux, R%d", m, imm, i->rd); + return; + } + if(imm==0 && i->rd==0){ + bprint(i, "NOP"); + return; + } + if(i->target < 0){ + bprint(i, "MOVW\t$%lux, R%d", imm, i->rd); + return; + } + bprint(i, "MOVW\t$%lux, R%d", i->imm32, i->target); +} + +static char ldtab[] = { + 'W', + 'B', + 'H', + 'D', +}; + +static char* +moveinstr(int op3, char *m) +{ + char *s; + int c; + static char buf[8]; + + if(!dascase){ + /* batshit cases */ + if(op3 == 0xF || op3 == 0x1F) + return "SWAP"; + if(op3 == 0xD || op3 == 0x1D) + return "TAS"; /* really LDSTUB */ + c = ldtab[op3&3]; + s = ""; + if((op3&11)==1 || (op3&11)==2) + s="U"; + sprint(buf, "MOV%c%s", c, s); + return buf; + } + return m; +} + +static void +load(Instr *i, char *m) /* page 68 */ +{ + m = moveinstr(i->op3, m); + if(i->i == 0) + bprint(i, "%s\t(R%d+R%d), R%d", m, i->rs1, i->rs2, i->rd); + else{ + bprint(i, "%s\t", m); + address(i); + bprint(i, ", R%d", i->rd); + } +} + +static void +loada(Instr *i, char *m) /* page 68 */ +{ + m = moveinstr(i->op3, m); + if(i->i == 0) + bprint(i, "%s\t(R%d+R%d, %d), R%d", m, i->rs1, i->rs2, i->asi, i->rd); + else + bprint(i, "unknown ld asi %lux", i->w0); +} + +static void +store(Instr *i, char *m) /* page 74 */ +{ + m = moveinstr(i->op3, m); + if(i->i == 0) + bprint(i, "%s\tR%d, (R%d+R%d)", + m, i->rd, i->rs1, i->rs2); + else{ + bprint(i, "%s\tR%d, ", m, i->rd); + address(i); + } +} + +static void +storea(Instr *i, char *m) /* page 74 */ +{ + m = moveinstr(i->op3, m); + if(i->i == 0) + bprint(i, "%s\tR%d, (R%d+R%d, %d)", m, i->rd, i->rs1, i->rs2, i->asi); + else + bprint(i, "%s\tR%d, %d(R%d, %d), ?", m, i->rd, i->simm13, i->rs1, i->asi); +} + +static void +shift(Instr *i, char *m) /* page 88 */ +{ + if(i->i == 0){ + if(i->rs1 == i->rd) + if(dascase) + bprint(i, "%T\tR%d, R%d", m, i->rs1, i->rs2); + else + bprint(i, "%T\tR%d, R%d", m, i->rs2, i->rs1); + else + if(dascase) + bprint(i, "%T\tR%d, R%d, R%d", m, i->rs1, i->rs2, i->rd); + else + bprint(i, "%T\tR%d, R%d, R%d", m, i->rs2, i->rs1, i->rd); + }else{ + if(i->rs1 == i->rd) + if(dascase) + bprint(i, "%T\t$%d,R%d", m, i->simm13&0x1F, i->rs1); + else + bprint(i, "%T\tR%d, $%d", m, i->rs1, i->simm13&0x1F); + else + if(dascase) + bprint(i, "%T\tR%d, $%d, R%d",m,i->rs1,i->simm13&0x1F,i->rd); + else + bprint(i, "%T\t$%d, R%d, R%d",m,i->simm13&0x1F,i->rs1,i->rd); + } +} + +static void +add(Instr *i, char *m) /* page 82 */ +{ + if(i->i == 0){ + if(dascase) + bprint(i, "%T\tR%d, R%d", m, i->rs1, i->rs2); + else + if(i->op3==2 && i->rs1==0 && i->rd) /* OR R2, R0, R1 */ + bprint(i, "MOVW\tR%d", i->rs2); + else + bprint(i, "%T\tR%d, R%d", m, i->rs2, i->rs1); + }else{ + if(dascase) + bprint(i, "%T\tR%d, $%ux", m, i->rs1, i->simm13); + else + if(i->op3==0 && i->rd && i->rs1==0) /* ADD $x, R0, R1 */ + bprint(i, "MOVW\t$%ux", i->simm13); + else if(i->op3==0 && i->rd && i->rs1==2){ + /* ADD $x, R2, R1 -> MOVW $x(SB), R1 */ + bprint(i, "MOVW\t$"); + address(i); + } else + bprint(i, "%T\t$%ux, R%d", m, i->simm13, i->rs1); + } + if(i->rs1 != i->rd) + bprint(i, ", R%d", i->rd); +} + +static void +cmp(Instr *i, char *m) +{ + if(dascase || i->rd){ + add(i, m); + return; + } + if(i->i == 0) + bprint(i, "CMP\tR%d, R%d", i->rs1, i->rs2); + else + bprint(i, "CMP\tR%d, $%ux", i->rs1, i->simm13); +} + +static char *regtab[4] = { + "Y", + "PSR", + "WIM", + "TBR", +}; + +static void +wr(Instr *i, char *m) /* page 82 */ +{ + if(dascase){ + if(i->i == 0) + bprint(i, "%s\tR%d, R%d", m, i->rs1, i->rs2); + else + bprint(i, "%s\tR%d, $%ux", m, i->rs1, i->simm13); + }else{ + if(i->i && i->simm13==0) + bprint(i, "MOVW\tR%d", i->rs1); + else if(i->i == 0) + bprint(i, "wr\tR%d, R%d", i->rs2, i->rs1); + else + bprint(i, "wr\t$%ux, R%d", i->simm13, i->rs1); + } + bprint(i, ", %s", regtab[i->op3&3]); +} + +static void +rd(Instr *i, char *m) /* page 103 */ +{ + if(i->rs1==15 && i->rd==0){ + m = "stbar"; + if(!dascase) + m = "STBAR"; + bprint(i, "%s", m); + }else{ + if(!dascase) + m = "MOVW"; + bprint(i, "%s\t%s, R%d", m, regtab[i->op3&3], i->rd); + } +} + +static void +jmpl(Instr *i, char *m) /* page 82 */ +{ + if(i->i == 0){ + if(i->rd == 15) + bprint(i, "%T\t(R%d+R%d)", "CALL", i->rs2, i->rs1); + else + bprint(i, "%T\t(R%d+R%d), R%d", m, i->rs2, i->rs1, i->rd); + }else{ + if(!dascase && i->simm13==8 && i->rs1==15 && i->rd==0) + bprint(i, "RETURN"); + else{ + bprint(i, "%T\t", m); + address(i); + bprint(i, ", R%d", i->rd); + } + } +} + +static void +loadf(Instr *i, char *m) /* page 70 */ +{ + if(!dascase){ + m = "FMOVD"; + if(i->op3 == 0x20) + m = "FMOVF"; + else if(i->op3 == 0x21) + m = "MOVW"; + } + if(i->i == 0) + bprint(i, "%s\t(R%d+R%d)", m, i->rs1, i->rs2); + else{ + bprint(i, "%s\t", m); + address(i); + } + if(i->op3 == 0x21) + bprint(i, ", FSR"); + else + bprint(i, ", R%d", i->rd); +} + +static void +storef(Instr *i, char *m) /* page 70 */ +{ + if(!dascase){ + m = "FMOVD"; + if(i->op3 == 0x25 || i->op3 == 0x26) + m = "MOVW"; + else if(i->op3 == 0x20) + m = "FMOVF"; + } + bprint(i, "%s\t", m); + if(i->op3 == 0x25) + bprint(i, "FSR, "); + else if(i->op3 == 0x26) + bprint(i, "FQ, "); + else + bprint(i, "R%d, ", i->rd); + if(i->i == 0) + bprint(i, "(R%d+R%d)", i->rs1, i->rs2); + else + address(i); +} + +static void +loadc(Instr *i, char *m) /* page 72 */ +{ + if(i->i == 0) + bprint(i, "%s\t(R%d+R%d), C%d", m, i->rs1, i->rs2, i->rd); + else{ + bprint(i, "%s\t", m); + address(i); + bprint(i, ", C%d", i->rd); + } +} + +static void +loadcsr(Instr *i, char *m) /* page 72 */ +{ + if(i->i == 0) + bprint(i, "%s\t(R%d+R%d), CSR", m, i->rs1, i->rs2); + else{ + bprint(i, "%s\t", m); + address(i); + bprint(i, ", CSR"); + } +} + +static struct{ + int opf; + char *name; +} fptab1[] = { /* ignores rs1 */ + 0xC4, "FITOS", /* page 109 */ + 0xC8, "FITOD", + 0xCC, "FITOX", + + 0xD1, "FSTOI", /* page 110 */ + 0xD2, "FDTOI", + 0xD3, "FXTOI", + + 0xC9, "FSTOD", /* page 111 */ + 0xCD, "FSTOX", + 0xC6, "FDTOS", + 0xCE, "FDTOX", + 0xC7, "FXTOS", + 0xCB, "FXTOD", + + 0x01, "FMOVS", /* page 112 */ + 0x05, "FNEGS", + 0x09, "FABSS", + + 0x29, "FSQRTS", /* page 113 */ + 0x2A, "FSQRTD", + 0x2B, "FSQRTX", + + 0, 0, +}; + +static struct{ + int opf; + char *name; +} fptab2[] = { /* uses rs1 */ + + 0x41, "FADDS", /* page 114 */ + 0x42, "FADDD", + 0x43, "FADDX", + 0x45, "FSUBS", + 0x46, "FSUBD", + 0x47, "FSUBX", + + 0x49, "FMULS", /* page 115 */ + 0x4A, "FMULD", + 0x4B, "FMULX", + 0x4D, "FDIVS", + 0x4E, "FDIVD", + 0x4F, "FDIVX", + + 0x51, "FCMPS", /* page 116 */ + 0x52, "FCMPD", + 0x53, "FCMPX", + 0x55, "FCMPES", + 0x56, "FCMPED", + 0x57, "FCMPEX", + + 0, 0 +}; + +static void +fpop(Instr *i, char *m) /* page 108-116 */ +{ + int j; + + if(dascase==0 && i->size==2){ + bprint(i, "FMOVD\tF%d, F%d", i->rs2, i->rd); + return; + } + for(j=0; fptab1[j].name; j++) + if(fptab1[j].opf == i->opf){ + bprint(i, "%T\tF%d, F%d", fptab1[j].name, i->rs2, i->rd); + return; + } + for(j=0; fptab2[j].name; j++) + if(fptab2[j].opf == i->opf){ + bprint(i, "%T\tF%d, F%d, F%d", fptab2[j].name, i->rs1, i->rs2, i->rd); + return; + } + bprint(i, "%T%ux\tF%d, F%d, F%d", m, i->opf, i->rs1, i->rs2, i->rd); +} + +static int +sparcfoll(Map *map, uvlong pc, Rgetter rget, uvlong *foll) +{ + ulong w, r1, r2; + char buf[8]; + Instr i; + + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + w = i.w0; + switch(w & 0xC1C00000){ + case 0x00800000: /* branch on int cond */ + case 0x01800000: /* branch on fp cond */ + case 0x01C00000: /* branch on copr cond */ + foll[0] = pc+8; + foll[1] = pc + (i.simmdisp22<<2); + return 2; + } + + if((w&0xC0000000) == 0x40000000){ /* CALL */ + foll[0] = pc + (i.disp30<<2); + return 1; + } + + if((w&0xC1F80000) == 0x81C00000){ /* JMPL */ + sprint(buf, "R%ld", (w>>14)&0xF); + r1 = (*rget)(map, buf); + if(w & 0x2000) /* JMPL R1+simm13 */ + r2 = i.simm13; + else{ /* JMPL R1+R2 */ + sprint(buf, "R%ld", w&0xF); + r2 = (*rget)(map, buf); + } + foll[0] = r1 + r2; + return 1; + } + foll[0] = pc+i.size*4; + return 1; +} diff --git a/utils/libmach/kobj.c b/utils/libmach/kobj.c new file mode 100644 index 0000000..51dccbd --- /dev/null +++ b/utils/libmach/kobj.c @@ -0,0 +1,136 @@ +/* + * kobj.c - identify and parse a sparc object file + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "kc/k.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char type; + char sym; + char name; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + + +int +_isk(char *s) +{ + return s[0] == ANAME /* ANAME */ + && s[1] == D_FILE /* type */ + && s[2] == 1 /* sym */ + && s[3] == '<'; /* name of file */ +} + + +int +_readk(Biobuf *bp, Prog *p) +{ + int as, n; + Addr a; + + as = Bgetc(bp); /* as */ + if(as < 0) + return 0; + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = beswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + else if(as == AGLOBL) + p->kind = aData; + skip(bp, 5); /* reg (1 byte); lineno (4 bytes) */ + a = addr(bp); + addr(bp); + if(a.type != D_OREG || a.name != D_STATIC && a.name != D_EXTERN) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + long off; + + a.type = Bgetc(bp); /* a.type */ + skip(bp, 1); /* reg */ + a.sym = Bgetc(bp); /* sym index */ + a.name = Bgetc(bp); /* sym type */ + switch(a.type) { + default: + case D_NONE: case D_REG: case D_FREG: case D_CREG: case D_PREG: + break; + case D_BRANCH: + case D_OREG: + case D_ASI: + case D_CONST: + off = Bgetc(bp); + off |= Bgetc(bp) << 8; + off |= Bgetc(bp) << 16; + off |= Bgetc(bp) << 24; + if(off < 0) + off = -off; + if(a.sym!=0 && (a.name==D_PARAM || a.name==D_AUTO)) + _offset(a.sym, off); + break; + case D_SCONST: + skip(bp, NSNAME); + break; + case D_FCONST: + skip(bp, 8); + break; + } + return a; +} + + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} diff --git a/utils/libmach/machdata.c b/utils/libmach/machdata.c new file mode 100644 index 0000000..425173e --- /dev/null +++ b/utils/libmach/machdata.c @@ -0,0 +1,450 @@ +/* + * Debugger utilities shared by at least two architectures + */ + +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +#define STARTSYM "_main" +#define PROFSYM "_mainp" +#define FRAMENAME ".frame" + +extern Machdata mipsmach; + +int asstype = AMIPS; /* disassembler type */ +Machdata *machdata; /* machine-dependent functions */ + +int +localaddr(Map *map, char *fn, char *var, uvlong *r, Rgetter rget) +{ + Symbol s; + uvlong fp, pc, sp, link; + + if (!lookup(fn, 0, &s)) { + werrstr("function not found"); + return -1; + } + pc = rget(map, mach->pc); + sp = rget(map, mach->sp); + if(mach->link) + link = rget(map, mach->link); + else + link = 0; + fp = machdata->findframe(map, s.value, pc, sp, link); + if (fp == 0) { + werrstr("stack frame not found"); + return -1; + } + + if (!var || !var[0]) { + *r = fp; + return 1; + } + + if (findlocal(&s, var, &s) == 0) { + werrstr("local variable not found"); + return -1; + } + + switch (s.class) { + case CAUTO: + *r = fp - s.value; + break; + case CPARAM: /* assume address size is stack width */ + *r = fp + s.value + mach->szaddr; + break; + default: + werrstr("local variable not found: %d", s.class); + return -1; + } + return 1; +} + +/* + * Print value v as s.name[+offset] if possible, or just v. + */ +int +symoff(char *buf, int n, uvlong v, int space) +{ + Symbol s; + int r; + long delta; + + r = delta = 0; /* to shut compiler up */ + if (v) { + r = findsym(v, space, &s); + if (r) + delta = v-s.value; + if (delta < 0) + delta = -delta; + } + if (v == 0 || r == 0) + return snprint(buf, n, "%llux", v); + if (s.type != 't' && s.type != 'T' && delta >= 4096) + return snprint(buf, n, "%llux", v); + else if (strcmp(s.name, ".string") == 0) + return snprint(buf, n, "%llux", v); + else if (delta) + return snprint(buf, n, "%s+%lux", s.name, delta); + else + return snprint(buf, n, "%s", s.name); +} + +/* + * Format floating point registers + * + * Register codes in format field: + * 'X' - print as 32-bit hexadecimal value + * 'F' - 64-bit double register when modif == 'F'; else 32-bit single reg + * 'f' - 32-bit ieee float + * '8' - big endian 80-bit ieee extended float + * '3' - little endian 80-bit ieee extended float with hole in bytes 8&9 + */ +int +fpformat(Map *map, Reglist *rp, char *buf, int n, int modif) +{ + char reg[12]; + ulong r; + + switch(rp->rformat) + { + case 'X': + if (get4(map, rp->roffs, &r) < 0) + return -1; + snprint(buf, n, "%lux", r); + break; + case 'F': /* first reg of double reg pair */ + if (modif == 'F') + if ((rp->rformat=='F') || (((rp+1)->rflags&RFLT) && (rp+1)->rformat == 'f')) { + if (get1(map, rp->roffs, (uchar *)reg, 8) < 0) + return -1; + machdata->dftos(buf, n, reg); + if (rp->rformat == 'F') + return 1; + return 2; + } + /* treat it like 'f' */ + if (get1(map, rp->roffs, (uchar *)reg, 4) < 0) + return -1; + machdata->sftos(buf, n, reg); + break; + case 'f': /* 32 bit float */ + if (get1(map, rp->roffs, (uchar *)reg, 4) < 0) + return -1; + machdata->sftos(buf, n, reg); + break; + case '3': /* little endian ieee 80 with hole in bytes 8&9 */ + if (get1(map, rp->roffs, (uchar *)reg, 10) < 0) + return -1; + memmove(reg+10, reg+8, 2); /* open hole */ + memset(reg+8, 0, 2); /* fill it */ + leieee80ftos(buf, n, reg); + break; + case '8': /* big-endian ieee 80 */ + if (get1(map, rp->roffs, (uchar *)reg, 10) < 0) + return -1; + beieee80ftos(buf, n, reg); + break; + default: /* unknown */ + break; + } + return 1; +} + +char * +_hexify(char *buf, ulong p, int zeros) +{ + ulong d; + + d = p/16; + if(d) + buf = _hexify(buf, d, zeros-1); + else + while(zeros--) + *buf++ = '0'; + *buf++ = "0123456789abcdef"[p&0x0f]; + return buf; +} + +/* + * These routines assume that if the number is representable + * in IEEE floating point, it will be representable in the native + * double format. Naive but workable, probably. + */ +int +ieeedftos(char *buf, int n, ulong h, ulong l) +{ + double fr; + int exp; + + if (n <= 0) + return 0; + + + if(h & (1L<<31)){ + *buf++ = '-'; + h &= ~(1L<<31); + }else + *buf++ = ' '; + n--; + if(l == 0 && h == 0) + return snprint(buf, n, "0."); + exp = (h>>20) & ((1L<<11)-1L); + if(exp == 0) + return snprint(buf, n, "DeN(%.8lux%.8lux)", h, l); + if(exp == ((1L<<11)-1L)){ + if(l==0 && (h&((1L<<20)-1L)) == 0) + return snprint(buf, n, "Inf"); + else + return snprint(buf, n, "NaN(%.8lux%.8lux)", h&((1L<<20)-1L), l); + } + exp -= (1L<<10) - 2L; + fr = l & ((1L<<16)-1L); + fr /= 1L<<16; + fr += (l>>16) & ((1L<<16)-1L); + fr /= 1L<<16; + fr += (h & (1L<<20)-1L) | (1L<<20); + fr /= 1L<<21; + fr = ldexp(fr, exp); + return snprint(buf, n, "%.18g", fr); +} + +int +ieeesftos(char *buf, int n, ulong h) +{ + double fr; + int exp; + + if (n <= 0) + return 0; + + if(h & (1L<<31)){ + *buf++ = '-'; + h &= ~(1L<<31); + }else + *buf++ = ' '; + n--; + if(h == 0) + return snprint(buf, n, "0."); + exp = (h>>23) & ((1L<<8)-1L); + if(exp == 0) + return snprint(buf, n, "DeN(%.8lux)", h); + if(exp == ((1L<<8)-1L)){ + if((h&((1L<<23)-1L)) == 0) + return snprint(buf, n, "Inf"); + else + return snprint(buf, n, "NaN(%.8lux)", h&((1L<<23)-1L)); + } + exp -= (1L<<7) - 2L; + fr = (h & ((1L<<23)-1L)) | (1L<<23); + fr /= 1L<<24; + fr = ldexp(fr, exp); + return snprint(buf, n, "%.9g", fr); +} + +int +beieeesftos(char *buf, int n, void *s) +{ + return ieeesftos(buf, n, beswal(*(ulong*)s)); +} + +int +beieeedftos(char *buf, int n, void *s) +{ + return ieeedftos(buf, n, beswal(*(ulong*)s), beswal(((ulong*)(s))[1])); +} + +int +leieeesftos(char *buf, int n, void *s) +{ + return ieeesftos(buf, n, leswal(*(ulong*)s)); +} + +int +leieeedftos(char *buf, int n, void *s) +{ + return ieeedftos(buf, n, leswal(((ulong*)(s))[1]), leswal(*(ulong*)s)); +} + +/* packed in 12 bytes, with s[2]==s[3]==0; mantissa starts at s[4]*/ +int +beieee80ftos(char *buf, int n, void *s) +{ + uchar *reg = (uchar*)s; + int i; + ulong x; + uchar ieee[8+8]; /* room for slop */ + uchar *p, *q; + + memset(ieee, 0, sizeof(ieee)); + /* sign */ + if(reg[0] & 0x80) + ieee[0] |= 0x80; + + /* exponent */ + x = ((reg[0]&0x7F)<<8) | reg[1]; + if(x == 0) /* number is ±0 */ + goto done; + if(x == 0x7FFF){ + if(memcmp(reg+4, ieee+1, 8) == 0){ /* infinity */ + x = 2047; + }else{ /* NaN */ + x = 2047; + ieee[7] = 0x1; /* make sure */ + } + ieee[0] |= x>>4; + ieee[1] |= (x&0xF)<<4; + goto done; + } + x -= 0x3FFF; /* exponent bias */ + x += 1023; + if(x >= (1<<11) || ((reg[4]&0x80)==0 && x!=0)) + return snprint(buf, n, "not in range"); + ieee[0] |= x>>4; + ieee[1] |= (x&0xF)<<4; + + /* mantissa */ + p = reg+4; + q = ieee+1; + for(i=0; i<56; i+=8, p++, q++){ /* move one byte */ + x = (p[0]&0x7F) << 1; + if(p[1] & 0x80) + x |= 1; + q[0] |= x>>4; + q[1] |= (x&0xF)<<4; + } + done: + return beieeedftos(buf, n, (void*)ieee); +} + +int +leieee80ftos(char *buf, int n, void *s) +{ + int i; + char *cp; + char b[12]; + + cp = (char*) s; + for(i=0; i<12; i++) + b[11-i] = *cp++; + return beieee80ftos(buf, n, b); +} + +int +cisctrace(Map *map, uvlong pc, uvlong sp, uvlong link, Tracer trace) +{ + Symbol s; + int found, i; + uvlong opc, moved; + + USED(link); + i = 0; + opc = 0; + while(pc && opc != pc) { + moved = pc2sp(pc); + if (moved == ~0) + break; + found = findsym(pc, CTEXT, &s); + if (!found) + break; + if(strcmp(STARTSYM, s.name) == 0 || strcmp(PROFSYM, s.name) == 0) + break; + + sp += moved; + opc = pc; + if (geta(map, sp, &pc) < 0) + break; + (*trace)(map, pc, sp, &s); + sp += mach->szaddr; /*assumes address size = stack width*/ + if(++i > 40) + break; + } + return i; +} + +int +risctrace(Map *map, uvlong pc, uvlong sp, uvlong link, Tracer trace) +{ + int i; + Symbol s, f; + uvlong oldpc; + + i = 0; + while(findsym(pc, CTEXT, &s)) { + if(strcmp(STARTSYM, s.name) == 0 || strcmp(PROFSYM, s.name) == 0) + break; + + if(pc == s.value) /* at first instruction */ + f.value = 0; + else if(findlocal(&s, FRAMENAME, &f) == 0) + break; + + oldpc = pc; + if(s.type == 'L' || s.type == 'l' || pc <= s.value+mach->pcquant) + pc = link; + else + if (geta(map, sp, &pc) < 0) + break; + + if(pc == 0 || (pc == oldpc && f.value == 0)) + break; + + sp += f.value; + (*trace)(map, pc-8, sp, &s); + + if(++i > 40) + break; + } + return i; +} + +uvlong +ciscframe(Map *map, uvlong addr, uvlong pc, uvlong sp, uvlong link) +{ + Symbol s; + uvlong moved; + + USED(link); + for(;;) { + moved = pc2sp(pc); + if (moved == ~0) + break; + sp += moved; + findsym(pc, CTEXT, &s); + if (addr == s.value) + return sp; + if (geta(map, sp, &pc) < 0) + break; + sp += mach->szaddr; /*assumes sizeof(addr) = stack width*/ + } + return 0; +} + +uvlong +riscframe(Map *map, uvlong addr, uvlong pc, uvlong sp, uvlong link) +{ + Symbol s, f; + + while (findsym(pc, CTEXT, &s)) { + if(strcmp(STARTSYM, s.name) == 0 || strcmp(PROFSYM, s.name) == 0) + break; + + if(pc == s.value) /* at first instruction */ + f.value = 0; + else + if(findlocal(&s, FRAMENAME, &f) == 0) + break; + + sp += f.value; + if (s.value == addr) + return sp; + + if (s.type == 'L' || s.type == 'l' || pc-s.value <= mach->szaddr*2) + pc = link; + else + if (geta(map, sp-f.value, &pc) < 0) + break; + } + return 0; +} diff --git a/utils/libmach/map.c b/utils/libmach/map.c new file mode 100644 index 0000000..12bee1b --- /dev/null +++ b/utils/libmach/map.c @@ -0,0 +1,203 @@ +/* + * file map routines + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +Map * +newmap(Map *map, int n) +{ + int size; + + size = sizeof(Map)+(n-1)*sizeof(struct segment); + if (map == 0) + map = malloc(size); + else + map = realloc(map, size); + if (map == 0) { + werrstr("out of memory: %r"); + return 0; + } + memset(map, 0, size); + map->nsegs = n; + return map; +} + +int +setmap(Map *map, int fd, uvlong b, uvlong e, vlong f, char *name) +{ + int i; + + if (map == 0) + return 0; + for (i = 0; i < map->nsegs; i++) + if (!map->seg[i].inuse) + break; + if (i >= map->nsegs) + return 0; + map->seg[i].b = b; + map->seg[i].e = e; + map->seg[i].f = f; + map->seg[i].inuse = 1; + map->seg[i].name = name; + map->seg[i].fd = fd; + return 1; +} + +static uvlong +stacktop(int pid) +{ + char buf[64]; + int fd; + int n; + char *cp; + + snprint(buf, sizeof(buf), "/proc/%d/segment", pid); + fd = open(buf, 0); + if (fd < 0) + return 0; + n = read(fd, buf, sizeof(buf)-1); + close(fd); + buf[n] = 0; + if (strncmp(buf, "Stack", 5)) + return 0; + for (cp = buf+5; *cp && *cp == ' '; cp++) + ; + if (!*cp) + return 0; + cp = strchr(cp, ' '); + if (!cp) + return 0; + while (*cp && *cp == ' ') + cp++; + if (!*cp) + return 0; + return strtoull(cp, 0, 16); +} + +Map* +attachproc(int pid, int kflag, int corefd, Fhdr *fp) +{ + char buf[64], *regs; + int fd; + Map *map; + uvlong n; + + map = newmap(0, 4); + if (!map) + return 0; + if(kflag) + regs = "kregs"; + else + regs = "regs"; + if (mach->regsize) { + sprint(buf, "/proc/%d/%s", pid, regs); + fd = open(buf, ORDWR); + if(fd < 0) + fd = open(buf, OREAD); + if(fd < 0) { + free(map); + return 0; + } + setmap(map, fd, 0, mach->regsize, 0, "regs"); + } + if (mach->fpregsize) { + sprint(buf, "/proc/%d/fpregs", pid); + fd = open(buf, ORDWR); + if(fd < 0) + fd = open(buf, OREAD); + if(fd < 0) { + close(map->seg[0].fd); + free(map); + return 0; + } + setmap(map, fd, mach->regsize, mach->regsize+mach->fpregsize, 0, "fpregs"); + } + setmap(map, corefd, fp->txtaddr, fp->txtaddr+fp->txtsz, fp->txtaddr, "text"); + if(kflag || fp->dataddr >= mach->utop) { + setmap(map, corefd, fp->dataddr, ~0, fp->dataddr, "data"); + return map; + } + n = stacktop(pid); + if (n == 0) { + setmap(map, corefd, fp->dataddr, mach->utop, fp->dataddr, "data"); + return map; + } + setmap(map, corefd, fp->dataddr, n, fp->dataddr, "data"); + return map; +} + +int +findseg(Map *map, char *name) +{ + int i; + + if (!map) + return -1; + for (i = 0; i < map->nsegs; i++) + if (map->seg[i].inuse && !strcmp(map->seg[i].name, name)) + return i; + return -1; +} + +void +unusemap(Map *map, int i) +{ + if (map != 0 && 0 <= i && i < map->nsegs) + map->seg[i].inuse = 0; +} + +Map* +loadmap(Map *map, int fd, Fhdr *fp) +{ + map = newmap(map, 2); + if (map == 0) + return 0; + + map->seg[0].b = fp->txtaddr; + map->seg[0].e = fp->txtaddr+fp->txtsz; + map->seg[0].f = fp->txtoff; + map->seg[0].fd = fd; + map->seg[0].inuse = 1; + map->seg[0].name = "text"; + map->seg[1].b = fp->dataddr; + map->seg[1].e = fp->dataddr+fp->datsz; + map->seg[1].f = fp->datoff; + map->seg[1].fd = fd; + map->seg[1].inuse = 1; + map->seg[1].name = "data"; + return map; +} + +Map* +attachremt(int fd, Fhdr *f) +{ + Map *m; + ulong txt; + + m = newmap(0, 3); + if (m == 0) + return 0; + + /* Space for mach structures */ + txt = f->txtaddr; + if(txt > 8*4096) + txt -= 8*4096; + + setmap(m, fd, txt, f->txtaddr+f->txtsz, txt, "*text"); + /*setmap(m, fd, f->dataddr, 0xffffffff, f->dataddr, "*data");*/ /* pc heap is < KTZERO */ + setmap(m, fd, 4096, 0xffffffff, 4096, "*data"); + setmap(m, fd, 0x0, mach->regsize, 0, "kreg"); + + return m; +} + +void +setmapio(Map *map, int i, Rsegio get, Rsegio put) +{ + if (map != 0 && 0 <= i && i < map->nsegs) { + map->seg[i].mget = get; + map->seg[i].mput = put; + } +} diff --git a/utils/libmach/mkfile b/utils/libmach/mkfile new file mode 100644 index 0000000..9114ed6 --- /dev/null +++ b/utils/libmach/mkfile @@ -0,0 +1,43 @@ +<../../mkconfig + +LIB=libmach.a +OFILES=\ + 4.$O\ + 5.$O\ + 6.$O\ + 8.$O\ + 9.$O\ + k.$O\ + q.$O\ + t.$O\ + v.$O\ + 5db.$O\ + 8db.$O\ + kdb.$O\ + qdb.$O\ + tdb.$O\ + vdb.$O\ + 5obj.$O\ + 6obj.$O\ + 8obj.$O\ + 9obj.$O\ + kobj.$O\ + qobj.$O\ + vobj.$O\ + obj.$O\ + map.$O\ + swap.$O\ + sym.$O\ + access.$O\ + machdata.$O\ + setmach.$O\ + executable.$O\ + vcodas.$O\ + +HFILES=../include/mach.h ../include/a.out.h bootexec.h elf.h ureg4.h ureg6.h ureg8.h uregk.h uregv.h ureg5.h + +<$ROOT/mkfiles/mksyslib-$SHELLTYPE +CFLAGS= $CFLAGS -I../include -I.. + +package:QV: + $TRUE diff --git a/utils/libmach/obj.c b/utils/libmach/obj.c new file mode 100644 index 0000000..7b1f1b6 --- /dev/null +++ b/utils/libmach/obj.c @@ -0,0 +1,329 @@ +/* + * obj.c + * routines universal to all object files + */ +#include <lib9.h> +#include <ctype.h> +#include <bio.h> +#include <ar.h> +#include "mach.h" +#include "obj.h" + +#define islocal(t) ((t)=='a' || (t)=='p') + +enum +{ + NNAMES = 50, + MAXIS = 8, /* max length to determine if a file is a .? file */ + MAXOFF = 0x7fffffff, /* larger than any possible local offset */ + NHASH = 1024, /* must be power of two */ + HASHMUL = 79L, +}; + +/* in [$OS].c */ +int _is5(char*), + _is6(char*), + _is8(char*), + _is9(char*), + _isk(char*), + _isq(char*), + _isv(char*), + _read5(Biobuf*, Prog*), + _read6(Biobuf*, Prog*), + _read8(Biobuf*, Prog*), + _read9(Biobuf*, Prog*), + _readk(Biobuf*, Prog*), + _readq(Biobuf*, Prog*), + _readv(Biobuf*, Prog*); + +typedef struct Obj Obj; +typedef struct Symtab Symtab; + +struct Obj /* functions to handle each intermediate (.$O) file */ +{ + char *name; /* name of each $O file */ + int (*is)(char*); /* test for each type of $O file */ + int (*read)(Biobuf*, Prog*); /* read for each type of $O file*/ +}; + +static Obj obj[] = +{ /* functions to identify and parse each type of obj */ + /*[Obj68020]*/ {0, 0,}, + /*[ObjSparc]*/ "sparc .k", _isk, _readk, + /*[ObjMips]*/ "mips .v", _isv, _readv, + /*[Obj386]*/ "386 .8", _is8, _read8, + /*[Obj960]*/ {0, 0,}, + /*[Obj3210]*/ {0, 0,}, + /*[ObjMips2]*/ {0, 0,}, + /*[Obj29000]*/ {0, 0,}, + /*[ObjArm]*/ "arm .5", _is5, _read5, + /*[ObjPower]*/ "power .q", _isq, _readq, + /*[ObjMips2le]*/ {0, 0,}, + /*[ObjAlpha]*/ {0, 0,}, + /*[ObjSparc64]*/ {0, 0,}, + /*[ObjAmd64]*/ "amd64 .6", _is6, _read6, + /*[ObjSpim]*/ {0, 0,}, + /*[ObjPower64]*/ "power64 .9", _is9, _read9, + /*[Maxobjtype]*/ 0, 0 +}; + +struct Symtab +{ + struct Sym s; + struct Symtab *next; +}; + +static Symtab *hash[NHASH]; +static Sym *names[NNAMES]; /* working set of active names */ + +static int processprog(Prog*,int); /* decode each symbol reference */ +static void objreset(void); +static void objlookup(int, char *, int, uint); +static void objupdate(int, int); + +int +objtype(Biobuf *bp, char **name) +{ + int i; + char buf[MAXIS]; + + if(Bread(bp, buf, MAXIS) < MAXIS) + return -1; + Bseek(bp, -MAXIS, 1); + for (i = 0; i < Maxobjtype; i++) { + if (obj[i].is && (*obj[i].is)(buf)) { + if (name) + *name = obj[i].name; + return i; + } + } + return -1; +} + +int +isar(Biobuf *bp) +{ + int n; + char magbuf[SARMAG]; + + n = Bread(bp, magbuf, SARMAG); + if(n == SARMAG && strncmp(magbuf, ARMAG, SARMAG) == 0) + return 1; + return 0; +} + +/* + * determine what kind of object file this is and process it. + * return whether or not this was a recognized intermediate file. + */ +int +readobj(Biobuf *bp, int objtype) +{ + Prog p; + + if (objtype < 0 || objtype >= Maxobjtype || obj[objtype].is == 0) + return 1; + objreset(); + while ((*obj[objtype].read)(bp, &p)) + if (!processprog(&p, 1)) + return 0; + return 1; +} + +int +readar(Biobuf *bp, int objtype, vlong end, int doautos) +{ + Prog p; + + if (objtype < 0 || objtype >= Maxobjtype || obj[objtype].is == 0) + return 1; + objreset(); + while ((*obj[objtype].read)(bp, &p) && Boffset(bp) < end) + if (!processprog(&p, doautos)) + return 0; + return 1; +} + +/* + * decode a symbol reference or definition + */ +static int +processprog(Prog *p, int doautos) +{ + if(p->kind == aNone) + return 1; + if(p->sym < 0 || p->sym >= NNAMES) + return 0; + switch(p->kind) + { + case aName: + if (!doautos) + if(p->type != 'U' && p->type != 'b') + break; + objlookup(p->sym, p->id, p->type, p->sig); + break; + case aText: + objupdate(p->sym, 'T'); + break; + case aData: + objupdate(p->sym, 'D'); + break; + default: + break; + } + return 1; +} + +/* + * find the entry for s in the symbol array. + * make a new entry if it is not already there. + */ +static void +objlookup(int id, char *name, int type, uint sig) +{ + long h; + char *cp; + Sym *s; + Symtab *sp; + + s = names[id]; + if(s && strcmp(s->name, name) == 0) { + s->type = type; + s->sig = sig; + return; + } + + h = *name; + for(cp = name+1; *cp; h += *cp++) + h *= HASHMUL; + if(h < 0) + h = ~h; + h &= (NHASH-1); + if (type == 'U' || type == 'b' || islocal(type)) { + for(sp = hash[h]; sp; sp = sp->next) + if(strcmp(sp->s.name, name) == 0) { + switch(sp->s.type) { + case 'T': + case 'D': + case 'U': + if (type == 'U') { + names[id] = &sp->s; + return; + } + break; + case 't': + case 'd': + case 'b': + if (type == 'b') { + names[id] = &sp->s; + return; + } + break; + case 'a': + case 'p': + if (islocal(type)) { + names[id] = &sp->s; + return; + } + break; + default: + break; + } + } + } + sp = malloc(sizeof(Symtab)); + sp->s.name = name; + sp->s.type = type; + sp->s.sig = sig; + sp->s.value = islocal(type) ? MAXOFF : 0; + names[id] = &sp->s; + sp->next = hash[h]; + hash[h] = sp; + return; +} +/* + * traverse the symbol lists + */ +void +objtraverse(void (*fn)(Sym*, void*), void *pointer) +{ + int i; + Symtab *s; + + for(i = 0; i < NHASH; i++) + for(s = hash[i]; s; s = s->next) + (*fn)(&s->s, pointer); +} + +/* + * update the offset information for a 'a' or 'p' symbol in an intermediate file + */ +void +_offset(int id, vlong off) +{ + Sym *s; + + s = names[id]; + if (s && s->name[0] && islocal(s->type) && s->value > off) + s->value = off; +} + +/* + * update the type of a global text or data symbol + */ +static void +objupdate(int id, int type) +{ + Sym *s; + + s = names[id]; + if (s && s->name[0]) + if (s->type == 'U') + s->type = type; + else if (s->type == 'b') + s->type = tolower(type); +} + +/* + * look for the next file in an archive + */ +int +nextar(Biobuf *bp, int offset, char *buf) +{ + struct ar_hdr a; + int i, r; + long arsize; + + if (offset&01) + offset++; + Bseek(bp, offset, 0); + r = Bread(bp, &a, SAR_HDR); + if(r != SAR_HDR) + return 0; + if(strncmp(a.fmag, ARFMAG, sizeof(a.fmag))) + return -1; + for(i=0; i<sizeof(a.name) && i<SARNAME && a.name[i] != ' '; i++) + buf[i] = a.name[i]; + buf[i] = 0; + arsize = strtol(a.size, 0, 0); + if (arsize&1) + arsize++; + return arsize + SAR_HDR; +} + +static void +objreset(void) +{ + int i; + Symtab *s, *n; + + for(i = 0; i < NHASH; i++) { + for(s = hash[i]; s; s = n) { + n = s->next; + free(s->s.name); + free(s); + } + hash[i] = 0; + } + memset(names, 0, sizeof names); +} diff --git a/utils/libmach/obj.h b/utils/libmach/obj.h new file mode 100644 index 0000000..d8c507a --- /dev/null +++ b/utils/libmach/obj.h @@ -0,0 +1,25 @@ +/* + * obj.h -- defs for dealing with object files + */ + +typedef enum Kind /* variable defs and references in obj */ +{ + aNone, /* we don't care about this prog */ + aName, /* introduces a name */ + aText, /* starts a function */ + aData, /* references to a global object */ +} Kind; + +typedef struct Prog Prog; + +struct Prog /* info from .$O files */ +{ + Kind kind; /* what kind of symbol */ + char type; /* type of the symbol: ie, 'T', 'a', etc. */ + char sym; /* index of symbol's name */ + char *id; /* name for the symbol, if it introduces one */ + uint sig; /* type signature for symbol */ +}; + +#define UNKNOWN '?' +void _offset(int, vlong); diff --git a/utils/libmach/q.c b/utils/libmach/q.c new file mode 100644 index 0000000..2e8f66f --- /dev/null +++ b/utils/libmach/q.c @@ -0,0 +1,123 @@ +/* + * PowerPC definition + * forsyth@terzarima.net + */ +#include <lib9.h> +#include <bio.h> +#include "uregq.h" +#include "mach.h" + + +#define REGOFF(x) (ulong) (&((struct Ureg *) 0)->x) + +#define SP REGOFF(sp) +#define PC REGOFF(pc) +#define R3 REGOFF(r3) /* return reg */ +#define LR REGOFF(lr) +#define R31 REGOFF(r31) +#define FP_REG(x) (R31+4+8*(x)) + +#define REGSIZE sizeof(struct Ureg) +#define FPREGSIZE (8*33) + +Reglist powerreglist[] = { + {"CAUSE", REGOFF(cause), RINT|RRDONLY, 'X'}, + {"SRR1", REGOFF(srr1), RINT|RRDONLY, 'X'}, + {"PC", REGOFF(pc), RINT, 'X'}, + {"LR", REGOFF(lr), RINT, 'X'}, + {"CR", REGOFF(cr), RINT, 'X'}, + {"XER", REGOFF(xer), RINT, 'X'}, + {"CTR", REGOFF(ctr), RINT, 'X'}, + {"PC", PC, RINT, 'X'}, + {"SP", SP, RINT, 'X'}, + {"R0", REGOFF(r0), RINT, 'X'}, + /* R1 is SP */ + {"R2", REGOFF(r2), RINT, 'X'}, + {"R3", REGOFF(r3), RINT, 'X'}, + {"R4", REGOFF(r4), RINT, 'X'}, + {"R5", REGOFF(r5), RINT, 'X'}, + {"R6", REGOFF(r6), RINT, 'X'}, + {"R7", REGOFF(r7), RINT, 'X'}, + {"R8", REGOFF(r8), RINT, 'X'}, + {"R9", REGOFF(r9), RINT, 'X'}, + {"R10", REGOFF(r10), RINT, 'X'}, + {"R11", REGOFF(r11), RINT, 'X'}, + {"R12", REGOFF(r12), RINT, 'X'}, + {"R13", REGOFF(r13), RINT, 'X'}, + {"R14", REGOFF(r14), RINT, 'X'}, + {"R15", REGOFF(r15), RINT, 'X'}, + {"R16", REGOFF(r16), RINT, 'X'}, + {"R17", REGOFF(r17), RINT, 'X'}, + {"R18", REGOFF(r18), RINT, 'X'}, + {"R19", REGOFF(r19), RINT, 'X'}, + {"R20", REGOFF(r20), RINT, 'X'}, + {"R21", REGOFF(r21), RINT, 'X'}, + {"R22", REGOFF(r22), RINT, 'X'}, + {"R23", REGOFF(r23), RINT, 'X'}, + {"R24", REGOFF(r24), RINT, 'X'}, + {"R25", REGOFF(r25), RINT, 'X'}, + {"R26", REGOFF(r26), RINT, 'X'}, + {"R27", REGOFF(r27), RINT, 'X'}, + {"R28", REGOFF(r28), RINT, 'X'}, + {"R29", REGOFF(r29), RINT, 'X'}, + {"R30", REGOFF(r30), RINT, 'X'}, + {"R31", REGOFF(r31), RINT, 'X'}, + {"F0", FP_REG(0), RFLT, 'F'}, + {"F1", FP_REG(1), RFLT, 'F'}, + {"F2", FP_REG(2), RFLT, 'F'}, + {"F3", FP_REG(3), RFLT, 'F'}, + {"F4", FP_REG(4), RFLT, 'F'}, + {"F5", FP_REG(5), RFLT, 'F'}, + {"F6", FP_REG(6), RFLT, 'F'}, + {"F7", FP_REG(7), RFLT, 'F'}, + {"F8", FP_REG(8), RFLT, 'F'}, + {"F9", FP_REG(9), RFLT, 'F'}, + {"F10", FP_REG(10), RFLT, 'F'}, + {"F11", FP_REG(11), RFLT, 'F'}, + {"F12", FP_REG(12), RFLT, 'F'}, + {"F13", FP_REG(13), RFLT, 'F'}, + {"F14", FP_REG(14), RFLT, 'F'}, + {"F15", FP_REG(15), RFLT, 'F'}, + {"F16", FP_REG(16), RFLT, 'F'}, + {"F17", FP_REG(17), RFLT, 'F'}, + {"F18", FP_REG(18), RFLT, 'F'}, + {"F19", FP_REG(19), RFLT, 'F'}, + {"F20", FP_REG(20), RFLT, 'F'}, + {"F21", FP_REG(21), RFLT, 'F'}, + {"F22", FP_REG(22), RFLT, 'F'}, + {"F23", FP_REG(23), RFLT, 'F'}, + {"F24", FP_REG(24), RFLT, 'F'}, + {"F25", FP_REG(25), RFLT, 'F'}, + {"F26", FP_REG(26), RFLT, 'F'}, + {"F27", FP_REG(27), RFLT, 'F'}, + {"F28", FP_REG(28), RFLT, 'F'}, + {"F29", FP_REG(29), RFLT, 'F'}, + {"F30", FP_REG(30), RFLT, 'F'}, + {"F31", FP_REG(31), RFLT, 'F'}, + {"FPSCR", FP_REG(32)+4, RFLT, 'X'}, + { 0 } +}; + + /* the machine description */ +Mach mpower = +{ + "power", + MPOWER, /* machine type */ + powerreglist, /* register set */ + REGSIZE, /* number of bytes in register set */ + FPREGSIZE, /* number of bytes in FP register set */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "LR", /* name of link register */ + "setSB", /* static base register name */ + 0, /* value */ + 0x1000, /* page size */ + 0x80000000U, /* kernel base */ + 0xF0000000U, /* kernel text mask */ + 0x7FFFFFFFU, /* user stack top */ + 4, /* quantization of pc */ + 4, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/qdb.c b/utils/libmach/qdb.c new file mode 100644 index 0000000..636b551 --- /dev/null +++ b/utils/libmach/qdb.c @@ -0,0 +1,1363 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +/* + * PowerPC-specific debugger interface, + * including 64-bit modes + * forsyth@terzarima.net + */ + +static char *powerexcep(Map*, Rgetter); +static int powerfoll(Map*, uvlong, Rgetter, uvlong*); +static int powerinst(Map*, uvlong, char, char*, int); +static int powerinstlen(Map*, uvlong); +static int powerdas(Map*, uvlong, char*, int); + +/* + * Machine description + */ +Machdata powermach = +{ + {0x07f, 0xe0, 0x00, 0x08}, /* breakpoint (tw 31,r0,r0) */ + 4, /* break point size */ + + beswab, /* short to local byte order */ + beswal, /* long to local byte order */ + beswav, /* vlong to local byte order */ + risctrace, /* print C traceback */ + riscframe, /* frame finder */ + powerexcep, /* print exception */ + 0, /* breakpoint fixup */ + beieeesftos, /* single precision float printer */ + beieeedftos, /* double precisioin float printer */ + powerfoll, /* following addresses */ + powerinst, /* print instruction */ + powerdas, /* dissembler */ + powerinstlen, /* instruction size */ +}; + +static char *excname[] = +{ + "reserved 0", + "system reset", + "machine check", + "data access", + "instruction access", + "external interrupt", + "alignment", + "program exception", + "floating-point unavailable", + "decrementer", + "i/o controller interface error", + "reserved B", + "system call", + "trace trap", + "floating point assist", + "reserved", + "ITLB miss", + "DTLB load miss", + "DTLB store miss", + "instruction address breakpoint" + "SMI interrupt" + "reserved 15", + "reserved 16", + "reserved 17", + "reserved 18", + "reserved 19", + "reserved 1A", + /* the following are made up on a program exception */ + "floating point exception", /* FPEXC */ + "illegal instruction", + "privileged instruction", + "trap", + "illegal operation", + "breakpoint", /* 20 */ +}; + +static char* +powerexcep(Map *map, Rgetter rget) +{ + long c; + static char buf[32]; + + c = (*rget)(map, "CAUSE") >> 8; + if(c < nelem(excname)) + return excname[c]; + sprint(buf, "unknown trap #%lx", c); + return buf; +} + +/* + * disassemble PowerPC opcodes + */ + +#define REGSP 1 /* should come from q.out.h, but there's a clash */ +#define REGSB 2 + +static char FRAMENAME[] = ".frame"; + +static Map *mymap; + +/* + * ibm conventions for these: bit 0 is top bit + * from table 10-1 + */ +typedef struct { + uchar aa; /* bit 30 */ + uchar crba; /* bits 11-15 */ + uchar crbb; /* bits 16-20 */ + long bd; /* bits 16-29 */ + uchar crfd; /* bits 6-8 */ + uchar crfs; /* bits 11-13 */ + uchar bi; /* bits 11-15 */ + uchar bo; /* bits 6-10 */ + uchar crbd; /* bits 6-10 */ + /* union { */ + short d; /* bits 16-31 */ + short simm; + ushort uimm; + /*}; */ + uchar fm; /* bits 7-14 */ + uchar fra; /* bits 11-15 */ + uchar frb; /* bits 16-20 */ + uchar frc; /* bits 21-25 */ + uchar frs; /* bits 6-10 */ + uchar frd; /* bits 6-10 */ + uchar crm; /* bits 12-19 */ + long li; /* bits 6-29 || b'00' */ + uchar lk; /* bit 31 */ + uchar mb; /* bits 21-25 */ + uchar me; /* bits 26-30 */ + uchar xmbe; /* bits 26,21-25: mb[5] || mb[0:4], also xme */ + uchar xsh; /* bits 30,16-20: sh[5] || sh[0:4] */ + uchar nb; /* bits 16-20 */ + uchar op; /* bits 0-5 */ + uchar oe; /* bit 21 */ + uchar ra; /* bits 11-15 */ + uchar rb; /* bits 16-20 */ + uchar rc; /* bit 31 */ + /* union { */ + uchar rs; /* bits 6-10 */ + uchar rd; + /*};*/ + uchar sh; /* bits 16-20 */ + ushort spr; /* bits 11-20 */ + uchar to; /* bits 6-10 */ + uchar imm; /* bits 16-19 */ + ushort xo; /* bits 21-30, 22-30, 26-30, or 30 (beware) */ + uvlong imm64; + long w0; + long w1; + uvlong addr; /* pc of instruction */ + short target; + short m64; /* 64-bit mode */ + char *curr; /* current fill level in output buffer */ + char *end; /* end of buffer */ + int size; /* number of longs in instr */ + char *err; /* errmsg */ +} Instr; + +#define IBF(v,a,b) (((ulong)(v)>>(32-(b)-1)) & ~(~0L<<(((b)-(a)+1)))) +#define IB(v,b) IBF((v),(b),(b)) + +#pragma varargck argpos bprint 2 + +static void +bprint(Instr *i, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + i->curr = vseprint(i->curr, i->end, fmt, arg); + va_end(arg); +} + +static int +decode(uvlong pc, Instr *i) +{ + ulong w; + + if (get4(mymap, pc, &w) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + i->m64 = asstype == APOWER64; + i->aa = IB(w, 30); + i->crba = IBF(w, 11, 15); + i->crbb = IBF(w, 16, 20); + i->bd = IBF(w, 16, 29)<<2; + if(i->bd & 0x8000) + i->bd |= ~0L<<16; + i->crfd = IBF(w, 6, 8); + i->crfs = IBF(w, 11, 13); + i->bi = IBF(w, 11, 15); + i->bo = IBF(w, 6, 10); + i->crbd = IBF(w, 6, 10); + i->uimm = IBF(w, 16, 31); /* also d, simm */ + i->fm = IBF(w, 7, 14); + i->fra = IBF(w, 11, 15); + i->frb = IBF(w, 16, 20); + i->frc = IBF(w, 21, 25); + i->frs = IBF(w, 6, 10); + i->frd = IBF(w, 6, 10); + i->crm = IBF(w, 12, 19); + i->li = IBF(w, 6, 29)<<2; + if(IB(w, 6)) + i->li |= ~0<<25; + i->lk = IB(w, 31); + i->mb = IBF(w, 21, 25); + i->me = IBF(w, 26, 30); + i->xmbe = (IB(w,26)<<5) | i->mb; + i->nb = IBF(w, 16, 20); + i->op = IBF(w, 0, 5); + i->oe = IB(w, 21); + i->ra = IBF(w, 11, 15); + i->rb = IBF(w, 16, 20); + i->rc = IB(w, 31); + i->rs = IBF(w, 6, 10); /* also rd */ + i->sh = IBF(w, 16, 20); + i->xsh = (IB(w, 30)<<5) | i->sh; + i->spr = IBF(w, 11, 20); + i->to = IBF(w, 6, 10); + i->imm = IBF(w, 16, 19); + i->xo = IBF(w, 21, 30); /* bits 21-30, 22-30, 26-30, or 30 (beware) */ + if(i->op == 58){ /* class of 64-bit loads */ + i->xo = i->simm & 3; + i->simm &= ~3; + } + i->imm64 = i->simm; + if(i->op == 15) + i->imm64 <<= 16; + else if(i->op == 25 || i->op == 27 || i->op == 29) + i->imm64 = (uvlong)(i->uimm<<16); + i->w0 = w; + i->target = -1; + i->addr = pc; + i->size = 1; + return 1; +} + +static int +mkinstr(uvlong pc, Instr *i) +{ + Instr x; + + if(decode(pc, i) < 0) + return -1; + /* + * combine ADDIS/ORI (CAU/ORIL) into MOVW + * also ORIS/ORIL for unsigned in 64-bit mode + */ + if ((i->op == 15 || i->op == 25) && i->ra==0) { + if(decode(pc+4, &x) < 0) + return -1; + if (x.op == 24 && x.rs == x.ra && x.ra == i->rd) { + i->imm64 |= (x.imm64 & 0xFFFF); + if(i->op != 15) + i->imm64 &= 0xFFFFFFFFUL; + i->w1 = x.w0; + i->target = x.rd; + i->size++; + return 1; + } + } + return 1; +} + +static int +plocal(Instr *i) +{ + long offset; + Symbol s; + + if (!findsym(i->addr, CTEXT, &s) || !findlocal(&s, FRAMENAME, &s)) + return -1; + offset = s.value - i->imm64; + if (offset > 0) { + if(getauto(&s, offset, CAUTO, &s)) { + bprint(i, "%s+%lld(SP)", s.name, s.value); + return 1; + } + } else { + if (getauto(&s, -offset-4, CPARAM, &s)) { + bprint(i, "%s+%ld(FP)", s.name, -offset); + return 1; + } + } + return -1; +} + +static int +pglobal(Instr *i, uvlong off, int anyoff, char *reg) +{ + Symbol s, s2; + uvlong off1; + + if(findsym(off, CANY, &s) && + s.value-off < 4096 && + (s.class == CDATA || s.class == CTEXT)) { + if(off==s.value && s.name[0]=='$'){ + off1 = 0; + geta(mymap, s.value, &off1); + if(off1 && findsym(off1, CANY, &s2) && s2.value == off1){ + bprint(i, "$%s%s", s2.name, reg); + return 1; + } + } + bprint(i, "%s", s.name); + if (s.value != off) + bprint(i, "+%llux", off-s.value); + bprint(i, reg); + return 1; + } + if(!anyoff) + return 0; + bprint(i, "%llux%s", off, reg); + return 1; +} + +static void +address(Instr *i) +{ + if (i->ra == REGSP && plocal(i) >= 0) + return; + if (i->ra == REGSB && mach->sb && pglobal(i, mach->sb+i->imm64, 0, "(SB)") >= 0) + return; + if(i->simm < 0) + bprint(i, "-%x(R%d)", -i->simm, i->ra); + else + bprint(i, "%llux(R%d)", i->imm64, i->ra); +} + +static char *tcrbits[] = {"LT", "GT", "EQ", "VS"}; +static char *fcrbits[] = {"GE", "LE", "NE", "VC"}; + +typedef struct Opcode Opcode; + +struct Opcode { + uchar op; + ushort xo; + ushort xomask; + char *mnemonic; + void (*f)(Opcode *, Instr *); + char *ken; + int flags; +}; + +static void format(char *, Instr *, char *); + +static void +branch(Opcode *o, Instr *i) +{ + char buf[8]; + int bo, bi; + + bo = i->bo & ~1; /* ignore prediction bit */ + if(bo==4 || bo==12 || bo==20) { /* simple forms */ + if(bo != 20) { + bi = i->bi&3; + sprint(buf, "B%s%%L", bo==12? tcrbits[bi]: fcrbits[bi]); + format(buf, i, nil); + bprint(i, "\t"); + if(i->bi > 4) + bprint(i, "CR(%d),", i->bi/4); + } else + format("BR%L\t", i, nil); + if(i->op == 16) + format(0, i, "%J"); + else if(i->op == 19 && i->xo == 528) + format(0, i, "(CTR)"); + else if(i->op == 19 && i->xo == 16) + format(0, i, "(LR)"); + } else + format(o->mnemonic, i, o->ken); +} + +static void +addi(Opcode *o, Instr *i) +{ + if (i->op==14 && i->ra == 0) + format("MOVW", i, "%i,R%d"); + else if (i->ra == REGSB) { + bprint(i, "MOVW\t$"); + address(i); + bprint(i, ",R%d", i->rd); + } else if(i->op==14 && i->simm < 0) { + bprint(i, "SUB\t$%d,R%d", -i->simm, i->ra); + if(i->rd != i->ra) + bprint(i, ",R%d", i->rd); + } else if(i->ra == i->rd) { + format(o->mnemonic, i, "%i"); + bprint(i, ",R%d", i->rd); + } else + format(o->mnemonic, i, o->ken); +} + +static void +addis(Opcode *o, Instr *i) +{ + long v; + + v = i->imm64; + if (i->op==15 && i->ra == 0) + bprint(i, "MOVW\t$%lux,R%d", v, i->rd); + else if (i->op==15 && i->ra == REGSB) { + bprint(i, "MOVW\t$"); + address(i); + bprint(i, ",R%d", i->rd); + } else if(i->op==15 && v < 0) { + bprint(i, "SUB\t$%ld,R%d", -v, i->ra); + if(i->rd != i->ra) + bprint(i, ",R%d", i->rd); + } else { + format(o->mnemonic, i, nil); + bprint(i, "\t$%ld,R%d", v, i->ra); + if(i->rd != i->ra) + bprint(i, ",R%d", i->rd); + } +} + +static void +andi(Opcode *o, Instr *i) +{ + if (i->ra == i->rs) + format(o->mnemonic, i, "%I,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +gencc(Opcode *o, Instr *i) +{ + format(o->mnemonic, i, o->ken); +} + +static void +gen(Opcode *o, Instr *i) +{ + format(o->mnemonic, i, o->ken); + if (i->rc) + bprint(i, " [illegal Rc]"); +} + +static void +ldx(Opcode *o, Instr *i) +{ + if(i->ra == 0) + format(o->mnemonic, i, "(R%b),R%d"); + else + format(o->mnemonic, i, "(R%b+R%a),R%d"); + if(i->rc) + bprint(i, " [illegal Rc]"); +} + +static void +stx(Opcode *o, Instr *i) +{ + if(i->ra == 0) + format(o->mnemonic, i, "R%d,(R%b)"); + else + format(o->mnemonic, i, "R%d,(R%b+R%a)"); + if(i->rc && i->xo != 150) + bprint(i, " [illegal Rc]"); +} + +static void +fldx(Opcode *o, Instr *i) +{ + if(i->ra == 0) + format(o->mnemonic, i, "(R%b),F%d"); + else + format(o->mnemonic, i, "(R%b+R%a),F%d"); + if(i->rc) + bprint(i, " [illegal Rc]"); +} + +static void +fstx(Opcode *o, Instr *i) +{ + if(i->ra == 0) + format(o->mnemonic, i, "F%d,(R%b)"); + else + format(o->mnemonic, i, "F%d,(R%b+R%a)"); + if(i->rc) + bprint(i, " [illegal Rc]"); +} + +static void +dcb(Opcode *o, Instr *i) +{ + if(i->ra == 0) + format(o->mnemonic, i, "(R%b)"); + else + format(o->mnemonic, i, "(R%b+R%a)"); + if(i->rd) + bprint(i, " [illegal Rd]"); + if(i->rc) + bprint(i, " [illegal Rc]"); +} + +static void +lw(Opcode *o, Instr *i, char r) +{ + format(o->mnemonic, i, nil); + bprint(i, "\t"); + address(i); + bprint(i, ",%c%d", r, i->rd); +} + +static void +load(Opcode *o, Instr *i) +{ + lw(o, i, 'R'); +} + +static void +fload(Opcode *o, Instr *i) +{ + lw(o, i, 'F'); +} + +static void +sw(Opcode *o, Instr *i, char r) +{ + int offset; + Symbol s; + + if (i->rs == REGSP) { + if (findsym(i->addr, CTEXT, &s) && findlocal(&s, FRAMENAME, &s)) { + offset = s.value-i->imm64; + if (offset > 0 && getauto(&s, offset, CAUTO, &s)) { + format(o->mnemonic, i, nil); + bprint(i, "\t%c%d,%s-%d(SP)", r, i->rd, s.name, offset); + return; + } + } + } + if (i->rs == REGSB && mach->sb) { + format(o->mnemonic, i, nil); + bprint(i, "\t%c%d,", r, i->rd); + address(i); + return; + } + if (r == 'F') + format(o->mnemonic, i, "F%d,%l"); + else + format(o->mnemonic, i, o->ken); +} + +static void +store(Opcode *o, Instr *i) +{ + sw(o, i, 'R'); +} + +static void +fstore(Opcode *o, Instr *i) +{ + sw(o, i, 'F'); +} + +static void +shifti(Opcode *o, Instr *i) +{ + if (i->ra == i->rs) + format(o->mnemonic, i, "$%k,R%a"); + else + format(o->mnemonic, i, o->ken); +} + +static void +shift(Opcode *o, Instr *i) +{ + if (i->ra == i->rs) + format(o->mnemonic, i, "R%b,R%a"); + else + format(o->mnemonic, i, o->ken); +} + +static void +add(Opcode *o, Instr *i) +{ + if (i->rd == i->ra) + format(o->mnemonic, i, "R%b,R%d"); + else if (i->rd == i->rb) + format(o->mnemonic, i, "R%a,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +sub(Opcode *o, Instr *i) +{ + format(o->mnemonic, i, nil); + bprint(i, "\t"); + if(i->op == 31) { + bprint(i, "\tR%d,R%d", i->ra, i->rb); /* subtract Ra from Rb */ + if(i->rd != i->rb) + bprint(i, ",R%d", i->rd); + } else + bprint(i, "\tR%d,$%d,R%d", i->ra, i->simm, i->rd); +} + +static void +qmuldiv(Opcode *o, Instr *i) +{ + format(o->mnemonic, i, nil); + if(i->op == 31) + bprint(i, "\tR%d,R%d", i->rb, i->ra); + else + bprint(i, "\t$%d,R%d", i->simm, i->ra); + if(i->ra != i->rd) + bprint(i, ",R%d", i->rd); +} + +static void +and(Opcode *o, Instr *i) +{ + if (i->op == 31) { + /* Rb,Rs,Ra */ + if (i->ra == i->rs) + format(o->mnemonic, i, "R%b,R%a"); + else if (i->ra == i->rb) + format(o->mnemonic, i, "R%s,R%a"); + else + format(o->mnemonic, i, o->ken); + } else { + /* imm,Rs,Ra */ + if (i->ra == i->rs) + format(o->mnemonic, i, "%I,R%a"); + else + format(o->mnemonic, i, o->ken); + } +} + +static void +or(Opcode *o, Instr *i) +{ + if (i->op == 31) { + /* Rb,Rs,Ra */ + if (i->rs == 0 && i->ra == 0 && i->rb == 0) + format("NOP", i, nil); + else if (i->rs == i->rb) + format("MOVW", i, "R%b,R%a"); + else + and(o, i); + } else + and(o, i); +} + +static void +shifted(Opcode *o, Instr *i) +{ + format(o->mnemonic, i, nil); + bprint(i, "\t$%lux,", (ulong)i->uimm<<16); + if (i->rs == i->ra) + bprint(i, "R%d", i->ra); + else + bprint(i, "R%d,R%d", i->rs, i->ra); +} + +static void +neg(Opcode *o, Instr *i) +{ + if (i->rd == i->ra) + format(o->mnemonic, i, "R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static char ir2[] = "R%a,R%d"; /* reverse of IBM order */ +static char ir3[] = "R%b,R%a,R%d"; +static char ir3r[] = "R%a,R%b,R%d"; +static char il3[] = "R%b,R%s,R%a"; +static char il2u[] = "%I,R%d,R%a"; +static char il3s[] = "$%k,R%s,R%a"; +static char il2[] = "R%s,R%a"; +static char icmp3[] = "R%a,R%b,%D"; +static char cr3op[] = "%b,%a,%d"; +static char ir2i[] = "%i,R%a,R%d"; +static char fp2[] = "F%b,F%d"; +static char fp3[] = "F%b,F%a,F%d"; +static char fp3c[] = "F%c,F%a,F%d"; +static char fp4[] = "F%a,F%c,F%b,F%d"; +static char fpcmp[] = "F%a,F%b,%D"; +static char ldop[] = "%l,R%d"; +static char stop[] = "R%d,%l"; +static char fldop[] = "%l,F%d"; +static char fstop[] = "F%d,%l"; +static char rldc[] = "R%b,R%s,$%E,R%a"; +static char rlim[] = "R%b,R%s,$%z,R%a"; +static char rlimi[] = "$%k,R%s,$%z,R%a"; +static char rldi[] = "$%e,R%s,$%E,R%a"; + +#define OEM IBF(~0,22,30) +#define FP4 IBF(~0,26,30) +#define ALL (~0) +#define RLDC 0xF +#define RLDI 0xE +/* +notes: + 10-26: crfD = rD>>2; rD&3 mbz + also, L bit (bit 10) mbz or selects 64-bit operands +*/ + +static Opcode opcodes[] = { + {31, 266, OEM, "ADD%V%C", add, ir3}, + {31, 10, OEM, "ADDC%V%C", add, ir3}, + {31, 138, OEM, "ADDE%V%C", add, ir3}, + {14, 0, 0, "ADD", addi, ir2i}, + {12, 0, 0, "ADDC", addi, ir2i}, + {13, 0, 0, "ADDCCC", addi, ir2i}, + {15, 0, 0, "ADD", addis, 0}, + {31, 234, OEM, "ADDME%V%C", gencc, ir2}, + {31, 202, OEM, "ADDZE%V%C", gencc, ir2}, + + {31, 28, ALL, "AND%C", and, il3}, + {31, 60, ALL, "ANDN%C", and, il3}, + {28, 0, 0, "ANDCC", andi, il2u}, + {29, 0, 0, "ANDCC", shifted, 0}, + + {18, 0, 0, "B%L", gencc, "%j"}, + {16, 0, 0, "BC%L", branch, "%d,%a,%J"}, + {19, 528, ALL, "BC%L", branch, "%d,%a,(CTR)"}, + {19, 16, ALL, "BC%L", branch, "%d,%a,(LR)"}, + + {31, 0, ALL, "CMP", 0, icmp3}, + {11, 0, 0, "CMP", 0, "R%a,%i,%D"}, + {31, 32, ALL, "CMPU", 0, icmp3}, + {10, 0, 0, "CMPU", 0, "R%a,%I,%D"}, + + {31, 58, ALL, "CNTLZD%C", gencc, ir2}, /* 64 */ + {31, 26, ALL, "CNTLZ%W%C", gencc, ir2}, + + {19, 257, ALL, "CRAND", gen, cr3op}, + {19, 129, ALL, "CRANDN", gen, cr3op}, + {19, 289, ALL, "CREQV", gen, cr3op}, + {19, 225, ALL, "CRNAND", gen, cr3op}, + {19, 33, ALL, "CRNOR", gen, cr3op}, + {19, 449, ALL, "CROR", gen, cr3op}, + {19, 417, ALL, "CRORN", gen, cr3op}, + {19, 193, ALL, "CRXOR", gen, cr3op}, + + {31, 86, ALL, "DCBF", dcb, 0}, + {31, 470, ALL, "DCBI", dcb, 0}, + {31, 54, ALL, "DCBST", dcb, 0}, + {31, 278, ALL, "DCBT", dcb, 0}, + {31, 246, ALL, "DCBTST", dcb, 0}, + {31, 1014, ALL, "DCBZ", dcb, 0}, + {31, 454, ALL, "DCCCI", dcb, 0}, + {31, 966, ALL, "ICCCI", dcb, 0}, + + {31, 489, OEM, "DIVD%V%C", qmuldiv, ir3}, /* 64 */ + {31, 457, OEM, "DIVDU%V%C", qmuldiv, ir3}, /* 64 */ + {31, 491, OEM, "DIVW%V%C", qmuldiv, ir3}, + {31, 459, OEM, "DIVWU%V%C", qmuldiv, ir3}, + + {31, 310, ALL, "ECIWX", ldx, 0}, + {31, 438, ALL, "ECOWX", stx, 0}, + {31, 854, ALL, "EIEIO", gen, 0}, + + {31, 284, ALL, "EQV%C", gencc, il3}, + + {31, 954, ALL, "EXTSB%C", gencc, il2}, + {31, 922, ALL, "EXTSH%C", gencc, il2}, + {31, 986, ALL, "EXTSW%C", gencc, il2}, /* 64 */ + + {63, 264, ALL, "FABS%C", gencc, fp2}, + {63, 21, ALL, "FADD%C", gencc, fp3}, + {59, 21, ALL, "FADDS%C", gencc, fp3}, + {63, 32, ALL, "FCMPO", gen, fpcmp}, + {63, 0, ALL, "FCMPU", gen, fpcmp}, + {63, 846, ALL, "FCFID%C", gencc, fp2}, /* 64 */ + {63, 814, ALL, "FCTID%C", gencc, fp2}, /* 64 */ + {63, 815, ALL, "FCTIDZ%C", gencc, fp2}, /* 64 */ + {63, 14, ALL, "FCTIW%C", gencc, fp2}, + {63, 15, ALL, "FCTIWZ%C", gencc, fp2}, + {63, 18, ALL, "FDIV%C", gencc, fp3}, + {59, 18, ALL, "FDIVS%C", gencc, fp3}, + {63, 29, FP4, "FMADD%C", gencc, fp4}, + {59, 29, FP4, "FMADDS%C", gencc, fp4}, + {63, 72, ALL, "FMOVD%C", gencc, fp2}, + {63, 28, FP4, "FMSUB%C", gencc, fp4}, + {59, 28, FP4, "FMSUBS%C", gencc, fp4}, + {63, 25, FP4, "FMUL%C", gencc, fp3c}, + {59, 25, FP4, "FMULS%C", gencc, fp3c}, + {63, 136, ALL, "FNABS%C", gencc, fp2}, + {63, 40, ALL, "FNEG%C", gencc, fp2}, + {63, 31, FP4, "FNMADD%C", gencc, fp4}, + {59, 31, FP4, "FNMADDS%C", gencc, fp4}, + {63, 30, FP4, "FNMSUB%C", gencc, fp4}, + {59, 30, FP4, "FNMSUBS%C", gencc, fp4}, + {59, 24, ALL, "FRES%C", gencc, fp2}, /* optional */ + {63, 12, ALL, "FRSP%C", gencc, fp2}, + {63, 26, ALL, "FRSQRTE%C", gencc, fp2}, /* optional */ + {63, 23, FP4, "FSEL%CC", gencc, fp4}, /* optional */ + {63, 22, ALL, "FSQRT%C", gencc, fp2}, /* optional */ + {59, 22, ALL, "FSQRTS%C", gencc, fp2}, /* optional */ + {63, 20, FP4, "FSUB%C", gencc, fp3}, + {59, 20, FP4, "FSUBS%C", gencc, fp3}, + + {31, 982, ALL, "ICBI", dcb, 0}, /* optional */ + {19, 150, ALL, "ISYNC", gen, 0}, + + {34, 0, 0, "MOVBZ", load, ldop}, + {35, 0, 0, "MOVBZU", load, ldop}, + {31, 119, ALL, "MOVBZU", ldx, 0}, + {31, 87, ALL, "MOVBZ", ldx, 0}, + {50, 0, 0, "FMOVD", fload, fldop}, + {51, 0, 0, "FMOVDU", fload, fldop}, + {31, 631, ALL, "FMOVDU", fldx, 0}, + {31, 599, ALL, "FMOVD", fldx, 0}, + {48, 0, 0, "FMOVS", load, fldop}, + {49, 0, 0, "FMOVSU", load, fldop}, + {31, 567, ALL, "FMOVSU", fldx, 0}, + {31, 535, ALL, "FMOVS", fldx, 0}, + {42, 0, 0, "MOVH", load, ldop}, + {43, 0, 0, "MOVHU", load, ldop}, + {31, 375, ALL, "MOVHU", ldx, 0}, + {31, 343, ALL, "MOVH", ldx, 0}, + {31, 790, ALL, "MOVHBR", ldx, 0}, + {40, 0, 0, "MOVHZ", load, ldop}, + {41, 0, 0, "MOVHZU", load, ldop}, + {31, 311, ALL, "MOVHZU", ldx, 0}, + {31, 279, ALL, "MOVHZ", ldx, 0}, + {46, 0, 0, "MOVMW", load, ldop}, + {31, 597, ALL, "LSW", gen, "(R%a),$%n,R%d"}, + {31, 533, ALL, "LSW", ldx, 0}, + {31, 20, ALL, "LWAR", ldx, 0}, + {31, 84, ALL, "LWARD", ldx, 0}, /* 64 */ + + {58, 0, ALL, "MOVD", load, ldop}, /* 64 */ + {58, 1, ALL, "MOVDU", load, ldop}, /* 64 */ + {31, 53, ALL, "MOVDU", ldx, 0}, /* 64 */ + {31, 21, ALL, "MOVD", ldx, 0}, /* 64 */ + + {31, 534, ALL, "MOVWBR", ldx, 0}, + + {58, 2, ALL, "MOVW", load, ldop}, /* 64 (lwa) */ + {31, 373, ALL, "MOVWU", ldx, 0}, /* 64 */ + {31, 341, ALL, "MOVW", ldx, 0}, /* 64 */ + + {32, 0, 0, "MOVW%Z", load, ldop}, + {33, 0, 0, "MOVW%ZU", load, ldop}, + {31, 55, ALL, "MOVW%ZU", ldx, 0}, + {31, 23, ALL, "MOVW%Z", ldx, 0}, + + {19, 0, ALL, "MOVFL", gen, "%S,%D"}, + {63, 64, ALL, "MOVCRFS", gen, "%S,%D"}, + {31, 512, ALL, "MOVW", gen, "XER,%D"}, + {31, 19, ALL, "MOVW", gen, "CR,R%d"}, + + {63, 583, ALL, "MOVW%C", gen, "FPSCR, F%d"}, /* mffs */ + {31, 83, ALL, "MOVW", gen, "MSR,R%d"}, + {31, 339, ALL, "MOVW", gen, "%P,R%d"}, + {31, 595, ALL, "MOVW", gen, "SEG(%a),R%d"}, + {31, 659, ALL, "MOVW", gen, "SEG(R%b),R%d"}, + {31, 323, ALL, "MOVW", gen, "DCR(%Q),R%d"}, + {31, 451, ALL, "MOVW", gen, "R%s,DCR(%Q)"}, + {31, 259, ALL, "MOVW", gen, "DCR(R%a),R%d"}, + {31, 387, ALL, "MOVW", gen, "R%s,DCR(R%a)"}, + {31, 144, ALL, "MOVFL", gen, "R%s,%m,CR"}, + {63, 70, ALL, "MTFSB0%C", gencc, "%D"}, + {63, 38, ALL, "MTFSB1%C", gencc, "%D"}, + {63, 711, ALL, "MOVFL%C", gencc, "F%b,%M,FPSCR"}, /* mtfsf */ + {63, 134, ALL, "MOVFL%C", gencc, "%K,%D"}, + {31, 146, ALL, "MOVW", gen, "R%s,MSR"}, + {31, 178, ALL, "MOVD", gen, "R%s,MSR"}, + {31, 467, ALL, "MOVW", gen, "R%s,%P"}, + {31, 210, ALL, "MOVW", gen, "R%s,SEG(%a)"}, + {31, 242, ALL, "MOVW", gen, "R%s,SEG(R%b)"}, + + {31, 73, ALL, "MULHD%C", gencc, ir3}, + {31, 9, ALL, "MULHDU%C", gencc, ir3}, + {31, 233, OEM, "MULLD%V%C", gencc, ir3}, + + {31, 75, ALL, "MULHW%C", gencc, ir3}, + {31, 11, ALL, "MULHWU%C", gencc, ir3}, + {31, 235, OEM, "MULLW%V%C", gencc, ir3}, + + {7, 0, 0, "MULLW", qmuldiv, "%i,R%a,R%d"}, + + {31, 476, ALL, "NAND%C", gencc, il3}, + {31, 104, OEM, "NEG%V%C", neg, ir2}, + {31, 124, ALL, "NOR%C", gencc, il3}, + {31, 444, ALL, "OR%C", or, il3}, + {31, 412, ALL, "ORN%C", or, il3}, + {24, 0, 0, "OR", and, "%I,R%d,R%a"}, + {25, 0, 0, "OR", shifted, 0}, + + {19, 50, ALL, "RFI", gen, 0}, + {19, 51, ALL, "RFCI", gen, 0}, + + {30, 8, RLDC, "RLDCL%C", gencc, rldc}, /* 64 */ + {30, 9, RLDC, "RLDCR%C", gencc, rldc}, /* 64 */ + {30, 0, RLDI, "RLDCL%C", gencc, rldi}, /* 64 */ + {30, 1<<1, RLDI, "RLDCR%C", gencc, rldi}, /* 64 */ + {30, 2<<1, RLDI, "RLDC%C", gencc, rldi}, /* 64 */ + {30, 3<<1, RLDI, "RLDMI%C", gencc, rldi}, /* 64 */ + + {20, 0, 0, "RLWMI%C", gencc, rlimi}, + {21, 0, 0, "RLWNM%C", gencc, rlimi}, + {23, 0, 0, "RLWNM%C", gencc, rlim}, + + {17, 1, ALL, "SYSCALL", gen, 0}, + + {31, 27, ALL, "SLD%C", shift, il3}, /* 64 */ + {31, 24, ALL, "SLW%C", shift, il3}, + + {31, 794, ALL, "SRAD%C", shift, il3}, /* 64 */ + {31, (413<<1)|0, ALL, "SRAD%C", shifti, il3s}, /* 64 */ + {31, (413<<1)|1, ALL, "SRAD%C", shifti, il3s}, /* 64 */ + {31, 792, ALL, "SRAW%C", shift, il3}, + {31, 824, ALL, "SRAW%C", shifti, il3s}, + + {31, 539, ALL, "SRD%C", shift, il3}, /* 64 */ + {31, 536, ALL, "SRW%C", shift, il3}, + + {38, 0, 0, "MOVB", store, stop}, + {39, 0, 0, "MOVBU", store, stop}, + {31, 247, ALL, "MOVBU", stx, 0}, + {31, 215, ALL, "MOVB", stx, 0}, + {54, 0, 0, "FMOVD", fstore, fstop}, + {55, 0, 0, "FMOVDU", fstore, fstop}, + {31, 759, ALL, "FMOVDU", fstx, 0}, + {31, 727, ALL, "FMOVD", fstx, 0}, + {52, 0, 0, "FMOVS", fstore, fstop}, + {53, 0, 0, "FMOVSU", fstore, fstop}, + {31, 695, ALL, "FMOVSU", fstx, 0}, + {31, 663, ALL, "FMOVS", fstx, 0}, + {44, 0, 0, "MOVH", store, stop}, + {31, 918, ALL, "MOVHBR", stx, 0}, + {45, 0, 0, "MOVHU", store, stop}, + {31, 439, ALL, "MOVHU", stx, 0}, + {31, 407, ALL, "MOVH", stx, 0}, + {47, 0, 0, "MOVMW", store, stop}, + {31, 725, ALL, "STSW", gen, "R%d,$%n,(R%a)"}, + {31, 661, ALL, "STSW", stx, 0}, + {36, 0, 0, "MOVW", store, stop}, + {31, 662, ALL, "MOVWBR", stx, 0}, + {31, 150, ALL, "STWCCC", stx, 0}, + {31, 214, ALL, "STDCCC", stx, 0}, /* 64 */ + {37, 0, 0, "MOVWU", store, stop}, + {31, 183, ALL, "MOVWU", stx, 0}, + {31, 151, ALL, "MOVW", stx, 0}, + + {62, 0, 0, "MOVD%U", store, stop}, /* 64 */ + {31, 149, ALL, "MOVD", stx, 0,}, /* 64 */ + {31, 181, ALL, "MOVDU", stx, 0}, /* 64 */ + + {31, 498, ALL, "SLBIA", gen, 0}, /* 64 */ + {31, 434, ALL, "SLBIE", gen, "R%b"}, /* 64 */ + {31, 466, ALL, "SLBIEX", gen, "R%b"}, /* 64 */ + {31, 915, ALL, "SLBMFEE", gen, "R%b,R%d"}, /* 64 */ + {31, 851, ALL, "SLBMFEV", gen, "R%b,R%d"}, /* 64 */ + {31, 402, ALL, "SLBMTE", gen, "R%s,R%b"}, /* 64 */ + + {31, 40, OEM, "SUB%V%C", sub, ir3}, + {31, 8, OEM, "SUBC%V%C", sub, ir3}, + {31, 136, OEM, "SUBE%V%C", sub, ir3}, + {8, 0, 0, "SUBC", gen, "R%a,%i,R%d"}, + {31, 232, OEM, "SUBME%V%C", sub, ir2}, + {31, 200, OEM, "SUBZE%V%C", sub, ir2}, + + {31, 598, ALL, "SYNC", gen, 0}, /* TO DO: there's a parameter buried in there */ + {2, 0, 0, "TD", gen, "%d,R%a,%i"}, /* 64 */ + {31, 370, ALL, "TLBIA", gen, 0}, /* optional */ + {31, 306, ALL, "TLBIE", gen, "R%b"}, /* optional */ + {31, 274, ALL, "TLBIEL", gen, "R%b"}, /* optional */ + {31, 1010, ALL, "TLBLI", gen, "R%b"}, /* optional */ + {31, 978, ALL, "TLBLD", gen, "R%b"}, /* optional */ + {31, 566, ALL, "TLBSYNC", gen, 0}, /* optional */ + {31, 68, ALL, "TD", gen, "%d,R%a,R%b"}, /* 64 */ + {31, 4, ALL, "TW", gen, "%d,R%a,R%b"}, + {3, 0, 0, "TW", gen, "%d,R%a,%i"}, + + {31, 316, ALL, "XOR", and, il3}, + {26, 0, 0, "XOR", and, il2u}, + {27, 0, 0, "XOR", shifted, 0}, + + {0}, +}; + +typedef struct Spr Spr; +struct Spr { + int n; + char *name; +}; + +static Spr sprname[] = { + {0, "MQ"}, + {1, "XER"}, + {268, "TBL"}, + {269, "TBU"}, + {8, "LR"}, + {9, "CTR"}, + {528, "IBAT0U"}, + {529, "IBAT0L"}, + {530, "IBAT1U"}, + {531, "IBAT1L"}, + {532, "IBAT2U"}, + {533, "IBAT2L"}, + {534, "IBAT3U"}, + {535, "IBAT3L"}, + {536, "DBAT0U"}, + {537, "DBAT0L"}, + {538, "DBAT1U"}, + {539, "DBAT1L"}, + {540, "DBAT2U"}, + {541, "DBAT2L"}, + {542, "DBAT3U"}, + {543, "DBAT3L"}, + {25, "SDR1"}, + {19, "DAR"}, + {272, "SPRG0"}, + {273, "SPRG1"}, + {274, "SPRG2"}, + {275, "SPRG3"}, + {18, "DSISR"}, + {26, "SRR0"}, + {27, "SRR1"}, + {284, "TBLW"}, + {285, "TBUW"}, + {22, "DEC"}, + {282, "EAR"}, + {1008, "HID0"}, + {1009, "HID1"}, + {976, "DMISS"}, + {977, "DCMP"}, + {978, "HASH1"}, + {979, "HASH2"}, + {980, "IMISS"}, + {981, "ICMP"}, + {982, "RPA"}, + {1010, "IABR"}, + {1013, "DABR"}, + {0,0}, +}; + +static int +shmask(uvlong *m) +{ + int i; + + for(i=0; i<63; i++) + if(*m & ((uvlong)1<<i)) + break; + if(i > 63) + return 0; + if(*m & ~((uvlong)1<<i)){ /* more than one bit: do multiples of bytes */ + i = (i/8)*8; + if(i == 0) + return 0; + } + *m >>= i; + return i; +} + +static void +format(char *mnemonic, Instr *i, char *f) +{ + int n, s; + ulong mask; + uvlong vmask; + + if (mnemonic) + format(0, i, mnemonic); + if (f == 0) + return; + if (mnemonic) + bprint(i, "\t"); + for ( ; *f; f++) { + if (*f != '%') { + bprint(i, "%c", *f); + continue; + } + switch (*++f) { + + case 'a': + bprint(i, "%d", i->ra); + break; + + case 'b': + bprint(i, "%d", i->rb); + break; + + case 'c': + bprint(i, "%d", i->frc); + break; + + case 'd': + case 's': + bprint(i, "%d", i->rd); + break; + + case 'C': + if(i->rc) + bprint(i, "CC"); + break; + + case 'D': + if(i->rd & 3) + bprint(i, "CR(INVAL:%d)", i->rd); + else if(i->op == 63) + bprint(i, "FPSCR(%d)", i->crfd); + else + bprint(i, "CR(%d)", i->crfd); + break; + + case 'e': + bprint(i, "%d", i->xsh); + break; + + case 'E': + switch(IBF(i->w0,27,30)){ /* low bit is top bit of shift in rldiX cases */ + case 8: i->mb = i->xmbe; i->me = 63; break; /* rldcl */ + case 9: i->mb = 0; i->me = i->xmbe; break; /* rldcr */ + case 4: case 5: + i->mb = i->xmbe; i->me = 63-i->xsh; break; /* rldic */ + case 0: case 1: + i->mb = i->xmbe; i->me = 63; break; /* rldicl */ + case 2: case 3: + i->mb = 0; i->me = i->xmbe; break; /* rldicr */ + case 6: case 7: + i->mb = i->xmbe; i->me = 63-i->xsh; break; /* rldimi */ + } + vmask = (~(uvlong)0>>i->mb) & (~(uvlong)0<<(63-i->me)); + s = shmask(&vmask); + if(s) + bprint(i, "(%llux<<%d)", vmask, s); + else + bprint(i, "%llux", vmask); + break; + + case 'i': + bprint(i, "$%d", i->simm); + break; + + case 'I': + bprint(i, "$%ux", i->uimm); + break; + + case 'j': + if(i->aa) + pglobal(i, i->li, 1, "(SB)"); + else + pglobal(i, i->addr+i->li, 1, ""); + break; + + case 'J': + if(i->aa) + pglobal(i, i->bd, 1, "(SB)"); + else + pglobal(i, i->addr+i->bd, 1, ""); + break; + + case 'k': + bprint(i, "%d", i->sh); + break; + + case 'K': + bprint(i, "$%x", i->imm); + break; + + case 'L': + if(i->lk) + bprint(i, "L"); + break; + + case 'l': + if(i->simm < 0) + bprint(i, "-%x(R%d)", -i->simm, i->ra); + else + bprint(i, "%x(R%d)", i->simm, i->ra); + break; + + case 'm': + bprint(i, "%ux", i->crm); + break; + + case 'M': + bprint(i, "%ux", i->fm); + break; + + case 'n': + bprint(i, "%d", i->nb==0? 32: i->nb); /* eg, pg 10-103 */ + break; + + case 'P': + n = ((i->spr&0x1f)<<5)|((i->spr>>5)&0x1f); + for(s=0; sprname[s].name; s++) + if(sprname[s].n == n) + break; + if(sprname[s].name) { + if(s < 10) + bprint(i, sprname[s].name); + else + bprint(i, "SPR(%s)", sprname[s].name); + } else + bprint(i, "SPR(%d)", n); + break; + + case 'Q': + n = ((i->spr&0x1f)<<5)|((i->spr>>5)&0x1f); + bprint(i, "%d", n); + break; + + case 'S': + if(i->ra & 3) + bprint(i, "CR(INVAL:%d)", i->ra); + else if(i->op == 63) + bprint(i, "FPSCR(%d)", i->crfs); + else + bprint(i, "CR(%d)", i->crfs); + break; + + case 'U': + if(i->rc) + bprint(i, "U"); + break; + + case 'V': + if(i->oe) + bprint(i, "V"); + break; + + case 'w': + bprint(i, "[%lux]", i->w0); + break; + + case 'W': + if(i->m64) + bprint(i, "W"); + break; + + case 'Z': + if(i->m64) + bprint(i, "Z"); + break; + + case 'z': + if(i->mb <= i->me) + mask = ((ulong)~0L>>i->mb) & (~0L<<(31-i->me)); + else + mask = ~(((ulong)~0L>>(i->me+1)) & (~0L<<(31-(i->mb-1)))); + bprint(i, "%lux", mask); + break; + + case '\0': + bprint(i, "%%"); + return; + + default: + bprint(i, "%%%c", *f); + break; + } + } +} + +static int +printins(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + Opcode *o; + + mymap = map; + memset(&i, 0, sizeof(i)); + i.curr = buf; + i.end = buf+n-1; + if(mkinstr(pc, &i) < 0) + return -1; + for(o = opcodes; o->mnemonic != 0; o++) + if(i.op == o->op && (i.xo & o->xomask) == o->xo) { + if (o->f) + (*o->f)(o, &i); + else + format(o->mnemonic, &i, o->ken); + return i.size*4; + } + bprint(&i, "unknown %lux", i.w0); + return i.size*4; +} + +static int +powerinst(Map *map, uvlong pc, char modifier, char *buf, int n) +{ + USED(modifier); + return printins(map, pc, buf, n); +} + +static int +powerdas(Map *map, uvlong pc, char *buf, int n) +{ + Instr instr; + + mymap = map; + memset(&instr, 0, sizeof(instr)); + instr.curr = buf; + instr.end = buf+n-1; + if (mkinstr(pc, &instr) < 0) + return -1; + if (instr.end-instr.curr > 8) + instr.curr = _hexify(instr.curr, instr.w0, 7); + if (instr.end-instr.curr > 9 && instr.size == 2) { + *instr.curr++ = ' '; + instr.curr = _hexify(instr.curr, instr.w1, 7); + } + *instr.curr = 0; + return instr.size*4; +} + +static int +powerinstlen(Map *map, uvlong pc) +{ + Instr i; + + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + return i.size*4; +} + +static int +powerfoll(Map *map, uvlong pc, Rgetter rget, uvlong *foll) +{ + char *reg; + Instr i; + + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + foll[0] = pc+4; + foll[1] = pc+4; + switch(i.op) { + default: + return 1; + + case 18: /* branch */ + foll[0] = i.li; + if(!i.aa) + foll[0] += pc; + break; + + case 16: /* conditional branch */ + foll[0] = i.bd; + if(!i.aa) + foll[0] += pc; + break; + + case 19: /* conditional branch to register */ + if(i.xo == 528) + reg = "CTR"; + else if(i.xo == 16) + reg = "LR"; + else + return 1; /* not a branch */ + foll[0] = (*rget)(map, reg); + break; + } + if(i.lk) + return 2; + return 1; +} diff --git a/utils/libmach/qobj.c b/utils/libmach/qobj.c new file mode 100644 index 0000000..79d1c64 --- /dev/null +++ b/utils/libmach/qobj.c @@ -0,0 +1,144 @@ +/* + * qobj.c - identify and parse a PowerPC object file + * forsyth@terzarima.net + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "qc/q.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char type; + char sym; + char name; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + +int +_isq(char *s) +{ + return (s[0]&0377) == ANAME /* ANAME */ + && (s[1]&0377) == ANAME>>8 + && s[2] == D_FILE /* type */ + && s[3] == 1 /* sym */ + && s[4] == '<'; /* name of file */ +} + +int +_readq(Biobuf *bp, Prog *p) +{ + int as, n, c; + Addr a; + + as = Bgetc(bp); /* as(low) */ + if(as < 0) + return 0; + c = Bgetc(bp); /* as(high) */ + if(c < 0) + return 0; + as |= ((c & 0xff) << 8); + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = beswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + else if(as == AGLOBL) + p->kind = aData; + n = Bgetc(bp); /* reg and flag */ + skip(bp, 4); /* lineno(4) */ + a = addr(bp); + if(n & 0x40) + addr(bp); + addr(bp); + if(a.type != D_OREG || a.name != D_STATIC && a.name != D_EXTERN) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + long off; + + a.type = Bgetc(bp); /* a.type */ + skip(bp,1); /* reg */ + a.sym = Bgetc(bp); /* sym index */ + a.name = Bgetc(bp); /* sym type */ + switch(a.type){ + default: + case D_NONE: case D_REG: case D_FREG: case D_CREG: + case D_FPSCR: case D_MSR: case D_SREG: + break; + case D_SPR: + case D_OREG: + case D_DCR: + case D_CONST: + case D_BRANCH: + off = Bgetc(bp); + off |= Bgetc(bp) << 8; + off |= Bgetc(bp) << 16; + off |= Bgetc(bp) << 24; + if(off < 0) + off = -off; + if(a.sym && (a.name==D_PARAM || a.name==D_AUTO)) + _offset(a.sym, off); + break; + case D_SCONST: + skip(bp, NSNAME); + break; + case D_FCONST: + skip(bp, 8); + break; + } + return a; +} + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} diff --git a/utils/libmach/setmach.c b/utils/libmach/setmach.c new file mode 100644 index 0000000..7247881 --- /dev/null +++ b/utils/libmach/setmach.c @@ -0,0 +1,144 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + /* table for selecting machine-dependent parameters */ + +typedef struct machtab Machtab; + +struct machtab +{ + char *name; /* machine name */ + short type; /* executable type */ + short boottype; /* bootable type */ + int asstype; /* disassembler code */ + Mach *mach; /* machine description */ + Machdata *machdata; /* machine functions */ +}; + +extern Mach mmips, msparc, mi386, mamd64, + marm, mmips2be, mmips2le, mpower, mpower64; +extern Machdata mipsmach, sparcmach, i386mach, + armmach, mipsmach2le, powermach; + +/* + * machine selection table. machines with native disassemblers should + * follow the plan 9 variant in the table; native modes are selectable + * only by name. + */ +Machtab machines[] = +{ + { "mips2LE", /*plan 9 mips2 little endian*/ + FMIPS2LE, + 0, + AMIPS, + &mmips2le, + &mipsmach2le, }, + { "mips", /*plan 9 mips*/ + FMIPS, + FMIPSB, + AMIPS, + &mmips, + &mipsmach, }, + { "mips2", /*plan 9 mips2*/ + FMIPS2BE, + FMIPSB, + AMIPS, + &mmips2be, + &mipsmach, }, /* shares debuggers with native mips */ + { "mipsco", /*native mips - must follow plan 9*/ + FMIPS, + FMIPSB, + AMIPSCO, + &mmips, + &mipsmach, }, + { "sparc", /*plan 9 sparc */ + FSPARC, + FSPARCB, + ASPARC, + &msparc, + &sparcmach, }, + { "sunsparc", /*native sparc - must follow plan 9*/ + FSPARC, + FSPARCB, + ASUNSPARC, + &msparc, + &sparcmach, }, + { "386", /*plan 9 386*/ + FI386, + FI386B, + AI386, + &mi386, + &i386mach, }, + { "86", /*8086 - a peach of a machine*/ + FI386, + FI386B, + AI8086, + &mi386, + &i386mach, }, + { "amd64", /*amd64*/ + FAMD64, + FAMD64B, + AAMD64, + &mamd64, + &i386mach, }, + { "arm", /*ARM*/ + FARM, + FARMB, + AARM, + &marm, + &armmach, }, + { "power", /*PowerPC*/ + FPOWER, + FPOWERB, + APOWER, + &mpower, + &powermach, }, + { "power64", /*PowerPC*/ + FPOWER64, + FPOWER64B, + APOWER64, + &mpower64, + &powermach, }, + { 0 }, /*the terminator*/ +}; + +/* + * select a machine by executable file type + */ +void +machbytype(int type) +{ + Machtab *mp; + + for (mp = machines; mp->name; mp++){ + if (mp->type == type || mp->boottype == type) { + asstype = mp->asstype; + machdata = mp->machdata; + break; + } + } +} +/* + * select a machine by name + */ +int +machbyname(char *name) +{ + Machtab *mp; + + if (!name) { + asstype = AMIPS; + machdata = &mipsmach; + mach = &mmips; + return 1; + } + for (mp = machines; mp->name; mp++){ + if (strcmp(mp->name, name) == 0) { + asstype = mp->asstype; + machdata = mp->machdata; + mach = mp->mach; + return 1; + } + } + return 0; +} diff --git a/utils/libmach/swap.c b/utils/libmach/swap.c new file mode 100644 index 0000000..63f7629 --- /dev/null +++ b/utils/libmach/swap.c @@ -0,0 +1,81 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +/* + * big-endian short + */ +ushort +beswab(ushort s) +{ + uchar *p; + + p = (uchar*)&s; + return (p[0]<<8) | p[1]; +} + +/* + * big-endian long + */ +ulong +beswal(ulong l) +{ + uchar *p; + + p = (uchar*)&l; + return (p[0]<<24) | (p[1]<<16) | (p[2]<<8) | p[3]; +} + +/* + * big-endian vlong + */ +uvlong +beswav(uvlong v) +{ + uchar *p; + + p = (uchar*)&v; + return ((uvlong)p[0]<<56) | ((uvlong)p[1]<<48) | ((uvlong)p[2]<<40) + | ((uvlong)p[3]<<32) | ((uvlong)p[4]<<24) + | ((uvlong)p[5]<<16) | ((uvlong)p[6]<<8) + | (uvlong)p[7]; +} + +/* + * little-endian short + */ +ushort +leswab(ushort s) +{ + uchar *p; + + p = (uchar*)&s; + return (p[1]<<8) | p[0]; +} + +/* + * little-endian long + */ +ulong +leswal(ulong l) +{ + uchar *p; + + p = (uchar*)&l; + return (p[3]<<24) | (p[2]<<16) | (p[1]<<8) | p[0]; +} + +/* + * little-endian vlong + */ +uvlong +leswav(uvlong v) +{ + uchar *p; + + p = (uchar*)&v; + return ((uvlong)p[7]<<56) | ((uvlong)p[6]<<48) | ((uvlong)p[5]<<40) + | ((uvlong)p[4]<<32) | ((uvlong)p[3]<<24) + | ((uvlong)p[2]<<16) | ((uvlong)p[1]<<8) + | (uvlong)p[0]; +} diff --git a/utils/libmach/sym.c b/utils/libmach/sym.c new file mode 100644 index 0000000..5651d4e --- /dev/null +++ b/utils/libmach/sym.c @@ -0,0 +1,1373 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +#define HUGEINT 0x7fffffff +#define NNAME 20 /* a relic of the past */ + +typedef struct txtsym Txtsym; +typedef struct file File; +typedef struct hist Hist; + +struct txtsym { /* Text Symbol table */ + int n; /* number of local vars */ + Sym **locals; /* array of ptrs to autos */ + Sym *sym; /* function symbol entry */ +}; + +struct hist { /* Stack of include files & #line directives */ + char *name; /* Assumes names Null terminated in file */ + long line; /* line # where it was included */ + long offset; /* line # of #line directive */ +}; + +struct file { /* Per input file header to history stack */ + uvlong addr; /* address of first text sym */ + /* union { */ + Txtsym *txt; /* first text symbol */ + Sym *sym; /* only during initilization */ + /* }; */ + int n; /* size of history stack */ + Hist *hist; /* history stack */ +}; + +static int debug = 0; + +static Sym **autos; /* Base of auto variables */ +static File *files; /* Base of file arena */ +static int fpmax; /* largest file path index */ +static Sym **fnames; /* file names path component table */ +static Sym **globals; /* globals by addr table */ +static Hist *hist; /* base of history stack */ +static int isbuilt; /* internal table init flag */ +static long nauto; /* number of automatics */ +static long nfiles; /* number of files */ +static long nglob; /* number of globals */ +static long nhist; /* number of history stack entries */ +static long nsym; /* number of symbols */ +static int ntxt; /* number of text symbols */ +static uchar *pcline; /* start of pc-line state table */ +static uchar *pclineend; /* end of pc-line table */ +static uchar *spoff; /* start of pc-sp state table */ +static uchar *spoffend; /* end of pc-sp offset table */ +static Sym *symbols; /* symbol table */ +static Txtsym *txt; /* Base of text symbol table */ +static uvlong txtstart; /* start of text segment */ +static uvlong txtend; /* end of text segment */ + +static void cleansyms(void); +static long decodename(Biobuf*, Sym*); +static short *encfname(char*); +static int fline(char*, int, long, Hist*, Hist**); +static void fillsym(Sym*, Symbol*); +static int findglobal(char*, Symbol*); +static int findlocvar(Symbol*, char *, Symbol*); +static int findtext(char*, Symbol*); +static int hcomp(Hist*, short*); +static int hline(File*, short*, long*); +static void printhist(char*, Hist*, int); +static int buildtbls(void); +static int symcomp(void*, void*); +static int symerrmsg(int, char*); +static int txtcomp(void*, void*); +static int filecomp(void*, void*); + +/* + * initialize the symbol tables + */ +int +syminit(int fd, Fhdr *fp) +{ + Sym *p; + long i, l, size; + vlong vl; + Biobuf b; + int svalsz; + + if(fp->symsz == 0) + return 0; + if(fp->type == FNONE) + return 0; + + cleansyms(); + textseg(fp->txtaddr, fp); + /* minimum symbol record size = 4+1+2 bytes */ + symbols = malloc((fp->symsz/(4+1+2)+1)*sizeof(Sym)); + if(symbols == 0) { + werrstr("can't malloc %ld bytes", fp->symsz); + return -1; + } + Binit(&b, fd, OREAD); + Bseek(&b, fp->symoff, 0); + nsym = 0; + size = 0; + for(p = symbols; size < fp->symsz; p++, nsym++) { + if(fp->_magic && (fp->magic & HDR_MAGIC)){ + svalsz = 8; + if(Bread(&b, &vl, 8) != 8) + return symerrmsg(8, "symbol"); + p->value = beswav(vl); + } + else{ + svalsz = 4; + if(Bread(&b, &l, 4) != 4) + return symerrmsg(4, "symbol"); + p->value = (u32int)beswal(l); + } + if(Bread(&b, &p->type, sizeof(p->type)) != sizeof(p->type)) + return symerrmsg(sizeof(p->value), "symbol"); + + i = decodename(&b, p); + if(i < 0) + return -1; + size += i+svalsz+sizeof(p->type); + + /* count global & auto vars, text symbols, and file names */ + switch (p->type) { + case 'l': + case 'L': + case 't': + case 'T': + ntxt++; + break; + case 'd': + case 'D': + case 'b': + case 'B': + nglob++; + break; + case 'f': + if(strcmp(p->name, ".frame") == 0) { + p->type = 'm'; + nauto++; + } + else if(p->value > fpmax) + fpmax = p->value; /* highest path index */ + break; + case 'a': + case 'p': + case 'm': + nauto++; + break; + case 'z': + if(p->value == 1) { /* one extra per file */ + nhist++; + nfiles++; + } + nhist++; + break; + default: + break; + } + } + if (debug) + print("NG: %ld NT: %d NF: %d\n", nglob, ntxt, fpmax); + if (fp->sppcsz) { /* pc-sp offset table */ + spoff = (uchar *)malloc(fp->sppcsz); + if(spoff == 0) { + werrstr("can't malloc %ld bytes", fp->sppcsz); + return -1; + } + Bseek(&b, fp->sppcoff, 0); + if(Bread(&b, spoff, fp->sppcsz) != fp->sppcsz){ + spoff = 0; + return symerrmsg(fp->sppcsz, "sp-pc"); + } + spoffend = spoff+fp->sppcsz; + } + if (fp->lnpcsz) { /* pc-line number table */ + pcline = (uchar *)malloc(fp->lnpcsz); + if(pcline == 0) { + werrstr("can't malloc %ld bytes", fp->lnpcsz); + return -1; + } + Bseek(&b, fp->lnpcoff, 0); + if(Bread(&b, pcline, fp->lnpcsz) != fp->lnpcsz){ + pcline = 0; + return symerrmsg(fp->lnpcsz, "pc-line"); + } + pclineend = pcline+fp->lnpcsz; + } + return nsym; +} + +static int +symerrmsg(int n, char *table) +{ + werrstr("can't read %d bytes of %s table", n, table); + return -1; +} + +static long +decodename(Biobuf *bp, Sym *p) +{ + char *cp; + int c1, c2; + long n; + vlong o; + + if((p->type & 0x80) == 0) { /* old-style, fixed length names */ + p->name = malloc(NNAME); + if(p->name == 0) { + werrstr("can't malloc %d bytes", NNAME); + return -1; + } + if(Bread(bp, p->name, NNAME) != NNAME) + return symerrmsg(NNAME, "symbol"); + Bseek(bp, 3, 1); + return NNAME+3; + } + + p->type &= ~0x80; + if(p->type == 'z' || p->type == 'Z') { + o = Bseek(bp, 0, 1); + if(Bgetc(bp) < 0) { + werrstr("can't read symbol name"); + return -1; + } + for(;;) { + c1 = Bgetc(bp); + c2 = Bgetc(bp); + if(c1 < 0 || c2 < 0) { + werrstr("can't read symbol name"); + return -1; + } + if(c1 == 0 && c2 == 0) + break; + } + n = Bseek(bp, 0, 1)-o; + p->name = malloc(n); + if(p->name == 0) { + werrstr("can't malloc %ld bytes", n); + return -1; + } + Bseek(bp, -n, 1); + if(Bread(bp, p->name, n) != n) { + werrstr("can't read %ld bytes of symbol name", n); + return -1; + } + } else { + cp = Brdline(bp, '\0'); + if(cp == 0) { + werrstr("can't read symbol name"); + return -1; + } + n = Blinelen(bp); + p->name = malloc(n); + if(p->name == 0) { + werrstr("can't malloc %ld bytes", n); + return -1; + } + strcpy(p->name, cp); + } + return n; +} + +/* + * free any previously loaded symbol tables + */ +static void +cleansyms(void) +{ + if(globals) + free(globals); + globals = 0; + nglob = 0; + if(txt) + free(txt); + txt = 0; + ntxt = 0; + if(fnames) + free(fnames); + fnames = 0; + fpmax = 0; + + if(files) + free(files); + files = 0; + nfiles = 0; + if(hist) + free(hist); + hist = 0; + nhist = 0; + if(autos) + free(autos); + autos = 0; + nauto = 0; + isbuilt = 0; + if(symbols) + free(symbols); + symbols = 0; + nsym = 0; + if(spoff) + free(spoff); + spoff = 0; + if(pcline) + free(pcline); + pcline = 0; +} + +/* + * delimit the text segment + */ +void +textseg(uvlong base, Fhdr *fp) +{ + txtstart = base; + txtend = base+fp->txtsz; +} + +/* + * symbase: return base and size of raw symbol table + * (special hack for high access rate operations) + */ +Sym * +symbase(long *n) +{ + *n = nsym; + return symbols; +} + +/* + * Get the ith symbol table entry + */ +Sym * +getsym(int index) +{ + if(index >= 0 && index < nsym) + return &symbols[index]; + return 0; +} + +/* + * initialize internal symbol tables + */ +static int +buildtbls(void) +{ + long i; + int j, nh, ng, nt; + File *f; + Txtsym *tp; + Hist *hp; + Sym *p, **ap; + + if(isbuilt) + return 1; + isbuilt = 1; + /* allocate the tables */ + if(nglob) { + globals = malloc(nglob*sizeof(*globals)); + if(!globals) { + werrstr("can't malloc global symbol table"); + return 0; + } + } + if(ntxt) { + txt = malloc(ntxt*sizeof(*txt)); + if (!txt) { + werrstr("can't malloc text symbol table"); + return 0; + } + } + fnames = malloc((fpmax+1)*sizeof(*fnames)); + if (!fnames) { + werrstr("can't malloc file name table"); + return 0; + } + memset(fnames, 0, (fpmax+1)*sizeof(*fnames)); + files = malloc(nfiles*sizeof(*files)); + if(!files) { + werrstr("can't malloc file table"); + return 0; + } + hist = malloc(nhist*sizeof(Hist)); + if(hist == 0) { + werrstr("can't malloc history stack"); + return 0; + } + autos = malloc(nauto*sizeof(Sym*)); + if(autos == 0) { + werrstr("can't malloc auto symbol table"); + return 0; + } + /* load the tables */ + ng = nt = nh = 0; + f = 0; + tp = 0; + i = nsym; + hp = hist; + ap = autos; + for(p = symbols; i-- > 0; p++) { + switch(p->type) { + case 'D': + case 'd': + case 'B': + case 'b': + if(debug) + print("Global: %s %llux\n", p->name, p->value); + globals[ng++] = p; + break; + case 'z': + if(p->value == 1) { /* New file */ + if(f) { + f->n = nh; + f->hist[nh].name = 0; /* one extra */ + hp += nh+1; + f++; + } + else + f = files; + f->hist = hp; + f->sym = 0; + f->addr = 0; + nh = 0; + } + /* alloc one slot extra as terminator */ + f->hist[nh].name = p->name; + f->hist[nh].line = p->value; + f->hist[nh].offset = 0; + if(debug) + printhist("-> ", &f->hist[nh], 1); + nh++; + break; + case 'Z': + if(f && nh > 0) + f->hist[nh-1].offset = p->value; + break; + case 'T': + case 't': /* Text: terminate history if first in file */ + case 'L': + case 'l': + tp = &txt[nt++]; + tp->n = 0; + tp->sym = p; + tp->locals = ap; + if(debug) + print("TEXT: %s at %llux\n", p->name, p->value); + if(f && !f->sym) { /* first */ + f->sym = p; + f->addr = p->value; + } + break; + case 'a': + case 'p': + case 'm': /* Local Vars */ + if(!tp) + print("Warning: Free floating local var: %s\n", + p->name); + else { + if(debug) + print("Local: %s %llux\n", p->name, p->value); + tp->locals[tp->n] = p; + tp->n++; + ap++; + } + break; + case 'f': /* File names */ + if(debug) + print("Fname: %s\n", p->name); + fnames[p->value] = p; + break; + default: + break; + } + } + /* sort global and text tables into ascending address order */ + qsort(globals, nglob, sizeof(Sym*), symcomp); + qsort(txt, ntxt, sizeof(Txtsym), txtcomp); + qsort(files, nfiles, sizeof(File), filecomp); + tp = txt; + for(i = 0, f = files; i < nfiles; i++, f++) { + for(j = 0; j < ntxt; j++) { + if(f->sym == tp->sym) { + if(debug) { + print("LINK: %s to at %llux", f->sym->name, f->addr); + printhist("... ", f->hist, 1); + } + f->txt = tp++; + break; + } + if(++tp >= txt+ntxt) /* wrap around */ + tp = txt; + } + } + return 1; +} + +/* + * find symbol function.var by name. + * fn != 0 && var != 0 => look for fn in text, var in data + * fn != 0 && var == 0 => look for fn in text + * fn == 0 && var != 0 => look for var first in text then in data space. + */ +int +lookup(char *fn, char *var, Symbol *s) +{ + int found; + + if(buildtbls() == 0) + return 0; + if(fn) { + found = findtext(fn, s); + if(var == 0) /* case 2: fn not in text */ + return found; + else if(!found) /* case 1: fn not found */ + return 0; + } else if(var) { + found = findtext(var, s); + if(found) + return 1; /* case 3: var found in text */ + } else return 0; /* case 4: fn & var == zero */ + + if(found) + return findlocal(s, var, s); /* case 1: fn found */ + return findglobal(var, s); /* case 3: var not found */ + +} + +/* + * find a function by name + */ +static int +findtext(char *name, Symbol *s) +{ + int i; + + for(i = 0; i < ntxt; i++) { + if(strcmp(txt[i].sym->name, name) == 0) { + fillsym(txt[i].sym, s); + s->handle = (void *) &txt[i]; + s->index = i; + return 1; + } + } + return 0; +} +/* + * find global variable by name + */ +static int +findglobal(char *name, Symbol *s) +{ + long i; + + for(i = 0; i < nglob; i++) { + if(strcmp(globals[i]->name, name) == 0) { + fillsym(globals[i], s); + s->index = i; + return 1; + } + } + return 0; +} + +/* + * find the local variable by name within a given function + */ +int +findlocal(Symbol *s1, char *name, Symbol *s2) +{ + if(s1 == 0) + return 0; + if(buildtbls() == 0) + return 0; + return findlocvar(s1, name, s2); +} + +/* + * find the local variable by name within a given function + * (internal function - does no parameter validation) + */ +static int +findlocvar(Symbol *s1, char *name, Symbol *s2) +{ + Txtsym *tp; + int i; + + tp = (Txtsym *)s1->handle; + if(tp && tp->locals) { + for(i = 0; i < tp->n; i++) + if (strcmp(tp->locals[i]->name, name) == 0) { + fillsym(tp->locals[i], s2); + s2->handle = (void *)tp; + s2->index = tp->n-1 - i; + return 1; + } + } + return 0; +} + +/* + * Get ith text symbol + */ +int +textsym(Symbol *s, int index) +{ + + if(buildtbls() == 0) + return 0; + if(index < 0 || index >= ntxt) + return 0; + fillsym(txt[index].sym, s); + s->handle = (void *)&txt[index]; + s->index = index; + return 1; +} + +/* + * Get ith file name + */ +int +filesym(int index, char *buf, int n) +{ + Hist *hp; + + if(buildtbls() == 0) + return 0; + if(index < 0 || index >= nfiles) + return 0; + hp = files[index].hist; + if(!hp || !hp->name) + return 0; + return fileelem(fnames, (uchar*)hp->name, buf, n); +} + +/* + * Lookup name of local variable located at an offset into the frame. + * The type selects either a parameter or automatic. + */ +int +getauto(Symbol *s1, int off, int type, Symbol *s2) +{ + Txtsym *tp; + Sym *p; + int i, t; + + if(s1 == 0) + return 0; + if(type == CPARAM) + t = 'p'; + else if(type == CAUTO) + t = 'a'; + else + return 0; + if(buildtbls() == 0) + return 0; + tp = (Txtsym *)s1->handle; + if(tp == 0) + return 0; + for(i = 0; i < tp->n; i++) { + p = tp->locals[i]; + if(p->type == t && p->value == off) { + fillsym(p, s2); + s2->handle = s1->handle; + s2->index = tp->n-1 - i; + return 1; + } + } + return 0; +} + +/* + * Find text symbol containing addr; binary search assumes text array is sorted by addr + */ +static int +srchtext(uvlong addr) +{ + uvlong val; + int top, bot, mid; + Sym *sp; + + val = addr; + bot = 0; + top = ntxt; + for (mid = (bot+top)/2; mid < top; mid = (bot+top)/2) { + sp = txt[mid].sym; + if(val < sp->value) + top = mid; + else if(mid != ntxt-1 && val >= txt[mid+1].sym->value) + bot = mid; + else + return mid; + } + return -1; +} + +/* + * Find data symbol containing addr; binary search assumes data array is sorted by addr + */ +static int +srchdata(uvlong addr) +{ + uvlong val; + int top, bot, mid; + Sym *sp; + + bot = 0; + top = nglob; + val = addr; + for(mid = (bot+top)/2; mid < top; mid = (bot+top)/2) { + sp = globals[mid]; + if(val < sp->value) + top = mid; + else if(mid < nglob-1 && val >= globals[mid+1]->value) + bot = mid; + else + return mid; + } + return -1; +} + +/* + * Find symbol containing val in specified search space + * There is a special case when a value falls beyond the end + * of the text segment; if the search space is CTEXT, that value + * (usually etext) is returned. If the search space is CANY, symbols in the + * data space are searched for a match. + */ +int +findsym(uvlong val, int type, Symbol *s) +{ + int i; + + if(buildtbls() == 0) + return 0; + + if(type == CTEXT || type == CANY) { + i = srchtext(val); + if(i >= 0) { + if(type == CTEXT || i != ntxt-1) { + fillsym(txt[i].sym, s); + s->handle = (void *) &txt[i]; + s->index = i; + return 1; + } + } + } + if(type == CDATA || type == CANY) { + i = srchdata(val); + if(i >= 0) { + fillsym(globals[i], s); + s->index = i; + return 1; + } + } + return 0; +} + +/* + * Find the start and end address of the function containing addr + */ +int +fnbound(uvlong addr, uvlong *bounds) +{ + int i; + + if(buildtbls() == 0) + return 0; + + i = srchtext(addr); + if(0 <= i && i < ntxt-1) { + bounds[0] = txt[i].sym->value; + bounds[1] = txt[i+1].sym->value; + return 1; + } + return 0; +} + +/* + * get the ith local symbol for a function + * the input symbol table is reverse ordered, so we reverse + * accesses here to maintain approx. parameter ordering in a stack trace. + */ +int +localsym(Symbol *s, int index) +{ + Txtsym *tp; + + if(s == 0 || index < 0) + return 0; + if(buildtbls() == 0) + return 0; + + tp = (Txtsym *)s->handle; + if(tp && tp->locals && index < tp->n) { + fillsym(tp->locals[tp->n-index-1], s); /* reverse */ + s->handle = (void *)tp; + s->index = index; + return 1; + } + return 0; +} + +/* + * get the ith global symbol + */ +int +globalsym(Symbol *s, int index) +{ + if(s == 0) + return 0; + if(buildtbls() == 0) + return 0; + + if(index >=0 && index < nglob) { + fillsym(globals[index], s); + s->index = index; + return 1; + } + return 0; +} + +/* + * find the pc given a file name and line offset into it. + */ +uvlong +file2pc(char *file, long line) +{ + File *fp; + long i; + uvlong pc, start, end; + short *name; + + if(buildtbls() == 0 || files == 0) + return ~0; + name = encfname(file); + if(name == 0) { /* encode the file name */ + werrstr("file %s not found", file); + return ~0; + } + /* find this history stack */ + for(i = 0, fp = files; i < nfiles; i++, fp++) + if (hline(fp, name, &line)) + break; + free(name); + if(i >= nfiles) { + werrstr("line %ld in file %s not found", line, file); + return ~0; + } + start = fp->addr; /* first text addr this file */ + if(i < nfiles-1) + end = (fp+1)->addr; /* first text addr next file */ + else + end = 0; /* last file in load module */ + /* + * At this point, line contains the offset into the file. + * run the state machine to locate the pc closest to that value. + */ + if(debug) + print("find pc for %ld - between: %llux and %llux\n", line, start, end); + pc = line2addr(line, start, end); + if(pc == ~0) { + werrstr("line %ld not in file %s", line, file); + return ~0; + } + return pc; +} + +/* + * search for a path component index + */ +static int +pathcomp(char *s, int n) +{ + int i; + + for(i = 0; i <= fpmax; i++) + if(fnames[i] && strncmp(s, fnames[i]->name, n) == 0) + return i; + return -1; +} + +/* + * Encode a char file name as a sequence of short indices + * into the file name dictionary. + */ +static short* +encfname(char *file) +{ + int i, j; + char *cp, *cp2; + short *dest; + + if(*file == '/') /* always check first '/' */ + cp2 = file+1; + else { + cp2 = strchr(file, '/'); + if(!cp2) + cp2 = strchr(file, 0); + } + cp = file; + dest = 0; + for(i = 0; *cp; i++) { + j = pathcomp(cp, cp2-cp); + if(j < 0) + return 0; /* not found */ + dest = realloc(dest, (i+1)*sizeof(short)); + dest[i] = j; + cp = cp2; + while(*cp == '/') /* skip embedded '/'s */ + cp++; + cp2 = strchr(cp, '/'); + if(!cp2) + cp2 = strchr(cp, 0); + } + dest = realloc(dest, (i+1)*sizeof(short)); + dest[i] = 0; + return dest; +} + +/* + * Search a history stack for a matching file name accumulating + * the size of intervening files in the stack. + */ +static int +hline(File *fp, short *name, long *line) +{ + Hist *hp; + int offset, depth; + long ln; + + for(hp = fp->hist; hp->name; hp++) /* find name in stack */ + if(hp->name[1] || hp->name[2]) { + if(hcomp(hp, name)) + break; + } + if(!hp->name) /* match not found */ + return 0; + if(debug) + printhist("hline found ... ", hp, 1); + /* + * unwind the stack until empty or we hit an entry beyond our line + */ + ln = *line; + offset = hp->line-1; + depth = 1; + for(hp++; depth && hp->name; hp++) { + if(debug) + printhist("hline inspect ... ", hp, 1); + if(hp->name[1] || hp->name[2]) { + if(hp->offset){ /* Z record */ + offset = 0; + if(hcomp(hp, name)) { + if(*line <= hp->offset) + break; + ln = *line+hp->line-hp->offset; + depth = 1; /* implicit pop */ + } else + depth = 2; /* implicit push */ + } else if(depth == 1 && ln < hp->line-offset) + break; /* Beyond our line */ + else if(depth++ == 1) /* push */ + offset -= hp->line; + } else if(--depth == 1) /* pop */ + offset += hp->line; + } + *line = ln+offset; + return 1; +} + +/* + * compare two encoded file names + */ +static int +hcomp(Hist *hp, short *sp) +{ + uchar *cp; + int i, j; + short *s; + + cp = (uchar *)hp->name; + s = sp; + if (*s == 0) + return 0; + for (i = 1; j = (cp[i]<<8)|cp[i+1]; i += 2) { + if(j == 0) + break; + if(*s == j) + s++; + else + s = sp; + } + return *s == 0; +} + +/* + * Convert a pc to a "file:line {file:line}" string. + */ +long +fileline(char *str, int n, uvlong dot) +{ + long line, top, bot, mid; + File *f; + + *str = 0; + if(buildtbls() == 0) + return 0; + /* binary search assumes file list is sorted by addr */ + bot = 0; + top = nfiles; + for (mid = (bot+top)/2; mid < top; mid = (bot+top)/2) { + f = &files[mid]; + if(dot < f->addr) + top = mid; + else if(mid < nfiles-1 && dot >= (f+1)->addr) + bot = mid; + else { + line = pc2line(dot); + if(line > 0 && fline(str, n, line, f->hist, 0) >= 0) + return 1; + break; + } + } + return 0; +} + +/* + * Convert a line number within a composite file to relative line + * number in a source file. A composite file is the source + * file with included files inserted in line. + */ +static int +fline(char *str, int n, long line, Hist *base, Hist **ret) +{ + Hist *start; /* start of current level */ + Hist *h; /* current entry */ + long delta; /* sum of size of files this level */ + int k; + + start = base; + h = base; + delta = h->line; + while(h && h->name && line > h->line) { + if(h->name[1] || h->name[2]) { + if(h->offset != 0) { /* #line Directive */ + delta = h->line-h->offset+1; + start = h; + base = h++; + } else { /* beginning of File */ + if(start == base) + start = h++; + else { + k = fline(str, n, line, start, &h); + if(k <= 0) + return k; + } + } + } else { + if(start == base && ret) { /* end of recursion level */ + *ret = h; + return 1; + } else { /* end of included file */ + delta += h->line-start->line; + h++; + start = base; + } + } + } + if(!h) + return -1; + if(start != base) + line = line-start->line+1; + else + line = line-delta+1; + if(!h->name) + strncpy(str, "<eof>", n); + else { + k = fileelem(fnames, (uchar*)start->name, str, n); + if(k+8 < n) + sprint(str+k, ":%ld", line); + } +/**********Remove comments for complete back-trace of include sequence + * if(start != base) { + * k = strlen(str); + * if(k+2 < n) { + * str[k++] = ' '; + * str[k++] = '{'; + * } + * k += fileelem(fnames, (uchar*) base->name, str+k, n-k); + * if(k+10 < n) + * sprint(str+k, ":%ld}", start->line-delta); + * } + ********************/ + return 0; +} + +/* + * convert an encoded file name to a string. + */ +int +fileelem(Sym **fp, uchar *cp, char *buf, int n) +{ + int i, j; + char *c, *bp, *end; + + bp = buf; + end = buf+n-1; + for(i = 1; j = (cp[i]<<8)|cp[i+1]; i+=2){ + c = fp[j]->name; + if(bp != buf && bp[-1] != '/' && bp < end) + *bp++ = '/'; + while(bp < end && *c) + *bp++ = *c++; + } + *bp = 0; + i = bp-buf; + if(i > 1) { + cleanname(buf); + i = strlen(buf); + } + return i; +} + +/* + * compare the values of two symbol table entries. + */ +static int +symcomp(void *a, void *b) +{ + int i; + + i = (*(Sym**)a)->value - (*(Sym**)b)->value; + if (i) + return i; + return strcmp((*(Sym**)a)->name, (*(Sym**)b)->name); +} + +/* + * compare the values of the symbols referenced by two text table entries + */ +static int +txtcomp(void *a, void *b) +{ + return ((Txtsym*)a)->sym->value - ((Txtsym*)b)->sym->value; +} + +/* + * compare the values of the symbols referenced by two file table entries + */ +static int +filecomp(void *a, void *b) +{ + return ((File*)a)->addr - ((File*)b)->addr; +} + +/* + * fill an interface Symbol structure from a symbol table entry + */ +static void +fillsym(Sym *sp, Symbol *s) +{ + s->type = sp->type; + s->value = sp->value; + s->name = sp->name; + s->index = 0; + switch(sp->type) { + case 'b': + case 'B': + case 'D': + case 'd': + s->class = CDATA; + break; + case 't': + case 'T': + case 'l': + case 'L': + s->class = CTEXT; + break; + case 'a': + s->class = CAUTO; + break; + case 'p': + s->class = CPARAM; + break; + case 'm': + s->class = CSTAB; + break; + default: + s->class = CNONE; + break; + } + s->handle = 0; +} + +/* + * find the stack frame, given the pc + */ +uvlong +pc2sp(uvlong pc) +{ + uchar *c, u; + uvlong currpc, currsp; + + if(spoff == 0) + return ~0; + currsp = 0; + currpc = txtstart - mach->pcquant; + + if(pc<currpc || pc>txtend) + return ~0; + for(c = spoff; c < spoffend; c++) { + if (currpc >= pc) + return currsp; + u = *c; + if (u == 0) { + currsp += (c[1]<<24)|(c[2]<<16)|(c[3]<<8)|c[4]; + c += 4; + } + else if (u < 65) + currsp += 4*u; + else if (u < 129) + currsp -= 4*(u-64); + else + currpc += mach->pcquant*(u-129); + currpc += mach->pcquant; + } + return ~0; +} + +/* + * find the source file line number for a given value of the pc + */ +long +pc2line(uvlong pc) +{ + uchar *c, u; + uvlong currpc; + long currline; + + if(pcline == 0) + return -1; + currline = 0; + currpc = txtstart-mach->pcquant; + if(pc<currpc || pc>txtend) + return ~0; + + for(c = pcline; c < pclineend; c++) { + if(currpc >= pc) + return currline; + u = *c; + if(u == 0) { + currline += (c[1]<<24)|(c[2]<<16)|(c[3]<<8)|c[4]; + c += 4; + } + else if(u < 65) + currline += u; + else if(u < 129) + currline -= (u-64); + else + currpc += mach->pcquant*(u-129); + currpc += mach->pcquant; + } + return ~0; +} + +/* + * find the pc associated with a line number + * basepc and endpc are text addresses bounding the search. + * if endpc == 0, the end of the table is used (i.e., no upper bound). + * usually, basepc and endpc contain the first text address in + * a file and the first text address in the following file, respectively. + */ +uvlong +line2addr(long line, uvlong basepc, uvlong endpc) +{ + uchar *c, u; + uvlong currpc, pc; + long currline; + long delta, d; + int found; + + if(pcline == 0 || line == 0) + return ~0; + + currline = 0; + currpc = txtstart-mach->pcquant; + pc = ~0; + found = 0; + delta = HUGEINT; + + for(c = pcline; c < pclineend; c++) { + if(endpc && currpc >= endpc) /* end of file of interest */ + break; + if(currpc >= basepc) { /* proper file */ + if(currline >= line) { + d = currline-line; + found = 1; + } else + d = line-currline; + if(d < delta) { + delta = d; + pc = currpc; + } + } + u = *c; + if(u == 0) { + currline += (c[1]<<24)|(c[2]<<16)|(c[3]<<8)|c[4]; + c += 4; + } + else if(u < 65) + currline += u; + else if(u < 129) + currline -= (u-64); + else + currpc += mach->pcquant*(u-129); + currpc += mach->pcquant; + } + if(found) + return pc; + return ~0; +} + +/* + * Print a history stack (debug). if count is 0, prints the whole stack + */ +static void +printhist(char *msg, Hist *hp, int count) +{ + int i; + uchar *cp; + char buf[128]; + + i = 0; + while(hp->name) { + if(count && ++i > count) + break; + print("%s Line: %lx (%ld) Offset: %lx (%ld) Name: ", msg, + hp->line, hp->line, hp->offset, hp->offset); + for(cp = (uchar *)hp->name+1; (*cp<<8)|cp[1]; cp += 2) { + if (cp != (uchar *)hp->name+1) + print("/"); + print("%x", (*cp<<8)|cp[1]); + } + fileelem(fnames, (uchar *) hp->name, buf, sizeof(buf)); + print(" (%s)\n", buf); + hp++; + } +} + +#ifdef DEBUG +/* + * print the history stack for a file. (debug only) + * if (name == 0) => print all history stacks. + */ +void +dumphist(char *name) +{ + int i; + File *f; + short *fname; + + if(buildtbls() == 0) + return; + if(name) + fname = encfname(name); + for(i = 0, f = files; i < nfiles; i++, f++) + if(fname == 0 || hcomp(f->hist, fname)) + printhist("> ", f->hist, f->n); + + if(fname) + free(fname); +} +#endif diff --git a/utils/libmach/t.c b/utils/libmach/t.c new file mode 100644 index 0000000..809168e --- /dev/null +++ b/utils/libmach/t.c @@ -0,0 +1,122 @@ +/* + * thumb definition + */ +#include <lib9.h> +#include <bio.h> +#include "uregt.h" +#include "mach.h" + + +#define REGOFF(x) (ulong) (&((struct Ureg *) 0)->x) + +#define SP REGOFF(r13) +#define PC REGOFF(pc) + +#define REGSIZE sizeof(struct Ureg) + +Reglist thumbreglist[] = +{ + {"LINK", REGOFF(link), RINT|RRDONLY, 'X'}, + {"TYPE", REGOFF(type), RINT|RRDONLY, 'X'}, + {"PSR", REGOFF(psr), RINT|RRDONLY, 'X'}, + {"PC", PC, RINT, 'X'}, + {"SP", SP, RINT, 'X'}, + {"R15", PC, RINT, 'X'}, + {"R14", REGOFF(r14), RINT, 'X'}, + {"R13", REGOFF(r13), RINT, 'X'}, + {"R12", REGOFF(r12), RINT, 'X'}, + {"R11", REGOFF(r11), RINT, 'X'}, + {"R10", REGOFF(r10), RINT, 'X'}, + {"R9", REGOFF(r9), RINT, 'X'}, + {"R8", REGOFF(r8), RINT, 'X'}, + {"R7", REGOFF(r7), RINT, 'X'}, + {"R6", REGOFF(r6), RINT, 'X'}, + {"R5", REGOFF(r5), RINT, 'X'}, + {"R4", REGOFF(r4), RINT, 'X'}, + {"R3", REGOFF(r3), RINT, 'X'}, + {"R2", REGOFF(r2), RINT, 'X'}, + {"R1", REGOFF(r1), RINT, 'X'}, + {"R0", REGOFF(r0), RINT, 'X'}, + { 0 } +}; + + /* the machine description */ +Mach mthumb = +{ + "thumb", + MARM, /*MTHUMB,*/ /* machine type */ + thumbreglist, /* register set */ + REGSIZE, /* register set size */ + 0, /* fp register set size */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "R15", /* name of link register */ + "setR12", /* static base register name */ + 0, /* static base register value */ + 0x1000, /* page size */ + 0x80000000, /* kernel base */ + 0, /* kernel text mask */ + 0x7FFFFFFF, /* stack top */ + 2, /* quantization of pc */ + 4, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; + +typedef struct pcentry pcentry; + +struct pcentry{ + long start; + long stop; +}; + +static pcentry *pctab; +static int npctab; + +void +thumbpctab(Biobuf *b, Fhdr *fp) +{ + int n, o, ta; + uchar c[8]; + pcentry *tab; + + Bseek(b, fp->lnpcoff+fp->lnpcsz, 0); + o = (int)Boffset(b); + Bseek(b, 0, 2); + n = (int)Boffset(b)-o; + pctab = (pcentry*)malloc(n); + if(pctab == 0) + return; + ta = fp->txtaddr; + tab = pctab; + Bseek(b, fp->lnpcoff+fp->lnpcsz, 0); + while(Bread(b, c, sizeof(c)) == sizeof(c)){ + tab->start = ta + (c[0]<<24)|(c[1]<<16)|(c[2]<<8)|c[3]; + tab->stop = ta + (c[4]<<24)|(c[5]<<16)|(c[6]<<8)|c[7]; + tab++; + } + npctab = n/sizeof(c); +} + +int +thumbpclookup(uvlong pc) +{ + uvlong l, u, m; + pcentry *tab = pctab; + + l = 0; + u = npctab-1; + while(l < u){ + m = (l+u)/2; + if(pc < tab[m].start) + u = m-1; + else if(pc > tab[m].stop) + l = m+1; + else + l = u = m; + } + if(l == u && u < npctab && tab[u].start <= pc && pc <= tab[u].stop) + return 1; // thumb + return 0; // arm +} diff --git a/utils/libmach/tdb.c b/utils/libmach/tdb.c new file mode 100644 index 0000000..8838d85 --- /dev/null +++ b/utils/libmach/tdb.c @@ -0,0 +1,839 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + +static int debug = 0; + +typedef struct Instr Instr; +struct Instr +{ + Map *map; + ulong w; + ulong addr; + uchar op; /* super opcode */ + + uchar rd; + uchar rn; + uchar rs; + + long imm; /* imm */ + + char* curr; /* fill point in buffer */ + char* end; /* end of buffer */ + char* err; /* error message */ +}; + +typedef struct Opcode Opcode; +struct Opcode +{ + char* o; + void (*fmt)(Opcode*, Instr*); + uvlong (*foll)(Map*, Rgetter, Instr*, uvlong); + char* a; +}; + +static void format(char*, Instr*, char*); +static char FRAMENAME[] = ".frame"; + +/* + * Thumb-specific debugger interface + */ + +static char *thumbexcep(Map*, Rgetter); +static int thumbfoll(Map*, uvlong, Rgetter, uvlong*); +static int thumbinst(Map*, uvlong, char, char*, int); +static int thumbdas(Map*, uvlong, char*, int); +static int thumbinstlen(Map*, uvlong); + +/* + * Debugger interface + */ +Machdata thumbmach = +{ + {0x0, 0xE8}, /* break point */ + 2, /* break point size */ + + leswab, /* short to local byte order */ + leswal, /* long to local byte order */ + leswav, /* long to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + thumbexcep, /* print exception */ + 0, /* breakpoint fixup */ + 0, /* single precision float printer */ + 0, /* double precision float printer */ + thumbfoll, /* following addresses */ + thumbinst, /* print instruction */ + thumbdas, /* dissembler */ + thumbinstlen, /* instruction size */ +}; + +static void thumbrrh(Opcode *, Instr *); +static void thumbbcc(Opcode *, Instr *); +static void thumbb(Opcode *, Instr *); +static void thumbbl(Opcode *, Instr *); + +static char* +thumbexcep(Map *map, Rgetter rget) +{ + long c; + + c = (*rget)(map, "TYPE"); + switch (c&0x1f) { + case 0x11: + return "Fiq interrupt"; + case 0x12: + return "Mirq interrupt"; + case 0x13: + return "SVC/SWI Exception"; + case 0x17: + return "Prefetch Abort/Data Abort"; + case 0x18: + return "Data Abort"; + case 0x1b: + return "Undefined instruction/Breakpoint"; + case 0x1f: + return "Sys trap"; + default: + return "Undefined trap"; + } +} + +static +char* cond[16] = +{ + "EQ", "NE", "CS", "CC", + "MI", "PL", "VS", "VC", + "HI", "LS", "GE", "LT", + "GT", "LE", "\0", "NV" +}; + +#define B(h, l) bits(ins, h, l) + +static int +bits(int i, int h, int l) +{ + if(h < l) + print("h < l in bits"); + return (i&(((1<<(h-l+1))-1)<<l))>>l; +} + +int +thumbclass(long w) +{ + int o; + int ins = w; + + if(ins&0xffff0000) + return 3+2+2+4+16+4+1+8+6+2+2+2+4+1+1+1+2; + o = B(15, 13); + switch(o){ + case 0: + o = B(12, 11); + switch(o){ + case 0: + case 1: + case 2: + return B(12, 11); + case 3: + if(B(10, 10) == 0) + return 3+B(9, 9); + else + return 3+2+B(9, 9); + } + case 1: + return 3+2+2+B(12, 11); + case 2: + o = B(12, 10); + if(o == 0) + return 3+2+2+4+B(9, 6); + if(o == 1){ + o = B(9, 8); + if(o == 3) + return 3+2+2+4+16+B(9, 8); + return 3+2+2+4+16+B(9, 8); + } + if(o == 2 || o == 3) + return 3+2+2+4+16+4; + return 3+2+2+4+16+4+1+B(11, 9); + case 3: + return 3+2+2+4+16+4+1+8+B(12, 11); + case 4: + if(B(12, 12) == 0) + return 3+2+2+4+16+4+1+8+4+B(11, 11); + return 3+2+2+4+16+4+1+8+6+B(11, 11); + case 5: + if(B(12, 12) == 0) + return 3+2+2+4+16+4+1+8+6+2+B(11, 11); + if(B(11, 8) == 0) + return 3+2+2+4+16+4+1+8+6+2+2+B(7, 7); + return 3+2+2+4+16+4+1+8+6+2+2+2+B(11, 11); + case 6: + if(B(12, 12) == 0) + return 3+2+2+4+16+4+1+8+6+2+2+2+2+B(11, 11); + if(B(11, 8) == 0xf) + return 3+2+2+4+16+4+1+8+6+2+2+2+4; + return 3+2+2+4+16+4+1+8+6+2+2+2+4+1; + case 7: + o = B(12, 11); + switch(o){ + case 0: + return 3+2+2+4+16+4+1+8+6+2+2+2+4+1+1; + case 1: + return 3+2+2+4+16+4+1+8+6+2+2+2+4+1+1+1+2; + case 2: + return 3+2+2+4+16+4+1+8+6+2+2+2+4+1+1+1; + case 3: + return 3+2+2+4+16+4+1+8+6+2+2+2+4+1+1+1+1; + } + } + return 0; +} + +static int +decode(Map *map, uvlong pc, Instr *i) +{ + ushort w; + + if(get2(map, pc, &w) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + i->w = w; + i->addr = pc; + i->op = thumbclass(w); + i->map = map; + return 1; +} + +static void +bprint(Instr *i, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + i->curr = vseprint(i->curr, i->end, fmt, arg); + va_end(arg); +} + +static int +plocal(Instr *i) +{ + char *reg; + Symbol s; + char *fn; + int class; + int offset; + + if(!findsym(i->addr, CTEXT, &s)) { + if(debug)fprint(2,"fn not found @%lux: %r\n", i->addr); + return 0; + } + fn = s.name; + if (!findlocal(&s, FRAMENAME, &s)) { + if(debug)fprint(2,"%s.%s not found @%s: %r\n", fn, FRAMENAME, s.name); + return 0; + } + if(s.value > i->imm) { + class = CAUTO; + offset = s.value-i->imm; + reg = "(SP)"; + } else { + class = CPARAM; + offset = i->imm-s.value-4; + reg = "(FP)"; + } + if(!getauto(&s, offset, class, &s)) { + if(debug)fprint(2,"%s %s not found @%ux: %r\n", fn, + class == CAUTO ? " auto" : "param", offset); + return 0; + } + bprint(i, "%s%c%d%s", s.name, class == CPARAM ? '+' : '-', s.value, reg); + return 1; +} + +/* + * Print value v as name[+offset] + */ +static int +gsymoff(char *buf, int n, long v, int space) +{ + Symbol s; + int r; + long delta; + + r = delta = 0; /* to shut compiler up */ + if (v) { + r = findsym(v, space, &s); + if (r) + delta = v-s.value; + if (delta < 0) + delta = -delta; + } + if (v == 0 || r == 0 || delta >= 4096) + return snprint(buf, n, "#%lux", v); + if (strcmp(s.name, ".string") == 0) + return snprint(buf, n, "#%lux", v); + if (!delta) + return snprint(buf, n, "%s", s.name); + if (s.type != 't' && s.type != 'T') + return snprint(buf, n, "%s+%llux", s.name, v-s.value); + else + return snprint(buf, n, "#%lux", v); +} + +static int +thumbcondpass(Map *map, Rgetter rget, uchar cond) +{ + ulong psr; + uchar n; + uchar z; + uchar c; + uchar v; + + psr = rget(map, "PSR"); + n = (psr >> 31) & 1; + z = (psr >> 30) & 1; + c = (psr >> 29) & 1; + v = (psr >> 28) & 1; + + switch(cond) { + case 0: return z; + case 1: return !z; + case 2: return c; + case 3: return !c; + case 4: return n; + case 5: return !n; + case 6: return v; + case 7: return !v; + case 8: return c && !z; + case 9: return !c || z; + case 10: return n == v; + case 11: return n != v; + case 12: return !z && (n == v); + case 13: return z && (n != v); + case 14: return 1; + case 15: return 0; + } + return 0; +} + +static uvlong +thumbfbranch(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + char buf[8]; + + if(i->op == 30){ // BX + thumbrrh(nil, i); + sprint(buf, "R%ud", i->rn); + return rget(map, buf)&~1; // clear T bit + } + if(i->op == 57){ // Bcc + thumbbcc(nil, i); + if(thumbcondpass(map, rget, (i->w >> 8) & 0xf)) + return i->imm; + return pc+2; + } + if(i->op == 58){ // B + thumbb(nil, i); + return i->imm; + } + if(i->op == 60){ // BL + thumbbl(nil, i); + return i->imm; + } + print("bad thumbfbranch call"); + return 0; +} + +static uvlong +thumbfmov(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + char buf[8]; + ulong rd; + + thumbrrh(nil, i); + rd = i->rd; + if(rd != 15) + return pc+2; + sprint(buf, "R%ud", i->rn); + return rget(map, buf); +} + +static uvlong +thumbfadd(Map *map, Rgetter rget, Instr *i, uvlong pc) +{ + char buf[8]; + ulong rd, v; + + thumbrrh(nil, i); + rd = i->rd; + if(rd != 15) + return pc+2; + sprint(buf, "R%ud", i->rn); + v = rget(map, buf); + sprint(buf, "R15"); + return rget(map, buf) + v; +} + +static void +thumbshift(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(2, 0); + i->rn = B(5, 3); + i->imm = B(10, 6); + format(o->o, i, o->a); +} + +static void +thumbrrr(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(2, 0); + i->rn = B(5, 3); + i->rs = B(8, 6); + format(o->o, i, o->a); +} + +static void +thumbirr(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(2, 0); + i->rn = B(5, 3); + i->imm = B(8, 6); + format(o->o, i, o->a); +} + +static void +thumbir(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(10, 8); + i->imm = B(7, 0); + format(o->o, i, o->a); +} + +static void +thumbrr(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(2, 0); + i->rn = B(5, 3); + format(o->o, i, o->a); +} + +static void +thumbrrh(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(2, 0); + i->rn = B(5, 3); + if(B(6, 6)) + i->rn += 8; + if(B(7, 7)) + i->rd += 8; + if(o != nil){ + if(i->w == 0x46b7 || i->w == 0x46f7 || i->w == 0x4730 || i->w == 0x4770) // mov r6, pc or mov lr, pc or bx r6 or bx lr + format("RET", i, ""); + else + format(o->o, i, o->a); + } +} + +static void +thumbpcrel(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rn = 15; + i->rd = B(10, 8); + i->imm = 4*(B(7, 0)+1); + if(i->addr & 3) + i->imm -= 2; + format(o->o, i, o->a); +} + +static void +thumbmovirr(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(2, 0); + i->rn = B(5, 3); + i->imm = B(10, 6); + if(strcmp(o->o, "MOVW") == 0) + i->imm *= 4; + else if(strncmp(o->o, "MOVH", 4) == 0) + i->imm *= 2; + format(o->o, i, o->a); +} + +static void +thumbmovsp(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rn = 13; + i->rd = B(10, 8); + i->imm = 4*B(7, 0); + format(o->o, i, o->a); +} + +static void +thumbaddsppc(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->rd = B(10, 8); + i->imm = 4*B(7, 0); + if(i->op == 48) + i->imm += 4; + format(o->o, i, o->a); +} + +static void +thumbaddsp(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->imm = 4*B(6, 0); + format(o->o, i, o->a); +} + +static void +thumbswi(Opcode *o, Instr *i) +{ + int ins = i->w; + + i->imm = B(7, 0); + format(o->o, i, o->a); +} + +static void +thumbbcc(Opcode *o, Instr *i) +{ + int off, ins = i->w; + + off = B(7, 0); + if(off & 0x80) + off |= 0xffffff00; + i->imm = i->addr + 2*off + 4; + if(o != nil) + format(o->o, i, o->a); +} + +static void +thumbb(Opcode *o, Instr *i) +{ + int off, ins = i->w; + + off = B(10, 0); + if(off & 0x400) + off |= 0xfffff800; + i->imm = i->addr + 2*off + 4; + if(o != nil) + format(o->o, i, o->a); +} + +static void +thumbbl(Opcode *o, Instr *i) +{ + int off, h, ins = i->w; + static int reglink; + + h = B(11, 11); + off = B(10, 0); + if(h == 0){ + if(off & 0x400) + off |= 0xfffff800; + i->imm = i->addr + (off<<12) + 4; + reglink = i->imm; + } + else{ + i->imm = reglink + 2*off; + } + if(o != nil) + format(o->o, i, o->a); +} + +static void +thumbregs(Opcode *o, Instr *i) +{ + int ins = i->w; + + if(i->op == 52 || i->op == 53) + i->rd = 13; + else + i->rd = B(10, 8); + i->imm = B(7, 0); + format(o->o, i, o->a); +} + +static void +thumbunk(Opcode *o, Instr *i) +{ + format(o->o, i, o->a); +} + +static Opcode opcodes[] = +{ + "LSL", thumbshift, 0, "$#%i,R%n,R%d", // 0 + "LSR", thumbshift, 0, "$#%i,R%n,R%d", // 1 + "ASR", thumbshift, 0, "$#%i,R%n,R%d", // 2 + "ADD", thumbrrr, 0, "R%s,R%n,R%d", // 3 + "SUB", thumbrrr, 0, "R%s,R%n,R%d", // 4 + "ADD", thumbirr, 0, "$#%i,R%n,R%d", // 5 + "SUB", thumbirr, 0, "$#%i,R%n,R%d", // 6 + "MOVW", thumbir, 0, "$#%i,R%d", // 7 + "CMP", thumbir, 0, "$#%i,R%d", // 8 + "ADD", thumbir, 0, "$#%i,R%d,R%d", // 9 + "SUB", thumbir, 0, "$#%i,R%d,R%d", // 10 + "AND", thumbrr, 0, "R%n,R%d,R%d", // 11 + "EOR", thumbrr, 0, "R%n,R%d,R%d", // 12 + "LSL", thumbrr, 0, "R%n,R%d,R%d", // 13 + "LSR", thumbrr, 0, "R%n,R%d,R%d", // 14 + "ASR", thumbrr, 0, "R%n,R%d,R%d", // 15 + "ADC", thumbrr, 0, "R%n,R%d,R%d", // 16 + "SBC", thumbrr, 0, "R%n,R%d,R%d", // 17 + "ROR", thumbrr, 0, "R%n,R%d,R%d", // 18 + "TST", thumbrr, 0, "R%n,R%d", // 19 + "NEG", thumbrr, 0, "R%n,R%d", // 20 + "CMP", thumbrr, 0, "R%n,R%d", // 21 + "CMPN", thumbrr, 0, "R%n,R%d", // 22 + "OR", thumbrr, 0, "R%n,R%d,R%d", // 23 + "MUL", thumbrr, 0, "R%n,R%d,R%d", // 24 + "BITC", thumbrr, 0, "R%n,R%d,R%d", // 25 + "MOVN", thumbrr, 0, "R%n,R%d", // 26 + "ADD", thumbrrh, thumbfadd, "R%n,R%d,R%d", // 27 + "CMP", thumbrrh, 0, "R%n,R%d", // 28 + "MOVW", thumbrrh, thumbfmov, "R%n,R%d", // 29 + "BX", thumbrrh, thumbfbranch, "R%n", // 30 + "MOVW", thumbpcrel, 0, "$%I,R%d", // 31 + "MOVW", thumbrrr, 0, "R%d, [R%s,R%n]", // 32 + "MOVH", thumbrrr, 0, "R%d, [R%s,R%n]", // 33 + "MOVB", thumbrrr, 0, "R%d, [R%s,R%n]", // 34 + "MOVB", thumbrrr, 0, "[R%s,R%n],R%d", // 35 + "MOVW", thumbrrr, 0, "[R%s,R%n],R%d", // 36 + "MOVHU", thumbrrr, 0, "[R%s,R%n],R%d", // 37 + "MOVBU", thumbrrr, 0, "[R%s,R%n],R%d", // 38 + "MOVH", thumbrrr, 0, "[R%s,R%n],R%d", // 39 + "MOVW", thumbmovirr, 0, "R%d,%I", // 40 + "MOVW", thumbmovirr, 0, "%I,R%d", // 41 + "MOVB", thumbmovirr, 0, "R%d,%I", // 42 + "MOVBU", thumbmovirr, 0, "$%I,R%d", // 43 + "MOVH", thumbmovirr, 0, "R%d,%I", // 44 + "MOVHU", thumbmovirr, 0, "%I,R%d", // 45 + "MOVW", thumbmovsp, 0, "R%d,%I", // 46 + "MOVW", thumbmovsp, 0, "%I,R%d", // 47 + "ADD", thumbaddsppc,0, "$#%i,PC,R%d", // 48 + "ADD", thumbaddsppc,0, "$#%i,SP,R%d", // 49 + "ADD", thumbaddsp, 0, "$#%i,SP,SP", // 50 + "SUB", thumbaddsp, 0, "$#%i,SP,SP", // 51 + "PUSH", thumbregs, 0, "R%d, %r", // 52 + "POP", thumbregs, 0, "R%d, %r", // 53 + "STMIA", thumbregs, 0, "R%d, %r", // 54 + "LDMIA", thumbregs, 0, "R%d, %r", // 55 + "SWI", thumbswi, 0, "$#%i", // 56 + "B%c", thumbbcc, thumbfbranch, "%b", // 57 + "B", thumbb, thumbfbranch, "%b", // 58 + "BL", thumbbl, 0, "", // 59 + "BL", thumbbl, thumbfbranch, "%b", // 60 + "UNK", thumbunk, 0, "", // 61 +}; + +static void +gaddr(Instr *i) +{ + *i->curr++ = '$'; + i->curr += gsymoff(i->curr, i->end-i->curr, i->imm, CANY); +} + +static void +format(char *mnemonic, Instr *i, char *f) +{ + int j, k, m, n; + int g; + char *fmt; + int ins = i->w; + + if(mnemonic) + format(0, i, mnemonic); + if(f == 0) + return; + if(mnemonic) + if(i->curr < i->end) + *i->curr++ = '\t'; + for ( ; *f && i->curr < i->end; f++) { + if(*f != '%') { + *i->curr++ = *f; + continue; + } + switch (*++f) { + + case 'c': /*Bcc */ + bprint(i, "%s", cond[B(11, 8)]); + break; + + case 's': + bprint(i, "%d", i->rs); + break; + + case 'n': + bprint(i, "%d", i->rn); + break; + + case 'd': + bprint(i, "%d", i->rd); + break; + + case 'i': + bprint(i, "%lux", i->imm); + break; + + case 'b': + i->curr += symoff(i->curr, i->end-i->curr, + i->imm, CTEXT); + break; + + case 'I': + if (i->rn == 13) { + if (plocal(i)) + break; + } + g = 0; + fmt = "#%lx(R%d)"; + if (i->rn == 15) { + /* convert load of offset(PC) to a load immediate */ + if (get4(i->map, i->addr + i->imm, (ulong*)&i->imm) > 0) + { + g = 1; + fmt = ""; + } + } + if (mach->sb) + { + if (i->rn == 12) + { + i->imm += mach->sb; + g = 1; + fmt = "-SB(SB)"; + } + } + if (g) + { + gaddr(i); + bprint(i, fmt, i->rn); + } + else + bprint(i, fmt, i->imm, i->rn); + break; + + case 'r': + n = i->imm&0xff; + j = 0; + k = 0; + while(n) { + m = j; + while(n&0x1) { + j++; + n >>= 1; + } + if(j != m) { + if(k) + bprint(i, ","); + if(j == m+1) + bprint(i, "R%d", m); + else + bprint(i, "R%d-R%d", m, j-1); + k = 1; + } + j++; + n >>= 1; + } + break; + + case '\0': + *i->curr++ = '%'; + return; + + default: + bprint(i, "%%%c", *f); + break; + } + } + *i->curr = 0; +} + +static int +printins(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + + i.curr = buf; + i.end = buf+n-1; + if(decode(map, pc, &i) < 0) + return -1; + + (*opcodes[i.op].fmt)(&opcodes[i.op], &i); + return 2; +} + +static int +thumbinst(Map *map, uvlong pc, char modifier, char *buf, int n) +{ + USED(modifier); + return printins(map, pc, buf, n); +} + +static int +thumbdas(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + + i.curr = buf; + i.end = buf+n; + if(decode(map, pc, &i) < 0) + return -1; + if(i.end-i.curr > 8) + i.curr = _hexify(buf, i.w, 7); + *i.curr = 0; + return 2; +} + +static int +thumbinstlen(Map *map, uvlong pc) +{ + Instr i; + + if(decode(map, pc, &i) < 0) + return -1; + return 2; +} + +static int +thumbfoll(Map *map, uvlong pc, Rgetter rget, uvlong *foll) +{ + ulong d; + Instr i; + + if(decode(map, pc, &i) < 0) + return -1; + + if(opcodes[i.op].foll) { + d = (*opcodes[i.op].foll)(map, rget, &i, pc); + if(d == -1) + return -1; + } else + d = pc+2; + + foll[0] = d; + return 1; +} diff --git a/utils/libmach/ureg4.h b/utils/libmach/ureg4.h new file mode 100644 index 0000000..5f95dcd --- /dev/null +++ b/utils/libmach/ureg4.h @@ -0,0 +1,46 @@ +struct Ureg +{ + ulong status; + long pc; + union + { + long sp; /* r29 */ + long usp; /* r29 */ + } u0; + ulong cause; + ulong badvaddr; + ulong tlbvirt; + + long hhi; long hi; + long hlo; long lo; + long hr31; long r31; + long hr30; long r30; + long hr28; long r28; + long hr27; long r27; + long hr26; long r26; + long hr25; long r25; + long hr24; long r24; + long hr23; long r23; + long hr22; long r22; + long hr21; long r21; + long hr20; long r20; + long hr19; long r19; + long hr18; long r18; + long hr17; long r17; + long hr16; long r16; + long hr15; long r15; + long hr14; long r14; + long hr13; long r13; + long hr12; long r12; + long hr11; long r11; + long hr10; long r10; + long hr9; long r9; + long hr8; long r8; + long hr7; long r7; + long hr6; long r6; + long hr5; long r5; + long hr4; long r4; + long hr3; long r3; + long hr2; long r2; + long hr1; long r1; +}; diff --git a/utils/libmach/ureg5.h b/utils/libmach/ureg5.h new file mode 100644 index 0000000..ffdad42 --- /dev/null +++ b/utils/libmach/ureg5.h @@ -0,0 +1,21 @@ +struct Ureg { + uint r0; + uint r1; + uint r2; + uint r3; + uint r4; + uint r5; + uint r6; + uint r7; + uint r8; + uint r9; + uint r10; + uint r11; + uint r12; + uint r13; + uint r14; + uint link; + uint type; + uint psr; + uint pc; +}; diff --git a/utils/libmach/ureg6.h b/utils/libmach/ureg6.h new file mode 100644 index 0000000..6e58d25 --- /dev/null +++ b/utils/libmach/ureg6.h @@ -0,0 +1,30 @@ +struct Ureg { + u64int ax; + u64int bx; + u64int cx; + u64int dx; + u64int si; + u64int di; + u64int bp; + u64int r8; + u64int r9; + u64int r10; + u64int r11; + u64int r12; + u64int r13; + u64int r14; + u64int r15; + + u16int ds; + u16int es; + u16int fs; + u16int gs; + + u64int type; + u64int error; /* error code (or zero) */ + u64int ip; /* pc */ + u64int cs; /* old context */ + u64int flags; /* old flags */ + u64int sp; /* sp */ + u64int ss; /* old stack segment */ +}; diff --git a/utils/libmach/ureg8.h b/utils/libmach/ureg8.h new file mode 100644 index 0000000..8bdf178 --- /dev/null +++ b/utils/libmach/ureg8.h @@ -0,0 +1,25 @@ +struct Ureg +{ + ulong di; /* general registers */ + ulong si; /* ... */ + ulong bp; /* ... */ + ulong nsp; + ulong bx; /* ... */ + ulong dx; /* ... */ + ulong cx; /* ... */ + ulong ax; /* ... */ + ulong gs; /* data segments */ + ulong fs; /* ... */ + ulong es; /* ... */ + ulong ds; /* ... */ + ulong trap; /* trap type */ + ulong ecode; /* error code (or zero) */ + ulong pc; /* pc */ + ulong cs; /* old context */ + ulong flags; /* old flags */ + union { + ulong usp; + ulong sp; + } u0; + ulong ss; /* old stack segment */ +}; diff --git a/utils/libmach/ureg9.h b/utils/libmach/ureg9.h new file mode 100644 index 0000000..676f5a5 --- /dev/null +++ b/utils/libmach/ureg9.h @@ -0,0 +1,44 @@ +struct Ureg +{ +/* 0*/ u64int cause; /* trap or interrupt vector */ +/* 8*/ u64int msr; /* SRR1 */ +/* 16*/ u64int pc; /* SRR0 */ +/* 24*/ u64int unused; +/* 32*/ u64int lr; +/* 36*/ u32int pad; +/* 40*/ u32int cr; +/* 48*/ u64int xer; +/* 56*/ u64int ctr; +/* 64*/ u64int r0; +/* 72*/ union{ u64int r1; u64int sp; u64int usp; }; +/* 80*/ u64int r2; +/* 88*/ u64int r3; +/* 96*/ u64int r4; +/*104*/ u64int r5; +/*112*/ u64int r6; +/*120*/ u64int r7; +/*128*/ u64int r8; +/*136*/ u64int r9; +/*144*/ u64int r10; +/*152*/ u64int r11; +/*160*/ u64int r12; +/*168*/ u64int r13; +/*176*/ u64int r14; +/*184*/ u64int r15; +/*192*/ u64int r16; +/*200*/ u64int r17; +/*208*/ u64int r18; +/*216*/ u64int r19; +/*224*/ u64int r20; +/*232*/ u64int r21; +/*240*/ u64int r22; +/*248*/ u64int r23; +/*256*/ u64int r24; +/*264*/ u64int r25; +/*272*/ u64int r26; +/*280*/ u64int r27; +/*288*/ u64int r28; +/*296*/ u64int r29; +/*304*/ u64int r30; +/*312*/ u64int r31; +}; diff --git a/utils/libmach/uregk.h b/utils/libmach/uregk.h new file mode 100644 index 0000000..4ff12ed --- /dev/null +++ b/utils/libmach/uregk.h @@ -0,0 +1,45 @@ +struct Ureg +{ + ulong r0; /* unnecessary; just for symmetry */ + union{ + ulong sp; /* r1 */ + ulong usp; /* r1 */ + ulong r1; + } u0; + ulong r2; + ulong r3; + ulong r4; + ulong r5; + ulong r6; + ulong r7; + ulong r8; + ulong r9; + ulong r10; + ulong r11; + ulong r12; + ulong r13; + ulong r14; + ulong r15; + ulong r16; + ulong r17; + ulong r18; + ulong r19; + ulong r20; + ulong r21; + ulong r22; + ulong r23; + ulong r24; + ulong r25; + ulong r26; + ulong r27; + ulong r28; + ulong r29; + ulong r30; + ulong r31; + ulong y; + ulong tbr; + ulong psr; + ulong npc; + ulong pc; + ulong pad; /* so structure is double word aligned */ +}; diff --git a/utils/libmach/uregq.h b/utils/libmach/uregq.h new file mode 100644 index 0000000..d412b05 --- /dev/null +++ b/utils/libmach/uregq.h @@ -0,0 +1,43 @@ +struct Ureg +{ + ulong cause; + ulong srr1; + ulong pc; /* SRR0 */ + ulong pad; + ulong lr; + ulong cr; + ulong xer; + ulong ctr; + ulong r0; + ulong sp; + ulong r2; + ulong r3; + ulong r4; + ulong r5; + ulong r6; + ulong r7; + ulong r8; + ulong r9; + ulong r10; + ulong r11; + ulong r12; + ulong r13; + ulong r14; + ulong r15; + ulong r16; + ulong r17; + ulong r18; + ulong r19; + ulong r20; + ulong r21; + ulong r22; + ulong r23; + ulong r24; + ulong r25; + ulong r26; + ulong r27; + ulong r28; + ulong r29; + ulong r30; + ulong r31; +}; diff --git a/utils/libmach/uregt.h b/utils/libmach/uregt.h new file mode 100644 index 0000000..705a867 --- /dev/null +++ b/utils/libmach/uregt.h @@ -0,0 +1,21 @@ +struct Ureg { + u32int r0; + u32int r1; + u32int r2; + u32int r3; + u32int r4; + u32int r5; + u32int r6; + u32int r7; + u32int r8; + u32int r9; + u32int r10; + u32int r11; + u32int r12; + u32int r13; + u32int r14; + u32int link; + u32int type; + u32int psr; + u32int pc; +}; diff --git a/utils/libmach/uregv.h b/utils/libmach/uregv.h new file mode 100644 index 0000000..def45d2 --- /dev/null +++ b/utils/libmach/uregv.h @@ -0,0 +1,44 @@ +struct Ureg +{ + ulong status; + ulong pc; + union{ + ulong sp; /* r29 */ + ulong usp; /* r29 */ + } u0; + ulong cause; + ulong badvaddr; + ulong tlbvirt; + ulong hi; + ulong lo; + ulong r31; + ulong r30; + ulong r28; + ulong r27; /* unused */ + ulong r26; /* unused */ + ulong r25; + ulong r24; + ulong r23; + ulong r22; + ulong r21; + ulong r20; + ulong r19; + ulong r18; + ulong r17; + ulong r16; + ulong r15; + ulong r14; + ulong r13; + ulong r12; + ulong r11; + ulong r10; + ulong r9; + ulong r8; + ulong r7; + ulong r6; + ulong r5; + ulong r4; + ulong r3; + ulong r2; + ulong r1; +}; diff --git a/utils/libmach/v.c b/utils/libmach/v.c new file mode 100644 index 0000000..3b2daf8 --- /dev/null +++ b/utils/libmach/v.c @@ -0,0 +1,117 @@ +/* + * mips definition + */ +#include <lib9.h> +#include <bio.h> +#include "uregv.h" +#include "mach.h" + +#define REGOFF(x) (ulong)(&((struct Ureg *) 0)->x) + +#define SP REGOFF(u0.sp) +#define PC REGOFF(pc) +#define R1 REGOFF(r1) +#define R31 REGOFF(r31) +#define FP_REG(x) (R1+4+4*(x)) + +#define REGSIZE sizeof(struct Ureg) +#define FPREGSIZE (4*33) + +Reglist mipsreglist[] = { + {"STATUS", REGOFF(status), RINT|RRDONLY, 'X'}, + {"CAUSE", REGOFF(cause), RINT|RRDONLY, 'X'}, + {"BADVADDR", REGOFF(badvaddr), RINT|RRDONLY, 'X'}, + {"TLBVIRT", REGOFF(tlbvirt), RINT|RRDONLY, 'X'}, + {"HI", REGOFF(hi), RINT|RRDONLY, 'X'}, + {"LO", REGOFF(lo), RINT|RRDONLY, 'X'}, + {"PC", PC, RINT, 'X'}, + {"SP", SP, RINT, 'X'}, + {"R31", R31, RINT, 'X'}, + {"R30", REGOFF(r30), RINT, 'X'}, + {"R28", REGOFF(r28), RINT, 'X'}, + {"R27", REGOFF(r27), RINT, 'X'}, + {"R26", REGOFF(r26), RINT, 'X'}, + {"R25", REGOFF(r25), RINT, 'X'}, + {"R24", REGOFF(r24), RINT, 'X'}, + {"R23", REGOFF(r23), RINT, 'X'}, + {"R22", REGOFF(r22), RINT, 'X'}, + {"R21", REGOFF(r21), RINT, 'X'}, + {"R20", REGOFF(r20), RINT, 'X'}, + {"R19", REGOFF(r19), RINT, 'X'}, + {"R18", REGOFF(r18), RINT, 'X'}, + {"R17", REGOFF(r17), RINT, 'X'}, + {"R16", REGOFF(r16), RINT, 'X'}, + {"R15", REGOFF(r15), RINT, 'X'}, + {"R14", REGOFF(r14), RINT, 'X'}, + {"R13", REGOFF(r13), RINT, 'X'}, + {"R12", REGOFF(r12), RINT, 'X'}, + {"R11", REGOFF(r11), RINT, 'X'}, + {"R10", REGOFF(r10), RINT, 'X'}, + {"R9", REGOFF(r9), RINT, 'X'}, + {"R8", REGOFF(r8), RINT, 'X'}, + {"R7", REGOFF(r7), RINT, 'X'}, + {"R6", REGOFF(r6), RINT, 'X'}, + {"R5", REGOFF(r5), RINT, 'X'}, + {"R4", REGOFF(r4), RINT, 'X'}, + {"R3", REGOFF(r3), RINT, 'X'}, + {"R2", REGOFF(r2), RINT, 'X'}, + {"R1", REGOFF(r1), RINT, 'X'}, + {"F0", FP_REG(0), RFLT, 'F'}, + {"F1", FP_REG(1), RFLT, 'f'}, + {"F2", FP_REG(2), RFLT, 'F'}, + {"F3", FP_REG(3), RFLT, 'f'}, + {"F4", FP_REG(4), RFLT, 'F'}, + {"F5", FP_REG(5), RFLT, 'f'}, + {"F6", FP_REG(6), RFLT, 'F'}, + {"F7", FP_REG(7), RFLT, 'f'}, + {"F8", FP_REG(8), RFLT, 'F'}, + {"F9", FP_REG(9), RFLT, 'f'}, + {"F10", FP_REG(10), RFLT, 'F'}, + {"F11", FP_REG(11), RFLT, 'f'}, + {"F12", FP_REG(12), RFLT, 'F'}, + {"F13", FP_REG(13), RFLT, 'f'}, + {"F14", FP_REG(14), RFLT, 'F'}, + {"F15", FP_REG(15), RFLT, 'f'}, + {"F16", FP_REG(16), RFLT, 'F'}, + {"F17", FP_REG(17), RFLT, 'f'}, + {"F18", FP_REG(18), RFLT, 'F'}, + {"F19", FP_REG(19), RFLT, 'f'}, + {"F20", FP_REG(20), RFLT, 'F'}, + {"F21", FP_REG(21), RFLT, 'f'}, + {"F22", FP_REG(22), RFLT, 'F'}, + {"F23", FP_REG(23), RFLT, 'f'}, + {"F24", FP_REG(24), RFLT, 'F'}, + {"F25", FP_REG(25), RFLT, 'f'}, + {"F26", FP_REG(26), RFLT, 'F'}, + {"F27", FP_REG(27), RFLT, 'f'}, + {"F28", FP_REG(28), RFLT, 'F'}, + {"F29", FP_REG(29), RFLT, 'f'}, + {"F30", FP_REG(30), RFLT, 'F'}, + {"F31", FP_REG(31), RFLT, 'f'}, + {"FPCR", FP_REG(32), RFLT, 'X'}, + { 0 } +}; + + /* the machine description */ +Mach mmips = +{ + "mips", + MMIPS, /* machine type */ + mipsreglist, /* register set */ + REGSIZE, /* number of bytes in reg set */ + FPREGSIZE, /* number of bytes in fp reg set */ + "PC", /* name of PC */ + "SP", /* name of SP */ + "R31", /* name of link register */ + "setR30", /* static base register name */ + 0, /* value */ + 0x1000, /* page size */ + 0xC0000000, /* kernel base */ + 0x40000000, /* kernel text mask */ + 0x7FFFFFFF, /* user stack top */ + 4, /* quantization of pc */ + 4, /* szaddr */ + 4, /* szreg */ + 4, /* szfloat */ + 8, /* szdouble */ +}; diff --git a/utils/libmach/vcodas.c b/utils/libmach/vcodas.c new file mode 100644 index 0000000..b31fdb3 --- /dev/null +++ b/utils/libmach/vcodas.c @@ -0,0 +1,555 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" + + /* mips native disassembler */ + +typedef struct { + uvlong addr; /* pc of instr */ + uchar op; /* bits 31-26 */ + uchar rs; /* bits 25-21 */ + uchar rt; /* bits 20-16 */ + uchar rd; /* bits 15-11 */ + uchar sa; /* bits 10-6 */ + uchar function; /* bits 5-0 */ + long immediate; /* bits 15-0 */ + ulong cofun; /* bits 24-0 */ + ulong target; /* bits 25-0 */ + long w0; + char *curr; /* current fill point */ + char *end; /* end of buffer */ + char *err; +} Instr; + +typedef struct { + char *mnemonic; + char *mipsco; +} Opcode; + +static char mipscoload[] = "r%t,%l"; +static char mipscoalui[] = "r%t,r%s,%i"; +static char mipscoalu3op[] = "r%d,r%s,r%t"; +static char mipscoboc[] = "r%s,r%t,%b"; +static char mipscoboc0[] = "r%s,%b"; +static char mipscorsrt[] = "r%s,r%t"; +static char mipscorsi[] = "r%s,%i"; +static char mipscoxxx[] = "%w"; +static char mipscofp3[] = "f%a,f%d,f%t"; /* fd,fs,ft */ +static char mipscofp2[] = "f%a,f%d"; /* fd,fs */ +static char mipscofpc[] = "f%d,f%t"; /* fs,ft */ + +static Opcode opcodes[64] = { + 0, 0, + 0, 0, + "j", "%j", + "jal", "%j", + "beq", mipscoboc, + "bne", mipscoboc, + "blez", mipscoboc0, + "bgtz", mipscoboc0, + "addi", mipscoalui, + "addiu", mipscoalui, + "slti", mipscoalui, + "sltiu", mipscoalui, + "andi", mipscoalui, + "ori", mipscoalui, + "xori", mipscoalui, + "lui", "r%t,%u", + "cop0", 0, + "cop1", 0, + "cop2", 0, + "cop3", 0, + "beql", mipscoboc, + "bnel", mipscoboc, + "blezl", mipscoboc0, + "bgtzl", mipscoboc0, + "instr18", mipscoxxx, + "instr19", mipscoxxx, + "instr1A", mipscoxxx, + "instr1B", mipscoxxx, + "instr1C", mipscoxxx, + "instr1D", mipscoxxx, + "instr1E", mipscoxxx, + "instr1F", mipscoxxx, + "lb", mipscoload, + "lh", mipscoload, + "lwl", mipscoload, + "lw", mipscoload, + "lbu", mipscoload, + "lhu", mipscoload, + "lwr", mipscoload, + "instr27", mipscoxxx, + "sb", mipscoload, + "sh", mipscoload, + "swl", mipscoload, + "sw", mipscoload, + "instr2C", mipscoxxx, + "instr2D", mipscoxxx, + "swr", mipscoload, + "cache", "", + "ll", mipscoload, + "lwc1", mipscoload, + "lwc2", mipscoload, + "lwc3", mipscoload, + "instr34", mipscoxxx, + "ld", mipscoload, + "ld", mipscoload, + "ld", mipscoload, + "sc", mipscoload, + "swc1", mipscoload, + "swc2", mipscoload, + "swc3", mipscoload, + "instr3C", mipscoxxx, + "sd", mipscoload, + "sd", mipscoload, + "sd", mipscoload, +}; + +static Opcode sopcodes[64] = { + "sll", "r%d,r%t,$%a", + "special01", mipscoxxx, + "srl", "r%d,r%t,$%a", + "sra", "r%d,r%t,$%a", + "sllv", "r%d,r%t,R%s", + "special05", mipscoxxx, + "srlv", "r%d,r%t,r%s", + "srav", "r%d,r%t,r%s", + "jr", "r%s", + "jalr", "r%d,r%s", + "special0A", mipscoxxx, + "special0B", mipscoxxx, + "syscall", "", + "break", "", + "special0E", mipscoxxx, + "sync", "", + "mfhi", "r%d", + "mthi", "r%s", + "mflo", "r%d", + "mtlo", "r%s", + "special14", mipscoxxx, + "special15", mipscoxxx, + "special16", mipscoxxx, + "special17", mipscoxxx, + "mult", mipscorsrt, + "multu", mipscorsrt, + "div", mipscorsrt, + "divu", mipscorsrt, + "special1C", mipscoxxx, + "special1D", mipscoxxx, + "special1E", mipscoxxx, + "special1F", mipscoxxx, + "add", mipscoalu3op, + "addu", mipscoalu3op, + "sub", mipscoalu3op, + "subu", mipscoalu3op, + "and", mipscoalu3op, + "or", mipscoalu3op, + "xor", mipscoalu3op, + "nor", mipscoalu3op, + "special28", mipscoxxx, + "special29", mipscoxxx, + "slt", mipscoalu3op, + "sltu", mipscoalu3op, + "special2C", mipscoxxx, + "special2D", mipscoxxx, + "special2E", mipscoxxx, + "special2F", mipscoxxx, + "tge", mipscorsrt, + "tgeu", mipscorsrt, + "tlt", mipscorsrt, + "tltu", mipscorsrt, + "teq", mipscorsrt, + "special35", mipscoxxx, + "tne", mipscorsrt, + "special37", mipscoxxx, + "special38", mipscoxxx, + "special39", mipscoxxx, + "special3A", mipscoxxx, + "special3B", mipscoxxx, + "special3C", mipscoxxx, + "special3D", mipscoxxx, + "special3E", mipscoxxx, + "special3F", mipscoxxx, +}; + +static Opcode ropcodes[32] = { + "bltz", mipscoboc0, + "bgez", mipscoboc0, + "bltzl", mipscoboc0, + "bgezl", mipscoboc0, + "regimm04", mipscoxxx, + "regimm05", mipscoxxx, + "regimm06", mipscoxxx, + "regimm07", mipscoxxx, + "tgei", mipscorsi, + "tgeiu", mipscorsi, + "tlti", mipscorsi, + "tltiu", mipscorsi, + "teqi", mipscorsi, + "regimm0D", mipscoxxx, + "tnei", mipscorsi, + "regimm0F", mipscoxxx, + "bltzal", mipscoboc0, + "bgezal", mipscoboc0, + "bltzall", mipscoboc0, + "bgezall", mipscoboc0, + "regimm14", mipscoxxx, + "regimm15", mipscoxxx, + "regimm16", mipscoxxx, + "regimm17", mipscoxxx, + "regimm18", mipscoxxx, + "regimm19", mipscoxxx, + "regimm1A", mipscoxxx, + "regimm1B", mipscoxxx, + "regimm1C", mipscoxxx, + "regimm1D", mipscoxxx, + "regimm1E", mipscoxxx, + "regimm1F", mipscoxxx, +}; + +static Opcode fopcodes[64] = { + "add.%f", mipscofp3, + "sub.%f", mipscofp3, + "mul.%f", mipscofp3, + "div.%f", mipscofp3, + "sqrt.%f", mipscofp2, + "abs.%f", mipscofp2, + "mov.%f", mipscofp2, + "neg.%f", mipscofp2, + "finstr08", mipscoxxx, + "finstr09", mipscoxxx, + "finstr0A", mipscoxxx, + "finstr0B", mipscoxxx, + "round.w.%f", mipscofp2, + "trunc.w%f", mipscofp2, + "ceil.w%f", mipscofp2, + "floor.w%f", mipscofp2, + "finstr10", mipscoxxx, + "finstr11", mipscoxxx, + "finstr12", mipscoxxx, + "finstr13", mipscoxxx, + "finstr14", mipscoxxx, + "finstr15", mipscoxxx, + "finstr16", mipscoxxx, + "finstr17", mipscoxxx, + "finstr18", mipscoxxx, + "finstr19", mipscoxxx, + "finstr1A", mipscoxxx, + "finstr1B", mipscoxxx, + "finstr1C", mipscoxxx, + "finstr1D", mipscoxxx, + "finstr1E", mipscoxxx, + "finstr1F", mipscoxxx, + "cvt.s.%f", mipscofp2, + "cvt.d.%f", mipscofp2, + "cvt.e.%f", mipscofp2, + "cvt.q.%f", mipscofp2, + "cvt.w.%f", mipscofp2, + "finstr25", mipscoxxx, + "finstr26", mipscoxxx, + "finstr27", mipscoxxx, + "finstr28", mipscoxxx, + "finstr29", mipscoxxx, + "finstr2A", mipscoxxx, + "finstr2B", mipscoxxx, + "finstr2C", mipscoxxx, + "finstr2D", mipscoxxx, + "finstr2E", mipscoxxx, + "finstr2F", mipscoxxx, + "c.f.%f", mipscofpc, + "c.un.%f", mipscofpc, + "c.eq.%f", mipscofpc, + "c.ueq.%f", mipscofpc, + "c.olt.%f", mipscofpc, + "c.ult.%f", mipscofpc, + "c.ole.%f", mipscofpc, + "c.ule.%f", mipscofpc, + "c.sf.%f", mipscofpc, + "c.ngle.%f", mipscofpc, + "c.seq.%f", mipscofpc, + "c.ngl.%f", mipscofpc, + "c.lt.%f", mipscofpc, + "c.nge.%f", mipscofpc, + "c.le.%f", mipscofpc, + "c.ngt.%f", mipscofpc, +}; + +static char fsub[16] = { + 's', 'd', 'e', 'q', 'w', '?', '?', '?', + '?', '?', '?', '?', '?', '?', '?', '?' +}; + + +static int +mkinstr(Instr *i, Map *map, uvlong pc) +{ + ulong w; + + if (get4(map, pc, &w) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + i->addr = pc; + i->op = (w >> 26) & 0x3F; + i->rs = (w >> 21) & 0x1F; + i->rt = (w >> 16) & 0x1F; + i->rd = (w >> 11) & 0x1F; + i->sa = (w >> 6) & 0x1F; + i->function = w & 0x3F; + i->immediate = w & 0x0000FFFF; + if (i->immediate & 0x8000) + i->immediate |= ~0x0000FFFF; + i->cofun = w & 0x01FFFFFF; + i->target = w & 0x03FFFFFF; + i->w0 = w; + return 1; +} + +#pragma varargck argpos bprint 2 + +static void +bprint(Instr *i, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + i->curr = vseprint(i->curr, i->end, fmt, arg); + va_end(arg); +} + +static void +format(char *mnemonic, Instr *i, char *f) +{ + if (mnemonic) + format(0, i, mnemonic); + if (f == 0) + return; + if (i->curr < i->end) + *i->curr++ = '\t'; + for ( ; *f && i->curr < i->end; f++) { + if (*f != '%') { + *i->curr++ = *f; + continue; + } + switch (*++f) { + + case 's': + bprint(i, "%d", i->rs); + break; + + case 't': + bprint(i, "%d", i->rt); + break; + + case 'd': + bprint(i, "%d", i->rd); + break; + + case 'a': + bprint(i, "%d", i->sa); + break; + + case 'l': + if (i->rs == 30) { + i->curr += symoff(i->curr, i->end-i->curr, i->immediate+mach->sb, CANY); + bprint(i, "(SB)"); + } else + bprint(i, "%lx(r%d)", i->immediate, i->rs); + break; + + case 'i': + bprint(i, "$%lx", i->immediate); + break; + + case 'u': + *i->curr++ = '$'; + i->curr += symoff(i->curr, i->end-i->curr, i->immediate, CANY); + bprint(i, "(SB)"); + break; + + case 'j': + i->curr += symoff(i->curr, i->end-i->curr, + (i->target<<2)|(i->addr & 0xF0000000), CANY); + bprint(i, "(SB)"); + break; + + case 'b': + i->curr += symoff(i->curr, i->end-i->curr, + (i->immediate<<2)+i->addr+4, CANY); + break; + + case 'c': + bprint(i, "%lux", i->cofun); + break; + + case 'w': + bprint(i, "[%lux]", i->w0); + break; + + case 'f': + *i->curr++ = fsub[i->rs & 0x0F]; + break; + + case '\0': + *i->curr++ = '%'; + return; + + default: + bprint(i, "%%%c", *f); + break; + } + } +} + +static void +copz(int cop, Instr *i) +{ + char *f, *m, buf[16]; + + m = buf; + f = "%t,%d"; + switch (i->rs) { + + case 0: + sprint(buf, "mfc%d", cop); + break; + + case 2: + sprint(buf, "cfc%d", cop); + break; + + case 4: + sprint(buf, "mtc%d", cop); + break; + + case 6: + sprint(buf, "ctc%d", cop); + break; + + case 8: + f = "%b"; + switch (i->rt) { + + case 0: + sprint(buf, "bc%df", cop); + break; + + case 1: + sprint(buf, "bc%dt", cop); + break; + + case 2: + sprint(buf, "bc%dfl", cop); + break; + + case 3: + sprint(buf, "bc%dtl", cop); + break; + + default: + sprint(buf, "cop%d", cop); + f = mipscoxxx; + break; + } + break; + + default: + sprint(buf, "cop%d", cop); + if (i->rs & 0x10) + f = "function %c"; + else + f = mipscoxxx; + break; + } + format(m, i, f); +} + +static void +cop0(Instr *i) +{ + char *m = 0; + + if (i->rs >= 0x10) { + switch (i->cofun) { + + case 1: + m = "tlbr"; + break; + + case 2: + m = "tlbwi"; + break; + + case 6: + m = "tlbwr"; + break; + + case 8: + m = "tlbp"; + break; + + case 16: + m = "rfe"; + break; + + case 32: + m = "eret"; + break; + } + if (m) { + format(m, i, 0); + if (i->curr < i->end) + *i->curr++ = 0; + return; + } + } + copz(0, i); +} + +int +_mipscoinst(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + Opcode *o; + uchar op; + + i.curr = buf; + i.end = buf+n-1; + if (mkinstr(&i, map, pc) < 0) + return -1; + switch (i.op) { + + case 0x00: /* SPECIAL */ + o = sopcodes; + op = i.function; + break; + + case 0x01: /* REGIMM */ + o = ropcodes; + op = i.rt; + break; + + case 0x10: /* COP0 */ + cop0(&i); + return 4; + + case 0x11: /* COP1 */ + if (i.rs & 0x10) { + o = fopcodes; + op = i.function; + break; + } + /*FALLTHROUGH*/ + case 0x12: /* COP2 */ + case 0x13: /* COP3 */ + copz(i.op-0x10, &i); + return 4; + + default: + o = opcodes; + op = i.op; + break; + } + format(o[op].mnemonic, &i, o[op].mipsco); + return 4; +} diff --git a/utils/libmach/vdb.c b/utils/libmach/vdb.c new file mode 100644 index 0000000..5579897 --- /dev/null +++ b/utils/libmach/vdb.c @@ -0,0 +1,1165 @@ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +/* + * Mips-specific debugger interface + */ + +static char *mipsexcep(Map*, Rgetter); +static int mipsfoll(Map*, uvlong, Rgetter, uvlong*); +static int mipsinst(Map*, uvlong, char, char*, int); +static int mipsdas(Map*, uvlong, char*, int); +static int mipsinstlen(Map*, uvlong); + +/* + * Debugger interface + */ +Machdata mipsmach = +{ + {0, 0, 0, 0xD}, /* break point */ + 4, /* break point size */ + + beswab, /* short to local byte order */ + beswal, /* long to local byte order */ + beswav, /* vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + mipsexcep, /* print exception */ + 0, /* breakpoint fixup */ + beieeesftos, /* single precision float printer */ + beieeedftos, /* double precisioin float printer */ + mipsfoll, /* following addresses */ + mipsinst, /* print instruction */ + mipsdas, /* dissembler */ + mipsinstlen, /* instruction size */ +}; + +Machdata mipsmachle = +{ + {0, 0, 0, 0xD}, /* break point */ + 4, /* break point size */ + + leswab, /* short to local byte order */ + leswal, /* long to local byte order */ + leswav, /* vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + mipsexcep, /* print exception */ + 0, /* breakpoint fixup */ + leieeesftos, /* single precision float printer */ + leieeedftos, /* double precisioin float printer */ + mipsfoll, /* following addresses */ + mipsinst, /* print instruction */ + mipsdas, /* dissembler */ + mipsinstlen, /* instruction size */ +}; + +/* + * mips r4k little-endian + */ +Machdata mipsmach2le = +{ + {0, 0, 0, 0xD}, /* break point */ + 4, /* break point size */ + + leswab, /* short to local byte order */ + leswal, /* long to local byte order */ + leswav, /* vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + mipsexcep, /* print exception */ + 0, /* breakpoint fixup */ + leieeesftos, /* single precision float printer */ + leieeedftos, /* double precisioin float printer */ + mipsfoll, /* following addresses */ + mipsinst, /* print instruction */ + mipsdas, /* dissembler */ + mipsinstlen, /* instruction size */ +}; + +/* + * mips r4k big-endian + */ +Machdata mipsmach2be = +{ + {0, 0, 0, 0xD}, /* break point */ + 4, /* break point size */ + + beswab, /* short to local byte order */ + beswal, /* long to local byte order */ + beswav, /* vlong to local byte order */ + risctrace, /* C traceback */ + riscframe, /* Frame finder */ + mipsexcep, /* print exception */ + 0, /* breakpoint fixup */ + beieeesftos, /* single precision float printer */ + beieeedftos, /* double precisioin float printer */ + mipsfoll, /* following addresses */ + mipsinst, /* print instruction */ + mipsdas, /* dissembler */ + mipsinstlen, /* instruction size */ +}; + + +static char *excname[] = +{ + "external interrupt", + "TLB modification", + "TLB miss (load or fetch)", + "TLB miss (store)", + "address error (load or fetch)", + "address error (store)", + "bus error (fetch)", + "bus error (data load or store)", + "system call", + "breakpoint", + "reserved instruction", + "coprocessor unusable", + "arithmetic overflow", + "undefined 13", + "undefined 14", + "system call", + /* the following is made up */ + "floating point exception" /* FPEXC */ +}; + +static char* +mipsexcep(Map *map, Rgetter rget) +{ + int e; + long c; + + c = (*rget)(map, "CAUSE"); + if(c & 0x00002000) /* INTR3 */ + e = 16; /* Floating point exception */ + else + e = (c>>2)&0x0F; + return excname[e]; +} + + /* mips disassembler and related functions */ + +static char FRAMENAME[] = ".frame"; + +typedef struct { + uvlong addr; + uchar op; /* bits 31-26 */ + uchar rs; /* bits 25-21 */ + uchar rt; /* bits 20-16 */ + uchar rd; /* bits 15-11 */ + uchar sa; /* bits 10-6 */ + uchar function; /* bits 5-0 */ + long immediate; /* bits 15-0 */ + ulong cofun; /* bits 24-0 */ + ulong target; /* bits 25-0 */ + long w0; + long w1; + int size; /* instruction size */ + char *curr; /* fill point in buffer */ + char *end; /* end of buffer */ + char *err; /* error message */ +} Instr; + +static Map *mymap; + +static int +decode(uvlong pc, Instr *i) +{ + ulong w; + + if (get4(mymap, pc, &w) < 0) { + werrstr("can't read instruction: %r"); + return -1; + } + + i->addr = pc; + i->size = 1; + i->op = (w >> 26) & 0x3F; + i->rs = (w >> 21) & 0x1F; + i->rt = (w >> 16) & 0x1F; + i->rd = (w >> 11) & 0x1F; + i->sa = (w >> 6) & 0x1F; + i->function = w & 0x3F; + i->immediate = w & 0x0000FFFF; + if (i->immediate & 0x8000) + i->immediate |= ~0x0000FFFF; + i->cofun = w & 0x01FFFFFF; + i->target = w & 0x03FFFFFF; + i->w0 = w; + return 1; +} + +static int +mkinstr(uvlong pc, Instr *i) +{ + Instr x; + + if (decode(pc, i) < 0) + return -1; + /* + * if it's a LUI followed by an ORI, + * it's an immediate load of a large constant. + * fix the LUI immediate in any case. + */ + if (i->op == 0x0F) { + if (decode(pc+4, &x) < 0) + return 0; + i->immediate <<= 16; + if (x.op == 0x0D && x.rs == x.rt && x.rt == i->rt) { + i->immediate |= (x.immediate & 0xFFFF); + i->w1 = x.w0; + i->size++; + return 1; + } + } + /* + * if it's a LWC1 followed by another LWC1 + * into an adjacent register, it's a load of + * a floating point double. + */ + else if (i->op == 0x31 && (i->rt & 0x01)) { + if (decode(pc+4, &x) < 0) + return 0; + if (x.op == 0x31 && x.rt == (i->rt - 1) && x.rs == i->rs) { + i->rt -= 1; + i->w1 = x.w0; + i->size++; + return 1; + } + } + /* + * similarly for double stores + */ + else if (i->op == 0x39 && (i->rt & 0x01)) { + if (decode(pc+4, &x) < 0) + return 0; + if (x.op == 0x39 && x.rt == (i->rt - 1) && x.rs == i->rs) { + i->rt -= 1; + i->w1 = x.w0; + i->size++; + } + } + return 1; +} + +#pragma varargck argpos bprint 2 + +static void +bprint(Instr *i, char *fmt, ...) +{ + va_list arg; + + va_start(arg, fmt); + i->curr = vseprint(i->curr, i->end, fmt, arg); + va_end(arg); +} + +typedef struct Opcode Opcode; + +struct Opcode { + char *mnemonic; + void (*f)(Opcode *, Instr *); + char *ken; +}; + +static void format(char *, Instr *, char *); + +static void +branch(Opcode *o, Instr *i) +{ + if (i->rs == 0 && i->rt == 0) + format("JMP", i, "%b"); + else if (i->rs == 0) + format(o->mnemonic, i, "R%t,%b"); + else if (i->rt < 2) + format(o->mnemonic, i, "R%s,%b"); + else + format(o->mnemonic, i, "R%s,R%t,%b"); +} + +static void +addi(Opcode *o, Instr *i) +{ + if (i->rs == i->rt) + format(o->mnemonic, i, "%i,R%t"); + else if (i->rs == 0) + format("MOVW", i, "%i,R%t"); + else if (i->rs == 30) { + bprint(i, "MOVW\t$"); + i->curr += symoff(i->curr, i->end-i->curr, + i->immediate+mach->sb, CANY); + bprint(i, "(SB),R%d", i->rt); + } + else + format(o->mnemonic, i, o->ken); +} + +static void +andi(Opcode *o, Instr *i) +{ + if (i->rs == i->rt) + format(o->mnemonic, i, "%i,R%t"); + else + format(o->mnemonic, i, o->ken); +} + +static int +plocal(Instr *i, char *m, char r, int store) +{ + int offset; + char *reg; + Symbol s; + + if (!findsym(i->addr, CTEXT, &s) || !findlocal(&s, FRAMENAME, &s)) + return 0; + if (s.value > i->immediate) { + if(!getauto(&s, s.value-i->immediate, CAUTO, &s)) + return 0; + reg = "(SP)"; + offset = i->immediate; + } else { + offset = i->immediate-s.value; + if (!getauto(&s, offset-4, CPARAM, &s)) + return 0; + reg = "(FP)"; + } + if (store) + bprint(i, "%s\t%c%d,%s+%d%s", m, r, i->rt, s.name, offset, reg); + else + bprint(i, "%s\t%s+%d%s,%c%d", m, s.name, offset, reg, r, i->rt); + return 1; +} + +static void +lw(Opcode *o, Instr *i, char r) +{ + char *m; + + if (r == 'F') { + if (i->size == 2) + m = "MOVD"; + else + m = "MOVF"; + } + else + m = o->mnemonic; + if (i->rs == 29 && plocal(i, m, r, 0)) + return; + + if (i->rs == 30 && mach->sb) { + bprint(i, "%s\t", m); + i->curr += symoff(i->curr, i->end-i->curr, i->immediate+mach->sb, CANY); + bprint(i, "(SB),%c%d", r, i->rt); + return; + } + if (r == 'F') + format(m, i, "%l,F%t"); + else + format(m, i, o->ken); +} + +static void +load(Opcode *o, Instr *i) +{ + lw(o, i, 'R'); +} + +static void +lwc1(Opcode *o, Instr *i) +{ + lw(o, i, 'F'); +} + +static void +sw(Opcode *o, Instr *i, char r) +{ + char *m; + + if (r == 'F') { + if (i->size == 2) + m = "MOVD"; + else + m = "MOVF"; + } + else + m = o->mnemonic; + if (i->rs == 29 && plocal(i, m, r, 1)) + return; + + if (i->rs == 30 && mach->sb) { + bprint(i, "%s\t%c%d,", m, r, i->rt); + i->curr += symoff(i->curr, i->end-i->curr, i->immediate+mach->sb, CANY); + bprint(i, "(SB)"); + return; + } + if (r == 'F') + format(m, i, "F%t,%l"); + else + format(m, i, o->ken); +} + +static void +store(Opcode *o, Instr *i) +{ + sw(o, i, 'R'); +} + +static void +swc1(Opcode *o, Instr *i) +{ + sw(o, i, 'F'); +} + +static void +sll(Opcode *o, Instr *i) +{ + if (i->w0 == 0) + bprint(i, "NOOP"); + else if (i->rd == i->rt) + format(o->mnemonic, i, "$%a,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +sl32(Opcode *o, Instr *i) +{ + i->sa += 32; + if (i->rd == i->rt) + format(o->mnemonic, i, "$%a,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +sllv(Opcode *o, Instr *i) +{ + if (i->rd == i->rt) + format(o->mnemonic, i, "R%s,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +jal(Opcode *o, Instr *i) +{ + if (i->rd == 31) + format("JAL", i, "(R%s)"); + else + format(o->mnemonic, i, o->ken); +} + +static void +add(Opcode *o, Instr *i) +{ + if (i->rd == i->rs) + format(o->mnemonic, i, "R%t,R%d"); + else if (i->rd == i->rt) + format(o->mnemonic, i, "R%s,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +sub(Opcode *o, Instr *i) +{ + if (i->rd == i->rs) + format(o->mnemonic, i, "R%t,R%d"); + else + format(o->mnemonic, i, o->ken); +} + +static void +or(Opcode *o, Instr *i) +{ + if (i->rs == 0 && i->rt == 0) + format("MOVW", i, "$0,R%d"); + else if (i->rs == 0) + format("MOVW", i, "R%t,R%d"); + else if (i->rt == 0) + format("MOVW", i, "R%s,R%d"); + else + add(o, i); +} + +static void +nor(Opcode *o, Instr *i) +{ + if (i->rs == 0 && i->rt == 0 && i->rd == 0) + format("NOP", i, 0); + else + add(o, i); +} + +static char mipscoload[] = "r%t,%l"; +static char mipsload[] = "%l,R%t"; +static char mipsstore[] = "R%t,%l"; +static char mipsalui[] = "%i,R%s,R%t"; +static char mipsalu3op[] = "R%t,R%s,R%d"; +static char mipsrtrs[] = "R%t,R%s"; +static char mipscorsrt[] = "r%s,r%t"; +static char mipscorsi[] = "r%s,%i"; +static char mipscoxxx[] = "%w"; +static char mipscofp3[] = "f%a,f%d,f%t"; /* fd,fs,ft */ +static char mipsfp3[] = "F%t,F%d,F%a"; +static char mipscofp2[] = "f%a,f%d"; /* fd,fs */ +static char mipsfp2[] = "F%d,F%a"; +static char mipscofpc[] = "f%d,f%t"; /* fs,ft */ +static char mipsfpc[] = "F%t,F%d"; + +static Opcode opcodes[64] = { + 0, 0, 0, + 0, 0, 0, + "JMP", 0, "%j", + "JAL", 0, "%j", + "BEQ", branch, 0, + "BNE", branch, 0, + "BLEZ", branch, 0, + "BGTZ", branch, 0, + "ADD", addi, mipsalui, + "ADDU", addi, mipsalui, + "SGT", 0, mipsalui, + "SGTU", 0, mipsalui, + "AND", andi, mipsalui, + "OR", andi, mipsalui, + "XOR", andi, mipsalui, + "MOVW", 0, "$%u,R%t", + "cop0", 0, 0, + "cop1", 0, 0, + "cop2", 0, 0, + "cop3", 0, 0, + "BEQL", branch, 0, + "BNEL", branch, 0, + "BLEZL", branch, 0, + "BGTZL", branch, 0, + "instr18", 0, mipscoxxx, + "instr19", 0, mipscoxxx, + "MOVVL", load, mipsload, + "MOVVR", load, mipsload, + "instr1C", 0, mipscoxxx, + "instr1D", 0, mipscoxxx, + "instr1E", 0, mipscoxxx, + "instr1F", 0, mipscoxxx, + "MOVB", load, mipsload, + "MOVH", load, mipsload, + "lwl", 0, mipscoload, + "MOVW", load, mipsload, + "MOVBU", load, mipsload, + "MOVHU", load, mipsload, + "lwr", 0, mipscoload, + "instr27", 0, mipscoxxx, + "MOVB", store, mipsstore, + "MOVH", store, mipsstore, + "swl", 0, mipscoload, + "MOVW", store, mipsstore, + "MOVVL", store, mipsstore, + "MOVVR", store, mipsstore, + "swr", 0, mipscoload, + "CACHE", 0, "%C,%l", + "ll", 0, mipscoload, + "MOVW", lwc1, mipscoload, + "lwc2", 0, mipscoload, + "lwc3", 0, mipscoload, + "instr34", 0, mipscoxxx, + "ldc1", 0, mipscoload, + "ldc2", 0, mipscoload, + "MOVV", load, mipsload, + "sc", 0, mipscoload, + "swc1", swc1, mipscoload, + "swc2", 0, mipscoload, + "swc3", 0, mipscoload, + "instr3C", 0, mipscoxxx, + "sdc1", 0, mipscoload, + "sdc2", 0, mipscoload, + "MOVV", store, mipsstore, +}; + +static Opcode sopcodes[64] = { + "SLL", sll, "$%a,R%t,R%d", + "special01", 0, mipscoxxx, + "SRL", sll, "$%a,R%t,R%d", + "SRA", sll, "$%a,R%t,R%d", + "SLL", sllv, "R%s,R%t,R%d", + "special05", 0, mipscoxxx, + "SRL", sllv, "R%s,R%t,R%d", + "SRA", sllv, "R%s,R%t,R%d", + "JMP", 0, "(R%s)", + "jal", jal, "r%d,r%s", + "special0A", 0, mipscoxxx, + "special0B", 0, mipscoxxx, + "SYSCALL", 0, 0, + "BREAK", 0, 0, + "special0E", 0, mipscoxxx, + "SYNC", 0, 0, + "MOVW", 0, "HI,R%d", + "MOVW", 0, "R%s,HI", + "MOVW", 0, "LO,R%d", + "MOVW", 0, "R%s,LO", + "SLLV", sllv, "R%s,R%t,R%d", + "special15", 0, mipscoxxx, + "SRLV", sllv, "R%s,R%t,R%d", + "SRAV", sllv, "R%s,R%t,R%d", + "MUL", 0, mipsrtrs, + "MULU", 0, mipsrtrs, + "DIV", 0, mipsrtrs, + "DIVU", 0, mipsrtrs, + "special1C", 0, mipscoxxx, + "special1D", 0, mipscoxxx, + "DDIV", 0, "R%s,R%t", + "special1F", 0, mipscoxxx, + "ADD", add, mipsalu3op, + "ADDU", add, mipsalu3op, + "SUB", sub, mipsalu3op, + "SUBU", sub, mipsalu3op, + "AND", add, mipsalu3op, + "OR", or, mipsalu3op, + "XOR", add, mipsalu3op, + "NOR", nor, mipsalu3op, + "special28", 0, mipscoxxx, + "special29", 0, mipscoxxx, + "SGT", 0, mipsalu3op, + "SGTU", 0, mipsalu3op, + "special2C", 0, mipscoxxx, + "special2D", 0, mipscoxxx, + "special2E", 0, mipscoxxx, + "DSUBU", 0, "R%s,R%t,R%d", + "tge", 0, mipscorsrt, + "tgeu", 0, mipscorsrt, + "tlt", 0, mipscorsrt, + "tltu", 0, mipscorsrt, + "teq", 0, mipscorsrt, + "special35", 0, mipscoxxx, + "tne", 0, mipscorsrt, + "special37", 0, mipscoxxx, + "SLLV", sll, "$%a,R%t,R%d", + "special39", 0, mipscoxxx, + "SRLV", sll, "$%a,R%t,R%d", + "SRAV", sll, "$%a,R%t,R%d", + "SLLV", sl32, "$%a,R%t,R%d", + "special3D", 0, mipscoxxx, + "SRLV", sl32, "$%a,R%t,R%d", + "SRAV", sl32, "$%a,R%t,R%d", +}; + +static Opcode ropcodes[32] = { + "BLTZ", branch, 0, + "BGEZ", branch, 0, + "BLTZL", branch, 0, + "BGEZL", branch, 0, + "regimm04", 0, mipscoxxx, + "regimm05", 0, mipscoxxx, + "regimm06", 0, mipscoxxx, + "regimm07", 0, mipscoxxx, + "tgei", 0, mipscorsi, + "tgeiu", 0, mipscorsi, + "tlti", 0, mipscorsi, + "tltiu", 0, mipscorsi, + "teqi", 0, mipscorsi, + "regimm0D", 0, mipscoxxx, + "tnei", 0, mipscorsi, + "regimm0F", 0, mipscoxxx, + "BLTZAL", branch, 0, + "BGEZAL", branch, 0, + "BLTZALL", branch, 0, + "BGEZALL", branch, 0, + "regimm14", 0, mipscoxxx, + "regimm15", 0, mipscoxxx, + "regimm16", 0, mipscoxxx, + "regimm17", 0, mipscoxxx, + "regimm18", 0, mipscoxxx, + "regimm19", 0, mipscoxxx, + "regimm1A", 0, mipscoxxx, + "regimm1B", 0, mipscoxxx, + "regimm1C", 0, mipscoxxx, + "regimm1D", 0, mipscoxxx, + "regimm1E", 0, mipscoxxx, + "regimm1F", 0, mipscoxxx, +}; + +static Opcode fopcodes[64] = { + "ADD%f", 0, mipsfp3, + "SUB%f", 0, mipsfp3, + "MUL%f", 0, mipsfp3, + "DIV%f", 0, mipsfp3, + "sqrt.%f", 0, mipscofp2, + "ABS%f", 0, mipsfp2, + "MOV%f", 0, mipsfp2, + "NEG%f", 0, mipsfp2, + "finstr08", 0, mipscoxxx, + "finstr09", 0, mipscoxxx, + "finstr0A", 0, mipscoxxx, + "finstr0B", 0, mipscoxxx, + "round.w.%f", 0, mipscofp2, + "trunc.w%f", 0, mipscofp2, + "ceil.w%f", 0, mipscofp2, + "floor.w%f", 0, mipscofp2, + "finstr10", 0, mipscoxxx, + "finstr11", 0, mipscoxxx, + "finstr12", 0, mipscoxxx, + "finstr13", 0, mipscoxxx, + "finstr14", 0, mipscoxxx, + "finstr15", 0, mipscoxxx, + "finstr16", 0, mipscoxxx, + "finstr17", 0, mipscoxxx, + "finstr18", 0, mipscoxxx, + "finstr19", 0, mipscoxxx, + "finstr1A", 0, mipscoxxx, + "finstr1B", 0, mipscoxxx, + "finstr1C", 0, mipscoxxx, + "finstr1D", 0, mipscoxxx, + "finstr1E", 0, mipscoxxx, + "finstr1F", 0, mipscoxxx, + "cvt.s.%f", 0, mipscofp2, + "cvt.d.%f", 0, mipscofp2, + "cvt.e.%f", 0, mipscofp2, + "cvt.q.%f", 0, mipscofp2, + "cvt.w.%f", 0, mipscofp2, + "finstr25", 0, mipscoxxx, + "finstr26", 0, mipscoxxx, + "finstr27", 0, mipscoxxx, + "finstr28", 0, mipscoxxx, + "finstr29", 0, mipscoxxx, + "finstr2A", 0, mipscoxxx, + "finstr2B", 0, mipscoxxx, + "finstr2C", 0, mipscoxxx, + "finstr2D", 0, mipscoxxx, + "finstr2E", 0, mipscoxxx, + "finstr2F", 0, mipscoxxx, + "c.f.%f", 0, mipscofpc, + "c.un.%f", 0, mipscofpc, + "CMPEQ%f", 0, mipsfpc, + "c.ueq.%f", 0, mipscofpc, + "c.olt.%f", 0, mipscofpc, + "c.ult.%f", 0, mipscofpc, + "c.ole.%f", 0, mipscofpc, + "c.ule.%f", 0, mipscofpc, + "c.sf.%f", 0, mipscofpc, + "c.ngle.%f", 0, mipscofpc, + "c.seq.%f", 0, mipscofpc, + "c.ngl.%f", 0, mipscofpc, + "CMPGT%f", 0, mipsfpc, + "c.nge.%f", 0, mipscofpc, + "CMPGE%f", 0, mipsfpc, + "c.ngt.%f", 0, mipscofpc, +}; + +static char *cop0regs[32] = { + "INDEX", "RANDOM", "TLBPHYS", "EntryLo0", + "CONTEXT", "PageMask", "Wired", "Error", + "BADVADDR", "Count", "TLBVIRT", "Compare", + "STATUS", "CAUSE", "EPC", "PRID", + "Config", "LLadr", "WatchLo", "WatchHi", + "20", "21", "22", "23", + "24", "25", "26", "CacheErr", + "TagLo", "TagHi", "ErrorEPC", "31" +}; + +static char fsub[16] = { + 'F', 'D', 'e', 'q', 'W', '?', '?', '?', + '?', '?', '?', '?', '?', '?', '?', '?' +}; + +static char *cacheps[] = { + "I", "D", "SI", "SD" +}; + +static char *cacheop[] = { + "IWBI", "ILT", "IST", "CDE", "HI", "HWBI", "HWB", "HSV" +}; + +static void +format(char *mnemonic, Instr *i, char *f) +{ + if (mnemonic) + format(0, i, mnemonic); + if (f == 0) + return; + if (mnemonic) + if (i->curr < i->end) + *i->curr++ = '\t'; + for ( ; *f && i->curr < i->end; f++) { + if (*f != '%') { + *i->curr++ = *f; + continue; + } + switch (*++f) { + + case 's': + bprint(i, "%d", i->rs); + break; + + case 't': + bprint(i, "%d", i->rt); + break; + + case 'd': + bprint(i, "%d", i->rd); + break; + + case 'a': + bprint(i, "%d", i->sa); + break; + + case 'l': + bprint(i, "%lx(R%d)",i->immediate, i->rs); + break; + + case 'i': + bprint(i, "$%lx", i->immediate); + break; + + case 'u': + i->curr += symoff(i->curr, i->end-i->curr, i->immediate, CANY); + bprint(i, "(SB)"); + break; + + case 'j': + i->curr += symoff(i->curr, i->end-i->curr, + (i->target<<2)|(i->addr & 0xF0000000), CANY); + bprint(i, "(SB)"); + break; + + case 'b': + i->curr += symoff(i->curr, i->end-i->curr, + (i->immediate<<2)+i->addr+4, CANY); + break; + + case 'c': + bprint(i, "$%lx", i->cofun); + break; + + case 'w': + bprint(i, "[%lux]", i->w0); + break; + + case 'm': + bprint(i, "M(%s)", cop0regs[i->rd]); + break; + + case 'f': + *i->curr++ = fsub[i->rs & 0x0F]; + break; + + case 'C': + bprint(i, "%s%s", cacheps[i->rt & 3], cacheop[(i->rt>>2) & 7]); + break; + + case '\0': + *i->curr++ = '%'; + return; + + default: + bprint(i, "%%%c", *f); + break; + } + } + *i->curr = 0; +} + +static void +copz(int cop, Instr *i) +{ + char *f, *m, buf[16]; + + m = buf; + f = "%t,%d"; + switch (i->rs) { + + case 0: + sprint(buf, "mfc%d", cop); + break; + + case 2: + sprint(buf, "cfc%d", cop); + break; + + case 4: + sprint(buf, "mtc%d", cop); + break; + + case 6: + sprint(buf, "ctc%d", cop); + break; + + case 8: + f = "%b"; + switch (i->rt) { + + case 0: + sprint(buf, "bc%df", cop); + break; + + case 1: + sprint(buf, "bc%dt", cop); + break; + + case 2: + sprint(buf, "bc%dfl", cop); + break; + + case 3: + sprint(buf, "bc%dtl", cop); + break; + + default: + sprint(buf, "cop%d", cop); + f = mipscoxxx; + break; + } + break; + + default: + sprint(buf, "cop%d", cop); + if (i->rs & 0x10) + f = "function %c"; + else + f = mipscoxxx; + break; + } + format(m, i, f); +} + +static void +cop0(Instr *i) +{ + char *m = 0; + + if (i->rs < 8) { + switch (i->rs) { + + case 0: + case 1: + format("MOVW", i, "%m,R%t"); + return; + + case 4: + case 5: + format("MOVW", i, "R%t,%m"); + return; + } + } + else if (i->rs >= 0x10) { + switch (i->cofun) { + + case 1: + m = "TLBR"; + break; + + case 2: + m = "TLBWI"; + break; + + case 6: + m = "TLBWR"; + break; + + case 8: + m = "TLBP"; + break; + + case 16: + m = "RFE"; + break; + + case 32: + m = "ERET"; + break; + } + if (m) { + format(m, i, 0); + return; + } + } + copz(0, i); +} + +static void +cop1(Instr *i) +{ + char *m = "MOVW"; + + switch (i->rs) { + + case 0: + format(m, i, "F%d,R%t"); + return; + + case 2: + format(m, i, "FCR%d,R%t"); + return; + + case 4: + format(m, i, "R%t,F%d"); + return; + + case 6: + format(m, i, "R%t,FCR%d"); + return; + + case 8: + switch (i->rt) { + + case 0: + format("BFPF", i, "%b"); + return; + + case 1: + format("BFPT", i, "%b"); + return; + } + break; + } + copz(1, i); +} + +static int +printins(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + Opcode *o; + uchar op; + + i.curr = buf; + i.end = buf+n-1; + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + switch (i.op) { + + case 0x00: /* SPECIAL */ + o = sopcodes; + op = i.function; + break; + + case 0x01: /* REGIMM */ + o = ropcodes; + op = i.rt; + break; + + case 0x10: /* COP0 */ + cop0(&i); + return i.size*4; + + case 0x11: /* COP1 */ + if (i.rs & 0x10) { + o = fopcodes; + op = i.function; + break; + } + cop1(&i); + return i.size*4; + + case 0x12: /* COP2 */ + case 0x13: /* COP3 */ + copz(i.op-0x10, &i); + return i.size*4; + + default: + o = opcodes; + op = i.op; + break; + } + if (o[op].f) + (*o[op].f)(&o[op], &i); + else + format(o[op].mnemonic, &i, o[op].ken); + return i.size*4; +} + +extern int _mipscoinst(Map *, uvlong, char*, int); + + /* modifier 'I' toggles the default disassembler type */ +static int +mipsinst(Map *map, uvlong pc, char modifier, char *buf, int n) +{ + if ((asstype == AMIPSCO && modifier == 'i') + || (asstype == AMIPS && modifier == 'I')) + return _mipscoinst(map, pc, buf, n); + else + return printins(map, pc, buf, n); +} + +static int +mipsdas(Map *map, uvlong pc, char *buf, int n) +{ + Instr i; + + i.curr = buf; + i.end = buf+n; + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + if (i.end-i.curr > 8) + i.curr = _hexify(buf, i.w0, 7); + if (i.size == 2 && i.end-i.curr > 9) { + *i.curr++ = ' '; + i.curr = _hexify(i.curr, i.w1, 7); + } + *i.curr = 0; + return i.size*4; +} + +static int +mipsinstlen(Map *map, uvlong pc) +{ + Instr i; + + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + return i.size*4; +} + +static int +mipsfoll(Map *map, uvlong pc, Rgetter rget, uvlong *foll) +{ + ulong w, l; + char buf[8]; + Instr i; + + mymap = map; + if (mkinstr(pc, &i) < 0) + return -1; + w = i.w0; + if((w&0xF3600000) == 0x41000000){ /* branch on coprocessor */ + Conditional: + foll[0] = pc+8; + l = ((w&0xFFFF)<<2); + if(w & 0x8000) + l |= 0xFFFC0000; + foll[1] = pc+4 + l; + return 2; + } + + l = (w&0xFC000000)>>26; + switch(l){ + case 0: /* SPECIAL */ + if((w&0x3E) == 0x08){ /* JR, JALR */ + sprint(buf, "R%ld", (w>>21)&0x1F); + foll[0] = (*rget)(map, buf); + return 1; + } + foll[0] = pc+i.size*4; + return 1; + case 0x30: /* Load-Linked followed by NOP, STC */ + foll[0] = pc+12; + return 1; + case 1: /* BCOND */ + case 4: /* BEQ */ + case 20: /* BEQL */ + case 5: /* BNE */ + case 21: /* BNEL */ + case 6: /* BLEZ */ + case 22: /* BLEZL */ + case 7: /* BGTZ */ + case 23: /* BGTZL */ + goto Conditional; + case 2: /* J */ + case 3: /* JAL */ + foll[0] = (pc&0xF0000000) | ((w&0x03FFFFFF)<<2); + return 1; + } + + foll[0] = pc+i.size*4; + return 1; +} diff --git a/utils/libmach/vobj.c b/utils/libmach/vobj.c new file mode 100644 index 0000000..3deadb5 --- /dev/null +++ b/utils/libmach/vobj.c @@ -0,0 +1,133 @@ +/* + * vobj.c - identify and parse a mips object file + */ +#include <lib9.h> +#include <bio.h> +#include "mach.h" +#include "vc/v.out.h" +#include "obj.h" + +typedef struct Addr Addr; +struct Addr +{ + char type; + char sym; + char name; +}; +static Addr addr(Biobuf*); +static char type2char(int); +static void skip(Biobuf*, int); + +int +_isv(char *s) +{ + return s[0] == ANAME /* ANAME */ + && s[1] == D_FILE /* type */ + && s[2] == 1 /* sym */ + && s[3] == '<'; /* name of file */ +} + +int +_readv(Biobuf *bp, Prog *p) +{ + int as, n; + Addr a; + + as = Bgetc(bp); /* as */ + if(as < 0) + return 0; + p->kind = aNone; + p->sig = 0; + if(as == ANAME || as == ASIGNAME){ + if(as == ASIGNAME){ + Bread(bp, &p->sig, 4); + p->sig = leswal(p->sig); + } + p->kind = aName; + p->type = type2char(Bgetc(bp)); /* type */ + p->sym = Bgetc(bp); /* sym */ + n = 0; + for(;;) { + as = Bgetc(bp); + if(as < 0) + return 0; + n++; + if(as == 0) + break; + } + p->id = malloc(n); + if(p->id == 0) + return 0; + Bseek(bp, -n, 1); + if(Bread(bp, p->id, n) != n) + return 0; + return 1; + } + if(as == ATEXT) + p->kind = aText; + else if(as == AGLOBL) + p->kind = aData; + skip(bp, 5); /* reg(1), lineno(4) */ + a = addr(bp); + addr(bp); + if(a.type != D_OREG || a.name != D_STATIC && a.name != D_EXTERN) + p->kind = aNone; + p->sym = a.sym; + return 1; +} + +static Addr +addr(Biobuf *bp) +{ + Addr a; + long off; + + a.type = Bgetc(bp); /* a.type */ + skip(bp,1); /* reg */ + a.sym = Bgetc(bp); /* sym index */ + a.name = Bgetc(bp); /* sym type */ + switch(a.type){ + default: + case D_NONE: case D_REG: case D_FREG: case D_MREG: + case D_FCREG: case D_LO: case D_HI: + break; + case D_OREG: + case D_CONST: + case D_BRANCH: + off = Bgetc(bp); + off |= Bgetc(bp) << 8; + off |= Bgetc(bp) << 16; + off |= Bgetc(bp) << 24; + if(off < 0) + off = -off; + if(a.sym && (a.name==D_PARAM || a.name==D_AUTO)) + _offset(a.sym, off); + break; + case D_SCONST: + skip(bp, NSNAME); + break; + case D_FCONST: + skip(bp, 8); + break; + } + return a; +} + +static char +type2char(int t) +{ + switch(t){ + case D_EXTERN: return 'U'; + case D_STATIC: return 'b'; + case D_AUTO: return 'a'; + case D_PARAM: return 'p'; + default: return UNKNOWN; + } +} + +static void +skip(Biobuf *bp, int n) +{ + while (n-- > 0) + Bgetc(bp); +} |
