aboutsummaryrefslogtreecommitdiff
path: root/lib/transform-dis-arm-multi.inc.h
diff options
context:
space:
mode:
Diffstat (limited to 'lib/transform-dis-arm-multi.inc.h')
-rw-r--r--lib/transform-dis-arm-multi.inc.h158
1 files changed, 158 insertions, 0 deletions
diff --git a/lib/transform-dis-arm-multi.inc.h b/lib/transform-dis-arm-multi.inc.h
new file mode 100644
index 0000000..3c99911
--- /dev/null
+++ b/lib/transform-dis-arm-multi.inc.h
@@ -0,0 +1,158 @@
+static inline void PUSHone(struct transform_dis_ctx *ctx, int Rt) {
+ if (ctx->pc_low_bit)
+ op32(ctx, 0x0d04f84d | Rt << 28);
+ else
+ op32(ctx, 0xe52d0004 | Rt << 12);
+
+}
+
+static inline void POPone(struct transform_dis_ctx *ctx, int Rt) {
+ if (ctx->pc_low_bit)
+ op32(ctx, 0x0b04f85d | Rt << 28);
+ else
+ op32(ctx, 0xe49d0004 | Rt << 12);
+}
+
+static inline void POPmulti(struct transform_dis_ctx *ctx, uint16_t mask) {
+ if (ctx->pc_low_bit)
+ op32(ctx, 0x0000e8bd | mask << 16);
+ else
+ op32(ctx, 0xe8bd0000 | mask);
+}
+
+static inline void MOVW_MOVT(struct transform_dis_ctx *ctx, int Rd, uint32_t val) {
+ uint16_t hi = val >> 16, lo = (uint16_t) val;
+ if (ctx->pc_low_bit) {
+ op32(ctx, 0x0000f240 | Rd << 24 | lo >> 12 | (lo >> 11 & 1) << 10 |
+ (lo >> 8 & 7) << 28 | (lo & 0xff) << 16);
+ op32(ctx, 0x0000f2c0 | Rd << 24 | hi >> 12 | (hi >> 11 & 1) << 10 |
+ (hi >> 8 & 7) << 28 | (hi & 0xff) << 16);
+
+ } else {
+ op32(ctx, 0xe3000000 | Rd << 12 | (lo >> 12) << 16 | (lo & 0xfff));
+ op32(ctx, 0xe3400000 | Rd << 12 | (hi >> 12) << 16 | (hi & 0xfff));
+ }
+
+}
+
+static inline void STRri(struct transform_dis_ctx *ctx, int Rt, int Rn, uint32_t off) {
+ if (ctx->pc_low_bit)
+ op32(ctx, 0x0000f8c0 | Rn | Rt << 28 | off << 16);
+ else
+ op32(ctx, 0xe4800000 | Rn << 16 | Rt << 12 | off);
+}
+
+static inline void LDRxi(struct transform_dis_ctx *ctx, int Rt, int Rn, uint32_t off,
+ enum pcrel_load_mode load_mode) {
+ if (ctx->pc_low_bit) {
+ int subop, sign;
+ switch (load_mode) {
+ case PLM_U8: subop = 0; sign = 0;
+ case PLM_S8: subop = 0; sign = 1;
+ case PLM_U16: subop = 1; sign = 0;
+ case PLM_S16: subop = 1; sign = 1;
+ case PLM_U32: subop = 2; sign = 0;
+ default: __builtin_abort();
+ }
+ op32(ctx, 0x0000f8d0 | Rn | Rt << 28 | subop << 5 | sign << 8 | off << 16);
+ } else {
+ int is_byte, subop;
+ switch (load_mode) {
+ case PLM_U8: is_byte = 1; goto type1;
+ case PLM_S8: subop = 13; goto type2;
+ case PLM_U16: subop = 11; goto type2;
+ case PLM_S16: subop = 15; goto type2;
+ case PLM_U32: is_byte = 0; goto type1;
+ type1:
+ op32(ctx, 0xe5900000 | Rn << 16 | Rt << 12 | off);
+ break;
+ type2:
+ op32(ctx, 0xe1d00000 | Rn << 16 | Rt << 12 | subop << 4 |
+ (off & 0xf) | (off & 0xf0) << 4);
+ break;
+ default:
+ __builtin_abort();
+ }
+ }
+}
+
+static NOINLINE UNUSED void transform_dis_data(struct transform_dis_ctx *ctx,
+ unsigned o0, unsigned o1, unsigned o2, unsigned o3, unsigned out_mask) {
+ /* We only care if at least one op is PC, so quickly test that. */
+ if (((o0 | o1 | o2 | o3) & 15) != 15)
+ return;
+ unsigned *newval = ctx->newval;
+ newval[0] = o0;
+ newval[1] = o1;
+ newval[2] = o2;
+ newval[3] = o3;
+
+ void **rpp = ctx->rewritten_ptr_ptr;
+
+ /* A few cases:
+ * 1. Move to PC that does not read PC. Probably fine.
+ * 2. Move to PC that does read PC, e.g. 'ldrls pc, [pc, r0, lsl #2]'.
+ * This is different from #4 mainly in that we can't need to do
+ * something like pop {temp, pc}. Not terribly plausible (only likely
+ * in non-position-independent code in ARM mode, and I can't get it to
+ * happen in the first 8 bytes then), but we may as well handle it.
+ * 3. Read of PC that does not read the register(s) it writes, e.g. adr r3,
+ * X. In this case we can use that register as a temporary.
+ * 4. Read of PC that does, or doesn't have any output register, e.g. add
+ * r3, pc. In this case we use the stack because reliably finding a
+ * free register would be work, and might not even be possible (thumb
+ * mov r9, r0; mov r12, r1; <some PC using insn(s)>)
+ * the out register is always first.
+ */
+ uint16_t in_regs = 0;
+ int out_reg = -1;
+ for (int i = 0; i < 4; i++) {
+ if (out_mask & 1 << i)
+ out_reg = i;
+ else
+ in_regs |= 1 << newval[i];
+ }
+ uint32_t pc = ctx->pc + (ctx->pc_low_bit ? 4 : 8);
+ int scratch = __builtin_ctz(~(in_regs | (1 << out_reg)));
+ if (out_reg == 15) {
+ if (in_regs & 1 << 15)
+ return; /* case 1 */
+ /* case 2 */
+ PUSHone(ctx, scratch);
+ PUSHone(ctx, scratch);
+ MOVW_MOVT(ctx, scratch, pc);
+ for (int i = 0; i < 4; i++)
+ if (newval[i] == 15)
+ newval[i] = scratch;
+ ctx->write_newop_here = *rpp; *rpp += ctx->op_size;
+ STRri(ctx, scratch, 13, 4);
+ POPmulti(ctx, 1 << scratch | 1 << 15);
+ } else {
+ if (out_reg != -1 && !(in_regs & 1 << out_reg)) {
+ /* case 3 - ignore scratch */
+ MOVW_MOVT(ctx, out_reg, pc);
+ for (int i = 1; i < 4; i++)
+ if (newval[i] == 15)
+ newval[i] = out_reg;
+ ctx->write_newop_here = *rpp; *rpp += ctx->op_size;
+ } else {
+ /* case 4 */
+ PUSHone(ctx, scratch);
+ MOVW_MOVT(ctx, scratch, pc);
+ for (int i = 1; i < 4; i++)
+ if (newval[i] == 15)
+ newval[i] = scratch;
+ ctx->write_newop_here = *rpp; *rpp += ctx->op_size;
+ POPone(ctx, 1 << scratch);
+ }
+ }
+ ctx->modify = true;
+}
+
+static NOINLINE UNUSED void transform_dis_pcrel(struct transform_dis_ctx *ctx,
+ uintptr_t dpc, unsigned reg, enum pcrel_load_mode load_mode) {
+ ctx->write_newop_here = NULL;
+ MOVW_MOVT(ctx, reg, dpc);
+ if (load_mode != PLM_ADR)
+ LDRxi(ctx, reg, reg, 0, load_mode);
+}