tcg-aarch64: Introduce tcg_out_insn_3312, _3310, _3313

Replace aarch64_ldst_op_data with AArch64LdstType, as it wasn't encoded
for the proper shift for the field and was confusing.

Merge aarch64_ldst_op_data, AArch64LdstType, and a few stray opcode bits
into a single I3312_* argument, eliminating some magic numbers from the
helper functions.

Reviewed-by: Claudio Fontana <claudio.fontana@huawei.com>
Signed-off-by: Richard Henderson <rth@twiddle.net>
This commit is contained in:
Richard Henderson 2014-03-03 17:11:49 -08:00 committed by Richard Henderson
parent dc73dfd4bc
commit 3d4299f425
1 changed files with 90 additions and 88 deletions

View File

@ -242,19 +242,12 @@ static const enum aarch64_cond_code tcg_cond_to_aarch64[] = {
[TCG_COND_LEU] = COND_LS, [TCG_COND_LEU] = COND_LS,
}; };
/* opcodes for LDR / STR instructions with base + simm9 addressing */ typedef enum {
enum aarch64_ldst_op_data { /* size of the data moved */ LDST_ST = 0, /* store */
LDST_8 = 0x38, LDST_LD = 1, /* load */
LDST_16 = 0x78, LDST_LD_S_X = 2, /* load and sign-extend into Xt */
LDST_32 = 0xb8, LDST_LD_S_W = 3, /* load and sign-extend into Wt */
LDST_64 = 0xf8, } AArch64LdstType;
};
enum aarch64_ldst_op_type { /* type of operation */
LDST_ST = 0x0, /* store */
LDST_LD = 0x4, /* load */
LDST_LD_S_X = 0x8, /* load and sign-extend into Xt */
LDST_LD_S_W = 0xc, /* load and sign-extend into Wt */
};
/* We encode the format of the insn into the beginning of the name, so that /* We encode the format of the insn into the beginning of the name, so that
we can have the preprocessor help "typecheck" the insn vs the output we can have the preprocessor help "typecheck" the insn vs the output
@ -278,6 +271,28 @@ typedef enum {
I3207_BLR = 0xd63f0000, I3207_BLR = 0xd63f0000,
I3207_RET = 0xd65f0000, I3207_RET = 0xd65f0000,
/* Load/store register. Described here as 3.3.12, but the helper
that emits them can transform to 3.3.10 or 3.3.13. */
I3312_STRB = 0x38000000 | LDST_ST << 22 | MO_8 << 30,
I3312_STRH = 0x38000000 | LDST_ST << 22 | MO_16 << 30,
I3312_STRW = 0x38000000 | LDST_ST << 22 | MO_32 << 30,
I3312_STRX = 0x38000000 | LDST_ST << 22 | MO_64 << 30,
I3312_LDRB = 0x38000000 | LDST_LD << 22 | MO_8 << 30,
I3312_LDRH = 0x38000000 | LDST_LD << 22 | MO_16 << 30,
I3312_LDRW = 0x38000000 | LDST_LD << 22 | MO_32 << 30,
I3312_LDRX = 0x38000000 | LDST_LD << 22 | MO_64 << 30,
I3312_LDRSBW = 0x38000000 | LDST_LD_S_W << 22 | MO_8 << 30,
I3312_LDRSHW = 0x38000000 | LDST_LD_S_W << 22 | MO_16 << 30,
I3312_LDRSBX = 0x38000000 | LDST_LD_S_X << 22 | MO_8 << 30,
I3312_LDRSHX = 0x38000000 | LDST_LD_S_X << 22 | MO_16 << 30,
I3312_LDRSWX = 0x38000000 | LDST_LD_S_X << 22 | MO_32 << 30,
I3312_TO_I3310 = 0x00206800,
I3312_TO_I3313 = 0x01000000,
/* Load/store register pair instructions. */ /* Load/store register pair instructions. */
I3314_LDP = 0x28400000, I3314_LDP = 0x28400000,
I3314_STP = 0x28000000, I3314_STP = 0x28000000,
@ -490,26 +505,25 @@ static void tcg_out_insn_3509(TCGContext *s, AArch64Insn insn, TCGType ext,
tcg_out32(s, insn | ext << 31 | rm << 16 | ra << 10 | rn << 5 | rd); tcg_out32(s, insn | ext << 31 | rm << 16 | ra << 10 | rn << 5 | rd);
} }
static void tcg_out_insn_3310(TCGContext *s, AArch64Insn insn,
static inline void tcg_out_ldst_9(TCGContext *s, TCGReg rd, TCGReg base, TCGReg regoff)
enum aarch64_ldst_op_data op_data,
enum aarch64_ldst_op_type op_type,
TCGReg rd, TCGReg rn, intptr_t offset)
{ {
/* use LDUR with BASE register with 9bit signed unscaled offset */ /* Note the AArch64Insn constants above are for C3.3.12. Adjust. */
tcg_out32(s, op_data << 24 | op_type << 20 tcg_out32(s, insn | I3312_TO_I3310 | regoff << 16 | base << 5 | rd);
| (offset & 0x1ff) << 12 | rn << 5 | rd);
} }
/* tcg_out_ldst_12 expects a scaled unsigned immediate offset */
static inline void tcg_out_ldst_12(TCGContext *s, static void tcg_out_insn_3312(TCGContext *s, AArch64Insn insn,
enum aarch64_ldst_op_data op_data, TCGReg rd, TCGReg rn, intptr_t offset)
enum aarch64_ldst_op_type op_type,
TCGReg rd, TCGReg rn,
tcg_target_ulong scaled_uimm)
{ {
tcg_out32(s, (op_data | 1) << 24 tcg_out32(s, insn | (offset & 0x1ff) << 12 | rn << 5 | rd);
| op_type << 20 | scaled_uimm << 10 | rn << 5 | rd); }
static void tcg_out_insn_3313(TCGContext *s, AArch64Insn insn,
TCGReg rd, TCGReg rn, uintptr_t scaled_uimm)
{
/* Note the AArch64Insn constants above are for C3.3.12. Adjust. */
tcg_out32(s, insn | I3312_TO_I3313 | scaled_uimm << 10 | rn << 5 | rd);
} }
/* Register to register move using ORR (shifted register with no shift). */ /* Register to register move using ORR (shifted register with no shift). */
@ -647,44 +661,32 @@ static void tcg_out_movi(TCGContext *s, TCGType type, TCGReg rd,
} }
} }
static inline void tcg_out_ldst_r(TCGContext *s, /* Define something more legible for general use. */
enum aarch64_ldst_op_data op_data, #define tcg_out_ldst_r tcg_out_insn_3310
enum aarch64_ldst_op_type op_type,
TCGReg rd, TCGReg base, TCGReg regoff)
{
/* load from memory to register using base + 64bit register offset */
/* using f.e. STR Wt, [Xn, Xm] 0xb8600800|(regoff << 16)|(base << 5)|rd */
/* the 0x6000 is for the "no extend field" */
tcg_out32(s, 0x00206800
| op_data << 24 | op_type << 20 | regoff << 16 | base << 5 | rd);
}
/* solve the whole ldst problem */ static void tcg_out_ldst(TCGContext *s, AArch64Insn insn,
static inline void tcg_out_ldst(TCGContext *s, enum aarch64_ldst_op_data data,
enum aarch64_ldst_op_type type,
TCGReg rd, TCGReg rn, intptr_t offset) TCGReg rd, TCGReg rn, intptr_t offset)
{ {
TCGMemOp size = (uint32_t)insn >> 30;
if (offset >= -256 && offset < 256) { if (offset >= -256 && offset < 256) {
tcg_out_ldst_9(s, data, type, rd, rn, offset); tcg_out_insn_3312(s, insn, rd, rn, offset);
return; return;
} }
if (offset >= 256) { /* If the offset is naturally aligned and in range, then we can
/* if the offset is naturally aligned and in range, use the scaled uimm12 encoding */
then we can use the scaled uimm12 encoding */ if (offset >= 0 && !(offset & ((1 << size) - 1))) {
unsigned int s_bits = data >> 6; uintptr_t scaled_uimm = offset >> size;
if (!(offset & ((1 << s_bits) - 1))) {
tcg_target_ulong scaled_uimm = offset >> s_bits;
if (scaled_uimm <= 0xfff) { if (scaled_uimm <= 0xfff) {
tcg_out_ldst_12(s, data, type, rd, rn, scaled_uimm); tcg_out_insn_3313(s, insn, rd, rn, scaled_uimm);
return; return;
} }
} }
}
/* worst-case scenario, move offset to temp register, use reg offset */ /* Worst-case scenario, move offset to temp register, use reg offset. */
tcg_out_movi(s, TCG_TYPE_I64, TCG_REG_TMP, offset); tcg_out_movi(s, TCG_TYPE_I64, TCG_REG_TMP, offset);
tcg_out_ldst_r(s, data, type, rd, rn, TCG_REG_TMP); tcg_out_ldst_r(s, insn, rd, rn, TCG_REG_TMP);
} }
static inline void tcg_out_mov(TCGContext *s, static inline void tcg_out_mov(TCGContext *s,
@ -698,14 +700,14 @@ static inline void tcg_out_mov(TCGContext *s,
static inline void tcg_out_ld(TCGContext *s, TCGType type, TCGReg arg, static inline void tcg_out_ld(TCGContext *s, TCGType type, TCGReg arg,
TCGReg arg1, intptr_t arg2) TCGReg arg1, intptr_t arg2)
{ {
tcg_out_ldst(s, (type == TCG_TYPE_I64) ? LDST_64 : LDST_32, LDST_LD, tcg_out_ldst(s, type == TCG_TYPE_I32 ? I3312_LDRW : I3312_LDRX,
arg, arg1, arg2); arg, arg1, arg2);
} }
static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg, static inline void tcg_out_st(TCGContext *s, TCGType type, TCGReg arg,
TCGReg arg1, intptr_t arg2) TCGReg arg1, intptr_t arg2)
{ {
tcg_out_ldst(s, (type == TCG_TYPE_I64) ? LDST_64 : LDST_32, LDST_ST, tcg_out_ldst(s, type == TCG_TYPE_I32 ? I3312_STRW : I3312_STRX,
arg, arg1, arg2); arg, arg1, arg2);
} }
@ -1108,12 +1110,12 @@ static void tcg_out_tlb_read(TCGContext *s, TCGReg addr_reg, TCGMemOp s_bits,
/* Merge "low bits" from tlb offset, load the tlb comparator into X0. /* Merge "low bits" from tlb offset, load the tlb comparator into X0.
X0 = load [X2 + (tlb_offset & 0x000fff)] */ X0 = load [X2 + (tlb_offset & 0x000fff)] */
tcg_out_ldst(s, TARGET_LONG_BITS == 64 ? LDST_64 : LDST_32, tcg_out_ldst(s, TARGET_LONG_BITS == 32 ? I3312_LDRW : I3312_LDRX,
LDST_LD, TCG_REG_X0, TCG_REG_X2, tlb_offset & 0xfff); TCG_REG_X0, TCG_REG_X2, tlb_offset & 0xfff);
/* Load the tlb addend. Do that early to avoid stalling. /* Load the tlb addend. Do that early to avoid stalling.
X1 = load [X2 + (tlb_offset & 0xfff) + offsetof(addend)] */ X1 = load [X2 + (tlb_offset & 0xfff) + offsetof(addend)] */
tcg_out_ldst(s, LDST_64, LDST_LD, TCG_REG_X1, TCG_REG_X2, tcg_out_ldst(s, I3312_LDRX, TCG_REG_X1, TCG_REG_X2,
(tlb_offset & 0xfff) + (offsetof(CPUTLBEntry, addend)) - (tlb_offset & 0xfff) + (offsetof(CPUTLBEntry, addend)) -
(is_read ? offsetof(CPUTLBEntry, addr_read) (is_read ? offsetof(CPUTLBEntry, addr_read)
: offsetof(CPUTLBEntry, addr_write))); : offsetof(CPUTLBEntry, addr_write)));
@ -1135,43 +1137,43 @@ static void tcg_out_qemu_ld_direct(TCGContext *s, TCGMemOp memop,
switch (memop & MO_SSIZE) { switch (memop & MO_SSIZE) {
case MO_UB: case MO_UB:
tcg_out_ldst_r(s, LDST_8, LDST_LD, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRB, data_r, addr_r, off_r);
break; break;
case MO_SB: case MO_SB:
tcg_out_ldst_r(s, LDST_8, LDST_LD_S_X, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRSBX, data_r, addr_r, off_r);
break; break;
case MO_UW: case MO_UW:
tcg_out_ldst_r(s, LDST_16, LDST_LD, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRH, data_r, addr_r, off_r);
if (bswap) { if (bswap) {
tcg_out_rev16(s, data_r, data_r); tcg_out_rev16(s, data_r, data_r);
} }
break; break;
case MO_SW: case MO_SW:
if (bswap) { if (bswap) {
tcg_out_ldst_r(s, LDST_16, LDST_LD, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRH, data_r, addr_r, off_r);
tcg_out_rev16(s, data_r, data_r); tcg_out_rev16(s, data_r, data_r);
tcg_out_sxt(s, TCG_TYPE_I64, MO_16, data_r, data_r); tcg_out_sxt(s, TCG_TYPE_I64, MO_16, data_r, data_r);
} else { } else {
tcg_out_ldst_r(s, LDST_16, LDST_LD_S_X, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRSHX, data_r, addr_r, off_r);
} }
break; break;
case MO_UL: case MO_UL:
tcg_out_ldst_r(s, LDST_32, LDST_LD, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRW, data_r, addr_r, off_r);
if (bswap) { if (bswap) {
tcg_out_rev32(s, data_r, data_r); tcg_out_rev32(s, data_r, data_r);
} }
break; break;
case MO_SL: case MO_SL:
if (bswap) { if (bswap) {
tcg_out_ldst_r(s, LDST_32, LDST_LD, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRW, data_r, addr_r, off_r);
tcg_out_rev32(s, data_r, data_r); tcg_out_rev32(s, data_r, data_r);
tcg_out_sxt(s, TCG_TYPE_I64, MO_32, data_r, data_r); tcg_out_sxt(s, TCG_TYPE_I64, MO_32, data_r, data_r);
} else { } else {
tcg_out_ldst_r(s, LDST_32, LDST_LD_S_X, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRSWX, data_r, addr_r, off_r);
} }
break; break;
case MO_Q: case MO_Q:
tcg_out_ldst_r(s, LDST_64, LDST_LD, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_LDRX, data_r, addr_r, off_r);
if (bswap) { if (bswap) {
tcg_out_rev64(s, data_r, data_r); tcg_out_rev64(s, data_r, data_r);
} }
@ -1188,28 +1190,28 @@ static void tcg_out_qemu_st_direct(TCGContext *s, TCGMemOp memop,
switch (memop & MO_SIZE) { switch (memop & MO_SIZE) {
case MO_8: case MO_8:
tcg_out_ldst_r(s, LDST_8, LDST_ST, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_STRB, data_r, addr_r, off_r);
break; break;
case MO_16: case MO_16:
if (bswap && data_r != TCG_REG_XZR) { if (bswap && data_r != TCG_REG_XZR) {
tcg_out_rev16(s, TCG_REG_TMP, data_r); tcg_out_rev16(s, TCG_REG_TMP, data_r);
data_r = TCG_REG_TMP; data_r = TCG_REG_TMP;
} }
tcg_out_ldst_r(s, LDST_16, LDST_ST, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_STRH, data_r, addr_r, off_r);
break; break;
case MO_32: case MO_32:
if (bswap && data_r != TCG_REG_XZR) { if (bswap && data_r != TCG_REG_XZR) {
tcg_out_rev32(s, TCG_REG_TMP, data_r); tcg_out_rev32(s, TCG_REG_TMP, data_r);
data_r = TCG_REG_TMP; data_r = TCG_REG_TMP;
} }
tcg_out_ldst_r(s, LDST_32, LDST_ST, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_STRW, data_r, addr_r, off_r);
break; break;
case MO_64: case MO_64:
if (bswap && data_r != TCG_REG_XZR) { if (bswap && data_r != TCG_REG_XZR) {
tcg_out_rev64(s, TCG_REG_TMP, data_r); tcg_out_rev64(s, TCG_REG_TMP, data_r);
data_r = TCG_REG_TMP; data_r = TCG_REG_TMP;
} }
tcg_out_ldst_r(s, LDST_64, LDST_ST, data_r, addr_r, off_r); tcg_out_ldst_r(s, I3312_STRX, data_r, addr_r, off_r);
break; break;
default: default:
tcg_abort(); tcg_abort();
@ -1302,49 +1304,49 @@ static void tcg_out_op(TCGContext *s, TCGOpcode opc,
case INDEX_op_ld8u_i32: case INDEX_op_ld8u_i32:
case INDEX_op_ld8u_i64: case INDEX_op_ld8u_i64:
tcg_out_ldst(s, LDST_8, LDST_LD, a0, a1, a2); tcg_out_ldst(s, I3312_LDRB, a0, a1, a2);
break; break;
case INDEX_op_ld8s_i32: case INDEX_op_ld8s_i32:
tcg_out_ldst(s, LDST_8, LDST_LD_S_W, a0, a1, a2); tcg_out_ldst(s, I3312_LDRSBW, a0, a1, a2);
break; break;
case INDEX_op_ld8s_i64: case INDEX_op_ld8s_i64:
tcg_out_ldst(s, LDST_8, LDST_LD_S_X, a0, a1, a2); tcg_out_ldst(s, I3312_LDRSBX, a0, a1, a2);
break; break;
case INDEX_op_ld16u_i32: case INDEX_op_ld16u_i32:
case INDEX_op_ld16u_i64: case INDEX_op_ld16u_i64:
tcg_out_ldst(s, LDST_16, LDST_LD, a0, a1, a2); tcg_out_ldst(s, I3312_LDRH, a0, a1, a2);
break; break;
case INDEX_op_ld16s_i32: case INDEX_op_ld16s_i32:
tcg_out_ldst(s, LDST_16, LDST_LD_S_W, a0, a1, a2); tcg_out_ldst(s, I3312_LDRSHW, a0, a1, a2);
break; break;
case INDEX_op_ld16s_i64: case INDEX_op_ld16s_i64:
tcg_out_ldst(s, LDST_16, LDST_LD_S_X, a0, a1, a2); tcg_out_ldst(s, I3312_LDRSHX, a0, a1, a2);
break; break;
case INDEX_op_ld_i32: case INDEX_op_ld_i32:
case INDEX_op_ld32u_i64: case INDEX_op_ld32u_i64:
tcg_out_ldst(s, LDST_32, LDST_LD, a0, a1, a2); tcg_out_ldst(s, I3312_LDRW, a0, a1, a2);
break; break;
case INDEX_op_ld32s_i64: case INDEX_op_ld32s_i64:
tcg_out_ldst(s, LDST_32, LDST_LD_S_X, a0, a1, a2); tcg_out_ldst(s, I3312_LDRSWX, a0, a1, a2);
break; break;
case INDEX_op_ld_i64: case INDEX_op_ld_i64:
tcg_out_ldst(s, LDST_64, LDST_LD, a0, a1, a2); tcg_out_ldst(s, I3312_LDRX, a0, a1, a2);
break; break;
case INDEX_op_st8_i32: case INDEX_op_st8_i32:
case INDEX_op_st8_i64: case INDEX_op_st8_i64:
tcg_out_ldst(s, LDST_8, LDST_ST, REG0(0), a1, a2); tcg_out_ldst(s, I3312_STRB, REG0(0), a1, a2);
break; break;
case INDEX_op_st16_i32: case INDEX_op_st16_i32:
case INDEX_op_st16_i64: case INDEX_op_st16_i64:
tcg_out_ldst(s, LDST_16, LDST_ST, REG0(0), a1, a2); tcg_out_ldst(s, I3312_STRH, REG0(0), a1, a2);
break; break;
case INDEX_op_st_i32: case INDEX_op_st_i32:
case INDEX_op_st32_i64: case INDEX_op_st32_i64:
tcg_out_ldst(s, LDST_32, LDST_ST, REG0(0), a1, a2); tcg_out_ldst(s, I3312_STRW, REG0(0), a1, a2);
break; break;
case INDEX_op_st_i64: case INDEX_op_st_i64:
tcg_out_ldst(s, LDST_64, LDST_ST, REG0(0), a1, a2); tcg_out_ldst(s, I3312_STRX, REG0(0), a1, a2);
break; break;
case INDEX_op_add_i32: case INDEX_op_add_i32: