Message ID | 20210430011543.1017113-28-richard.henderson@linaro.org |
---|---|
State | Superseded |
Headers | show |
Series | Base for adding PowerPC 64-bit instructions | expand |
On 29/04/2021 22:15, Richard Henderson wrote: > These are all connected by macros in the legacy decoding. > Decode the D and DS forms into the PLS_D argument set so > that prefixed insns can share code. > > Signed-off-by: Richard Henderson <richard.henderson@linaro.org> > --- > target/ppc/insn32.decode | 37 ++++++ > target/ppc/translate.c | 145 ++++----------------- > target/ppc/translate/fixedpoint-impl.c.inc | 114 ++++++++++++++++ > 3 files changed, 174 insertions(+), 122 deletions(-) > > diff --git a/target/ppc/insn32.decode b/target/ppc/insn32.decode > index 2ed25c7e67..1c1b4620fc 100644 > --- a/target/ppc/insn32.decode > +++ b/target/ppc/insn32.decode > @@ -26,6 +26,43 @@ > &PLS_D rt ra si:int64_t r:bool > @PLS_D ...... rt:5 ra:5 si:s16 &PLS_D r=0 > > +%ds_si 2:s14 !function=times_4 > +@PLS_DS ...... rt:5 ra:5 .............. .. &PLS_D si=%ds_si r=0 > + > +&X rt ra rb > +@X ...... rt:5 ra:5 rb:5 .......... . &X > + > +### Fixed-Point Load Instructions > + > +LBZ 100010 ..... ..... ................ @PLS_D > +LBZU 100011 ..... ..... ................ @PLS_D > +LBZX 011111 ..... ..... ..... 0001010111 - @X > +LBZUX 011111 ..... ..... ..... 0001110111 - @X > + > +LHZ 101000 ..... ..... ................ @PLS_D > +LHZU 101001 ..... ..... ................ @PLS_D > +LHZX 011111 ..... ..... ..... 0100010111 - @X > +LHZUX 011111 ..... ..... ..... 0100110111 - @X > + > +LHA 101010 ..... ..... ................ @PLS_D > +LHAU 101011 ..... ..... ................ @PLS_D > +LHAX 011111 ..... ..... ..... 0101010111 - @X > +LHAXU 011111 ..... ..... ..... 0101110111 - @X > + > +LWZ 100000 ..... ..... ................ @PLS_D > +LWZU 100001 ..... ..... ................ @PLS_D > +LWZX 011111 ..... ..... ..... 0000010111 - @X > +LWZUX 011111 ..... ..... ..... 0000110111 - @X > + > +LWA 111010 ..... ..... ..............10 @PLS_DS > +LWAX 011111 ..... ..... ..... 0101010101 - @X > +LWAUX 011111 ..... ..... ..... 0101110101 - @X > + > +LD 111010 ..... ..... ..............00 @PLS_DS > +LDU 111010 ..... ..... ..............01 @PLS_DS > +LDX 011111 ..... ..... ..... 0000010101 - @X > +LDUX 011111 ..... ..... ..... 0000110101 - @X > + > ### Fixed-Point Arithmetic Instructions > > ADDI 001110 ..... ..... ................ @PLS_D > diff --git a/target/ppc/translate.c b/target/ppc/translate.c > index 5a8a3c39c3..1fdb501ee9 100644 > --- a/target/ppc/translate.c > +++ b/target/ppc/translate.c > @@ -2487,54 +2487,6 @@ GEN_QEMU_STORE_64(st64, DEF_MEMOP(MO_Q)) > GEN_QEMU_STORE_64(st64r, BSWAP_MEMOP(MO_Q)) > #endif > > -#define GEN_LD(name, ldop, opc, type) \ > -static void glue(gen_, name)(DisasContext *ctx) \ > -{ \ > - TCGv EA; \ > - gen_set_access_type(ctx, ACCESS_INT); \ > - EA = tcg_temp_new(); \ > - gen_addr_imm_index(ctx, EA, 0); \ > - gen_qemu_##ldop(ctx, cpu_gpr[rD(ctx->opcode)], EA); \ > - tcg_temp_free(EA); \ > -} > - > -#define GEN_LDU(name, ldop, opc, type) \ > -static void glue(gen_, name##u)(DisasContext *ctx) \ > -{ \ > - TCGv EA; \ > - if (unlikely(rA(ctx->opcode) == 0 || \ > - rA(ctx->opcode) == rD(ctx->opcode))) { \ > - gen_inval_exception(ctx, POWERPC_EXCP_INVAL_INVAL); \ > - return; \ > - } \ > - gen_set_access_type(ctx, ACCESS_INT); \ > - EA = tcg_temp_new(); \ > - if (type == PPC_64B) \ > - gen_addr_imm_index(ctx, EA, 0x03); \ > - else \ > - gen_addr_imm_index(ctx, EA, 0); \ > - gen_qemu_##ldop(ctx, cpu_gpr[rD(ctx->opcode)], EA); \ > - tcg_gen_mov_tl(cpu_gpr[rA(ctx->opcode)], EA); \ > - tcg_temp_free(EA); \ > -} > - > -#define GEN_LDUX(name, ldop, opc2, opc3, type) \ > -static void glue(gen_, name##ux)(DisasContext *ctx) \ > -{ \ > - TCGv EA; \ > - if (unlikely(rA(ctx->opcode) == 0 || \ > - rA(ctx->opcode) == rD(ctx->opcode))) { \ > - gen_inval_exception(ctx, POWERPC_EXCP_INVAL_INVAL); \ > - return; \ > - } \ > - gen_set_access_type(ctx, ACCESS_INT); \ > - EA = tcg_temp_new(); \ > - gen_addr_reg_index(ctx, EA); \ > - gen_qemu_##ldop(ctx, cpu_gpr[rD(ctx->opcode)], EA); \ > - tcg_gen_mov_tl(cpu_gpr[rA(ctx->opcode)], EA); \ > - tcg_temp_free(EA); \ > -} > - > #define GEN_LDX_E(name, ldop, opc2, opc3, type, type2, chk) \ > static void glue(gen_, name##x)(DisasContext *ctx) \ > { \ > @@ -2553,21 +2505,6 @@ static void glue(gen_, name##x)(DisasContext *ctx) \ > #define GEN_LDX_HVRM(name, ldop, opc2, opc3, type) \ > GEN_LDX_E(name, ldop, opc2, opc3, type, PPC_NONE, CHK_HVRM) > > -#define GEN_LDS(name, ldop, op, type) \ > -GEN_LD(name, ldop, op | 0x20, type); \ > -GEN_LDU(name, ldop, op | 0x21, type); \ > -GEN_LDUX(name, ldop, 0x17, op | 0x01, type); \ > -GEN_LDX(name, ldop, 0x17, op | 0x00, type) > - > -/* lbz lbzu lbzux lbzx */ > -GEN_LDS(lbz, ld8u, 0x02, PPC_INTEGER); > -/* lha lhau lhaux lhax */ > -GEN_LDS(lha, ld16s, 0x0A, PPC_INTEGER); > -/* lhz lhzu lhzux lhzx */ > -GEN_LDS(lhz, ld16u, 0x08, PPC_INTEGER); > -/* lwz lwzu lwzux lwzx */ > -GEN_LDS(lwz, ld32u, 0x00, PPC_INTEGER); > - > #define GEN_LDEPX(name, ldop, opc2, opc3) \ > static void glue(gen_, name##epx)(DisasContext *ctx) \ > { \ > @@ -2588,47 +2525,12 @@ GEN_LDEPX(ld, DEF_MEMOP(MO_Q), 0x1D, 0x00) > #endif > > #if defined(TARGET_PPC64) > -/* lwaux */ > -GEN_LDUX(lwa, ld32s, 0x15, 0x0B, PPC_64B); > -/* lwax */ > -GEN_LDX(lwa, ld32s, 0x15, 0x0A, PPC_64B); > -/* ldux */ > -GEN_LDUX(ld, ld64_i64, 0x15, 0x01, PPC_64B); > -/* ldx */ > -GEN_LDX(ld, ld64_i64, 0x15, 0x00, PPC_64B); > - > /* CI load/store variants */ > GEN_LDX_HVRM(ldcix, ld64_i64, 0x15, 0x1b, PPC_CILDST) > GEN_LDX_HVRM(lwzcix, ld32u, 0x15, 0x15, PPC_CILDST) > GEN_LDX_HVRM(lhzcix, ld16u, 0x15, 0x19, PPC_CILDST) > GEN_LDX_HVRM(lbzcix, ld8u, 0x15, 0x1a, PPC_CILDST) > > -static void gen_ld(DisasContext *ctx) > -{ > - TCGv EA; > - if (Rc(ctx->opcode)) { > - if (unlikely(rA(ctx->opcode) == 0 || > - rA(ctx->opcode) == rD(ctx->opcode))) { > - gen_inval_exception(ctx, POWERPC_EXCP_INVAL_INVAL); > - return; > - } > - } > - gen_set_access_type(ctx, ACCESS_INT); > - EA = tcg_temp_new(); > - gen_addr_imm_index(ctx, EA, 0x03); > - if (ctx->opcode & 0x02) { > - /* lwa (lwau is undefined) */ > - gen_qemu_ld32s(ctx, cpu_gpr[rD(ctx->opcode)], EA); > - } else { > - /* ld - ldu */ > - gen_qemu_ld64_i64(ctx, cpu_gpr[rD(ctx->opcode)], EA); > - } > - if (Rc(ctx->opcode)) { > - tcg_gen_mov_tl(cpu_gpr[rA(ctx->opcode)], EA); > - } > - tcg_temp_free(EA); > -} > - > /* lq */ > static void gen_lq(DisasContext *ctx) > { > @@ -6849,6 +6751,14 @@ static inline void set_avr64(int regno, TCGv_i64 src, bool high) > tcg_gen_st_i64(src, cpu_env, avr64_offset(regno, high)); > } > > +/* > + * Helpers for decodetree used by !function for decoding arguments. > + */ > +static int times_4(DisasContext *ctx, int x) > +{ > + return x * 4; > +} > + > /* > * Helpers for trans_* functions to check for specific insns flags. > * Use token pasting to ensure that we use the proper flag with the > @@ -6875,6 +6785,21 @@ static inline void set_avr64(int regno, TCGv_i64 src, bool high) > # define REQUIRE_64BIT(CTX) REQUIRE_INSNS_FLAGS(CTX, 64B) > #endif > > +/* > + * Helpers for implementing sets of trans_* functions. > + * Defer the implementation of NAME to FUNC, with optional extra arguments. > + */ > +#define TRANS(NAME, FUNC, ...) \ > + static bool trans_##NAME(DisasContext *ctx, arg_##NAME *a) \ > + { return FUNC(ctx, a, __VA_ARGS__); } > + > +#define TRANS64(NAME, FUNC, ...) \ > + static bool trans_##NAME(DisasContext *ctx, arg_##NAME *a) \ > + { REQUIRE_64BIT(ctx); return FUNC(ctx, a, __VA_ARGS__); } > + > +/* TODO: More TRANS* helpers for extra insn_flags checks. */ > + > + > #include "decode-insn32.c.inc" > #include "decode-insn64.c.inc" > #include "translate/fixedpoint-impl.c.inc" > @@ -7059,7 +6984,6 @@ GEN_HANDLER2_E(extswsli1, "extswsli", 0x1F, 0x1B, 0x1B, 0x00000000, > PPC_NONE, PPC2_ISA300), > #endif > #if defined(TARGET_PPC64) > -GEN_HANDLER(ld, 0x3A, 0xFF, 0xFF, 0x00000000, PPC_64B), > GEN_HANDLER(lq, 0x38, 0xFF, 0xFF, 0x00000000, PPC_64BX), > GEN_HANDLER(std, 0x3E, 0xFF, 0xFF, 0x00000000, PPC_64B), > #endif > @@ -7425,34 +7349,11 @@ GEN_PPC64_R2(rldcr, 0x1E, 0x09), > GEN_PPC64_R4(rldimi, 0x1E, 0x06), > #endif > > -#undef GEN_LD > -#undef GEN_LDU > -#undef GEN_LDUX > #undef GEN_LDX_E > -#undef GEN_LDS > -#define GEN_LD(name, ldop, opc, type) \ > -GEN_HANDLER(name, opc, 0xFF, 0xFF, 0x00000000, type), > -#define GEN_LDU(name, ldop, opc, type) \ > -GEN_HANDLER(name##u, opc, 0xFF, 0xFF, 0x00000000, type), > -#define GEN_LDUX(name, ldop, opc2, opc3, type) \ > -GEN_HANDLER(name##ux, 0x1F, opc2, opc3, 0x00000001, type), > #define GEN_LDX_E(name, ldop, opc2, opc3, type, type2, chk) \ > GEN_HANDLER_E(name##x, 0x1F, opc2, opc3, 0x00000001, type, type2), > -#define GEN_LDS(name, ldop, op, type) \ > -GEN_LD(name, ldop, op | 0x20, type) \ > -GEN_LDU(name, ldop, op | 0x21, type) \ > -GEN_LDUX(name, ldop, 0x17, op | 0x01, type) \ > -GEN_LDX(name, ldop, 0x17, op | 0x00, type) > > -GEN_LDS(lbz, ld8u, 0x02, PPC_INTEGER) > -GEN_LDS(lha, ld16s, 0x0A, PPC_INTEGER) > -GEN_LDS(lhz, ld16u, 0x08, PPC_INTEGER) > -GEN_LDS(lwz, ld32u, 0x00, PPC_INTEGER) > #if defined(TARGET_PPC64) > -GEN_LDUX(lwa, ld32s, 0x15, 0x0B, PPC_64B) > -GEN_LDX(lwa, ld32s, 0x15, 0x0A, PPC_64B) > -GEN_LDUX(ld, ld64_i64, 0x15, 0x01, PPC_64B) > -GEN_LDX(ld, ld64_i64, 0x15, 0x00, PPC_64B) > GEN_LDX_E(ldbr, ld64ur_i64, 0x14, 0x10, PPC_NONE, PPC2_DBRX, CHK_NONE) > > /* HV/P7 and later only */ > diff --git a/target/ppc/translate/fixedpoint-impl.c.inc b/target/ppc/translate/fixedpoint-impl.c.inc > index 96b8c38f60..cb3219c996 100644 > --- a/target/ppc/translate/fixedpoint-impl.c.inc > +++ b/target/ppc/translate/fixedpoint-impl.c.inc > @@ -33,6 +33,120 @@ static bool resolve_PLS_D(DisasContext *ctx, arg_PLS_D *a) > return true; > } > > +/* > + * Fixed-Point Load/Store Instructions > + */ > + > +static bool do_ldst_PLS_D(DisasContext *ctx, arg_PLS_D *a, bool update, > + bool store, MemOp mop) > +{ > + TCGv ea; > + > + if (!resolve_PLS_D(ctx, a)) { > + return true; > + } > + if (update && (a->ra == 0 || (!store && a->ra == a->rt))) { > + gen_invalid(ctx); > + return true; > + } > + gen_set_access_type(ctx, ACCESS_INT); > + > + ea = tcg_temp_new(); > + if (a->ra) { > + tcg_gen_addi_tl(ea, cpu_gpr[a->ra], a->si); > + } else { > + tcg_gen_movi_tl(ea, a->si); > + } > + if (NARROW_MODE(ctx)) { > + tcg_gen_ext32u_tl(ea, ea); > + } > + mop ^= ctx->default_tcg_memop_mask; > + if (store) { > + tcg_gen_qemu_st_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); > + } else { > + tcg_gen_qemu_ld_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); > + } > + if (update) { > + tcg_gen_mov_tl(cpu_gpr[a->ra], ea); > + } > + tcg_temp_free(ea); > + > + return true; > +} > + > +static bool do_ldst_X(DisasContext *ctx, arg_X *a, bool update, > + bool store, MemOp mop) > +{ > + TCGv ea; > + > + if (update && (a->ra == 0 || (!store && a->ra == a->rt))) { > + gen_invalid(ctx); > + return true; > + } > + gen_set_access_type(ctx, ACCESS_INT); > + > + ea = tcg_temp_new(); > + if (a->ra) { > + tcg_gen_add_tl(ea, cpu_gpr[a->ra], cpu_gpr[a->rb]); > + } else { > + tcg_gen_mov_tl(ea, cpu_gpr[a->rb]); > + } > + if (NARROW_MODE(ctx)) { > + tcg_gen_ext32u_tl(ea, ea); > + } > + mop ^= ctx->default_tcg_memop_mask; > + if (store) { > + tcg_gen_qemu_st_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); > + } else { > + tcg_gen_qemu_ld_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); > + } > + if (update) { > + tcg_gen_mov_tl(cpu_gpr[a->ra], ea); > + } > + tcg_temp_free(ea); > + > + return true; > +} > + The only difference between those two is tcg_gen_addi_tl/tcg_gen_movi_tl and tcg_gen_add_tl/tcg_gen_mov_tl. We could do this in a single method if we tcg_const_tl(a->si) in do_ldst_D. I'm not sure about the costs involved, and we'd need to tcg_temp_free it. If you want to give it a look, I did some tests on https://github.com/ppc64/qemu/tree/ferst-tcg-decodetree64 . Thanks, Matheus K. Ferst Instituto de Pesquisas ELDORADO <http://www.eldorado.org.br/> Analista de Software Júnior Aviso Legal - Disclaimer <https://www.eldorado.org.br/disclaimer.html>
On 4/30/21 4:54 PM, Matheus K. Ferst wrote: > The only difference between those two is tcg_gen_addi_tl/tcg_gen_movi_tl and > tcg_gen_add_tl/tcg_gen_mov_tl. We could do this in a single method if we > tcg_const_tl(a->si) in do_ldst_D. I'm not sure about the costs involved, and > we'd need to tcg_temp_free it. If you want to give it a look, I did some tests > on https://github.com/ppc64/qemu/tree/ferst-tcg-decodetree64 . I guess it works, but it feels ugly with the comparison vs cpu_gpr[0]. Maybe pass in rt and ra as integers, and only pass in rb/si as TCGv addend? The upper-case argument names clash with docs/devel/style.rst. You can use tcg_constant_tl() to grab a hashed constant that need not be freed. BTW, I thought I had a comment about PLS being used for both MLS and 8LS. I guess that must have gotten lost at some point. If you go with your renaming to MLS, you'll want a different comment about PLD et al. r~
On 30/04/2021 21:50, Richard Henderson wrote: > On 4/30/21 4:54 PM, Matheus K. Ferst wrote: >> The only difference between those two is >> tcg_gen_addi_tl/tcg_gen_movi_tl and tcg_gen_add_tl/tcg_gen_mov_tl. We >> could do this in a single method if we tcg_const_tl(a->si) in >> do_ldst_D. I'm not sure about the costs involved, and we'd need to >> tcg_temp_free it. If you want to give it a look, I did some tests on >> https://github.com/ppc64/qemu/tree/ferst-tcg-decodetree64 . > > I guess it works, but it feels ugly with the comparison vs cpu_gpr[0]. > Maybe pass in rt and ra as integers, and only pass in rb/si as TCGv addend? > I tried that first and it looked just as weird, but if you prefer I'll change it back. We could also hide the ugliness in a helper e.g. bool gpr_is_zero(TCGv). > The upper-case argument names clash with docs/devel/style.rst. > Good call, I'll fix this before push this branch again; > You can use tcg_constant_tl() to grab a hashed constant that need not be > freed. > Then we could > return do_ldst(ctx, cpu_gpr[a->rt], a->ra?cpu->gpr[a->ra]:tcg_const_tl(0), ... At the cost of always calling tcg_gen_add_tl and repeating the RA=0 logic in do_ldst_X and do_ldst_D. > BTW, I thought I had a comment about PLS being used for both MLS and > 8LS. I guess that must have gotten lost at some point. If you go with > your renaming to MLS, you'll want a different comment about PLD et al. > > > r~ Don't mind that, it was a bad idea, I gave up on this change while rebasing v3. Thanks, Matheus K. Ferst Instituto de Pesquisas ELDORADO <http://www.eldorado.org.br/> Analista de Software Júnior Aviso Legal - Disclaimer <https://www.eldorado.org.br/disclaimer.html>
diff --git a/target/ppc/insn32.decode b/target/ppc/insn32.decode index 2ed25c7e67..1c1b4620fc 100644 --- a/target/ppc/insn32.decode +++ b/target/ppc/insn32.decode @@ -26,6 +26,43 @@ &PLS_D rt ra si:int64_t r:bool @PLS_D ...... rt:5 ra:5 si:s16 &PLS_D r=0 +%ds_si 2:s14 !function=times_4 +@PLS_DS ...... rt:5 ra:5 .............. .. &PLS_D si=%ds_si r=0 + +&X rt ra rb +@X ...... rt:5 ra:5 rb:5 .......... . &X + +### Fixed-Point Load Instructions + +LBZ 100010 ..... ..... ................ @PLS_D +LBZU 100011 ..... ..... ................ @PLS_D +LBZX 011111 ..... ..... ..... 0001010111 - @X +LBZUX 011111 ..... ..... ..... 0001110111 - @X + +LHZ 101000 ..... ..... ................ @PLS_D +LHZU 101001 ..... ..... ................ @PLS_D +LHZX 011111 ..... ..... ..... 0100010111 - @X +LHZUX 011111 ..... ..... ..... 0100110111 - @X + +LHA 101010 ..... ..... ................ @PLS_D +LHAU 101011 ..... ..... ................ @PLS_D +LHAX 011111 ..... ..... ..... 0101010111 - @X +LHAXU 011111 ..... ..... ..... 0101110111 - @X + +LWZ 100000 ..... ..... ................ @PLS_D +LWZU 100001 ..... ..... ................ @PLS_D +LWZX 011111 ..... ..... ..... 0000010111 - @X +LWZUX 011111 ..... ..... ..... 0000110111 - @X + +LWA 111010 ..... ..... ..............10 @PLS_DS +LWAX 011111 ..... ..... ..... 0101010101 - @X +LWAUX 011111 ..... ..... ..... 0101110101 - @X + +LD 111010 ..... ..... ..............00 @PLS_DS +LDU 111010 ..... ..... ..............01 @PLS_DS +LDX 011111 ..... ..... ..... 0000010101 - @X +LDUX 011111 ..... ..... ..... 0000110101 - @X + ### Fixed-Point Arithmetic Instructions ADDI 001110 ..... ..... ................ @PLS_D diff --git a/target/ppc/translate.c b/target/ppc/translate.c index 5a8a3c39c3..1fdb501ee9 100644 --- a/target/ppc/translate.c +++ b/target/ppc/translate.c @@ -2487,54 +2487,6 @@ GEN_QEMU_STORE_64(st64, DEF_MEMOP(MO_Q)) GEN_QEMU_STORE_64(st64r, BSWAP_MEMOP(MO_Q)) #endif -#define GEN_LD(name, ldop, opc, type) \ -static void glue(gen_, name)(DisasContext *ctx) \ -{ \ - TCGv EA; \ - gen_set_access_type(ctx, ACCESS_INT); \ - EA = tcg_temp_new(); \ - gen_addr_imm_index(ctx, EA, 0); \ - gen_qemu_##ldop(ctx, cpu_gpr[rD(ctx->opcode)], EA); \ - tcg_temp_free(EA); \ -} - -#define GEN_LDU(name, ldop, opc, type) \ -static void glue(gen_, name##u)(DisasContext *ctx) \ -{ \ - TCGv EA; \ - if (unlikely(rA(ctx->opcode) == 0 || \ - rA(ctx->opcode) == rD(ctx->opcode))) { \ - gen_inval_exception(ctx, POWERPC_EXCP_INVAL_INVAL); \ - return; \ - } \ - gen_set_access_type(ctx, ACCESS_INT); \ - EA = tcg_temp_new(); \ - if (type == PPC_64B) \ - gen_addr_imm_index(ctx, EA, 0x03); \ - else \ - gen_addr_imm_index(ctx, EA, 0); \ - gen_qemu_##ldop(ctx, cpu_gpr[rD(ctx->opcode)], EA); \ - tcg_gen_mov_tl(cpu_gpr[rA(ctx->opcode)], EA); \ - tcg_temp_free(EA); \ -} - -#define GEN_LDUX(name, ldop, opc2, opc3, type) \ -static void glue(gen_, name##ux)(DisasContext *ctx) \ -{ \ - TCGv EA; \ - if (unlikely(rA(ctx->opcode) == 0 || \ - rA(ctx->opcode) == rD(ctx->opcode))) { \ - gen_inval_exception(ctx, POWERPC_EXCP_INVAL_INVAL); \ - return; \ - } \ - gen_set_access_type(ctx, ACCESS_INT); \ - EA = tcg_temp_new(); \ - gen_addr_reg_index(ctx, EA); \ - gen_qemu_##ldop(ctx, cpu_gpr[rD(ctx->opcode)], EA); \ - tcg_gen_mov_tl(cpu_gpr[rA(ctx->opcode)], EA); \ - tcg_temp_free(EA); \ -} - #define GEN_LDX_E(name, ldop, opc2, opc3, type, type2, chk) \ static void glue(gen_, name##x)(DisasContext *ctx) \ { \ @@ -2553,21 +2505,6 @@ static void glue(gen_, name##x)(DisasContext *ctx) \ #define GEN_LDX_HVRM(name, ldop, opc2, opc3, type) \ GEN_LDX_E(name, ldop, opc2, opc3, type, PPC_NONE, CHK_HVRM) -#define GEN_LDS(name, ldop, op, type) \ -GEN_LD(name, ldop, op | 0x20, type); \ -GEN_LDU(name, ldop, op | 0x21, type); \ -GEN_LDUX(name, ldop, 0x17, op | 0x01, type); \ -GEN_LDX(name, ldop, 0x17, op | 0x00, type) - -/* lbz lbzu lbzux lbzx */ -GEN_LDS(lbz, ld8u, 0x02, PPC_INTEGER); -/* lha lhau lhaux lhax */ -GEN_LDS(lha, ld16s, 0x0A, PPC_INTEGER); -/* lhz lhzu lhzux lhzx */ -GEN_LDS(lhz, ld16u, 0x08, PPC_INTEGER); -/* lwz lwzu lwzux lwzx */ -GEN_LDS(lwz, ld32u, 0x00, PPC_INTEGER); - #define GEN_LDEPX(name, ldop, opc2, opc3) \ static void glue(gen_, name##epx)(DisasContext *ctx) \ { \ @@ -2588,47 +2525,12 @@ GEN_LDEPX(ld, DEF_MEMOP(MO_Q), 0x1D, 0x00) #endif #if defined(TARGET_PPC64) -/* lwaux */ -GEN_LDUX(lwa, ld32s, 0x15, 0x0B, PPC_64B); -/* lwax */ -GEN_LDX(lwa, ld32s, 0x15, 0x0A, PPC_64B); -/* ldux */ -GEN_LDUX(ld, ld64_i64, 0x15, 0x01, PPC_64B); -/* ldx */ -GEN_LDX(ld, ld64_i64, 0x15, 0x00, PPC_64B); - /* CI load/store variants */ GEN_LDX_HVRM(ldcix, ld64_i64, 0x15, 0x1b, PPC_CILDST) GEN_LDX_HVRM(lwzcix, ld32u, 0x15, 0x15, PPC_CILDST) GEN_LDX_HVRM(lhzcix, ld16u, 0x15, 0x19, PPC_CILDST) GEN_LDX_HVRM(lbzcix, ld8u, 0x15, 0x1a, PPC_CILDST) -static void gen_ld(DisasContext *ctx) -{ - TCGv EA; - if (Rc(ctx->opcode)) { - if (unlikely(rA(ctx->opcode) == 0 || - rA(ctx->opcode) == rD(ctx->opcode))) { - gen_inval_exception(ctx, POWERPC_EXCP_INVAL_INVAL); - return; - } - } - gen_set_access_type(ctx, ACCESS_INT); - EA = tcg_temp_new(); - gen_addr_imm_index(ctx, EA, 0x03); - if (ctx->opcode & 0x02) { - /* lwa (lwau is undefined) */ - gen_qemu_ld32s(ctx, cpu_gpr[rD(ctx->opcode)], EA); - } else { - /* ld - ldu */ - gen_qemu_ld64_i64(ctx, cpu_gpr[rD(ctx->opcode)], EA); - } - if (Rc(ctx->opcode)) { - tcg_gen_mov_tl(cpu_gpr[rA(ctx->opcode)], EA); - } - tcg_temp_free(EA); -} - /* lq */ static void gen_lq(DisasContext *ctx) { @@ -6849,6 +6751,14 @@ static inline void set_avr64(int regno, TCGv_i64 src, bool high) tcg_gen_st_i64(src, cpu_env, avr64_offset(regno, high)); } +/* + * Helpers for decodetree used by !function for decoding arguments. + */ +static int times_4(DisasContext *ctx, int x) +{ + return x * 4; +} + /* * Helpers for trans_* functions to check for specific insns flags. * Use token pasting to ensure that we use the proper flag with the @@ -6875,6 +6785,21 @@ static inline void set_avr64(int regno, TCGv_i64 src, bool high) # define REQUIRE_64BIT(CTX) REQUIRE_INSNS_FLAGS(CTX, 64B) #endif +/* + * Helpers for implementing sets of trans_* functions. + * Defer the implementation of NAME to FUNC, with optional extra arguments. + */ +#define TRANS(NAME, FUNC, ...) \ + static bool trans_##NAME(DisasContext *ctx, arg_##NAME *a) \ + { return FUNC(ctx, a, __VA_ARGS__); } + +#define TRANS64(NAME, FUNC, ...) \ + static bool trans_##NAME(DisasContext *ctx, arg_##NAME *a) \ + { REQUIRE_64BIT(ctx); return FUNC(ctx, a, __VA_ARGS__); } + +/* TODO: More TRANS* helpers for extra insn_flags checks. */ + + #include "decode-insn32.c.inc" #include "decode-insn64.c.inc" #include "translate/fixedpoint-impl.c.inc" @@ -7059,7 +6984,6 @@ GEN_HANDLER2_E(extswsli1, "extswsli", 0x1F, 0x1B, 0x1B, 0x00000000, PPC_NONE, PPC2_ISA300), #endif #if defined(TARGET_PPC64) -GEN_HANDLER(ld, 0x3A, 0xFF, 0xFF, 0x00000000, PPC_64B), GEN_HANDLER(lq, 0x38, 0xFF, 0xFF, 0x00000000, PPC_64BX), GEN_HANDLER(std, 0x3E, 0xFF, 0xFF, 0x00000000, PPC_64B), #endif @@ -7425,34 +7349,11 @@ GEN_PPC64_R2(rldcr, 0x1E, 0x09), GEN_PPC64_R4(rldimi, 0x1E, 0x06), #endif -#undef GEN_LD -#undef GEN_LDU -#undef GEN_LDUX #undef GEN_LDX_E -#undef GEN_LDS -#define GEN_LD(name, ldop, opc, type) \ -GEN_HANDLER(name, opc, 0xFF, 0xFF, 0x00000000, type), -#define GEN_LDU(name, ldop, opc, type) \ -GEN_HANDLER(name##u, opc, 0xFF, 0xFF, 0x00000000, type), -#define GEN_LDUX(name, ldop, opc2, opc3, type) \ -GEN_HANDLER(name##ux, 0x1F, opc2, opc3, 0x00000001, type), #define GEN_LDX_E(name, ldop, opc2, opc3, type, type2, chk) \ GEN_HANDLER_E(name##x, 0x1F, opc2, opc3, 0x00000001, type, type2), -#define GEN_LDS(name, ldop, op, type) \ -GEN_LD(name, ldop, op | 0x20, type) \ -GEN_LDU(name, ldop, op | 0x21, type) \ -GEN_LDUX(name, ldop, 0x17, op | 0x01, type) \ -GEN_LDX(name, ldop, 0x17, op | 0x00, type) -GEN_LDS(lbz, ld8u, 0x02, PPC_INTEGER) -GEN_LDS(lha, ld16s, 0x0A, PPC_INTEGER) -GEN_LDS(lhz, ld16u, 0x08, PPC_INTEGER) -GEN_LDS(lwz, ld32u, 0x00, PPC_INTEGER) #if defined(TARGET_PPC64) -GEN_LDUX(lwa, ld32s, 0x15, 0x0B, PPC_64B) -GEN_LDX(lwa, ld32s, 0x15, 0x0A, PPC_64B) -GEN_LDUX(ld, ld64_i64, 0x15, 0x01, PPC_64B) -GEN_LDX(ld, ld64_i64, 0x15, 0x00, PPC_64B) GEN_LDX_E(ldbr, ld64ur_i64, 0x14, 0x10, PPC_NONE, PPC2_DBRX, CHK_NONE) /* HV/P7 and later only */ diff --git a/target/ppc/translate/fixedpoint-impl.c.inc b/target/ppc/translate/fixedpoint-impl.c.inc index 96b8c38f60..cb3219c996 100644 --- a/target/ppc/translate/fixedpoint-impl.c.inc +++ b/target/ppc/translate/fixedpoint-impl.c.inc @@ -33,6 +33,120 @@ static bool resolve_PLS_D(DisasContext *ctx, arg_PLS_D *a) return true; } +/* + * Fixed-Point Load/Store Instructions + */ + +static bool do_ldst_PLS_D(DisasContext *ctx, arg_PLS_D *a, bool update, + bool store, MemOp mop) +{ + TCGv ea; + + if (!resolve_PLS_D(ctx, a)) { + return true; + } + if (update && (a->ra == 0 || (!store && a->ra == a->rt))) { + gen_invalid(ctx); + return true; + } + gen_set_access_type(ctx, ACCESS_INT); + + ea = tcg_temp_new(); + if (a->ra) { + tcg_gen_addi_tl(ea, cpu_gpr[a->ra], a->si); + } else { + tcg_gen_movi_tl(ea, a->si); + } + if (NARROW_MODE(ctx)) { + tcg_gen_ext32u_tl(ea, ea); + } + mop ^= ctx->default_tcg_memop_mask; + if (store) { + tcg_gen_qemu_st_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); + } else { + tcg_gen_qemu_ld_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); + } + if (update) { + tcg_gen_mov_tl(cpu_gpr[a->ra], ea); + } + tcg_temp_free(ea); + + return true; +} + +static bool do_ldst_X(DisasContext *ctx, arg_X *a, bool update, + bool store, MemOp mop) +{ + TCGv ea; + + if (update && (a->ra == 0 || (!store && a->ra == a->rt))) { + gen_invalid(ctx); + return true; + } + gen_set_access_type(ctx, ACCESS_INT); + + ea = tcg_temp_new(); + if (a->ra) { + tcg_gen_add_tl(ea, cpu_gpr[a->ra], cpu_gpr[a->rb]); + } else { + tcg_gen_mov_tl(ea, cpu_gpr[a->rb]); + } + if (NARROW_MODE(ctx)) { + tcg_gen_ext32u_tl(ea, ea); + } + mop ^= ctx->default_tcg_memop_mask; + if (store) { + tcg_gen_qemu_st_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); + } else { + tcg_gen_qemu_ld_tl(cpu_gpr[a->rt], ea, ctx->mem_idx, mop); + } + if (update) { + tcg_gen_mov_tl(cpu_gpr[a->ra], ea); + } + tcg_temp_free(ea); + + return true; +} + +/* Load Byte and Zero */ +TRANS(LBZ, do_ldst_PLS_D, false, false, MO_UB) +TRANS(LBZX, do_ldst_X, false, false, MO_UB) +TRANS(LBZU, do_ldst_PLS_D, true, false, MO_UB) +TRANS(LBZUX, do_ldst_X, true, false, MO_UB) + +/* Load Halfword and Zero */ +TRANS(LHZ, do_ldst_PLS_D, false, false, MO_UW) +TRANS(LHZX, do_ldst_X, false, false, MO_UW) +TRANS(LHZU, do_ldst_PLS_D, true, false, MO_UW) +TRANS(LHZUX, do_ldst_X, true, false, MO_UW) + +/* Load Halfword Algebraic */ +TRANS(LHA, do_ldst_PLS_D, false, false, MO_SW) +TRANS(LHAX, do_ldst_X, false, false, MO_SW) +TRANS(LHAU, do_ldst_PLS_D, true, false, MO_SW) +TRANS(LHAXU, do_ldst_X, true, false, MO_SW) + +/* Load Word and Zero */ +TRANS(LWZ, do_ldst_PLS_D, false, false, MO_UL) +TRANS(LWZX, do_ldst_X, false, false, MO_UL) +TRANS(LWZU, do_ldst_PLS_D, true, false, MO_UL) +TRANS(LWZUX, do_ldst_X, true, false, MO_UL) + +/* Load Word Algebraic */ +TRANS64(LWA, do_ldst_PLS_D, false, false, MO_SL) +TRANS64(LWAX, do_ldst_X, false, false, MO_SL) +TRANS64(LWAUX, do_ldst_X, true, false, MO_SL) + +/* Load Doubleword */ +TRANS64(LD, do_ldst_PLS_D, false, false, MO_Q) +TRANS64(LDX, do_ldst_X, false, false, MO_Q) +TRANS64(LDU, do_ldst_PLS_D, true, false, MO_Q) +TRANS64(LDUX, do_ldst_X, true, false, MO_Q) + +/* + * Fixed-Point Arithmetic Instructions + */ + static bool trans_ADDI(DisasContext *ctx, arg_PLS_D *a) { if (resolve_PLS_D(ctx, a)) {
These are all connected by macros in the legacy decoding. Decode the D and DS forms into the PLS_D argument set so that prefixed insns can share code. Signed-off-by: Richard Henderson <richard.henderson@linaro.org> --- target/ppc/insn32.decode | 37 ++++++ target/ppc/translate.c | 145 ++++----------------- target/ppc/translate/fixedpoint-impl.c.inc | 114 ++++++++++++++++ 3 files changed, 174 insertions(+), 122 deletions(-) -- 2.25.1