target/hppa: Implement CF_PCREL

Now that the groundwork has been laid, enabling CF_PCREL within the
translator proper is a simple matter of updating copy_iaoq_entry
and install_iaq_entries.

We also need to modify the unwind info, since we no longer have
absolute addresses to install.

As expected, this reduces the runtime overhead of compilation when
running a Linux kernel with address space randomization enabled.

Reviewed-by: Helge Deller <deller@gmx.de>
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
This commit is contained in:
Richard Henderson 2024-04-13 20:57:13 -07:00
parent 804cd52d3a
commit 6dd9b145f6
2 changed files with 55 additions and 32 deletions

View File

@ -62,10 +62,6 @@ void cpu_get_tb_cpu_state(CPUHPPAState *env, vaddr *pc,
*pc = hppa_cpu_get_pc(env_cpu(env)); *pc = hppa_cpu_get_pc(env_cpu(env));
flags |= (env->iaoq_f & 3) << TB_FLAG_PRIV_SHIFT; flags |= (env->iaoq_f & 3) << TB_FLAG_PRIV_SHIFT;
if (hppa_is_pa20(env)) {
cs_base = env->iaoq_f & MAKE_64BIT_MASK(32, 32);
}
/* /*
* The only really interesting case is if IAQ_Back is on the same page * The only really interesting case is if IAQ_Back is on the same page
* as IAQ_Front, so that we can use goto_tb between the blocks. In all * as IAQ_Front, so that we can use goto_tb between the blocks. In all
@ -113,19 +109,19 @@ static void hppa_restore_state_to_opc(CPUState *cs,
const TranslationBlock *tb, const TranslationBlock *tb,
const uint64_t *data) const uint64_t *data)
{ {
HPPACPU *cpu = HPPA_CPU(cs); CPUHPPAState *env = cpu_env(cs);
cpu->env.iaoq_f = data[0]; env->iaoq_f = (env->iaoq_f & TARGET_PAGE_MASK) | data[0];
if (data[1] != (target_ulong)-1) { if (data[1] != INT32_MIN) {
cpu->env.iaoq_b = data[1]; env->iaoq_b = env->iaoq_f + data[1];
} }
cpu->env.unwind_breg = data[2]; env->unwind_breg = data[2];
/* /*
* Since we were executing the instruction at IAOQ_F, and took some * Since we were executing the instruction at IAOQ_F, and took some
* sort of action that provoked the cpu_restore_state, we can infer * sort of action that provoked the cpu_restore_state, we can infer
* that the instruction was not nullified. * that the instruction was not nullified.
*/ */
cpu->env.psw_n = 0; env->psw_n = 0;
} }
static bool hppa_cpu_has_work(CPUState *cs) static bool hppa_cpu_has_work(CPUState *cs)
@ -191,6 +187,9 @@ static void hppa_cpu_realizefn(DeviceState *dev, Error **errp)
hppa_ptlbe(&cpu->env); hppa_ptlbe(&cpu->env);
} }
#endif #endif
/* Use pc-relative instructions always to simplify the translator. */
tcg_cflags_set(cs, CF_PCREL);
} }
static void hppa_cpu_initfn(Object *obj) static void hppa_cpu_initfn(Object *obj)

View File

@ -47,7 +47,7 @@ typedef struct DisasIAQE {
TCGv_i64 space; TCGv_i64 space;
/* IAOQ base; may be null for relative address. */ /* IAOQ base; may be null for relative address. */
TCGv_i64 base; TCGv_i64 base;
/* IAOQ addend; if base is null, relative to ctx->iaoq_first. */ /* IAOQ addend; if base is null, relative to cpu_iaoq_f. */
int64_t disp; int64_t disp;
} DisasIAQE; } DisasIAQE;
@ -664,11 +664,7 @@ static DisasIAQE iaqe_next_absv(DisasContext *ctx, TCGv_i64 var)
static void copy_iaoq_entry(DisasContext *ctx, TCGv_i64 dest, static void copy_iaoq_entry(DisasContext *ctx, TCGv_i64 dest,
const DisasIAQE *src) const DisasIAQE *src)
{ {
if (src->base == NULL) { tcg_gen_addi_i64(dest, src->base ? : cpu_iaoq_f, src->disp);
tcg_gen_movi_i64(dest, ctx->iaoq_first + src->disp);
} else {
tcg_gen_addi_i64(dest, src->base, src->disp);
}
} }
static void install_iaq_entries(DisasContext *ctx, const DisasIAQE *f, static void install_iaq_entries(DisasContext *ctx, const DisasIAQE *f,
@ -680,8 +676,28 @@ static void install_iaq_entries(DisasContext *ctx, const DisasIAQE *f,
b_next = iaqe_incr(f, 4); b_next = iaqe_incr(f, 4);
b = &b_next; b = &b_next;
} }
copy_iaoq_entry(ctx, cpu_iaoq_f, f);
/*
* There is an edge case
* bv r0(rN)
* b,l disp,r0
* for which F will use cpu_iaoq_b (from the indirect branch),
* and B will use cpu_iaoq_f (from the direct branch).
* In this case we need an extra temporary.
*/
if (f->base != cpu_iaoq_b) {
copy_iaoq_entry(ctx, cpu_iaoq_b, b); copy_iaoq_entry(ctx, cpu_iaoq_b, b);
copy_iaoq_entry(ctx, cpu_iaoq_f, f);
} else if (f->base == b->base) {
copy_iaoq_entry(ctx, cpu_iaoq_f, f);
tcg_gen_addi_i64(cpu_iaoq_b, cpu_iaoq_f, b->disp - f->disp);
} else {
TCGv_i64 tmp = tcg_temp_new_i64();
copy_iaoq_entry(ctx, tmp, b);
copy_iaoq_entry(ctx, cpu_iaoq_f, f);
tcg_gen_mov_i64(cpu_iaoq_b, tmp);
}
if (f->space) { if (f->space) {
tcg_gen_mov_i64(cpu_iasq_f, f->space); tcg_gen_mov_i64(cpu_iasq_f, f->space);
} }
@ -3980,9 +3996,8 @@ static bool trans_b_gate(DisasContext *ctx, arg_b_gate *a)
/* Adjust the dest offset for the privilege change from the PTE. */ /* Adjust the dest offset for the privilege change from the PTE. */
TCGv_i64 off = tcg_temp_new_i64(); TCGv_i64 off = tcg_temp_new_i64();
gen_helper_b_gate_priv(off, tcg_env, copy_iaoq_entry(ctx, off, &ctx->iaq_f);
tcg_constant_i64(ctx->iaoq_first gen_helper_b_gate_priv(off, tcg_env, off);
+ ctx->iaq_f.disp));
ctx->iaq_j.base = off; ctx->iaq_j.base = off;
ctx->iaq_j.disp = disp + 8; ctx->iaq_j.disp = disp + 8;
@ -4603,7 +4618,7 @@ static bool trans_diag_unimp(DisasContext *ctx, arg_diag_unimp *a)
static void hppa_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs) static void hppa_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
{ {
DisasContext *ctx = container_of(dcbase, DisasContext, base); DisasContext *ctx = container_of(dcbase, DisasContext, base);
uint64_t cs_base, iaoq_f, iaoq_b; uint64_t cs_base;
int bound; int bound;
ctx->cs = cs; ctx->cs = cs;
@ -4622,12 +4637,8 @@ static void hppa_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
: ctx->tb_flags & PSW_W ? MMU_ABS_W_IDX : MMU_ABS_IDX); : ctx->tb_flags & PSW_W ? MMU_ABS_W_IDX : MMU_ABS_IDX);
#endif #endif
/* Recover the IAOQ values from the GVA + PRIV. */
cs_base = ctx->base.tb->cs_base; cs_base = ctx->base.tb->cs_base;
iaoq_f = cs_base & MAKE_64BIT_MASK(32, 32); ctx->iaoq_first = ctx->base.pc_first + ctx->privilege;
iaoq_f |= ctx->base.pc_first & MAKE_64BIT_MASK(2, 30);
iaoq_f |= ctx->privilege;
ctx->iaoq_first = iaoq_f;
if (unlikely(cs_base & CS_BASE_DIFFSPACE)) { if (unlikely(cs_base & CS_BASE_DIFFSPACE)) {
ctx->iaq_b.space = cpu_iasq_b; ctx->iaq_b.space = cpu_iasq_b;
@ -4635,8 +4646,9 @@ static void hppa_tr_init_disas_context(DisasContextBase *dcbase, CPUState *cs)
} else if (unlikely(cs_base & CS_BASE_DIFFPAGE)) { } else if (unlikely(cs_base & CS_BASE_DIFFPAGE)) {
ctx->iaq_b.base = cpu_iaoq_b; ctx->iaq_b.base = cpu_iaoq_b;
} else { } else {
iaoq_b = (iaoq_f & TARGET_PAGE_MASK) | (cs_base & ~TARGET_PAGE_MASK); uint64_t iaoq_f_pgofs = ctx->iaoq_first & ~TARGET_PAGE_MASK;
ctx->iaq_b.disp = iaoq_b - iaoq_f; uint64_t iaoq_b_pgofs = cs_base & ~TARGET_PAGE_MASK;
ctx->iaq_b.disp = iaoq_b_pgofs - iaoq_f_pgofs;
} }
ctx->zero = tcg_constant_i64(0); ctx->zero = tcg_constant_i64(0);
@ -4663,11 +4675,23 @@ static void hppa_tr_tb_start(DisasContextBase *dcbase, CPUState *cs)
static void hppa_tr_insn_start(DisasContextBase *dcbase, CPUState *cs) static void hppa_tr_insn_start(DisasContextBase *dcbase, CPUState *cs)
{ {
DisasContext *ctx = container_of(dcbase, DisasContext, base); DisasContext *ctx = container_of(dcbase, DisasContext, base);
uint64_t iaoq_f, iaoq_b;
int64_t diff;
tcg_debug_assert(!iaqe_variable(&ctx->iaq_f)); tcg_debug_assert(!iaqe_variable(&ctx->iaq_f));
tcg_gen_insn_start(ctx->iaoq_first + ctx->iaq_f.disp,
(iaqe_variable(&ctx->iaq_b) ? -1 : iaoq_f = ctx->iaoq_first + ctx->iaq_f.disp;
ctx->iaoq_first + ctx->iaq_b.disp), 0); if (iaqe_variable(&ctx->iaq_b)) {
diff = INT32_MIN;
} else {
iaoq_b = ctx->iaoq_first + ctx->iaq_b.disp;
diff = iaoq_b - iaoq_f;
/* Direct branches can only produce a 24-bit displacement. */
tcg_debug_assert(diff == (int32_t)diff);
tcg_debug_assert(diff != INT32_MIN);
}
tcg_gen_insn_start(iaoq_f & ~TARGET_PAGE_MASK, diff, 0);
ctx->insn_start_updated = false; ctx->insn_start_updated = false;
} }