target/sparc: Fix FMUL8x16A{U,L}
These instructions have f32 inputs, which changes the decode
of the register numbers. While we're fixing things, use a
common helper for both insns, extracting the 16-bit scalar
in tcg beforehand.
Signed-off-by: Richard Henderson <richard.henderson@linaro.org>
Reviewed-by: Philippe Mathieu-Daudé <philmd@linaro.org>
Message-Id: <20240502165528.244004-5-richard.henderson@linaro.org>
Signed-off-by: Mark Cave-Ayland <mark.cave-ayland@ilande.co.uk>
(cherry picked from commit a859602c74
)
Signed-off-by: Michael Tokarev <mjt@tls.msk.ru>
This commit is contained in:
parent
6d027e1bf9
commit
098f10e9a8
@ -96,8 +96,7 @@ DEF_HELPER_FLAGS_2(fqtox, TCG_CALL_NO_WG, s64, env, i128)
|
|||||||
|
|
||||||
DEF_HELPER_FLAGS_2(fpmerge, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
DEF_HELPER_FLAGS_2(fpmerge, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
||||||
DEF_HELPER_FLAGS_2(fmul8x16, TCG_CALL_NO_RWG_SE, i64, i32, i64)
|
DEF_HELPER_FLAGS_2(fmul8x16, TCG_CALL_NO_RWG_SE, i64, i32, i64)
|
||||||
DEF_HELPER_FLAGS_2(fmul8x16al, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
DEF_HELPER_FLAGS_2(fmul8x16a, TCG_CALL_NO_RWG_SE, i64, i32, s32)
|
||||||
DEF_HELPER_FLAGS_2(fmul8x16au, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
|
||||||
DEF_HELPER_FLAGS_2(fmul8sux16, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
DEF_HELPER_FLAGS_2(fmul8sux16, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
||||||
DEF_HELPER_FLAGS_2(fmul8ulx16, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
DEF_HELPER_FLAGS_2(fmul8ulx16, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
||||||
DEF_HELPER_FLAGS_2(fmuld8sux16, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
DEF_HELPER_FLAGS_2(fmuld8sux16, TCG_CALL_NO_RWG_SE, i64, i64, i64)
|
||||||
|
@ -45,6 +45,7 @@
|
|||||||
# define gen_helper_clear_softint(E, S) qemu_build_not_reached()
|
# define gen_helper_clear_softint(E, S) qemu_build_not_reached()
|
||||||
# define gen_helper_done(E) qemu_build_not_reached()
|
# define gen_helper_done(E) qemu_build_not_reached()
|
||||||
# define gen_helper_flushw(E) qemu_build_not_reached()
|
# define gen_helper_flushw(E) qemu_build_not_reached()
|
||||||
|
# define gen_helper_fmul8x16a(D, S1, S2) qemu_build_not_reached()
|
||||||
# define gen_helper_rdccr(D, E) qemu_build_not_reached()
|
# define gen_helper_rdccr(D, E) qemu_build_not_reached()
|
||||||
# define gen_helper_rdcwp(D, E) qemu_build_not_reached()
|
# define gen_helper_rdcwp(D, E) qemu_build_not_reached()
|
||||||
# define gen_helper_restored(E) qemu_build_not_reached()
|
# define gen_helper_restored(E) qemu_build_not_reached()
|
||||||
@ -72,8 +73,6 @@
|
|||||||
# define gen_helper_fexpand ({ qemu_build_not_reached(); NULL; })
|
# define gen_helper_fexpand ({ qemu_build_not_reached(); NULL; })
|
||||||
# define gen_helper_fmul8sux16 ({ qemu_build_not_reached(); NULL; })
|
# define gen_helper_fmul8sux16 ({ qemu_build_not_reached(); NULL; })
|
||||||
# define gen_helper_fmul8ulx16 ({ qemu_build_not_reached(); NULL; })
|
# define gen_helper_fmul8ulx16 ({ qemu_build_not_reached(); NULL; })
|
||||||
# define gen_helper_fmul8x16al ({ qemu_build_not_reached(); NULL; })
|
|
||||||
# define gen_helper_fmul8x16au ({ qemu_build_not_reached(); NULL; })
|
|
||||||
# define gen_helper_fmul8x16 ({ qemu_build_not_reached(); NULL; })
|
# define gen_helper_fmul8x16 ({ qemu_build_not_reached(); NULL; })
|
||||||
# define gen_helper_fmuld8sux16 ({ qemu_build_not_reached(); NULL; })
|
# define gen_helper_fmuld8sux16 ({ qemu_build_not_reached(); NULL; })
|
||||||
# define gen_helper_fmuld8ulx16 ({ qemu_build_not_reached(); NULL; })
|
# define gen_helper_fmuld8ulx16 ({ qemu_build_not_reached(); NULL; })
|
||||||
@ -719,6 +718,18 @@ static void gen_op_bshuffle(TCGv_i64 dst, TCGv_i64 src1, TCGv_i64 src2)
|
|||||||
#endif
|
#endif
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static void gen_op_fmul8x16al(TCGv_i64 dst, TCGv_i32 src1, TCGv_i32 src2)
|
||||||
|
{
|
||||||
|
tcg_gen_ext16s_i32(src2, src2);
|
||||||
|
gen_helper_fmul8x16a(dst, src1, src2);
|
||||||
|
}
|
||||||
|
|
||||||
|
static void gen_op_fmul8x16au(TCGv_i64 dst, TCGv_i32 src1, TCGv_i32 src2)
|
||||||
|
{
|
||||||
|
tcg_gen_sari_i32(src2, src2, 16);
|
||||||
|
gen_helper_fmul8x16a(dst, src1, src2);
|
||||||
|
}
|
||||||
|
|
||||||
static void finishing_insn(DisasContext *dc)
|
static void finishing_insn(DisasContext *dc)
|
||||||
{
|
{
|
||||||
/*
|
/*
|
||||||
@ -4583,6 +4594,27 @@ TRANS(FSUBs, ALL, do_env_fff, a, gen_helper_fsubs)
|
|||||||
TRANS(FMULs, ALL, do_env_fff, a, gen_helper_fmuls)
|
TRANS(FMULs, ALL, do_env_fff, a, gen_helper_fmuls)
|
||||||
TRANS(FDIVs, ALL, do_env_fff, a, gen_helper_fdivs)
|
TRANS(FDIVs, ALL, do_env_fff, a, gen_helper_fdivs)
|
||||||
|
|
||||||
|
static bool do_dff(DisasContext *dc, arg_r_r_r *a,
|
||||||
|
void (*func)(TCGv_i64, TCGv_i32, TCGv_i32))
|
||||||
|
{
|
||||||
|
TCGv_i64 dst;
|
||||||
|
TCGv_i32 src1, src2;
|
||||||
|
|
||||||
|
if (gen_trap_ifnofpu(dc)) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
dst = gen_dest_fpr_D(dc, a->rd);
|
||||||
|
src1 = gen_load_fpr_F(dc, a->rs1);
|
||||||
|
src2 = gen_load_fpr_F(dc, a->rs2);
|
||||||
|
func(dst, src1, src2);
|
||||||
|
gen_store_fpr_D(dc, a->rd, dst);
|
||||||
|
return advance_pc(dc);
|
||||||
|
}
|
||||||
|
|
||||||
|
TRANS(FMUL8x16AU, VIS1, do_dff, a, gen_op_fmul8x16au)
|
||||||
|
TRANS(FMUL8x16AL, VIS1, do_dff, a, gen_op_fmul8x16al)
|
||||||
|
|
||||||
static bool do_dfd(DisasContext *dc, arg_r_r_r *a,
|
static bool do_dfd(DisasContext *dc, arg_r_r_r *a,
|
||||||
void (*func)(TCGv_i64, TCGv_i32, TCGv_i64))
|
void (*func)(TCGv_i64, TCGv_i32, TCGv_i64))
|
||||||
{
|
{
|
||||||
@ -4620,8 +4652,6 @@ static bool do_ddd(DisasContext *dc, arg_r_r_r *a,
|
|||||||
return advance_pc(dc);
|
return advance_pc(dc);
|
||||||
}
|
}
|
||||||
|
|
||||||
TRANS(FMUL8x16AU, VIS1, do_ddd, a, gen_helper_fmul8x16au)
|
|
||||||
TRANS(FMUL8x16AL, VIS1, do_ddd, a, gen_helper_fmul8x16al)
|
|
||||||
TRANS(FMUL8SUx16, VIS1, do_ddd, a, gen_helper_fmul8sux16)
|
TRANS(FMUL8SUx16, VIS1, do_ddd, a, gen_helper_fmul8sux16)
|
||||||
TRANS(FMUL8ULx16, VIS1, do_ddd, a, gen_helper_fmul8ulx16)
|
TRANS(FMUL8ULx16, VIS1, do_ddd, a, gen_helper_fmul8ulx16)
|
||||||
TRANS(FMULD8SUx16, VIS1, do_ddd, a, gen_helper_fmuld8sux16)
|
TRANS(FMULD8SUx16, VIS1, do_ddd, a, gen_helper_fmuld8sux16)
|
||||||
|
@ -119,44 +119,23 @@ uint64_t helper_fmul8x16(uint32_t src1, uint64_t src2)
|
|||||||
return d.ll;
|
return d.ll;
|
||||||
}
|
}
|
||||||
|
|
||||||
uint64_t helper_fmul8x16al(uint64_t src1, uint64_t src2)
|
uint64_t helper_fmul8x16a(uint32_t src1, int32_t src2)
|
||||||
{
|
{
|
||||||
VIS64 s, d;
|
VIS32 s;
|
||||||
|
VIS64 d;
|
||||||
uint32_t tmp;
|
uint32_t tmp;
|
||||||
|
|
||||||
s.ll = src1;
|
s.l = src1;
|
||||||
d.ll = src2;
|
d.ll = 0;
|
||||||
|
|
||||||
#define PMUL(r) \
|
#define PMUL(r) \
|
||||||
tmp = (int32_t)d.VIS_SW64(1) * (int32_t)s.VIS_B64(r); \
|
do { \
|
||||||
if ((tmp & 0xff) > 0x7f) { \
|
tmp = src2 * (int32_t)s.VIS_B32(r); \
|
||||||
tmp += 0x100; \
|
if ((tmp & 0xff) > 0x7f) { \
|
||||||
} \
|
tmp += 0x100; \
|
||||||
d.VIS_W64(r) = tmp >> 8;
|
} \
|
||||||
|
d.VIS_W64(r) = tmp >> 8; \
|
||||||
PMUL(0);
|
} while (0)
|
||||||
PMUL(1);
|
|
||||||
PMUL(2);
|
|
||||||
PMUL(3);
|
|
||||||
#undef PMUL
|
|
||||||
|
|
||||||
return d.ll;
|
|
||||||
}
|
|
||||||
|
|
||||||
uint64_t helper_fmul8x16au(uint64_t src1, uint64_t src2)
|
|
||||||
{
|
|
||||||
VIS64 s, d;
|
|
||||||
uint32_t tmp;
|
|
||||||
|
|
||||||
s.ll = src1;
|
|
||||||
d.ll = src2;
|
|
||||||
|
|
||||||
#define PMUL(r) \
|
|
||||||
tmp = (int32_t)d.VIS_SW64(0) * (int32_t)s.VIS_B64(r); \
|
|
||||||
if ((tmp & 0xff) > 0x7f) { \
|
|
||||||
tmp += 0x100; \
|
|
||||||
} \
|
|
||||||
d.VIS_W64(r) = tmp >> 8;
|
|
||||||
|
|
||||||
PMUL(0);
|
PMUL(0);
|
||||||
PMUL(1);
|
PMUL(1);
|
||||||
|
Loading…
Reference in New Issue
Block a user