346 lines
10 KiB
C
346 lines
10 KiB
C
|
#include <stdio.h>
|
||
|
#include <stddef.h>
|
||
|
#include <stdint.h>
|
||
|
|
||
|
#define FFLAG_NX_SHIFT 0 /* inexact */
|
||
|
#define FFLAG_UF_SHIFT 1 /* underflow */
|
||
|
#define FFLAG_OF_SHIFT 2 /* overflow */
|
||
|
#define FFLAG_DZ_SHIFT 3 /* divide by zero */
|
||
|
#define FFLAG_NV_SHIFT 4 /* invalid operation */
|
||
|
|
||
|
#define FFLAG_NV (1UL << FFLAG_NV_SHIFT)
|
||
|
#define FFLAG_DZ (1UL << FFLAG_DZ_SHIFT)
|
||
|
#define FFLAG_OF (1UL << FFLAG_OF_SHIFT)
|
||
|
#define FFLAG_UF (1UL << FFLAG_UF_SHIFT)
|
||
|
#define FFLAG_NX (1UL << FFLAG_NX_SHIFT)
|
||
|
|
||
|
typedef struct fp64_fcvt_fcvtmod_testcase {
|
||
|
const char* name;
|
||
|
union {
|
||
|
uint64_t inp_lu;
|
||
|
double inp_lf;
|
||
|
};
|
||
|
uint64_t exp_fcvt;
|
||
|
uint8_t exp_fcvt_fflags;
|
||
|
uint64_t exp_fcvtmod;
|
||
|
uint8_t exp_fcvtmod_fflags;
|
||
|
} fp64_fcvt_fcvtmod_testcase_t;
|
||
|
|
||
|
void print_fflags(uint8_t fflags)
|
||
|
{
|
||
|
int set = 0;
|
||
|
|
||
|
if (fflags == 0) {
|
||
|
printf("-");
|
||
|
return;
|
||
|
}
|
||
|
|
||
|
if (fflags & FFLAG_NV) {
|
||
|
printf("%sFFLAG_NV", set ? " | " : "");
|
||
|
set = 1;
|
||
|
}
|
||
|
if (fflags & FFLAG_DZ) {
|
||
|
printf("%sFFLAG_DZ", set ? " | " : "");
|
||
|
set = 1;
|
||
|
}
|
||
|
if (fflags & FFLAG_OF) {
|
||
|
printf("%sFFLAG_OF", set ? " | " : "");
|
||
|
set = 1;
|
||
|
}
|
||
|
if (fflags & FFLAG_UF) {
|
||
|
printf("%sFFLAG_UF", set ? " | " : "");
|
||
|
set = 1;
|
||
|
}
|
||
|
if (fflags & FFLAG_NX) {
|
||
|
printf("%sFFLAG_NX", set ? " | " : "");
|
||
|
set = 1;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* Clear all FP flags. */
|
||
|
static inline void clear_fflags()
|
||
|
{
|
||
|
__asm__ __volatile__("fsflags zero");
|
||
|
}
|
||
|
|
||
|
/* Read all FP flags. */
|
||
|
static inline uint8_t get_fflags()
|
||
|
{
|
||
|
uint64_t v;
|
||
|
__asm__ __volatile__("frflags %0" : "=r"(v));
|
||
|
return (uint8_t)v;
|
||
|
}
|
||
|
|
||
|
/* Move input value (without conversations) into an FP register. */
|
||
|
static inline double do_fmv_d_x(uint64_t inp)
|
||
|
{
|
||
|
double fpr;
|
||
|
__asm__ __volatile__("fmv.d.x %0, %1" : "=f"(fpr) : "r"(inp));
|
||
|
return fpr;
|
||
|
}
|
||
|
|
||
|
static inline uint64_t do_fcvt_w_d(uint64_t inp, uint8_t *fflags)
|
||
|
{
|
||
|
uint64_t ret;
|
||
|
double fpr = do_fmv_d_x(inp);
|
||
|
|
||
|
clear_fflags();
|
||
|
|
||
|
__asm__ __volatile__("fcvt.w.d %0, %1, rtz" : "=r"(ret) : "f"(fpr));
|
||
|
|
||
|
*fflags = get_fflags();
|
||
|
|
||
|
return ret;
|
||
|
}
|
||
|
|
||
|
static inline uint64_t do_fcvtmod_w_d(uint64_t inp, uint8_t *fflags)
|
||
|
{
|
||
|
uint64_t ret;
|
||
|
double fpr = do_fmv_d_x(inp);
|
||
|
|
||
|
clear_fflags();
|
||
|
|
||
|
/* fcvtmod.w.d rd, rs1, rtz = 1100001 01000 rs1 001 rd 1010011 */
|
||
|
asm(".insn r 0x53, 0x1, 0x61, %0, %1, f8" : "=r"(ret) : "f"(fpr));
|
||
|
|
||
|
*fflags = get_fflags();
|
||
|
|
||
|
return ret;
|
||
|
}
|
||
|
|
||
|
static const fp64_fcvt_fcvtmod_testcase_t tests[] = {
|
||
|
/* Zero (exp=0, frac=0) */
|
||
|
{ .name = "+0.0",
|
||
|
.inp_lf = 0x0p0,
|
||
|
.exp_fcvt = 0x0000000000000000,
|
||
|
.exp_fcvt_fflags = 0,
|
||
|
.exp_fcvtmod = 0x0000000000000000,
|
||
|
.exp_fcvtmod_fflags = 0 },
|
||
|
{ .name = "-0.0",
|
||
|
.inp_lf = -0x0p0,
|
||
|
.exp_fcvt = 0x0000000000000000,
|
||
|
.exp_fcvt_fflags = 0,
|
||
|
.exp_fcvtmod = 0x0000000000000000,
|
||
|
.exp_fcvtmod_fflags = 0 },
|
||
|
|
||
|
/* Subnormal: exp=0 frac!=0 */
|
||
|
{ .name = "Subnormal frac=1",
|
||
|
.inp_lu = 0x0000000000000001,
|
||
|
.exp_fcvt = 0x0000000000000000,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "Subnormal frac=0xf..f",
|
||
|
.inp_lu = 0x0000ffffffffffff,
|
||
|
.exp_fcvt = 0x0000000000000000,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "Neg subnormal frac=1",
|
||
|
.inp_lu = 0x0000000000000001,
|
||
|
.exp_fcvt = 0x0000000000000000,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "Neg subnormal frac=0xf..f",
|
||
|
.inp_lu = 0x8000ffffffffffff,
|
||
|
.exp_fcvt = 0x0000000000000000,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
|
||
|
/* Infinity: exp=0x7ff, frac=0 */
|
||
|
{ .name = "+INF",
|
||
|
.inp_lu = 0x7ff0000000000000,
|
||
|
.exp_fcvt = 0x000000007fffffff, /* int32 max */
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
{ .name = "-INF",
|
||
|
.inp_lu = 0xfff0000000000000,
|
||
|
.exp_fcvt = 0xffffffff80000000, /* int32 min */
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
|
||
|
/* NaN: exp=7ff, frac!=0 */
|
||
|
{ .name = "canonical NaN",
|
||
|
.inp_lu = 0x7ff8000000000000,
|
||
|
.exp_fcvt = 0x000000007fffffff, /* int32 max */
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
{ .name = "non-canonical NaN",
|
||
|
.inp_lu = 0x7ff8000000100000,
|
||
|
.exp_fcvt = 0x000000007fffffff, /* int32 min */
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
|
||
|
/* Normal numbers: exp!=0, exp!=7ff */
|
||
|
{ .name = "+smallest normal value",
|
||
|
.inp_lu = 0x0010000000000000,
|
||
|
.exp_fcvt = 0,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "-smallest normal value",
|
||
|
.inp_lu = 0x8010000000000000,
|
||
|
.exp_fcvt = 0,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
|
||
|
{ .name = "+0.5",
|
||
|
.inp_lf = 0x1p-1,
|
||
|
.exp_fcvt = 0,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "-0.5",
|
||
|
.inp_lf = -0x1p-1,
|
||
|
.exp_fcvt = 0,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
|
||
|
{ .name = "+value just below 1.0",
|
||
|
.inp_lu = 0x3fefffffffffffff,
|
||
|
.exp_fcvt = 0,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "-value just above -1.0",
|
||
|
.inp_lu = 0xbfefffffffffffff,
|
||
|
.exp_fcvt = 0,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
|
||
|
{ .name = "+1.0",
|
||
|
.inp_lf = 0x1p0,
|
||
|
.exp_fcvt = 0x0000000000000001,
|
||
|
.exp_fcvt_fflags = 0,
|
||
|
.exp_fcvtmod = 0x0000000000000001,
|
||
|
.exp_fcvtmod_fflags = 0 },
|
||
|
{ .name = "-1.0",
|
||
|
.inp_lf = -0x1p0,
|
||
|
.exp_fcvt = 0xffffffffffffffff,
|
||
|
.exp_fcvt_fflags = 0,
|
||
|
.exp_fcvtmod = 0xffffffffffffffff,
|
||
|
.exp_fcvtmod_fflags = 0 },
|
||
|
|
||
|
{ .name = "+1.5",
|
||
|
.inp_lu = 0x3ff8000000000000,
|
||
|
.exp_fcvt = 1,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 1,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
{ .name = "-1.5",
|
||
|
.inp_lu = 0xbff8000000000000,
|
||
|
.exp_fcvt = 0xffffffffffffffff,
|
||
|
.exp_fcvt_fflags = FFLAG_NX,
|
||
|
.exp_fcvtmod = 0xffffffffffffffff,
|
||
|
.exp_fcvtmod_fflags = FFLAG_NX },
|
||
|
|
||
|
{ .name = "+max int32 (2147483647)",
|
||
|
.inp_lu = 0x41dfffffffc00000,
|
||
|
.exp_fcvt = 0x000000007fffffff,
|
||
|
.exp_fcvt_fflags = 0,
|
||
|
.exp_fcvtmod = 0x000000007fffffff,
|
||
|
.exp_fcvtmod_fflags = 0 },
|
||
|
{ .name = "+max int32 +1 (2147483648)",
|
||
|
.inp_lf = 0x1p31,
|
||
|
.exp_fcvt = 0x000000007fffffff,
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = (uint64_t)-2147483648l, /* int32 min */
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
{ .name = "+max int32 +2 (2147483649)",
|
||
|
.inp_lu = 0x41e0000000200000,
|
||
|
.exp_fcvt = 0x000000007fffffff,
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = (uint64_t)-2147483647l, /* int32 min +1 */
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
|
||
|
{ .name = "-max int32 (-2147483648)",
|
||
|
.inp_lf = -0x1p31,
|
||
|
.exp_fcvt = 0xffffffff80000000,
|
||
|
.exp_fcvt_fflags = 0,
|
||
|
.exp_fcvtmod = 0xffffffff80000000,
|
||
|
.exp_fcvtmod_fflags = 0 },
|
||
|
{ .name = "-max int32 -1 (-2147483649)",
|
||
|
.inp_lf = -0x1.00000002p+31,
|
||
|
.exp_fcvt = 0xffffffff80000000,
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = 2147483647, /* int32 max */
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
{ .name = "-max int32 -2 (-2147483650)",
|
||
|
.inp_lf = -0x1.00000004p+31,
|
||
|
.exp_fcvt = 0xffffffff80000000,
|
||
|
.exp_fcvt_fflags = FFLAG_NV,
|
||
|
.exp_fcvtmod = 2147483646, /* int32 max -1 */
|
||
|
.exp_fcvtmod_fflags = FFLAG_NV },
|
||
|
};
|
||
|
|
||
|
int run_fcvtmod_tests()
|
||
|
{
|
||
|
uint64_t act_fcvt;
|
||
|
uint8_t act_fcvt_fflags;
|
||
|
uint64_t act_fcvtmod;
|
||
|
uint8_t act_fcvtmod_fflags;
|
||
|
|
||
|
for (size_t i = 0; i < sizeof(tests)/sizeof(tests[0]); i++) {
|
||
|
const fp64_fcvt_fcvtmod_testcase_t *t = &tests[i];
|
||
|
|
||
|
act_fcvt = do_fcvt_w_d(t->inp_lu, &act_fcvt_fflags);
|
||
|
int fcvt_correct = act_fcvt == t->exp_fcvt &&
|
||
|
act_fcvt_fflags == t->exp_fcvt_fflags;
|
||
|
act_fcvtmod = do_fcvtmod_w_d(t->inp_lu, &act_fcvtmod_fflags);
|
||
|
int fcvtmod_correct = act_fcvtmod == t->exp_fcvtmod &&
|
||
|
act_fcvtmod_fflags == t->exp_fcvtmod_fflags;
|
||
|
|
||
|
if (fcvt_correct && fcvtmod_correct) {
|
||
|
continue;
|
||
|
}
|
||
|
|
||
|
printf("Test %zu (%s) failed!\n", i, t->name);
|
||
|
|
||
|
double fpr = do_fmv_d_x(t->inp_lu);
|
||
|
printf("inp_lu: 0x%016lx == %lf\n", t->inp_lu, fpr);
|
||
|
printf("inp_lf: %lf\n", t->inp_lf);
|
||
|
|
||
|
uint32_t sign = (t->inp_lu >> 63);
|
||
|
uint32_t exp = (uint32_t)(t->inp_lu >> 52) & 0x7ff;
|
||
|
uint64_t frac = t->inp_lu & 0xfffffffffffffull; /* significand */
|
||
|
int true_exp = exp - 1023;
|
||
|
int shift = true_exp - 52;
|
||
|
uint64_t true_frac = frac | 1ull << 52;
|
||
|
|
||
|
printf("sign=%d, exp=0x%03x, frac=0x%012lx\n", sign, exp, frac);
|
||
|
printf("true_exp=%d, shift=%d, true_frac=0x%016lx\n", true_exp, shift, true_frac);
|
||
|
|
||
|
if (!fcvt_correct) {
|
||
|
printf("act_fcvt: 0x%016lx == %li\n", act_fcvt, act_fcvt);
|
||
|
printf("exp_fcvt: 0x%016lx == %li\n", t->exp_fcvt, t->exp_fcvt);
|
||
|
printf("act_fcvt_fflags: "); print_fflags(act_fcvt_fflags); printf("\n");
|
||
|
printf("exp_fcvt_fflags: "); print_fflags(t->exp_fcvt_fflags); printf("\n");
|
||
|
}
|
||
|
|
||
|
if (!fcvtmod_correct) {
|
||
|
printf("act_fcvtmod: 0x%016lx == %li\n", act_fcvtmod, act_fcvtmod);
|
||
|
printf("exp_fcvtmod: 0x%016lx == %li\n", t->exp_fcvtmod, t->exp_fcvtmod);
|
||
|
printf("act_fcvtmod_fflags: "); print_fflags(act_fcvtmod_fflags); printf("\n");
|
||
|
printf("exp_fcvtmod_fflags: "); print_fflags(t->exp_fcvtmod_fflags); printf("\n");
|
||
|
}
|
||
|
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
int main()
|
||
|
{
|
||
|
return run_fcvtmod_tests();
|
||
|
}
|