#include #include #include #define FFLAG_NX_SHIFT 0 /* inexact */ #define FFLAG_UF_SHIFT 1 /* underflow */ #define FFLAG_OF_SHIFT 2 /* overflow */ #define FFLAG_DZ_SHIFT 3 /* divide by zero */ #define FFLAG_NV_SHIFT 4 /* invalid operation */ #define FFLAG_NV (1UL << FFLAG_NV_SHIFT) #define FFLAG_DZ (1UL << FFLAG_DZ_SHIFT) #define FFLAG_OF (1UL << FFLAG_OF_SHIFT) #define FFLAG_UF (1UL << FFLAG_UF_SHIFT) #define FFLAG_NX (1UL << FFLAG_NX_SHIFT) typedef struct fp64_fcvt_fcvtmod_testcase { const char* name; union { uint64_t inp_lu; double inp_lf; }; uint64_t exp_fcvt; uint8_t exp_fcvt_fflags; uint64_t exp_fcvtmod; uint8_t exp_fcvtmod_fflags; } fp64_fcvt_fcvtmod_testcase_t; void print_fflags(uint8_t fflags) { int set = 0; if (fflags == 0) { printf("-"); return; } if (fflags & FFLAG_NV) { printf("%sFFLAG_NV", set ? " | " : ""); set = 1; } if (fflags & FFLAG_DZ) { printf("%sFFLAG_DZ", set ? " | " : ""); set = 1; } if (fflags & FFLAG_OF) { printf("%sFFLAG_OF", set ? " | " : ""); set = 1; } if (fflags & FFLAG_UF) { printf("%sFFLAG_UF", set ? " | " : ""); set = 1; } if (fflags & FFLAG_NX) { printf("%sFFLAG_NX", set ? " | " : ""); set = 1; } } /* Clear all FP flags. */ static inline void clear_fflags() { __asm__ __volatile__("fsflags zero"); } /* Read all FP flags. */ static inline uint8_t get_fflags() { uint64_t v; __asm__ __volatile__("frflags %0" : "=r"(v)); return (uint8_t)v; } /* Move input value (without conversations) into an FP register. */ static inline double do_fmv_d_x(uint64_t inp) { double fpr; __asm__ __volatile__("fmv.d.x %0, %1" : "=f"(fpr) : "r"(inp)); return fpr; } static inline uint64_t do_fcvt_w_d(uint64_t inp, uint8_t *fflags) { uint64_t ret; double fpr = do_fmv_d_x(inp); clear_fflags(); __asm__ __volatile__("fcvt.w.d %0, %1, rtz" : "=r"(ret) : "f"(fpr)); *fflags = get_fflags(); return ret; } static inline uint64_t do_fcvtmod_w_d(uint64_t inp, uint8_t *fflags) { uint64_t ret; double fpr = do_fmv_d_x(inp); clear_fflags(); /* fcvtmod.w.d rd, rs1, rtz = 1100001 01000 rs1 001 rd 1010011 */ asm(".insn r 0x53, 0x1, 0x61, %0, %1, f8" : "=r"(ret) : "f"(fpr)); *fflags = get_fflags(); return ret; } static const fp64_fcvt_fcvtmod_testcase_t tests[] = { /* Zero (exp=0, frac=0) */ { .name = "+0.0", .inp_lf = 0x0p0, .exp_fcvt = 0x0000000000000000, .exp_fcvt_fflags = 0, .exp_fcvtmod = 0x0000000000000000, .exp_fcvtmod_fflags = 0 }, { .name = "-0.0", .inp_lf = -0x0p0, .exp_fcvt = 0x0000000000000000, .exp_fcvt_fflags = 0, .exp_fcvtmod = 0x0000000000000000, .exp_fcvtmod_fflags = 0 }, /* Subnormal: exp=0 frac!=0 */ { .name = "Subnormal frac=1", .inp_lu = 0x0000000000000001, .exp_fcvt = 0x0000000000000000, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "Subnormal frac=0xf..f", .inp_lu = 0x0000ffffffffffff, .exp_fcvt = 0x0000000000000000, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "Neg subnormal frac=1", .inp_lu = 0x0000000000000001, .exp_fcvt = 0x0000000000000000, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "Neg subnormal frac=0xf..f", .inp_lu = 0x8000ffffffffffff, .exp_fcvt = 0x0000000000000000, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, /* Infinity: exp=0x7ff, frac=0 */ { .name = "+INF", .inp_lu = 0x7ff0000000000000, .exp_fcvt = 0x000000007fffffff, /* int32 max */ .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NV }, { .name = "-INF", .inp_lu = 0xfff0000000000000, .exp_fcvt = 0xffffffff80000000, /* int32 min */ .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NV }, /* NaN: exp=7ff, frac!=0 */ { .name = "canonical NaN", .inp_lu = 0x7ff8000000000000, .exp_fcvt = 0x000000007fffffff, /* int32 max */ .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NV }, { .name = "non-canonical NaN", .inp_lu = 0x7ff8000000100000, .exp_fcvt = 0x000000007fffffff, /* int32 min */ .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NV }, /* Normal numbers: exp!=0, exp!=7ff */ { .name = "+smallest normal value", .inp_lu = 0x0010000000000000, .exp_fcvt = 0, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "-smallest normal value", .inp_lu = 0x8010000000000000, .exp_fcvt = 0, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "+0.5", .inp_lf = 0x1p-1, .exp_fcvt = 0, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "-0.5", .inp_lf = -0x1p-1, .exp_fcvt = 0, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "+value just below 1.0", .inp_lu = 0x3fefffffffffffff, .exp_fcvt = 0, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "-value just above -1.0", .inp_lu = 0xbfefffffffffffff, .exp_fcvt = 0, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "+1.0", .inp_lf = 0x1p0, .exp_fcvt = 0x0000000000000001, .exp_fcvt_fflags = 0, .exp_fcvtmod = 0x0000000000000001, .exp_fcvtmod_fflags = 0 }, { .name = "-1.0", .inp_lf = -0x1p0, .exp_fcvt = 0xffffffffffffffff, .exp_fcvt_fflags = 0, .exp_fcvtmod = 0xffffffffffffffff, .exp_fcvtmod_fflags = 0 }, { .name = "+1.5", .inp_lu = 0x3ff8000000000000, .exp_fcvt = 1, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 1, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "-1.5", .inp_lu = 0xbff8000000000000, .exp_fcvt = 0xffffffffffffffff, .exp_fcvt_fflags = FFLAG_NX, .exp_fcvtmod = 0xffffffffffffffff, .exp_fcvtmod_fflags = FFLAG_NX }, { .name = "+max int32 (2147483647)", .inp_lu = 0x41dfffffffc00000, .exp_fcvt = 0x000000007fffffff, .exp_fcvt_fflags = 0, .exp_fcvtmod = 0x000000007fffffff, .exp_fcvtmod_fflags = 0 }, { .name = "+max int32 +1 (2147483648)", .inp_lf = 0x1p31, .exp_fcvt = 0x000000007fffffff, .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = (uint64_t)-2147483648l, /* int32 min */ .exp_fcvtmod_fflags = FFLAG_NV }, { .name = "+max int32 +2 (2147483649)", .inp_lu = 0x41e0000000200000, .exp_fcvt = 0x000000007fffffff, .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = (uint64_t)-2147483647l, /* int32 min +1 */ .exp_fcvtmod_fflags = FFLAG_NV }, { .name = "-max int32 (-2147483648)", .inp_lf = -0x1p31, .exp_fcvt = 0xffffffff80000000, .exp_fcvt_fflags = 0, .exp_fcvtmod = 0xffffffff80000000, .exp_fcvtmod_fflags = 0 }, { .name = "-max int32 -1 (-2147483649)", .inp_lf = -0x1.00000002p+31, .exp_fcvt = 0xffffffff80000000, .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = 2147483647, /* int32 max */ .exp_fcvtmod_fflags = FFLAG_NV }, { .name = "-max int32 -2 (-2147483650)", .inp_lf = -0x1.00000004p+31, .exp_fcvt = 0xffffffff80000000, .exp_fcvt_fflags = FFLAG_NV, .exp_fcvtmod = 2147483646, /* int32 max -1 */ .exp_fcvtmod_fflags = FFLAG_NV }, }; int run_fcvtmod_tests() { uint64_t act_fcvt; uint8_t act_fcvt_fflags; uint64_t act_fcvtmod; uint8_t act_fcvtmod_fflags; for (size_t i = 0; i < sizeof(tests)/sizeof(tests[0]); i++) { const fp64_fcvt_fcvtmod_testcase_t *t = &tests[i]; act_fcvt = do_fcvt_w_d(t->inp_lu, &act_fcvt_fflags); int fcvt_correct = act_fcvt == t->exp_fcvt && act_fcvt_fflags == t->exp_fcvt_fflags; act_fcvtmod = do_fcvtmod_w_d(t->inp_lu, &act_fcvtmod_fflags); int fcvtmod_correct = act_fcvtmod == t->exp_fcvtmod && act_fcvtmod_fflags == t->exp_fcvtmod_fflags; if (fcvt_correct && fcvtmod_correct) { continue; } printf("Test %zu (%s) failed!\n", i, t->name); double fpr = do_fmv_d_x(t->inp_lu); printf("inp_lu: 0x%016lx == %lf\n", t->inp_lu, fpr); printf("inp_lf: %lf\n", t->inp_lf); uint32_t sign = (t->inp_lu >> 63); uint32_t exp = (uint32_t)(t->inp_lu >> 52) & 0x7ff; uint64_t frac = t->inp_lu & 0xfffffffffffffull; /* significand */ int true_exp = exp - 1023; int shift = true_exp - 52; uint64_t true_frac = frac | 1ull << 52; printf("sign=%d, exp=0x%03x, frac=0x%012lx\n", sign, exp, frac); printf("true_exp=%d, shift=%d, true_frac=0x%016lx\n", true_exp, shift, true_frac); if (!fcvt_correct) { printf("act_fcvt: 0x%016lx == %li\n", act_fcvt, act_fcvt); printf("exp_fcvt: 0x%016lx == %li\n", t->exp_fcvt, t->exp_fcvt); printf("act_fcvt_fflags: "); print_fflags(act_fcvt_fflags); printf("\n"); printf("exp_fcvt_fflags: "); print_fflags(t->exp_fcvt_fflags); printf("\n"); } if (!fcvtmod_correct) { printf("act_fcvtmod: 0x%016lx == %li\n", act_fcvtmod, act_fcvtmod); printf("exp_fcvtmod: 0x%016lx == %li\n", t->exp_fcvtmod, t->exp_fcvtmod); printf("act_fcvtmod_fflags: "); print_fflags(act_fcvtmod_fflags); printf("\n"); printf("exp_fcvtmod_fflags: "); print_fflags(t->exp_fcvtmod_fflags); printf("\n"); } return 1; } return 0; } int main() { return run_fcvtmod_tests(); }