| #include <stdio.h> |
| #include <stddef.h> |
| #include <stdint.h> |
| |
| #define FFLAG_NX_SHIFT 0 /* inexact */ |
| #define FFLAG_UF_SHIFT 1 /* underflow */ |
| #define FFLAG_OF_SHIFT 2 /* overflow */ |
| #define FFLAG_DZ_SHIFT 3 /* divide by zero */ |
| #define FFLAG_NV_SHIFT 4 /* invalid operation */ |
| |
| #define FFLAG_NV (1UL << FFLAG_NV_SHIFT) |
| #define FFLAG_DZ (1UL << FFLAG_DZ_SHIFT) |
| #define FFLAG_OF (1UL << FFLAG_OF_SHIFT) |
| #define FFLAG_UF (1UL << FFLAG_UF_SHIFT) |
| #define FFLAG_NX (1UL << FFLAG_NX_SHIFT) |
| |
| typedef struct fp64_fcvt_fcvtmod_testcase { |
| const char* name; |
| union { |
| uint64_t inp_lu; |
| double inp_lf; |
| }; |
| uint64_t exp_fcvt; |
| uint8_t exp_fcvt_fflags; |
| uint64_t exp_fcvtmod; |
| uint8_t exp_fcvtmod_fflags; |
| } fp64_fcvt_fcvtmod_testcase_t; |
| |
| void print_fflags(uint8_t fflags) |
| { |
| int set = 0; |
| |
| if (fflags == 0) { |
| printf("-"); |
| return; |
| } |
| |
| if (fflags & FFLAG_NV) { |
| printf("%sFFLAG_NV", set ? " | " : ""); |
| set = 1; |
| } |
| if (fflags & FFLAG_DZ) { |
| printf("%sFFLAG_DZ", set ? " | " : ""); |
| set = 1; |
| } |
| if (fflags & FFLAG_OF) { |
| printf("%sFFLAG_OF", set ? " | " : ""); |
| set = 1; |
| } |
| if (fflags & FFLAG_UF) { |
| printf("%sFFLAG_UF", set ? " | " : ""); |
| set = 1; |
| } |
| if (fflags & FFLAG_NX) { |
| printf("%sFFLAG_NX", set ? " | " : ""); |
| set = 1; |
| } |
| } |
| |
| /* Clear all FP flags. */ |
| static inline void clear_fflags() |
| { |
| __asm__ __volatile__("fsflags zero"); |
| } |
| |
| /* Read all FP flags. */ |
| static inline uint8_t get_fflags() |
| { |
| uint64_t v; |
| __asm__ __volatile__("frflags %0" : "=r"(v)); |
| return (uint8_t)v; |
| } |
| |
| /* Move input value (without conversations) into an FP register. */ |
| static inline double do_fmv_d_x(uint64_t inp) |
| { |
| double fpr; |
| __asm__ __volatile__("fmv.d.x %0, %1" : "=f"(fpr) : "r"(inp)); |
| return fpr; |
| } |
| |
| static inline uint64_t do_fcvt_w_d(uint64_t inp, uint8_t *fflags) |
| { |
| uint64_t ret; |
| double fpr = do_fmv_d_x(inp); |
| |
| clear_fflags(); |
| |
| __asm__ __volatile__("fcvt.w.d %0, %1, rtz" : "=r"(ret) : "f"(fpr)); |
| |
| *fflags = get_fflags(); |
| |
| return ret; |
| } |
| |
| static inline uint64_t do_fcvtmod_w_d(uint64_t inp, uint8_t *fflags) |
| { |
| uint64_t ret; |
| double fpr = do_fmv_d_x(inp); |
| |
| clear_fflags(); |
| |
| /* fcvtmod.w.d rd, rs1, rtz = 1100001 01000 rs1 001 rd 1010011 */ |
| asm(".insn r 0x53, 0x1, 0x61, %0, %1, f8" : "=r"(ret) : "f"(fpr)); |
| |
| *fflags = get_fflags(); |
| |
| return ret; |
| } |
| |
| static const fp64_fcvt_fcvtmod_testcase_t tests[] = { |
| /* Zero (exp=0, frac=0) */ |
| { .name = "+0.0", |
| .inp_lf = 0x0p0, |
| .exp_fcvt = 0x0000000000000000, |
| .exp_fcvt_fflags = 0, |
| .exp_fcvtmod = 0x0000000000000000, |
| .exp_fcvtmod_fflags = 0 }, |
| { .name = "-0.0", |
| .inp_lf = -0x0p0, |
| .exp_fcvt = 0x0000000000000000, |
| .exp_fcvt_fflags = 0, |
| .exp_fcvtmod = 0x0000000000000000, |
| .exp_fcvtmod_fflags = 0 }, |
| |
| /* Subnormal: exp=0 frac!=0 */ |
| { .name = "Subnormal frac=1", |
| .inp_lu = 0x0000000000000001, |
| .exp_fcvt = 0x0000000000000000, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "Subnormal frac=0xf..f", |
| .inp_lu = 0x0000ffffffffffff, |
| .exp_fcvt = 0x0000000000000000, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "Neg subnormal frac=1", |
| .inp_lu = 0x0000000000000001, |
| .exp_fcvt = 0x0000000000000000, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "Neg subnormal frac=0xf..f", |
| .inp_lu = 0x8000ffffffffffff, |
| .exp_fcvt = 0x0000000000000000, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| |
| /* Infinity: exp=0x7ff, frac=0 */ |
| { .name = "+INF", |
| .inp_lu = 0x7ff0000000000000, |
| .exp_fcvt = 0x000000007fffffff, /* int32 max */ |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| { .name = "-INF", |
| .inp_lu = 0xfff0000000000000, |
| .exp_fcvt = 0xffffffff80000000, /* int32 min */ |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| |
| /* NaN: exp=7ff, frac!=0 */ |
| { .name = "canonical NaN", |
| .inp_lu = 0x7ff8000000000000, |
| .exp_fcvt = 0x000000007fffffff, /* int32 max */ |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| { .name = "non-canonical NaN", |
| .inp_lu = 0x7ff8000000100000, |
| .exp_fcvt = 0x000000007fffffff, /* int32 min */ |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| |
| /* Normal numbers: exp!=0, exp!=7ff */ |
| { .name = "+smallest normal value", |
| .inp_lu = 0x0010000000000000, |
| .exp_fcvt = 0, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "-smallest normal value", |
| .inp_lu = 0x8010000000000000, |
| .exp_fcvt = 0, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| |
| { .name = "+0.5", |
| .inp_lf = 0x1p-1, |
| .exp_fcvt = 0, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "-0.5", |
| .inp_lf = -0x1p-1, |
| .exp_fcvt = 0, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| |
| { .name = "+value just below 1.0", |
| .inp_lu = 0x3fefffffffffffff, |
| .exp_fcvt = 0, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "-value just above -1.0", |
| .inp_lu = 0xbfefffffffffffff, |
| .exp_fcvt = 0, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| |
| { .name = "+1.0", |
| .inp_lf = 0x1p0, |
| .exp_fcvt = 0x0000000000000001, |
| .exp_fcvt_fflags = 0, |
| .exp_fcvtmod = 0x0000000000000001, |
| .exp_fcvtmod_fflags = 0 }, |
| { .name = "-1.0", |
| .inp_lf = -0x1p0, |
| .exp_fcvt = 0xffffffffffffffff, |
| .exp_fcvt_fflags = 0, |
| .exp_fcvtmod = 0xffffffffffffffff, |
| .exp_fcvtmod_fflags = 0 }, |
| |
| { .name = "+1.5", |
| .inp_lu = 0x3ff8000000000000, |
| .exp_fcvt = 1, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 1, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| { .name = "-1.5", |
| .inp_lu = 0xbff8000000000000, |
| .exp_fcvt = 0xffffffffffffffff, |
| .exp_fcvt_fflags = FFLAG_NX, |
| .exp_fcvtmod = 0xffffffffffffffff, |
| .exp_fcvtmod_fflags = FFLAG_NX }, |
| |
| { .name = "+max int32 (2147483647)", |
| .inp_lu = 0x41dfffffffc00000, |
| .exp_fcvt = 0x000000007fffffff, |
| .exp_fcvt_fflags = 0, |
| .exp_fcvtmod = 0x000000007fffffff, |
| .exp_fcvtmod_fflags = 0 }, |
| { .name = "+max int32 +1 (2147483648)", |
| .inp_lf = 0x1p31, |
| .exp_fcvt = 0x000000007fffffff, |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = (uint64_t)-2147483648l, /* int32 min */ |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| { .name = "+max int32 +2 (2147483649)", |
| .inp_lu = 0x41e0000000200000, |
| .exp_fcvt = 0x000000007fffffff, |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = (uint64_t)-2147483647l, /* int32 min +1 */ |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| |
| { .name = "-max int32 (-2147483648)", |
| .inp_lf = -0x1p31, |
| .exp_fcvt = 0xffffffff80000000, |
| .exp_fcvt_fflags = 0, |
| .exp_fcvtmod = 0xffffffff80000000, |
| .exp_fcvtmod_fflags = 0 }, |
| { .name = "-max int32 -1 (-2147483649)", |
| .inp_lf = -0x1.00000002p+31, |
| .exp_fcvt = 0xffffffff80000000, |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = 2147483647, /* int32 max */ |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| { .name = "-max int32 -2 (-2147483650)", |
| .inp_lf = -0x1.00000004p+31, |
| .exp_fcvt = 0xffffffff80000000, |
| .exp_fcvt_fflags = FFLAG_NV, |
| .exp_fcvtmod = 2147483646, /* int32 max -1 */ |
| .exp_fcvtmod_fflags = FFLAG_NV }, |
| }; |
| |
| int run_fcvtmod_tests() |
| { |
| uint64_t act_fcvt; |
| uint8_t act_fcvt_fflags; |
| uint64_t act_fcvtmod; |
| uint8_t act_fcvtmod_fflags; |
| |
| for (size_t i = 0; i < sizeof(tests)/sizeof(tests[0]); i++) { |
| const fp64_fcvt_fcvtmod_testcase_t *t = &tests[i]; |
| |
| act_fcvt = do_fcvt_w_d(t->inp_lu, &act_fcvt_fflags); |
| int fcvt_correct = act_fcvt == t->exp_fcvt && |
| act_fcvt_fflags == t->exp_fcvt_fflags; |
| act_fcvtmod = do_fcvtmod_w_d(t->inp_lu, &act_fcvtmod_fflags); |
| int fcvtmod_correct = act_fcvtmod == t->exp_fcvtmod && |
| act_fcvtmod_fflags == t->exp_fcvtmod_fflags; |
| |
| if (fcvt_correct && fcvtmod_correct) { |
| continue; |
| } |
| |
| printf("Test %zu (%s) failed!\n", i, t->name); |
| |
| double fpr = do_fmv_d_x(t->inp_lu); |
| printf("inp_lu: 0x%016lx == %lf\n", t->inp_lu, fpr); |
| printf("inp_lf: %lf\n", t->inp_lf); |
| |
| uint32_t sign = (t->inp_lu >> 63); |
| uint32_t exp = (uint32_t)(t->inp_lu >> 52) & 0x7ff; |
| uint64_t frac = t->inp_lu & 0xfffffffffffffull; /* significand */ |
| int true_exp = exp - 1023; |
| int shift = true_exp - 52; |
| uint64_t true_frac = frac | 1ull << 52; |
| |
| printf("sign=%d, exp=0x%03x, frac=0x%012lx\n", sign, exp, frac); |
| printf("true_exp=%d, shift=%d, true_frac=0x%016lx\n", true_exp, shift, true_frac); |
| |
| if (!fcvt_correct) { |
| printf("act_fcvt: 0x%016lx == %li\n", act_fcvt, act_fcvt); |
| printf("exp_fcvt: 0x%016lx == %li\n", t->exp_fcvt, t->exp_fcvt); |
| printf("act_fcvt_fflags: "); print_fflags(act_fcvt_fflags); printf("\n"); |
| printf("exp_fcvt_fflags: "); print_fflags(t->exp_fcvt_fflags); printf("\n"); |
| } |
| |
| if (!fcvtmod_correct) { |
| printf("act_fcvtmod: 0x%016lx == %li\n", act_fcvtmod, act_fcvtmod); |
| printf("exp_fcvtmod: 0x%016lx == %li\n", t->exp_fcvtmod, t->exp_fcvtmod); |
| printf("act_fcvtmod_fflags: "); print_fflags(act_fcvtmod_fflags); printf("\n"); |
| printf("exp_fcvtmod_fflags: "); print_fflags(t->exp_fcvtmod_fflags); printf("\n"); |
| } |
| |
| return 1; |
| } |
| |
| return 0; |
| } |
| |
| int main() |
| { |
| return run_fcvtmod_tests(); |
| } |