test-i386-fprem.c - qemu - FORK: QEMU emulator

test-i386-fprem.c (9669B)
      1 /*
      2  *  x86 FPREM test - executes the FPREM and FPREM1 instructions with corner case
      3  *  operands and prints the operands, result and FPU status word.
      4  *
      5  *  Run this on real hardware, then under QEMU, and diff the outputs, to compare
      6  *  QEMU's implementation to your hardware. The 'run-test-i386-fprem' make
      7  *  target does this.
      8  *
      9  *  Copyright (c) 2003 Fabrice Bellard
     10  *  Copyright (c) 2012 Catalin Patulea
     11  *
     12  *  This program is free software; you can redistribute it and/or modify
     13  *  it under the terms of the GNU General Public License as published by
     14  *  the Free Software Foundation; either version 2 of the License, or
     15  *  (at your option) any later version.
     16  *
     17  *  This program is distributed in the hope that it will be useful,
     18  *  but WITHOUT ANY WARRANTY; without even the implied warranty of
     19  *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
     20  *  GNU General Public License for more details.
     21  *
     22  *  You should have received a copy of the GNU General Public License
     23  *  along with this program; if not, see <http://www.gnu.org/licenses/>.
     24  */
     25 
     26 #include <stdio.h>
     27 #include <stdint.h>
     28 
     29 #define ARRAY_SIZE(x) (sizeof(x) / sizeof((x)[0]))
     30 
     31 /*
     32  * Inspired by <ieee754.h>'s union ieee854_long_double, but with single
     33  * long long mantissa fields and assuming little-endianness for simplicity.
     34  */
     35 union float80u {
     36     long double d;
     37 
     38     /* This is the IEEE 854 double-extended-precision format.  */
     39     struct {
     40         unsigned long long mantissa:63;
     41         unsigned int one:1;
     42         unsigned int exponent:15;
     43         unsigned int negative:1;
     44         unsigned int empty:16;
     45     } __attribute__((packed)) ieee;
     46 
     47     /* This is for NaNs in the IEEE 854 double-extended-precision format.  */
     48     struct {
     49         unsigned long long mantissa:62;
     50         unsigned int quiet_nan:1;
     51         unsigned int one:1;
     52         unsigned int exponent:15;
     53         unsigned int negative:1;
     54         unsigned int empty:16;
     55     } __attribute__((packed)) ieee_nan;
     56 };
     57 
     58 #define IEEE854_LONG_DOUBLE_BIAS 0x3fff
     59 
     60 static const union float80u q_nan = {
     61     .ieee_nan.negative = 0,  /* X */
     62     .ieee_nan.exponent = 0x7fff,
     63     .ieee_nan.one = 1,
     64     .ieee_nan.quiet_nan = 1,
     65     .ieee_nan.mantissa = 0,
     66 };
     67 
     68 static const union float80u s_nan = {
     69     .ieee_nan.negative = 0,  /* X */
     70     .ieee_nan.exponent = 0x7fff,
     71     .ieee_nan.one = 1,
     72     .ieee_nan.quiet_nan = 0,
     73     .ieee_nan.mantissa = 1,  /* nonzero */
     74 };
     75 
     76 static const union float80u pos_inf = {
     77     .ieee.negative = 0,
     78     .ieee.exponent = 0x7fff,
     79     .ieee.one = 1,
     80     .ieee.mantissa = 0,
     81 };
     82 
     83 static const union float80u pseudo_pos_inf = {  /* "unsupported" */
     84     .ieee.negative = 0,
     85     .ieee.exponent = 0x7fff,
     86     .ieee.one = 0,
     87     .ieee.mantissa = 0,
     88 };
     89 
     90 static const union float80u pos_denorm = {
     91     .ieee.negative = 0,
     92     .ieee.exponent = 0,
     93     .ieee.one = 0,
     94     .ieee.mantissa = 1,
     95 };
     96 
     97 static const union float80u smallest_positive_norm = {
     98     .ieee.negative = 0,
     99     .ieee.exponent = 1,
    100     .ieee.one = 1,
    101     .ieee.mantissa = 0,
    102 };
    103 
    104 static void fninit()
    105 {
    106     asm volatile ("fninit\n");
    107 }
    108 
    109 static long double fprem(long double a, long double b, uint16_t *sw)
    110 {
    111     long double result;
    112     asm volatile ("fprem\n"
    113                   "fnstsw %1\n"
    114                   : "=t" (result), "=m" (*sw)
    115                   : "0" (a), "u" (b)
    116                   : "st(1)");
    117     return result;
    118 }
    119 
    120 static long double fprem1(long double a, long double b, uint16_t *sw)
    121 {
    122     long double result;
    123     asm volatile ("fprem1\n"
    124                   "fnstsw %1\n"
    125                   : "=t" (result), "=m" (*sw)
    126                   : "0" (a), "u" (b)
    127                   : "st(1)");
    128     return result;
    129 }
    130 
    131 #define FPUS_IE (1 << 0)
    132 #define FPUS_DE (1 << 1)
    133 #define FPUS_ZE (1 << 2)
    134 #define FPUS_OE (1 << 3)
    135 #define FPUS_UE (1 << 4)
    136 #define FPUS_PE (1 << 5)
    137 #define FPUS_SF (1 << 6)
    138 #define FPUS_SE (1 << 7)
    139 #define FPUS_C0 (1 << 8)
    140 #define FPUS_C1 (1 << 9)
    141 #define FPUS_C2 (1 << 10)
    142 #define FPUS_TOP 0x3800
    143 #define FPUS_C3 (1 << 14)
    144 #define FPUS_B  (1 << 15)
    145 
    146 #define FPUS_EMASK 0x007f
    147 
    148 #define FPUC_EM 0x3f
    149 
    150 static void psw(uint16_t sw)
    151 {
    152     printf("SW:  C3 TopC2C1C0\n");
    153     printf("SW: %c %d %3d %d %d %d %c %c %c %c %c %c %c %c\n",
    154            sw & FPUS_B ? 'B' : 'b',
    155            !!(sw & FPUS_C3),
    156            (sw & FPUS_TOP) >> 11,
    157            !!(sw & FPUS_C2),
    158            !!(sw & FPUS_C1),
    159            !!(sw & FPUS_C0),
    160            (sw & FPUS_SE) ? 'S' : 's',
    161            (sw & FPUS_SF) ? 'F' : 'f',
    162            (sw & FPUS_PE) ? 'P' : 'p',
    163            (sw & FPUS_UE) ? 'U' : 'u',
    164            (sw & FPUS_OE) ? 'O' : 'o',
    165            (sw & FPUS_ZE) ? 'Z' : 'z',
    166            (sw & FPUS_DE) ? 'D' : 'd',
    167            (sw & FPUS_IE) ? 'I' : 'i');
    168 }
    169 
    170 static void do_fprem(long double a, long double b)
    171 {
    172     const union float80u au = {.d = a};
    173     const union float80u bu = {.d = b};
    174     union float80u ru;
    175     uint16_t sw;
    176 
    177     printf("A: S=%d Exp=%04x Int=%d (QNaN=%d) Sig=%016llx (%.06Le)\n",
    178            au.ieee.negative, au.ieee.exponent, au.ieee.one,
    179            au.ieee_nan.quiet_nan, (unsigned long long)au.ieee.mantissa,
    180            a);
    181     printf("B: S=%d Exp=%04x Int=%d (QNaN=%d) Sig=%016llx (%.06Le)\n",
    182            bu.ieee.negative, bu.ieee.exponent, bu.ieee.one,
    183            bu.ieee_nan.quiet_nan, (unsigned long long)bu.ieee.mantissa,
    184            b);
    185     fflush(stdout);
    186 
    187     fninit();
    188     ru.d = fprem(a, b, &sw);
    189     psw(sw);
    190 
    191     printf("R : S=%d Exp=%04x Int=%d (QNaN=%d) Sig=%016llx (%.06Le)\n",
    192            ru.ieee.negative, ru.ieee.exponent, ru.ieee.one,
    193            ru.ieee_nan.quiet_nan, (unsigned long long)ru.ieee.mantissa,
    194            ru.d);
    195 
    196     fninit();
    197     ru.d = fprem1(a, b, &sw);
    198     psw(sw);
    199 
    200     printf("R1: S=%d Exp=%04x Int=%d (QNaN=%d) Sig=%016llx (%.06Le)\n",
    201            ru.ieee.negative, ru.ieee.exponent, ru.ieee.one,
    202            ru.ieee_nan.quiet_nan, (unsigned long long)ru.ieee.mantissa,
    203            ru.d);
    204 
    205     printf("\n");
    206 }
    207 
    208 static void do_fprem_stack_underflow(void)
    209 {
    210     const long double a = 1.0;
    211     union float80u ru;
    212     uint16_t sw;
    213 
    214     fninit();
    215     asm volatile ("fprem\n"
    216                   "fnstsw %1\n"
    217                   : "=t" (ru.d), "=m" (sw)
    218                   : "0" (a)
    219                   : "st(1)");
    220     psw(sw);
    221 
    222     printf("R: S=%d Exp=%04x Int=%d (QNaN=%d) Sig=%016llx (%.06Le)\n",
    223            ru.ieee.negative, ru.ieee.exponent, ru.ieee.one,
    224            ru.ieee_nan.quiet_nan, (unsigned long long)ru.ieee.mantissa,
    225            ru.d);
    226     printf("\n");
    227 }
    228 
    229 static void test_fprem_cases(void)
    230 {
    231     printf("= stack underflow =\n");
    232     do_fprem_stack_underflow();
    233 
    234     printf("= invalid operation =\n");
    235     do_fprem(q_nan.d, 1.0);
    236     do_fprem(s_nan.d, 1.0);
    237     do_fprem(1.0, 0.0);
    238     do_fprem(pos_inf.d, 1.0);
    239     do_fprem(pseudo_pos_inf.d, 1.0);
    240 
    241     printf("= denormal =\n");
    242     do_fprem(pos_denorm.d, 1.0);
    243     do_fprem(1.0, pos_denorm.d);
    244 
    245     do_fprem(smallest_positive_norm.d, smallest_positive_norm.d);
    246 
    247     /* printf("= underflow =\n"); */
    248     /* TODO: Is there a case where FPREM raises underflow? */
    249 }
    250 
    251 static void test_fprem_pairs(void)
    252 {
    253     unsigned long long count;
    254 
    255     unsigned int negative_index_a = 0;
    256     unsigned int negative_index_b = 0;
    257     static const unsigned int negative_values[] = {
    258         0,
    259         1,
    260     };
    261 
    262     unsigned int exponent_index_a = 0;
    263     unsigned int exponent_index_b = 0;
    264     static const unsigned int exponent_values[] = {
    265         0,
    266         1,
    267         2,
    268         IEEE854_LONG_DOUBLE_BIAS - 1,
    269         IEEE854_LONG_DOUBLE_BIAS,
    270         IEEE854_LONG_DOUBLE_BIAS + 1,
    271         0x7ffd,
    272         0x7ffe,
    273         0x7fff,
    274     };
    275 
    276     unsigned int one_index_a = 0;
    277     unsigned int one_index_b = 0;
    278     static const unsigned int one_values[] = {
    279         0,
    280         1,
    281     };
    282 
    283     unsigned int quiet_nan_index_a = 0;
    284     unsigned int quiet_nan_index_b = 0;
    285     static const unsigned int quiet_nan_values[] = {
    286         0,
    287         1,
    288     };
    289 
    290     unsigned int mantissa_index_a = 0;
    291     unsigned int mantissa_index_b = 0;
    292     static const unsigned long long mantissa_values[] = {
    293         0,
    294         1,
    295         2,
    296         0x3ffffffffffffffdULL,
    297         0x3ffffffffffffffeULL,
    298         0x3fffffffffffffffULL,
    299     };
    300 
    301     for (count = 0; ; ++count) {
    302 #define INIT_FIELD(var, field) \
    303             .ieee_nan.field = field##_values[field##_index_##var]
    304         const union float80u a = {
    305             INIT_FIELD(a, negative),
    306             INIT_FIELD(a, exponent),
    307             INIT_FIELD(a, one),
    308             INIT_FIELD(a, quiet_nan),
    309             INIT_FIELD(a, mantissa),
    310         };
    311         const union float80u b = {
    312             INIT_FIELD(b, negative),
    313             INIT_FIELD(b, exponent),
    314             INIT_FIELD(b, one),
    315             INIT_FIELD(b, quiet_nan),
    316             INIT_FIELD(b, mantissa),
    317         };
    318 #undef INIT_FIELD
    319 
    320         do_fprem(a.d, b.d);
    321 
    322         int carry = 1;
    323 #define CARRY_INTO(var, field) do { \
    324             if (carry) { \
    325                 if (++field##_index_##var == ARRAY_SIZE(field##_values)) { \
    326                     field##_index_##var = 0; \
    327                 } else { \
    328                     carry = 0; \
    329                 } \
    330             } \
    331         } while (0)
    332         CARRY_INTO(b, mantissa);
    333         CARRY_INTO(b, quiet_nan);
    334         CARRY_INTO(b, one);
    335         CARRY_INTO(b, exponent);
    336         CARRY_INTO(b, negative);
    337         CARRY_INTO(a, mantissa);
    338         CARRY_INTO(a, quiet_nan);
    339         CARRY_INTO(a, one);
    340         CARRY_INTO(a, exponent);
    341         CARRY_INTO(a, negative);
    342 #undef CARRY_INTO
    343 
    344         if (carry) {
    345             break;
    346         }
    347     }
    348 
    349     fprintf(stderr, "test-i386-fprem: tested %llu cases\n", count);
    350 }
    351 
    352 int main(int argc, char **argv)
    353 {
    354     test_fprem_cases();
    355     test_fprem_pairs();
    356     return 0;
    357 }
	qemu FORK: QEMU emulator
	git clone https://git.neptards.moe/neptards/qemu.git
	Log \| Files \| Refs \| Submodules \| LICENSE