none/tests/ppc32/test_dfp4.c - platform/external/valgrind - Git at Google

 /*  Copyright (C) 2012 IBM

  Author: Maynard Johnson <maynardj@us.ibm.com>

  This program is free software; you can redistribute it and/or
  modify it under the terms of the GNU General Public License as
  published by the Free Software Foundation; either version 2 of the
  License, or (at your option) any later version.

  This program is distributed in the hope that it will be useful, but
  WITHOUT ANY WARRANTY; without even the implied warranty of
  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  General Public License for more details.

  You should have received a copy of the GNU General Public License
  along with this program; if not, write to the Free Software
  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
  02111-1307, USA.

  The GNU General Public License is contained in the file COPYING.
  */

 #include <stdio.h>
 #include <stdlib.h>
 #include <stdint.h>

 #if defined(HAS_DFP)

 typedef union stuff {
    _Decimal64  dec_val;
    _Decimal128  dec_val128;
    unsigned long long u64_val;
    struct {
 #if defined(VGP_ppc64le_linux)
       unsigned long long vall;
       unsigned long long valu;
 #else
       unsigned long long valu;
       unsigned long long vall;
 #endif
    } u128;
 } dfp_val_t;


 typedef unsigned char Bool;
 #define True 1
 #define False 0


 #define ALLCR "cr0","cr1","cr2","cr3","cr4","cr5","cr6","cr7"

 #define SET_CR(_arg) \
       __asm__ __volatile__ ("mtcr  %0" : : "b"(_arg) : ALLCR );

 #define SET_XER(_arg) \
       __asm__ __volatile__ ("mtxer %0" : : "b"(_arg) : "xer" );

 #define GET_CR(_lval) \
       __asm__ __volatile__ ("mfcr %0"  : "=b"(_lval) )

 #define GET_XER(_lval) \
       __asm__ __volatile__ ("mfxer %0" : "=b"(_lval) )

 #define GET_CR_XER(_lval_cr,_lval_xer) \
    do { GET_CR(_lval_cr); GET_XER(_lval_xer); } while (0)

 #define SET_CR_ZERO \
       SET_CR(0)

 #define SET_XER_ZERO \
       SET_XER(0)

 #define SET_CR_XER_ZERO \
    do { SET_CR_ZERO; SET_XER_ZERO; } while (0)

 #define SET_FPSCR_ZERO \
    do { double _d = 0.0; \
         __asm__ __volatile__ ("mtfsf 0xFF, %0" : : "f"(_d) ); \
    } while (0)

 #define GET_FPSCR(_arg) \
     __asm__ __volatile__ ("mffs %0"  : "=f"(_arg) )

 #define SET_FPSCR_DRN \
     __asm__ __volatile__ ("mtfsf  1, %0, 0, 1" :  : "f"(f14) )


 // The assembly-level instructions being tested

 /* In _test_dtstdc[q], DCM can be one of 6 possible data classes, numbered 0-5.
  * In reality, DCM is a 6-bit mask field.  We just test the individual values
  * and assume that masking multiple values would work OK.
  * BF is the condition register bit field which can range from 0-7.  But for
  * testing purposes, we only use BF values of '0' and '5'.
  */
 static void _test_dtstdc(int BF, int DCM, dfp_val_t *val1, dfp_val_t *x1 __attribute__((unused)))
 {
    _Decimal64 f14 = val1->dec_val;
    if (DCM < 0 || DCM > 5 || !(BF == 0 || BF == 5)) {
       fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DCM);
       return;
    }
    switch (DCM) {
       case 0:
          if (BF)
             __asm__ __volatile__ ("dtstdc 5, %0, 1" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdc 0, %0, 1" : : "f" (f14));
          break;
       case 1:
          if (BF)
             __asm__ __volatile__ ("dtstdc 5, %0, 2" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdc 0, %0, 2" : : "f" (f14));
          break;
       case 2:
          if (BF)
             __asm__ __volatile__ ("dtstdc 5, %0, 4" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdc 0, %0, 4" : : "f" (f14));
          break;
       case 3:
          if (BF)
             __asm__ __volatile__ ("dtstdc 5, %0, 8" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdc 0, %0, 8" : : "f" (f14));
          break;
       case 4:
          if (BF)
             __asm__ __volatile__ ("dtstdc 5, %0, 16" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdc 0, %0, 16" : : "f" (f14));
          break;
       case 5:
          if (BF)
             __asm__ __volatile__ ("dtstdc 5, %0, 32" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdc 0, %0, 32" : : "f" (f14));
          break;
       default:
          break;
    }
 }

 static void _test_dtstdcq(int BF, int DCM, dfp_val_t *val1, dfp_val_t *x1 __attribute__((unused)))
 {
    _Decimal128 f14 = val1->dec_val128;
    if (DCM < 0 || DCM > 5 || !(BF == 0 || BF == 5)) {
       fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DCM);
       return;
    }
    switch (DCM) {
       case 0:
          if (BF)
             __asm__ __volatile__ ("dtstdcq 5, %0, 1" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdcq 0, %0, 1" : : "f" (f14));
          break;
       case 1:
          if (BF)
             __asm__ __volatile__ ("dtstdcq 5, %0, 2" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdcq 0, %0, 2" : : "f" (f14));
          break;
       case 2:
          if (BF)
             __asm__ __volatile__ ("dtstdcq 5, %0, 4" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdcq 0, %0, 4" : : "f" (f14));
          break;
       case 3:
          if (BF)
             __asm__ __volatile__ ("dtstdcq 5, %0, 8" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdcq 0, %0, 8" : : "f" (f14));
          break;
       case 4:
          if (BF)
             __asm__ __volatile__ ("dtstdcq 5, %0, 16" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdcq 0, %0, 16" : : "f" (f14));
          break;
       case 5:
          if (BF)
             __asm__ __volatile__ ("dtstdcq 5, %0, 32" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdcq 0, %0, 32" : : "f" (f14));
          break;
       default:
          break;
    }
 }

 /* In _test_dtstdg[q], DGM can be one of 6 possible data groups, numbered 0-5.
  * In reality, DGM is a 6-bit mask field.  We just test the individual values
  * and assume that masking multiple values would work OK.
  * BF is the condition register bit field which can range from 0-7.  But for
  * testing purposes, we only use BF values of '0' and '5'.
  */
 static void _test_dtstdg(int BF, int DGM, dfp_val_t *val1, dfp_val_t *x1 __attribute__((unused)))
 {
    _Decimal64 f14 = val1->dec_val;
    if (DGM < 0 || DGM > 5 || !(BF == 0 || BF == 5)) {
       fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DGM);
       return;
    }
    switch (DGM) {
       case 0:
          if (BF)
             __asm__ __volatile__ ("dtstdg 5, %0, 1" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdg 0, %0, 1" : : "f" (f14));
          break;
       case 1:
          if (BF)
             __asm__ __volatile__ ("dtstdg 5, %0, 2" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdg 0, %0, 2" : : "f" (f14));
          break;
       case 2:
          if (BF)
             __asm__ __volatile__ ("dtstdg 5, %0, 4" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdg 0, %0, 4" : : "f" (f14));
          break;
       case 3:
          if (BF)
             __asm__ __volatile__ ("dtstdg 5, %0, 8" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdg 0, %0, 8" : : "f" (f14));
          break;
       case 4:
          if (BF)
             __asm__ __volatile__ ("dtstdg 5, %0, 16" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdg 0, %0, 16" : : "f" (f14));
          break;
       case 5:
          if (BF)
             __asm__ __volatile__ ("dtstdg 5, %0, 32" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdg 0, %0, 32" : : "f" (f14));
          break;
       default:
          break;
    }
 }

 static void _test_dtstdgq(int BF, int DGM, dfp_val_t *val1, dfp_val_t *x1 __attribute__((unused)))
 {
    _Decimal128 f14 = val1->dec_val128;
    if (DGM < 0 || DGM > 5 || !(BF == 0 || BF == 5)) {
       fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DGM);
       return;
    }
    switch (DGM) {
       case 0:
          if (BF)
             __asm__ __volatile__ ("dtstdgq 5, %0, 1" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdgq 0, %0, 1" : : "f" (f14));
          break;
       case 1:
          if (BF)
             __asm__ __volatile__ ("dtstdgq 5, %0, 2" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdgq 0, %0, 2" : : "f" (f14));
          break;
       case 2:
          if (BF)
             __asm__ __volatile__ ("dtstdgq 5, %0, 4" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdgq 0, %0, 4" : : "f" (f14));
          break;
       case 3:
          if (BF)
             __asm__ __volatile__ ("dtstdgq 5, %0, 8" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdgq 0, %0, 8" : : "f" (f14));
          break;
       case 4:
          if (BF)
             __asm__ __volatile__ ("dtstdgq 5, %0, 16" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdgq 0, %0, 16" : : "f" (f14));
          break;
       case 5:
          if (BF)
             __asm__ __volatile__ ("dtstdgq 5, %0, 32" : : "f" (f14));
          else
             __asm__ __volatile__ ("dtstdgq 0, %0, 32" : : "f" (f14));
          break;
       default:
          break;
    }
 }

 /* In _test_dtstex[q], BF is the condition register bit field indicating the
  * CR field in which the result of the test should be placed.  BF can range
  * from 0-7, but for testing purposes, we only use BF values of '4' and '7'.
  */
 static void
 _test_dtstex(int BF, int x __attribute__((unused)), dfp_val_t *val1, dfp_val_t *val2)
 {
    _Decimal64 f14 = val1->dec_val;
    _Decimal64 f16 = val2->dec_val;
    if (!(BF == 4 || BF == 7)) {
       fprintf(stderr, "Invalid input to asm test: a=%d\n", BF);
       return;
    }
    switch (BF) {
       case 4:
          __asm__ __volatile__ ("dtstex  4, %0, %1" :  : "f" (f14),"f" (f16));
          break;
       case 7:
          __asm__ __volatile__ ("dtstex  7, %0, %1" :  : "f" (f14),"f" (f16));
          break;
       default:
          break;
    }
 }

 static void _test_dtstexq(int BF, int x __attribute__((unused)), dfp_val_t *val1, dfp_val_t *val2)
 {
    _Decimal128 f14 = val1->dec_val128;
    _Decimal128 f16 = val2->dec_val128;
    if (!(BF == 4 || BF == 7)) {
       fprintf(stderr, "Invalid input to asm test: a=%d\n", BF);
       return;
    }
    switch (BF) {
       case 4:
          __asm__ __volatile__ ("dtstexq  4, %0, %1" :  : "f" (f14),"f" (f16));
          break;
       case 7:
          __asm__ __volatile__ ("dtstexq  7, %0, %1" :  : "f" (f14),"f" (f16));
          break;
       default:
          break;
    }
 }


 typedef void (*test_funcp_t)(int a, int b,  dfp_val_t *val1,  dfp_val_t *val2);
 typedef void (*test_driver_func_t)(void);
 typedef struct test_table
 {
    test_driver_func_t test_category;
    char * name;
 } test_table_t;

 /*
  *  345.0DD (0x2207c00000000000 0xe50)
  *  1.2300e+5DD (0x2207c00000000000 0x14c000)
  *  -16.0DD (0xa207c00000000000 0xe0)
  *  0.00189DD (0x2206c00000000000 0xcf)
  *  -4.1235DD (0xa205c00000000000 0x10a395bcf)
  *  9.8399e+20DD (0x2209400000000000 0x253f1f534acdd4)
  *  0DD (0x2208000000000000 0x0)
  *  0DD (0x2208000000000000 0x0)
  *  infDD (0x7800000000000000 0x0)
  *  nanDD (0x7c00000000000000 0x0
  */
 static unsigned long long dfp128_vals[] = {
                                     // Some finite numbers
                                     0x2207c00000000000ULL, 0x0000000000000e50ULL,
                                     0x2207c00000000000ULL, 0x000000000014c000ULL,
                                     0xa207c00000000000ULL, 0x00000000000000e0ULL,
                                     0x2206c00000000000ULL, 0x00000000000000cfULL,
                                     0xa205c00000000000ULL, 0x000000010a395bcfULL,
                                     0x6209400000fd0000ULL, 0x00253f1f534acdd4ULL, // huge number
                                     0x000400000089b000ULL, 0x0a6000d000000049ULL, // very small number
                                     // flavors of zero
                                     0x2208000000000000ULL, 0x0000000000000000ULL,
                                     0xa208000000000000ULL, 0x0000000000000000ULL, // negative
                                     0xa248000000000000ULL, 0x0000000000000000ULL,
                                     // flavors of NAN
                                     0x7c00000000000000ULL, 0x0000000000000000ULL, // quiet
                                     0xfc00000000000000ULL, 0xc00100035b007700ULL,
                                     0x7e00000000000000ULL, 0xfe000000d0e0a0d0ULL, // signaling
                                     // flavors of Infinity
                                     0x7800000000000000ULL, 0x0000000000000000ULL,
                                     0xf800000000000000ULL, 0x0000000000000000ULL, // negative
                                     0xf900000000000000ULL, 0x0000000000000000ULL
 };

 static unsigned long long dfp64_vals[] = {
                                  // various finite numbers
                                  0x2234000000000e50ULL,
                                  0x223400000014c000ULL,
                                  0xa2340000000000e0ULL,// negative
                                  0x22240000000000cfULL,
                                  0xa21400010a395bcfULL,// negative
                                  0x6e4d3f1f534acdd4ULL,// huge number
                                  0x000400000089b000ULL,// very small number
                                  // flavors of zero
                                  0x2238000000000000ULL,
                                  0xa238000000000000ULL,
                                  0x4248000000000000ULL,
                                  // flavors of NAN
                                  0x7e34000000000111ULL,
                                  0xfe000000d0e0a0d0ULL,//signaling
                                  0xfc00000000000000ULL,//quiet
                                  // flavors of Infinity
                                  0x7800000000000000ULL,
                                  0xf800000000000000ULL,//negative
                                  0x7a34000000000000ULL,
 };

 // Both Long and Quad arrays of DFP values should have the same length, so it
 // doesn't matter which array I use for calculating the following #define.
 #define NUM_DFP_VALS (sizeof(dfp64_vals)/8)

 typedef struct dfp_test_args {
    int fra_idx;
    int frb_idx;
 } dfp_test_args_t;


 // Index pairs from dfp64_vals array to be used with dfp_two_arg_tests
 static dfp_test_args_t dfp_2args_x1[] = {
                                     {0, 1},
                                     {2, 1},
                                     {4, 3},
                                     {6, 0},
                                     {2, 4},
                                     {5, 1},
                                     {5, 2},
                                     {7, 1},
                                     {7, 2},
                                     {8, 0},
                                     {8, 1},
                                     {8, 2},
                                     {7, 8},
                                     {12, 14},
                                     {12, 1},
                                     {12, 13},
                                     {12, 12},
                                     {12, 11},
                                     {11, 14},
                                     {11, 0},
                                     {11, 13},
                                     {11, 11},
                                     {14, 14},
                                     {14, 3},
                                     {14, 15},
 };

 typedef enum {
    LONG_TEST,
    QUAD_TEST
 } precision_type_t;

 typedef struct dfp_test
 {
    test_funcp_t test_func;
    const char * name;
    dfp_test_args_t * targs;
    int num_tests;
    precision_type_t precision;
    const char * op;
 } dfp_test_t;

 typedef struct dfp_one_arg_test
 {
    test_funcp_t test_func;
    const char * name;
    precision_type_t precision;
    const char * op;
 } dfp_one_arg_test_t;


 static dfp_one_arg_test_t
 dfp_ClassAndGroupTest_tests[] = {
                                  { &_test_dtstdc,  "dtstdc", LONG_TEST, "[tCls]"},
                                  { &_test_dtstdcq, "dtstdcq", QUAD_TEST, "[tCls]"},
                                  { &_test_dtstdg,  "dtstdg", LONG_TEST, "[tGrp]"},
                                  { &_test_dtstdgq, "dtstdgq", QUAD_TEST, "[tGrp]"},
                                  { NULL, NULL, 0, NULL}
 };

 static void test_dfp_ClassAndGroupTest_ops(void)
 {
    test_funcp_t func;
    dfp_val_t test_val, dummy;

    int k = 0;

    while ((func = dfp_ClassAndGroupTest_tests[k].test_func)) {
       int i;
       dfp_one_arg_test_t test_def = dfp_ClassAndGroupTest_tests[k];

       for (i = 0; i < NUM_DFP_VALS; i++) {
          int data_class_OR_group, BF = 0;
          Bool repeat = True;

          if (test_def.precision == LONG_TEST) {
             test_val.u64_val = dfp64_vals[i];
          } else {
             test_val.u128.valu = dfp128_vals[i * 2];
             test_val.u128.vall = dfp128_vals[(i * 2) + 1];
          }

 again:
          for (data_class_OR_group = 0; data_class_OR_group < 6; data_class_OR_group++) {
             unsigned int condreg;
             unsigned int flags;
             SET_FPSCR_ZERO;
             SET_CR_XER_ZERO;

 	    /* There is an ABI change in how 128 bit arguments are aligned
              * with GCC 5.0.  The compiler generates a "note" about this
              * starting with GCC 4.8.  To avoid generating the "note", pass
              * the address of the 128-bit arguments rather then the value.
 	     */
             (*func)(BF, data_class_OR_group, &test_val, &dummy);
             GET_CR(flags);

             condreg = ((flags >> (4 * (7-BF)))) & 0xf;
             printf("%s (DC/DG=%d) %s", test_def.name, data_class_OR_group,
                    test_def.op);
             if (test_def.precision == QUAD_TEST) {
                printf("%016llx %016llx", test_val.u128.valu, test_val.u128.vall);
             } else {
                printf("%016llx", test_val.u64_val);
             }

                //%016llx
             printf(" => %x (BF=%d)\n", condreg, BF);
          }
          if (repeat) {
             repeat = False;
             BF = 5;
             goto again;
          }
       }
       k++;
       printf( "\n" );
    }
 }


 static dfp_test_t
 dfp_ExpTest_tests[] = {
                    { &_test_dtstex, "dtstex", dfp_2args_x1, 25, LONG_TEST, "[tExp]"},
                    { &_test_dtstexq, "dtstexq", dfp_2args_x1, 25, QUAD_TEST, "[tExp]"},
                    { NULL, NULL, NULL, 0, 0, NULL}
 };


 static void test_dfp_ExpTest_ops(void)
 {
    dfp_val_t test_val1, test_val2;
    test_funcp_t func;
    int k = 0;

    while ((func = dfp_ExpTest_tests[k].test_func)) {
       /* BF is a 3-bit instruction field that indicates the CR field in which the
        * result of the test should be placed.  We won't iterate through all
        * 8 possible BF values since storing compare results to a given field is
        * a well-tested mechanism in VEX.  But we will test two BF values, just as
        * a sniff-test.
        */
       int i, repeat = 1, BF = 4;
       dfp_test_t test_def = dfp_ExpTest_tests[k];

 again:
       for (i = 0; i < test_def.num_tests; i++) {
          unsigned int condreg;
          unsigned int flags;

          if (test_def.precision == LONG_TEST) {
             test_val1.u64_val = dfp64_vals[test_def.targs[i].fra_idx];
             test_val2.u64_val  = dfp64_vals[test_def.targs[i].frb_idx];
          } else {
             test_val1.u128.valu = dfp128_vals[test_def.targs[i].fra_idx * 2];
             test_val1.u128.vall = dfp128_vals[(test_def.targs[i].fra_idx * 2) + 1];
             test_val2.u128.valu = dfp128_vals[test_def.targs[i].frb_idx * 2];
             test_val2.u128.vall = dfp128_vals[(test_def.targs[i].frb_idx * 2) + 1];
          }

          SET_FPSCR_ZERO;
          SET_CR_XER_ZERO;
          /* There is an ABI change in how 128 bit arguments are aligned
           * with GCC 5.0.  The compiler generates a "note" about this
           * starting with GCC 4.8.  To avoid generating the "note", pass
           * the address of the 128-bit arguments rather then the value.
           */
          (*func)(BF, 0, &test_val1, &test_val2);
          GET_CR(flags);

          condreg = ((flags >> (4 * (7-BF)))) & 0xf;
          printf("%s ", test_def.name);
          if (test_def.precision == LONG_TEST) {
             printf("%016llx %s %016llx ",
                    test_val1.u64_val, test_def.op, test_val2.u64_val);
          } else {
             printf("%016llx %016llx %s %016llx %016llx ",
                    test_val1.u128.valu, test_val1.u128.vall, test_def.op, test_val2.u128.valu, test_val2.u128.vall);
          }
          printf(" => %x (BF=%d)\n", condreg, BF);
       }
       if (repeat) {
          repeat = 0;
          BF = 7;
          goto again;
       }
       k++;
       printf( "\n" );
    }
 }


 static test_table_t
          all_tests[] =
 {
                     { &test_dfp_ExpTest_ops,
                       "Test DFP exponent test instructions"},
                     { &test_dfp_ClassAndGroupTest_ops,
                       "Test DFP class and group test instructions"},
                     { NULL, NULL }
 };
 #endif // HAS_DFP

 int main() {
 #if defined(HAS_DFP)

    test_table_t aTest;
    test_driver_func_t func;
    int i = 0;

    while ((func = all_tests[i].test_category)) {
       aTest = all_tests[i];
       printf( "%s\n", aTest.name );
       (*func)();
       i++;
    }

 #endif // HAS_DFP
    return 0;
 }
	/* Copyright (C) 2012 IBM

	Author: Maynard Johnson <maynardj@us.ibm.com>

	This program is free software; you can redistribute it and/or
	modify it under the terms of the GNU General Public License as
	published by the Free Software Foundation; either version 2 of the
	License, or (at your option) any later version.

	This program is distributed in the hope that it will be useful, but
	WITHOUT ANY WARRANTY; without even the implied warranty of
	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
	General Public License for more details.

	You should have received a copy of the GNU General Public License
	along with this program; if not, write to the Free Software
	Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA
	02111-1307, USA.

	The GNU General Public License is contained in the file COPYING.
	*/

	#include <stdio.h>
	#include <stdlib.h>
	#include <stdint.h>

	#if defined(HAS_DFP)

	typedef union stuff {
	_Decimal64 dec_val;
	_Decimal128 dec_val128;
	unsigned long long u64_val;
	struct {
	#if defined(VGP_ppc64le_linux)
	unsigned long long vall;
	unsigned long long valu;
	#else
	unsigned long long valu;
	unsigned long long vall;
	#endif
	} u128;
	} dfp_val_t;


	typedef unsigned char Bool;
	#define True 1
	#define False 0


	#define ALLCR "cr0","cr1","cr2","cr3","cr4","cr5","cr6","cr7"

	#define SET_CR(_arg) \
	__asm__ __volatile__ ("mtcr %0" : : "b"(_arg) : ALLCR );

	#define SET_XER(_arg) \
	__asm__ __volatile__ ("mtxer %0" : : "b"(_arg) : "xer" );

	#define GET_CR(_lval) \
	__asm__ __volatile__ ("mfcr %0" : "=b"(_lval) )

	#define GET_XER(_lval) \
	__asm__ __volatile__ ("mfxer %0" : "=b"(_lval) )

	#define GET_CR_XER(_lval_cr,_lval_xer) \
	do { GET_CR(_lval_cr); GET_XER(_lval_xer); } while (0)

	#define SET_CR_ZERO \
	SET_CR(0)

	#define SET_XER_ZERO \
	SET_XER(0)

	#define SET_CR_XER_ZERO \
	do { SET_CR_ZERO; SET_XER_ZERO; } while (0)

	#define SET_FPSCR_ZERO \
	do { double _d = 0.0; \
	__asm__ __volatile__ ("mtfsf 0xFF, %0" : : "f"(_d) ); \
	} while (0)

	#define GET_FPSCR(_arg) \
	__asm__ __volatile__ ("mffs %0" : "=f"(_arg) )

	#define SET_FPSCR_DRN \
	__asm__ __volatile__ ("mtfsf 1, %0, 0, 1" : : "f"(f14) )


	// The assembly-level instructions being tested

	/* In _test_dtstdc[q], DCM can be one of 6 possible data classes, numbered 0-5.
	* In reality, DCM is a 6-bit mask field. We just test the individual values
	* and assume that masking multiple values would work OK.
	* BF is the condition register bit field which can range from 0-7. But for
	* testing purposes, we only use BF values of '0' and '5'.
	*/
	static void _test_dtstdc(int BF, int DCM, dfp_val_t val1, dfp_val_t x1 __attribute__((unused)))
	{
	_Decimal64 f14 = val1->dec_val;
	if (DCM < 0 \|\| DCM > 5 \|\| !(BF == 0 \|\| BF == 5)) {
	fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DCM);
	return;
	}
	switch (DCM) {
	case 0:
	if (BF)
	__asm__ __volatile__ ("dtstdc 5, %0, 1" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdc 0, %0, 1" : : "f" (f14));
	break;
	case 1:
	if (BF)
	__asm__ __volatile__ ("dtstdc 5, %0, 2" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdc 0, %0, 2" : : "f" (f14));
	break;
	case 2:
	if (BF)
	__asm__ __volatile__ ("dtstdc 5, %0, 4" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdc 0, %0, 4" : : "f" (f14));
	break;
	case 3:
	if (BF)
	__asm__ __volatile__ ("dtstdc 5, %0, 8" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdc 0, %0, 8" : : "f" (f14));
	break;
	case 4:
	if (BF)
	__asm__ __volatile__ ("dtstdc 5, %0, 16" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdc 0, %0, 16" : : "f" (f14));
	break;
	case 5:
	if (BF)
	__asm__ __volatile__ ("dtstdc 5, %0, 32" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdc 0, %0, 32" : : "f" (f14));
	break;
	default:
	break;
	}
	}

	static void _test_dtstdcq(int BF, int DCM, dfp_val_t val1, dfp_val_t x1 __attribute__((unused)))
	{
	_Decimal128 f14 = val1->dec_val128;
	if (DCM < 0 \|\| DCM > 5 \|\| !(BF == 0 \|\| BF == 5)) {
	fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DCM);
	return;
	}
	switch (DCM) {
	case 0:
	if (BF)
	__asm__ __volatile__ ("dtstdcq 5, %0, 1" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdcq 0, %0, 1" : : "f" (f14));
	break;
	case 1:
	if (BF)
	__asm__ __volatile__ ("dtstdcq 5, %0, 2" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdcq 0, %0, 2" : : "f" (f14));
	break;
	case 2:
	if (BF)
	__asm__ __volatile__ ("dtstdcq 5, %0, 4" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdcq 0, %0, 4" : : "f" (f14));
	break;
	case 3:
	if (BF)
	__asm__ __volatile__ ("dtstdcq 5, %0, 8" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdcq 0, %0, 8" : : "f" (f14));
	break;
	case 4:
	if (BF)
	__asm__ __volatile__ ("dtstdcq 5, %0, 16" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdcq 0, %0, 16" : : "f" (f14));
	break;
	case 5:
	if (BF)
	__asm__ __volatile__ ("dtstdcq 5, %0, 32" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdcq 0, %0, 32" : : "f" (f14));
	break;
	default:
	break;
	}
	}

	/* In _test_dtstdg[q], DGM can be one of 6 possible data groups, numbered 0-5.
	* In reality, DGM is a 6-bit mask field. We just test the individual values
	* and assume that masking multiple values would work OK.
	* BF is the condition register bit field which can range from 0-7. But for
	* testing purposes, we only use BF values of '0' and '5'.
	*/
	static void _test_dtstdg(int BF, int DGM, dfp_val_t val1, dfp_val_t x1 __attribute__((unused)))
	{
	_Decimal64 f14 = val1->dec_val;
	if (DGM < 0 \|\| DGM > 5 \|\| !(BF == 0 \|\| BF == 5)) {
	fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DGM);
	return;
	}
	switch (DGM) {
	case 0:
	if (BF)
	__asm__ __volatile__ ("dtstdg 5, %0, 1" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdg 0, %0, 1" : : "f" (f14));
	break;
	case 1:
	if (BF)
	__asm__ __volatile__ ("dtstdg 5, %0, 2" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdg 0, %0, 2" : : "f" (f14));
	break;
	case 2:
	if (BF)
	__asm__ __volatile__ ("dtstdg 5, %0, 4" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdg 0, %0, 4" : : "f" (f14));
	break;
	case 3:
	if (BF)
	__asm__ __volatile__ ("dtstdg 5, %0, 8" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdg 0, %0, 8" : : "f" (f14));
	break;
	case 4:
	if (BF)
	__asm__ __volatile__ ("dtstdg 5, %0, 16" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdg 0, %0, 16" : : "f" (f14));
	break;
	case 5:
	if (BF)
	__asm__ __volatile__ ("dtstdg 5, %0, 32" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdg 0, %0, 32" : : "f" (f14));
	break;
	default:
	break;
	}
	}

	static void _test_dtstdgq(int BF, int DGM, dfp_val_t val1, dfp_val_t x1 __attribute__((unused)))
	{
	_Decimal128 f14 = val1->dec_val128;
	if (DGM < 0 \|\| DGM > 5 \|\| !(BF == 0 \|\| BF == 5)) {
	fprintf(stderr, "Invalid inputs to asm test: a=%d, b=%d\n", BF, DGM);
	return;
	}
	switch (DGM) {
	case 0:
	if (BF)
	__asm__ __volatile__ ("dtstdgq 5, %0, 1" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdgq 0, %0, 1" : : "f" (f14));
	break;
	case 1:
	if (BF)
	__asm__ __volatile__ ("dtstdgq 5, %0, 2" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdgq 0, %0, 2" : : "f" (f14));
	break;
	case 2:
	if (BF)
	__asm__ __volatile__ ("dtstdgq 5, %0, 4" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdgq 0, %0, 4" : : "f" (f14));
	break;
	case 3:
	if (BF)
	__asm__ __volatile__ ("dtstdgq 5, %0, 8" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdgq 0, %0, 8" : : "f" (f14));
	break;
	case 4:
	if (BF)
	__asm__ __volatile__ ("dtstdgq 5, %0, 16" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdgq 0, %0, 16" : : "f" (f14));
	break;
	case 5:
	if (BF)
	__asm__ __volatile__ ("dtstdgq 5, %0, 32" : : "f" (f14));
	else
	__asm__ __volatile__ ("dtstdgq 0, %0, 32" : : "f" (f14));
	break;
	default:
	break;
	}
	}

	/* In _test_dtstex[q], BF is the condition register bit field indicating the
	* CR field in which the result of the test should be placed. BF can range
	* from 0-7, but for testing purposes, we only use BF values of '4' and '7'.
	*/
	static void
	_test_dtstex(int BF, int x __attribute__((unused)), dfp_val_t val1, dfp_val_t val2)
	{
	_Decimal64 f14 = val1->dec_val;
	_Decimal64 f16 = val2->dec_val;
	if (!(BF == 4 \|\| BF == 7)) {
	fprintf(stderr, "Invalid input to asm test: a=%d\n", BF);
	return;
	}
	switch (BF) {
	case 4:
	__asm__ __volatile__ ("dtstex 4, %0, %1" : : "f" (f14),"f" (f16));
	break;
	case 7:
	__asm__ __volatile__ ("dtstex 7, %0, %1" : : "f" (f14),"f" (f16));
	break;
	default:
	break;
	}
	}

	static void _test_dtstexq(int BF, int x __attribute__((unused)), dfp_val_t val1, dfp_val_t val2)
	{
	_Decimal128 f14 = val1->dec_val128;
	_Decimal128 f16 = val2->dec_val128;
	if (!(BF == 4 \|\| BF == 7)) {
	fprintf(stderr, "Invalid input to asm test: a=%d\n", BF);
	return;
	}
	switch (BF) {
	case 4:
	__asm__ __volatile__ ("dtstexq 4, %0, %1" : : "f" (f14),"f" (f16));
	break;
	case 7:
	__asm__ __volatile__ ("dtstexq 7, %0, %1" : : "f" (f14),"f" (f16));
	break;
	default:
	break;
	}
	}



	typedef void (test_funcp_t)(int a, int b, dfp_val_t val1, dfp_val_t *val2);
	typedef void (*test_driver_func_t)(void);
	typedef struct test_table
	{
	test_driver_func_t test_category;
	char * name;
	} test_table_t;

	/*
	* 345.0DD (0x2207c00000000000 0xe50)
	* 1.2300e+5DD (0x2207c00000000000 0x14c000)
	* -16.0DD (0xa207c00000000000 0xe0)
	* 0.00189DD (0x2206c00000000000 0xcf)
	* -4.1235DD (0xa205c00000000000 0x10a395bcf)
	* 9.8399e+20DD (0x2209400000000000 0x253f1f534acdd4)
	* 0DD (0x2208000000000000 0x0)
	* 0DD (0x2208000000000000 0x0)
	* infDD (0x7800000000000000 0x0)
	* nanDD (0x7c00000000000000 0x0
	*/
	static unsigned long long dfp128_vals[] = {
	// Some finite numbers
	0x2207c00000000000ULL, 0x0000000000000e50ULL,
	0x2207c00000000000ULL, 0x000000000014c000ULL,
	0xa207c00000000000ULL, 0x00000000000000e0ULL,
	0x2206c00000000000ULL, 0x00000000000000cfULL,
	0xa205c00000000000ULL, 0x000000010a395bcfULL,
	0x6209400000fd0000ULL, 0x00253f1f534acdd4ULL, // huge number
	0x000400000089b000ULL, 0x0a6000d000000049ULL, // very small number
	// flavors of zero
	0x2208000000000000ULL, 0x0000000000000000ULL,
	0xa208000000000000ULL, 0x0000000000000000ULL, // negative
	0xa248000000000000ULL, 0x0000000000000000ULL,
	// flavors of NAN
	0x7c00000000000000ULL, 0x0000000000000000ULL, // quiet
	0xfc00000000000000ULL, 0xc00100035b007700ULL,
	0x7e00000000000000ULL, 0xfe000000d0e0a0d0ULL, // signaling
	// flavors of Infinity
	0x7800000000000000ULL, 0x0000000000000000ULL,
	0xf800000000000000ULL, 0x0000000000000000ULL, // negative
	0xf900000000000000ULL, 0x0000000000000000ULL
	};

	static unsigned long long dfp64_vals[] = {
	// various finite numbers
	0x2234000000000e50ULL,
	0x223400000014c000ULL,
	0xa2340000000000e0ULL,// negative
	0x22240000000000cfULL,
	0xa21400010a395bcfULL,// negative
	0x6e4d3f1f534acdd4ULL,// huge number
	0x000400000089b000ULL,// very small number
	// flavors of zero
	0x2238000000000000ULL,
	0xa238000000000000ULL,
	0x4248000000000000ULL,
	// flavors of NAN
	0x7e34000000000111ULL,
	0xfe000000d0e0a0d0ULL,//signaling
	0xfc00000000000000ULL,//quiet
	// flavors of Infinity
	0x7800000000000000ULL,
	0xf800000000000000ULL,//negative
	0x7a34000000000000ULL,
	};

	// Both Long and Quad arrays of DFP values should have the same length, so it
	// doesn't matter which array I use for calculating the following #define.
	#define NUM_DFP_VALS (sizeof(dfp64_vals)/8)

	typedef struct dfp_test_args {
	int fra_idx;
	int frb_idx;
	} dfp_test_args_t;


	// Index pairs from dfp64_vals array to be used with dfp_two_arg_tests
	static dfp_test_args_t dfp_2args_x1[] = {
	{0, 1},
	{2, 1},
	{4, 3},
	{6, 0},
	{2, 4},
	{5, 1},
	{5, 2},
	{7, 1},
	{7, 2},
	{8, 0},
	{8, 1},
	{8, 2},
	{7, 8},
	{12, 14},
	{12, 1},
	{12, 13},
	{12, 12},
	{12, 11},
	{11, 14},
	{11, 0},
	{11, 13},
	{11, 11},
	{14, 14},
	{14, 3},
	{14, 15},
	};

	typedef enum {
	LONG_TEST,
	QUAD_TEST
	} precision_type_t;

	typedef struct dfp_test
	{
	test_funcp_t test_func;
	const char * name;
	dfp_test_args_t * targs;
	int num_tests;
	precision_type_t precision;
	const char * op;
	} dfp_test_t;

	typedef struct dfp_one_arg_test
	{
	test_funcp_t test_func;
	const char * name;
	precision_type_t precision;
	const char * op;
	} dfp_one_arg_test_t;



	static dfp_one_arg_test_t
	dfp_ClassAndGroupTest_tests[] = {
	{ &_test_dtstdc, "dtstdc", LONG_TEST, "[tCls]"},
	{ &_test_dtstdcq, "dtstdcq", QUAD_TEST, "[tCls]"},
	{ &_test_dtstdg, "dtstdg", LONG_TEST, "[tGrp]"},
	{ &_test_dtstdgq, "dtstdgq", QUAD_TEST, "[tGrp]"},
	{ NULL, NULL, 0, NULL}
	};

	static void test_dfp_ClassAndGroupTest_ops(void)
	{
	test_funcp_t func;
	dfp_val_t test_val, dummy;

	int k = 0;

	while ((func = dfp_ClassAndGroupTest_tests[k].test_func)) {
	int i;
	dfp_one_arg_test_t test_def = dfp_ClassAndGroupTest_tests[k];

	for (i = 0; i < NUM_DFP_VALS; i++) {
	int data_class_OR_group, BF = 0;
	Bool repeat = True;

	if (test_def.precision == LONG_TEST) {
	test_val.u64_val = dfp64_vals[i];
	} else {
	test_val.u128.valu = dfp128_vals[i * 2];
	test_val.u128.vall = dfp128_vals[(i * 2) + 1];
	}

	again:
	for (data_class_OR_group = 0; data_class_OR_group < 6; data_class_OR_group++) {
	unsigned int condreg;
	unsigned int flags;
	SET_FPSCR_ZERO;
	SET_CR_XER_ZERO;

	/* There is an ABI change in how 128 bit arguments are aligned
	* with GCC 5.0. The compiler generates a "note" about this
	* starting with GCC 4.8. To avoid generating the "note", pass
	* the address of the 128-bit arguments rather then the value.
	*/
	(*func)(BF, data_class_OR_group, &test_val, &dummy);
	GET_CR(flags);

	condreg = ((flags >> (4 * (7-BF)))) & 0xf;
	printf("%s (DC/DG=%d) %s", test_def.name, data_class_OR_group,
	test_def.op);
	if (test_def.precision == QUAD_TEST) {
	printf("%016llx %016llx", test_val.u128.valu, test_val.u128.vall);
	} else {
	printf("%016llx", test_val.u64_val);
	}

	//%016llx
	printf(" => %x (BF=%d)\n", condreg, BF);
	}
	if (repeat) {
	repeat = False;
	BF = 5;
	goto again;
	}
	}
	k++;
	printf( "\n" );
	}
	}


	static dfp_test_t
	dfp_ExpTest_tests[] = {
	{ &_test_dtstex, "dtstex", dfp_2args_x1, 25, LONG_TEST, "[tExp]"},
	{ &_test_dtstexq, "dtstexq", dfp_2args_x1, 25, QUAD_TEST, "[tExp]"},
	{ NULL, NULL, NULL, 0, 0, NULL}
	};


	static void test_dfp_ExpTest_ops(void)
	{
	dfp_val_t test_val1, test_val2;
	test_funcp_t func;
	int k = 0;

	while ((func = dfp_ExpTest_tests[k].test_func)) {
	/* BF is a 3-bit instruction field that indicates the CR field in which the
	* result of the test should be placed. We won't iterate through all
	* 8 possible BF values since storing compare results to a given field is
	* a well-tested mechanism in VEX. But we will test two BF values, just as
	* a sniff-test.
	*/
	int i, repeat = 1, BF = 4;
	dfp_test_t test_def = dfp_ExpTest_tests[k];

	again:
	for (i = 0; i < test_def.num_tests; i++) {
	unsigned int condreg;
	unsigned int flags;

	if (test_def.precision == LONG_TEST) {
	test_val1.u64_val = dfp64_vals[test_def.targs[i].fra_idx];
	test_val2.u64_val = dfp64_vals[test_def.targs[i].frb_idx];
	} else {
	test_val1.u128.valu = dfp128_vals[test_def.targs[i].fra_idx * 2];
	test_val1.u128.vall = dfp128_vals[(test_def.targs[i].fra_idx * 2) + 1];
	test_val2.u128.valu = dfp128_vals[test_def.targs[i].frb_idx * 2];
	test_val2.u128.vall = dfp128_vals[(test_def.targs[i].frb_idx * 2) + 1];
	}

	SET_FPSCR_ZERO;
	SET_CR_XER_ZERO;
	/* There is an ABI change in how 128 bit arguments are aligned
	* with GCC 5.0. The compiler generates a "note" about this
	* starting with GCC 4.8. To avoid generating the "note", pass
	* the address of the 128-bit arguments rather then the value.
	*/
	(*func)(BF, 0, &test_val1, &test_val2);
	GET_CR(flags);

	condreg = ((flags >> (4 * (7-BF)))) & 0xf;
	printf("%s ", test_def.name);
	if (test_def.precision == LONG_TEST) {
	printf("%016llx %s %016llx ",
	test_val1.u64_val, test_def.op, test_val2.u64_val);
	} else {
	printf("%016llx %016llx %s %016llx %016llx ",
	test_val1.u128.valu, test_val1.u128.vall, test_def.op, test_val2.u128.valu, test_val2.u128.vall);
	}
	printf(" => %x (BF=%d)\n", condreg, BF);
	}
	if (repeat) {
	repeat = 0;
	BF = 7;
	goto again;
	}
	k++;
	printf( "\n" );
	}
	}


	static test_table_t
	all_tests[] =
	{
	{ &test_dfp_ExpTest_ops,
	"Test DFP exponent test instructions"},
	{ &test_dfp_ClassAndGroupTest_ops,
	"Test DFP class and group test instructions"},
	{ NULL, NULL }
	};
	#endif // HAS_DFP

	int main() {
	#if defined(HAS_DFP)

	test_table_t aTest;
	test_driver_func_t func;
	int i = 0;

	while ((func = all_tests[i].test_category)) {
	aTest = all_tests[i];
	printf( "%s\n", aTest.name );
	(*func)();
	i++;
	}

	#endif // HAS_DFP
	return 0;
	}