il_11210 Cdiff usr/src/lib/libm/common/m9x/fmaf.c

Print this page

11210 libm should be cstyle(1ONBLD) clean


*** 20,29 ****
--- 20,30 ----
   */
  
  /*
   * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
   */
+ 
  /*
   * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
   * Use is subject to license terms.
   */
  
*** 32,89 ****
  #include "libm.h"
  #include "fma.h"
  #include "fenv_inlines.h"
  
  #if defined(__sparc)
- 
  /*
   * fmaf for SPARC: 32-bit single precision, big-endian
   */
  float
! __fmaf(float x, float y, float z) {
          union {
                  unsigned i[2];
                  double d;
          } xy, zz;
          unsigned u, s;
          int exy, ez;
  
          /*
           * the following operations can only raise the invalid exception,
           * and then only if either x*y is of the form Inf*0 or one of x,
           * y, or z is a signaling NaN
           */
!         xy.d = (double) x * y;
!         zz.d = (double) z;
  
          /*
           * if the sum xy + z will be exact, just compute it and cast the
           * result to float
           */
          exy = (xy.i[0] >> 20) & 0x7ff;
          ez = (zz.i[0] >> 20) & 0x7ff;
          if ((ez - exy <= 4 && exy - ez <= 28) || exy == 0x7ff || exy == 0 ||
!                 ez == 0x7ff || ez == 0) {
!                 return ((float) (xy.d + zz.d));
!         }
  
          /*
           * collapse the tail of the smaller summand into a "sticky bit"
           * so that the sum can be computed without error
           */
          if (ez > exy) {
                  if (ez - exy < 31) {
                          u = xy.i[1];
                          s = 2 << (ez - exy);
                          if (u & (s - 1))
                                  u |= s;
                          xy.i[1] = u & ~(s - 1);
                  } else if (ez - exy < 51) {
                          u = xy.i[0];
                          s = 1 << (ez - exy - 31);
                          if ((u & (s - 1)) | xy.i[1])
                                  u |= s;
                          xy.i[0] = u & ~(s - 1);
                          xy.i[1] = 0;
                  } else {
                          /* collapse all of xy into a single bit */
                          xy.i[0] = (xy.i[0] & 0x80000000) | ((ez - 51) << 20);
--- 33,95 ----
  #include "libm.h"
  #include "fma.h"
  #include "fenv_inlines.h"
  
  #if defined(__sparc)
  /*
   * fmaf for SPARC: 32-bit single precision, big-endian
   */
  float
! __fmaf(float x, float y, float z)
! {
          union {
                  unsigned i[2];
                  double d;
          } xy, zz;
+ 
          unsigned u, s;
          int exy, ez;
  
          /*
           * the following operations can only raise the invalid exception,
           * and then only if either x*y is of the form Inf*0 or one of x,
           * y, or z is a signaling NaN
           */
!         xy.d = (double)x * y;
!         zz.d = (double)z;
  
          /*
           * if the sum xy + z will be exact, just compute it and cast the
           * result to float
           */
          exy = (xy.i[0] >> 20) & 0x7ff;
          ez = (zz.i[0] >> 20) & 0x7ff;
+ 
          if ((ez - exy <= 4 && exy - ez <= 28) || exy == 0x7ff || exy == 0 ||
!             ez == 0x7ff || ez == 0)
!                 return ((float)(xy.d + zz.d));
  
          /*
           * collapse the tail of the smaller summand into a "sticky bit"
           * so that the sum can be computed without error
           */
          if (ez > exy) {
                  if (ez - exy < 31) {
                          u = xy.i[1];
                          s = 2 << (ez - exy);
+ 
                          if (u & (s - 1))
                                  u |= s;
+ 
                          xy.i[1] = u & ~(s - 1);
                  } else if (ez - exy < 51) {
                          u = xy.i[0];
                          s = 1 << (ez - exy - 31);
+ 
                          if ((u & (s - 1)) | xy.i[1])
                                  u |= s;
+ 
                          xy.i[0] = u & ~(s - 1);
                          xy.i[1] = 0;
                  } else {
                          /* collapse all of xy into a single bit */
                          xy.i[0] = (xy.i[0] & 0x80000000) | ((ez - 51) << 20);
*** 91,137 ****
                  }
          } else {
                  if (exy - ez < 31) {
                          u = zz.i[1];
                          s = 2 << (exy - ez);
                          if (u & (s - 1))
                                  u |= s;
                          zz.i[1] = u & ~(s - 1);
                  } else if (exy - ez < 51) {
                          u = zz.i[0];
                          s = 1 << (exy - ez - 31);
                          if ((u & (s - 1)) | zz.i[1])
                                  u |= s;
                          zz.i[0] = u & ~(s - 1);
                          zz.i[1] = 0;
                  } else {
                          /* collapse all of zz into a single bit */
                          zz.i[0] = (zz.i[0] & 0x80000000) | ((exy - 51) << 20);
                          zz.i[1] = 0;
                  }
          }
  
!         return ((float) (xy.d + zz.d));
  }
- 
  #elif defined(__x86)
- 
  #if defined(__amd64)
  #define NI      4
  #else
  #define NI      3
  #endif
  
  /*
   * fmaf for x86: 32-bit single precision, little-endian
   */
  float
! __fmaf(float x, float y, float z) {
          union {
                  unsigned i[NI];
                  long double e;
          } xy, zz;
          unsigned u, s, cwsw, oldcwsw;
          int exy, ez;
  
          /* set rounding precision to 64 bits */
          __fenv_getcwsw(&oldcwsw);
--- 97,147 ----
                  }
          } else {
                  if (exy - ez < 31) {
                          u = zz.i[1];
                          s = 2 << (exy - ez);
+ 
                          if (u & (s - 1))
                                  u |= s;
+ 
                          zz.i[1] = u & ~(s - 1);
                  } else if (exy - ez < 51) {
                          u = zz.i[0];
                          s = 1 << (exy - ez - 31);
+ 
                          if ((u & (s - 1)) | zz.i[1])
                                  u |= s;
+ 
                          zz.i[0] = u & ~(s - 1);
                          zz.i[1] = 0;
                  } else {
                          /* collapse all of zz into a single bit */
                          zz.i[0] = (zz.i[0] & 0x80000000) | ((exy - 51) << 20);
                          zz.i[1] = 0;
                  }
          }
  
!         return ((float)(xy.d + zz.d));
  }
  #elif defined(__x86)
  #if defined(__amd64)
  #define NI              4
  #else
  #define NI              3
  #endif
  
  /*
   * fmaf for x86: 32-bit single precision, little-endian
   */
  float
! __fmaf(float x, float y, float z)
! {
          union {
                  unsigned i[NI];
                  long double e;
          } xy, zz;
+ 
          unsigned u, s, cwsw, oldcwsw;
          int exy, ez;
  
          /* set rounding precision to 64 bits */
          __fenv_getcwsw(&oldcwsw);
*** 141,180 ****
          /*
           * the following operations can only raise the invalid exception,
           * and then only if either x*y is of the form Inf*0 or one of x,
           * y, or z is a signaling NaN
           */
!         xy.e = (long double) x * y;
!         zz.e = (long double) z;
  
          /*
           * if the sum xy + z will be exact, just compute it and cast the
           * result to float
           */
          exy = xy.i[2] & 0x7fff;
          ez = zz.i[2] & 0x7fff;
          if ((ez - exy <= 15 && exy - ez <= 39) || exy == 0x7fff || exy == 0 ||
!                 ez == 0x7fff || ez == 0) {
                  goto cont;
-         }
  
          /*
           * collapse the tail of the smaller summand into a "sticky bit"
           * so that the sum can be computed without error
           */
          if (ez > exy) {
                  if (ez - exy < 31) {
                          u = xy.i[0];
                          s = 2 << (ez - exy);
                          if (u & (s - 1))
                                  u |= s;
                          xy.i[0] = u & ~(s - 1);
                  } else if (ez - exy < 62) {
                          u = xy.i[1];
                          s = 1 << (ez - exy - 31);
                          if ((u & (s - 1)) | xy.i[0])
                                  u |= s;
                          xy.i[1] = u & ~(s - 1);
                          xy.i[0] = 0;
                  } else {
                          /* collapse all of xy into a single bit */
                          xy.i[0] = 0;
--- 151,194 ----
          /*
           * the following operations can only raise the invalid exception,
           * and then only if either x*y is of the form Inf*0 or one of x,
           * y, or z is a signaling NaN
           */
!         xy.e = (long double)x * y;
!         zz.e = (long double)z;
  
          /*
           * if the sum xy + z will be exact, just compute it and cast the
           * result to float
           */
          exy = xy.i[2] & 0x7fff;
          ez = zz.i[2] & 0x7fff;
+ 
          if ((ez - exy <= 15 && exy - ez <= 39) || exy == 0x7fff || exy == 0 ||
!             ez == 0x7fff || ez == 0)
                  goto cont;
  
          /*
           * collapse the tail of the smaller summand into a "sticky bit"
           * so that the sum can be computed without error
           */
          if (ez > exy) {
                  if (ez - exy < 31) {
                          u = xy.i[0];
                          s = 2 << (ez - exy);
+ 
                          if (u & (s - 1))
                                  u |= s;
+ 
                          xy.i[0] = u & ~(s - 1);
                  } else if (ez - exy < 62) {
                          u = xy.i[1];
                          s = 1 << (ez - exy - 31);
+ 
                          if ((u & (s - 1)) | xy.i[0])
                                  u |= s;
+ 
                          xy.i[1] = u & ~(s - 1);
                          xy.i[0] = 0;
                  } else {
                          /* collapse all of xy into a single bit */
                          xy.i[0] = 0;
*** 183,194 ****
--- 197,210 ----
                  }
          } else {
                  if (exy - ez < 62) {
                          u = zz.i[1];
                          s = 1 << (exy - ez - 31);
+ 
                          if ((u & (s - 1)) | zz.i[0])
                                  u |= s;
+ 
                          zz.i[1] = u & ~(s - 1);
                          zz.i[0] = 0;
                  } else {
                          /* collapse all of zz into a single bit */
                          zz.i[0] = 0;
*** 203,222 ****
          /* restore the rounding precision */
          __fenv_getcwsw(&cwsw);
          cwsw = (cwsw & 0xfcffffff) | (oldcwsw & 0x03000000);
          __fenv_setcwsw(&cwsw);
  
!         return ((float) xy.e);
  }
  
  #if 0
  /*
   * another fmaf for x86: assumes return value will be left in
   * long double (80-bit double extended) precision
   */
  long double
! __fmaf(float x, float y, float z) {
          /*
           * Note: This implementation assumes the rounding precision mode
           * is set to the default, rounding to 64 bit precision.  If this
           * routine must work in non-default rounding precision modes, do
           * the following instead:
--- 219,239 ----
          /* restore the rounding precision */
          __fenv_getcwsw(&cwsw);
          cwsw = (cwsw & 0xfcffffff) | (oldcwsw & 0x03000000);
          __fenv_setcwsw(&cwsw);
  
!         return ((float)xy.e);
  }
  
  #if 0
  /*
   * another fmaf for x86: assumes return value will be left in
   * long double (80-bit double extended) precision
   */
  long double
! __fmaf(float x, float y, float z)
! {
          /*
           * Note: This implementation assumes the rounding precision mode
           * is set to the default, rounding to 64 bit precision.  If this
           * routine must work in non-default rounding precision modes, do
           * the following instead:
*** 230,241 ****
           *
           * Note that the code to change rounding precision must not alter
           * the exception masks or flags, since the product x * y may raise
           * an invalid operation exception.
           */
!         return ((long double) x * y + z);
  }
  #endif
- 
  #else
  #error Unknown architecture
  #endif
--- 247,257 ----
           *
           * Note that the code to change rounding precision must not alter
           * the exception masks or flags, since the product x * y may raise
           * an invalid operation exception.
           */
!         return ((long double)x * y + z);
  }
  #endif
  #else
  #error Unknown architecture
  #endif