il_11210 Wdiff usr/src/lib/libm/common/Q/log1pl.c

Print this page

11210 libm should be cstyle(1ONBLD) clean

Split	Close
Expand all
Collapse all

          --- old/usr/src/lib/libm/common/Q/log1pl.c
          +++ new/usr/src/lib/libm/common/Q/log1pl.c

   1    1  /*
   2    2   * CDDL HEADER START
   3    3   *
   4    4   * The contents of this file are subject to the terms of the
   5    5   * Common Development and Distribution License (the "License").
   6    6   * You may not use this file except in compliance with the License.
   7    7   *
   8    8   * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
   9    9   * or http://www.opensolaris.org/os/licensing.
  10   10   * See the License for the specific language governing permissions
  11   11   * and limitations under the License.
  12   12   *
  13   13   * When distributing Covered Code, include this CDDL HEADER in each
  14   14   * file and include the License file at usr/src/OPENSOLARIS.LICENSE.

↓ open down ↓

14 lines elided

↑ open up ↑

  15   15   * If applicable, add the following below this CDDL HEADER, with the
  16   16   * fields enclosed by brackets "[]" replaced with your own identifying
  17   17   * information: Portions Copyright [yyyy] [name of copyright owner]
  18   18   *
  19   19   * CDDL HEADER END
  20   20   */
  21   21  
  22   22  /*
  23   23   * Copyright 2011 Nexenta Systems, Inc.  All rights reserved.
  24   24   */
       25 +
  25   26  /*
  26   27   * Copyright 2006 Sun Microsystems, Inc.  All rights reserved.
  27   28   * Use is subject to license terms.
  28   29   */
  29   30  
  30   31  #ifdef __LITTLE_ENDIAN
  31      -#define H0(x)   *(3 + (int *) &x)
  32      -#define H1(x)   *(2 + (int *) &x)
  33      -#define H2(x)   *(1 + (int *) &x)
  34      -#define H3(x)   *(int *) &x
       32 +#define H0(x)           *(3 + (int *)&x)
       33 +#define H1(x)           *(2 + (int *)&x)
       34 +#define H2(x)           *(1 + (int *)&x)
       35 +#define H3(x)           *(int *)&x
  35   36  #else
  36      -#define H0(x)   *(int *) &x
  37      -#define H1(x)   *(1 + (int *) &x)
  38      -#define H2(x)   *(2 + (int *) &x)
  39      -#define H3(x)   *(3 + (int *) &x)
       37 +#define H0(x)           *(int *)&x
       38 +#define H1(x)           *(1 + (int *)&x)
       39 +#define H2(x)           *(2 + (int *)&x)
       40 +#define H3(x)           *(3 + (int *)&x)
  40   41  #endif
  41   42  
  42   43  /*
  43   44   * log1pl(x)
  44   45   * Table look-up algorithm by modifying logl.c
  45   46   * By K.C. Ng, July 6, 1995
  46   47   *
  47   48   * (a). For 1+x in [31/33,33/31], using a special approximation:
  48   49   *      s = x/(2.0+x);  ... here |s| <= 0.03125
  49   50   *      z = s*s;
  50   51   *      return x-s*(x-z*(B1+z*(B2+z*(B3+z*(B4+...+z*B9)...))));
  51   52   *      (i.e., x is in [-2/33,2/31])
  52   53   *
  53   54   * (b). Otherwise, normalize 1+x = 2^n * 1.f.
  54      - *      Here we may need a correction term for 1+x rounded.
       55 + *      Here we may need a correction term for 1+x rounded.
  55   56   *      Use a 6-bit table look-up: find a 6 bit g that match f to 6.5 bits,
  56   57   *      then
  57   58   *          log(1+x) = n*ln2 + log(1.g) + log(1.f/1.g).
  58   59   *      Here the leading and trailing values of log(1.g) are obtained from
  59   60   *      a size-64 table.
  60   61   *      For log(1.f/1.g), let s = (1.f-1.g)/(1.f+1.g). Note that
  61   62   *              1.f = 2^-n(1+x)
  62   63   *
  63   64   *      then
  64   65   *          log(1.f/1.g) = log((1+s)/(1-s)) = 2s + 2/3 s^3 + 2/5 s^5 +...

  65   66   *      Note that |s|<2**-8=0.00390625. We use an odd s-polynomial
  66   67   *      approximation to compute log(1.f/1.g):

↓ open down ↓

2 lines elided

↑ open up ↑

  67   68   *              s*(A1+s^2*(A2+s^2*(A3+s^2*(A4+s^2*(A5+s^2*(A6+s^2*A7))))))
  68   69   *      (Precision is 2**-136.91 bits, absolute error)
  69   70   *
  70   71   *      CAUTION:
  71   72   *      For x>=1, compute 1+x will lost one bit (OK).
  72   73   *      For x in [-0.5,-1), 1+x is exact.
  73   74   *      For x in (-0.5,-2/33]U[2/31,1), up to 4 last bits of x will be lost
  74   75   *      in 1+x.  Therefore, to recover the lost bits, one need to compute
  75   76   *      1.f-1.g accurately.
  76   77   *
  77      - *      Let hx = HI(x), m = (hx>>16)-0x3fff (=ilogbl(x)), note that
       78 + *      Let hx = HI(x), m = (hx>>16)-0x3fff (=ilogbl(x)), note that
  78   79   *              -2/33 = -0.0606...= 2^-5 * 1.939...,
  79   80   *               2/31 =  0.09375  = 2^-4 * 1.500...,
  80   81   *      so for x in (-0.5,-2/33], -5<=m<=-2,  n= -1, 1+f=2*(1+x)
  81   82   *         for x in [2/33,1),     -4<=m<=-1,  n=  0, f=x
  82   83   *
  83   84   *      In short:
  84      - *      if x>0, let g: hg= ((hx + (0x200<<(-m)))>>(10-m))<<(10-m)
       85 + *      if x>0, let g: hg= ((hx + (0x200<<(-m)))>>(10-m))<<(10-m)
  85   86   *      then 1.f-1.g = x-g
  86   87   *      if x<0, let g': hg' =((ix-(0x200)<<(-m-1))>>(9-m))<<(9-m)
  87   88   *      (ix=hx&0x7fffffff)
  88   89   *      then 1.f-1.g = 2*(g'+x),
  89   90   *
  90   91   * (c). The final result is computed by
  91   92   *              (n*ln2_hi+_TBL_logl_hi[j]) +
  92   93   *                      ( (n*ln2_lo+_TBL_logl_lo[j]) + s*(A1+...) )
  93   94   *
  94   95   * Note.

  95   96   *      For ln2_hi and _TBL_logl_hi[j], we force their last 32 bit to be zero
  96   97   *      so that n*ln2_hi + _TBL_logl_hi[j] is exact. Here
  97   98   *      _TBL_logl_hi[j] + _TBL_logl_lo[j] match log(1+j*2**-6) to 194 bits
  98   99   *
  99  100   *
 100  101   * Special cases:
 101  102   *      log(x) is NaN with signal if x < 0 (including -INF) ;
 102  103   *      log(+INF) is +INF; log(0) is -INF with signal;
 103  104   *      log(NaN) is that NaN with no signal.
 104  105   *
 105  106   * Constants:
 106  107   * The hexadecimal values are the intended ones for the following constants.

↓ open down ↓

12 lines elided

↑ open up ↑

 107  108   * The decimal values may be used, provided that the compiler will convert
 108  109   * from decimal to binary accurately enough to produce the hexadecimal values
 109  110   * shown.
 110  111   */
 111  112  
 112  113  #pragma weak __log1pl = log1pl
 113  114  
 114  115  #include "libm.h"
 115  116  
 116  117  extern const long double _TBL_logl_hi[], _TBL_logl_lo[];
 117      -
 118      -static const long double
 119      -zero    =   0.0L,
 120      -one     =   1.0L,
 121      -two     =   2.0L,
 122      -ln2hi   =   6.931471805599453094172319547495844850203e-0001L,
 123      -ln2lo   =   1.667085920830552208890449330400379754169e-0025L,
 124      -A1      =   2.000000000000000000000000000000000000024e+0000L,
 125      -A2      =   6.666666666666666666666666666666091393804e-0001L,
 126      -A3      =   4.000000000000000000000000407167070220671e-0001L,
 127      -A4      =   2.857142857142857142730077490612903681164e-0001L,
 128      -A5      =   2.222222222222242577702836920812882605099e-0001L,
 129      -A6      =   1.818181816435493395985912667105885828356e-0001L,
 130      -A7      =   1.538537835211839751112067512805496931725e-0001L,
 131      -B1      =   6.666666666666666666666666666666961498329e-0001L,
 132      -B2      =   3.999999999999999999999999990037655042358e-0001L,
 133      -B3      =   2.857142857142857142857273426428347457918e-0001L,
 134      -B4      =   2.222222222222222221353229049747910109566e-0001L,
 135      -B5      =   1.818181818181821503532559306309070138046e-0001L,
 136      -B6      =   1.538461538453809210486356084587356788556e-0001L,
 137      -B7      =   1.333333344463358756121456892645178795480e-0001L,
 138      -B8      =   1.176460904783899064854645174603360383792e-0001L,
 139      -B9      =   1.057293869956598995326368602518056990746e-0001L;
      118 +static const long double zero = 0.0L,
      119 +        one = 1.0L,
      120 +        two = 2.0L,
      121 +        ln2hi = 6.931471805599453094172319547495844850203e-0001L,
      122 +        ln2lo = 1.667085920830552208890449330400379754169e-0025L,
      123 +        A1 = 2.000000000000000000000000000000000000024e+0000L,
      124 +        A2 = 6.666666666666666666666666666666091393804e-0001L,
      125 +        A3 = 4.000000000000000000000000407167070220671e-0001L,
      126 +        A4 = 2.857142857142857142730077490612903681164e-0001L,
      127 +        A5 = 2.222222222222242577702836920812882605099e-0001L,
      128 +        A6 = 1.818181816435493395985912667105885828356e-0001L,
      129 +        A7 = 1.538537835211839751112067512805496931725e-0001L,
      130 +        B1 = 6.666666666666666666666666666666961498329e-0001L,
      131 +        B2 = 3.999999999999999999999999990037655042358e-0001L,
      132 +        B3 = 2.857142857142857142857273426428347457918e-0001L,
      133 +        B4 = 2.222222222222222221353229049747910109566e-0001L,
      134 +        B5 = 1.818181818181821503532559306309070138046e-0001L,
      135 +        B6 = 1.538461538453809210486356084587356788556e-0001L,
      136 +        B7 = 1.333333344463358756121456892645178795480e-0001L,
      137 +        B8 = 1.176460904783899064854645174603360383792e-0001L,
      138 +        B9 = 1.057293869956598995326368602518056990746e-0001L;
 140  139  
 141  140  long double
 142      -log1pl(long double x) {
      141 +log1pl(long double x)
      142 +{
 143  143          long double f, s, z, qn, h, t, y, g;
 144  144          int i, j, ix, iy, n, hx, m;
 145  145  
 146  146          hx = H0(x);
 147  147          ix = hx & 0x7fffffff;
 148      -        if (ix < 0x3ffaf07c) {  /* |x|<2/33 */
      148 +
      149 +        if (ix < 0x3ffaf07c) {          /* |x|<2/33 */
 149  150                  if (ix <= 0x3f8d0000) { /* x <= 2**-114, return x */
 150      -                        if ((int) x == 0)
      151 +                        if ((int)x == 0)
 151  152                                  return (x);
 152  153                  }
      154 +
 153  155                  s = x / (two + x);      /* |s|<2**-8 */
 154  156                  z = s * s;
 155      -                return (x - s * (x - z * (B1 + z * (B2 + z * (B3 + z * (B4 +
 156      -                    z * (B5 + z * (B6 + z * (B7 + z * (B8 + z * B9))))))))));
      157 +                return (x - s * (x - z * (B1 + z * (B2 + z * (B3 + z * (B4 + z *
      158 +                    (B5 + z * (B6 + z * (B7 + z * (B8 + z * B9))))))))));
 157  159          }
 158      -        if (ix >= 0x7fff0000) { /* x is +inf or NaN */
      160 +
      161 +        if (ix >= 0x7fff0000)           /* x is +inf or NaN */
 159  162                  return (x + fabsl(x));
 160      -        }
      163 +
 161  164          if (hx < 0 && ix >= 0x3fff0000) {
 162  165                  if (ix > 0x3fff0000 || (H1(x) | H2(x) | H3(x)) != 0)
 163  166                          x = zero;
      167 +
 164  168                  return (x / zero);      /* log1p(x) is NaN  if x<-1 */
 165  169                  /* log1p(-1) is -inf */
 166  170          }
      171 +
 167  172          if (ix >= 0x7ffeffff)
 168      -                y = x;          /* avoid spurious overflow */
      173 +                y = x;                  /* avoid spurious overflow */
 169  174          else
 170  175                  y = one + x;
      176 +
 171  177          iy = H0(y);
 172  178          n = ((iy + 0x200) >> 16) - 0x3fff;
 173  179          iy = (iy & 0x0000ffff) | 0x3fff0000;    /* scale 1+x to [1,2] */
 174  180          H0(y) = iy;
 175  181          z = zero;
 176  182          m = (ix >> 16) - 0x3fff;
      183 +
 177  184          /* HI(1+x) = (((hx&0xffff)|0x10000)>>(-m))|0x3fff0000 */
 178      -        if (n == 0) {           /* x in [2/33,1) */
      185 +        if (n == 0) {                   /* x in [2/33,1) */
 179  186                  g = zero;
 180  187                  H0(g) = ((hx + (0x200 << (-m))) >> (10 - m)) << (10 - m);
 181  188                  t = x - g;
 182  189                  i = (((((hx & 0xffff) | 0x10000) >> (-m)) | 0x3fff0000) +
 183      -                        0x200) >> 10;
      190 +                    0x200) >> 10;
 184  191                  H0(z) = i << 10;
 185      -
 186  192          } else if ((1 + n) == 0 && (ix < 0x3ffe0000)) { /* x in (-0.5,-2/33] */
 187  193                  g = zero;
 188  194                  H0(g) = ((ix + (0x200 << (-m - 1))) >> (9 - m)) << (9 - m);
 189  195                  t = g + x;
 190  196                  t = t + t;
      197 +
 191  198                  /*
 192  199                   * HI(2*(1+x)) =
 193  200                   * ((0x10000-(((hx&0xffff)|0x10000)>>(-m)))<<1)|0x3fff0000
 194  201                   */
      202 +
 195  203                  /*
 196  204                   * i =
 197  205                   * ((((0x10000-(((hx&0xffff)|0x10000)>>(-m)))<<1)|0x3fff0000)+
 198  206                   * 0x200)>>10; H0(z)=i<<10;
 199  207                   */
 200  208                  z = two * (one - g);
 201  209                  i = H0(z) >> 10;
 202  210          } else {
 203  211                  i = (iy + 0x200) >> 10;
 204  212                  H0(z) = i << 10;
 205  213                  t = y - z;
 206  214          }
 207  215  
 208  216          s = t / (y + z);
 209  217          j = i & 0x3f;
 210  218          z = s * s;
 211      -        qn = (long double) n;
      219 +        qn = (long double)n;
 212  220          t = qn * ln2lo + _TBL_logl_lo[j];
 213  221          h = qn * ln2hi + _TBL_logl_hi[j];
 214      -        f = t + s * (A1 + z * (A2 + z * (A3 + z * (A4 + z * (A5 + z * (A6 +
 215      -                z * A7))))));
      222 +        f = t + s * (A1 + z * (A2 + z * (A3 + z * (A4 + z * (A5 + z * (A6 + z *
      223 +            A7))))));
 216  224          return (h + f);
 217  225  }

XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX