1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 22 /* 23 * Copyright 2006 Sun Microsystems, Inc. All rights reserved. 24 * Use is subject to license terms. 25 */ 26 27 /* 28 * Copyright 2011, Richard Lowe. 29 */ 30 31 /* Functions in this file are duplicated in locallibm.il. Keep them in sync */ 32 33 #ifndef _LIBM_INLINES_H 34 #define _LIBM_INLINES_H 35 36 #ifdef __GNUC__ 37 38 #include <sys/types.h> 39 #include <sys/ieeefp.h> 40 41 #ifdef __cplusplus 42 extern "C" { 43 #endif 44 45 extern __inline__ enum fp_class_type 46 fp_classf(float f) 47 { 48 enum fp_class_type ret; 49 int fint; /* scratch for f as int */ 50 uint64_t tmp; 51 52 __asm__ __volatile__( 53 "fabss %3,%3\n\t" 54 "st %3,%1\n\t" 55 "ld %1,%0\n\t" 56 "orcc %%g0,%0,%%g0\n\t" 57 "be,pn %%icc,2f\n\t" 58 "nop\n\t" 59 "1:\n\t" 60 "sethi %%hi(0x7f800000),%2\n\t" 61 "andcc %0,%2,%%g0\n\t" 62 "bne,pt %%icc,1f\n\t" 63 "nop\n\t" 64 "or %%g0,1,%0\n\t" 65 "ba 2f\n\t" /* subnormal */ 66 "nop\n\t" 67 "1:\n\t" 68 "subcc %0,%2,%%g0\n\t" 69 "bge,pn %%icc,1f\n\t" 70 "nop\n\t" 71 "or %%g0,2,%0\n\t" 72 "ba 2f\n\t" /* normal */ 73 "nop\n\t" 74 "1:\n\t" 75 "bg,pn %%icc,1f\n\t" 76 "nop\n\t" 77 "or %%g0,3,%0\n\t" 78 "ba 2f\n\t" /* infinity */ 79 "nop\n\t" 80 "1:\n\t" 81 "sethi %%hi(0x00400000),%2\n\t" 82 "andcc %0,%2,%%g0\n\t" 83 "or %%g0,4,%0\n\t" 84 "bne,pt %%icc,2f\n\t" /* quiet NaN */ 85 "nop\n\t" 86 "or %%g0,5,%0\n\t" /* signalling NaN */ 87 "2:\n\t" 88 : "=r" (ret), "=m" (fint), "=r" (tmp) 89 : "f" (f) 90 : "cc"); 91 92 return (ret); 93 } 94 95 extern __inline__ enum fp_class_type 96 fp_class(double d) 97 { 98 enum fp_class_type ret; 99 uint64_t dint; /* Scratch for d-as-long */ 100 uint64_t tmp; 101 102 __asm__ __volatile__( 103 "fabsd %3,%3\n\t" 104 "std %3,%1\n\t" 105 "ldx %1,%0\n\t" 106 "orcc %%g0,%0,%%g0\n\t" 107 "be,pn %%xcc,2f\n\t" 108 "nop\n\t" 109 "sethi %%hi(0x7ff00000),%2\n\t" 110 "sllx %2,32,%2\n\t" 111 "andcc %0,%2,%%g0\n\t" 112 "bne,pt %%xcc,1f\n\t" 113 "nop\n\t" 114 "or %%g0,1,%0\n\t" 115 "ba 2f\n\t" 116 "nop\n\t" 117 "1:\n\t" 118 "subcc %0,%2,%%g0\n\t" 119 "bge,pn %%xcc,1f\n\t" 120 "nop\n\t" 121 "or %%g0,2,%0\n\t" 122 "ba 2f\n\t" 123 "nop\n\t" 124 "1:\n\t" 125 "andncc %0,%2,%0\n\t" 126 "bne,pn %%xcc,1f\n\t" 127 "nop\n\t" 128 "or %%g0,3,%0\n\t" 129 "ba 2f\n\t" 130 "nop\n\t" 131 "1:\n\t" 132 "sethi %%hi(0x00080000),%2\n\t" 133 "sllx %2,32,%2\n\t" 134 "andcc %0,%2,%%g0\n\t" 135 "or %%g0,4,%0\n\t" 136 "bne,pt %%xcc,2f\n\t" 137 "nop\n\t" 138 "or %%g0,5,%0\n\t" 139 "2:\n\t" 140 : "=r" (ret), "=m" (dint), "=r" (tmp) 141 : "e" (d) 142 : "cc"); 143 144 return (ret); 145 } 146 147 extern __inline__ float 148 __inline_sqrtf(float f) 149 { 150 float ret; 151 152 __asm__ __volatile__("fsqrts %1,%0\n\t" : "=f" (ret) : "f" (f)); 153 return (ret); 154 } 155 156 extern __inline__ double 157 __inline_sqrt(double d) 158 { 159 double ret; 160 161 __asm__ __volatile__("fsqrtd %1,%0\n\t" : "=f" (ret) : "f" (d)); 162 return (ret); 163 } 164 165 extern __inline__ int 166 __swapEX(int i) 167 { 168 int ret; 169 uint32_t fsr; 170 uint64_t tmp1, tmp2; 171 172 __asm__ __volatile__( 173 "and %4,0x1f,%2\n\t" 174 "sll %2,5,%2\n\t" /* shift input to aexc bit location */ 175 ".volatile\n\t" 176 "st %%fsr,%1\n\t" 177 "ld %1,%0\n\t" /* %0 = fsr */ 178 "andn %0,0x3e0,%3\n\t" 179 "or %2,%3,%2\n\t" /* %2 = new fsr */ 180 "st %2,%1\n\t" 181 "ld %1,%%fsr\n\t" 182 "srl %0,5,%0\n\t" 183 "and %0,0x1f,%0\n\t" 184 ".nonvolatile\n\t" 185 : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2) 186 : "r" (i) 187 : "cc"); 188 189 return (ret); 190 } 191 192 /* 193 * On the SPARC, __swapRP is a no-op; always return 0 for backward 194 * compatibility 195 */ 196 /* ARGSUSED */ 197 extern __inline__ enum fp_precision_type 198 __swapRP(enum fp_precision_type i) 199 { 200 return (0); 201 } 202 203 extern __inline__ enum fp_direction_type 204 __swapRD(enum fp_direction_type d) 205 { 206 enum fp_direction_type ret; 207 uint32_t fsr; 208 uint64_t tmp1, tmp2, tmp3; 209 210 __asm__ __volatile__( 211 "and %5,0x3,%0\n\t" 212 "sll %0,30,%2\n\t" /* shift input to RD bit location */ 213 ".volatile\n\t" 214 "st %%fsr,%1\n\t" 215 "ld %1,%0\n\t" /* %0 = fsr */ 216 /* mask of rounding direction bits */ 217 "sethi %%hi(0xc0000000),%4\n\t" 218 "andn %0,%4,%3\n\t" 219 "or %2,%3,%2\n\t" /* %2 = new fsr */ 220 "st %2,%1\n\t" 221 "ld %1,%%fsr\n\t" 222 "srl %0,30,%0\n\t" 223 "and %0,0x3,%0\n\t" 224 ".nonvolatile\n\t" 225 : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2), "=r" (tmp3) 226 : "r" (d) 227 : "cc"); 228 229 return (ret); 230 } 231 232 extern __inline__ int 233 __swapTE(int i) 234 { 235 int ret; 236 uint32_t fsr; 237 uint64_t tmp1, tmp2, tmp3; 238 239 __asm__ __volatile__( 240 "and %5,0x1f,%0\n\t" 241 "sll %0,23,%2\n\t" /* shift input to TEM bit location */ 242 ".volatile\n\t" 243 "st %%fsr,%1\n\t" 244 "ld %1,%0\n\t" /* %0 = fsr */ 245 /* mask of TEM (Trap Enable Mode bits) */ 246 "sethi %%hi(0x0f800000),%4\n\t" 247 "andn %0,%4,%3\n\t" 248 "or %2,%3,%2\n\t" /* %2 = new fsr */ 249 "st %2,%1\n\t" 250 "ld %1,%%fsr\n\t" 251 "srl %0,23,%0\n\t" 252 "and %0,0x1f,%0\n\t" 253 ".nonvolatile\n\t" 254 : "=r" (ret), "=m" (fsr), "=r" (tmp1), "=r" (tmp2), "=r" (tmp3) 255 : "r" (i) 256 : "cc"); 257 258 return (ret); 259 } 260 261 262 extern __inline__ double 263 sqrt(double d) 264 { 265 return (__inline_sqrt(d)); 266 } 267 268 extern __inline__ float 269 sqrtf(float f) 270 { 271 return (__inline_sqrtf(f)); 272 } 273 274 extern __inline__ double 275 fabs(double d) 276 { 277 double ret; 278 279 __asm__ __volatile__("fabsd %1,%0\n\t" : "=e" (ret) : "e" (d)); 280 return (ret); 281 } 282 283 extern __inline__ float 284 fabsf(float f) 285 { 286 float ret; 287 288 __asm__ __volatile__("fabss %1,%0\n\t" : "=f" (ret) : "f" (f)); 289 return (ret); 290 } 291 292 #ifdef __cplusplus 293 } 294 #endif 295 296 #endif /* __GNUC__ */ 297 298 #endif /* _LIBM_INLINES_H */