1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 /* 22 * Copyright 2011 Nexenta Systems, Inc. All rights reserved. 23 */ 24 /* 25 * Copyright 2006 Sun Microsystems, Inc. All rights reserved. 26 * Use is subject to license terms. 27 */ 28 29 .file "__vsqrt.S" 30 31 #include "libm.h" 32 33 RO_DATA 34 .align 64 35 36 .CONST_TBL: 37 .word 0x3fe00000, 0x00000000 ! A1 = 5.00000000000000001789e-01 38 .word 0xbfbfffff, 0xfffd0bfd ! A2 = -1.24999999997314110667e-01 39 .word 0x3fafffff, 0xfffb5bfb ! A3 = 6.24999999978896565817e-02 40 .word 0xbfa4000f, 0xc00b4fc8 ! A4 = -3.90629693917215481458e-02 41 .word 0x3f9c0018, 0xc012da4e ! A5 = 2.73441188080261677282e-02 42 .word 0x000fffff, 0xffffffff ! DC0 = 0x000fffffffffffff 43 .word 0x00001000, 0x00000000 ! DC2 = 0x0000100000000000 44 .word 0x7fffe000, 0x00000000 ! DC3 = 0x7fffe00000000000 45 46 ! i = [0,128] 47 ! TBL[8*i+0] = 1.0 / (*(double*)&(0x3fe0000000000000LL + (i << 45))); 48 ! TBL[8*i+1] = (double)(2.0 * sqrtl(*(double*)&(0x3fe0000000000000LL + (i << 45)))); 49 ! TBL[8*i+2] = (double)(2.0 * sqrtl(*(double*)&(0x3fe0000000000000LL + (i << 45))) - TBL[8*i+1]); 50 ! TBL[8*i+3] = 0 51 ! TBL[8*i+4] = 1.0 / (*(double*)&(0x3fe0000000000000LL + (i << 45))); 52 ! TBL[8*i+5] = (double)(2.0 * sqrtl(2.0) * sqrtl(*(double*)&(0x3fe0000000000000LL + (i << 45)))); 53 ! TBL[8*i+6] = (double)(2.0 * sqrtl(2.0) * sqrtl(*(double*)&(0x3fe0000000000000LL + (i << 45))) - TBL[8*i+5]); 54 ! TBL[8*i+7] = 0 55 56 .word 0x40000000, 0x00000000, 0x3ff6a09e, 0x667f3bcd 57 .word 0xbc9bdd34, 0x13b26456, 0x00000000, 0x00000000 58 .word 0x40000000, 0x00000000, 0x40000000, 0x00000000 59 .word 0xb8f00000, 0x00000000, 0x00000000, 0x00000000 60 .word 0x3fffc07f, 0x01fc07f0, 0x3ff6b733, 0xbfd8c648 61 .word 0x3c53b629, 0x05629048, 0x00000000, 0x00000000 62 .word 0x3fffc07f, 0x01fc07f0, 0x40000ff8, 0x07f60deb 63 .word 0x3c90655c, 0x648a53f1, 0x00000000, 0x00000000 64 .word 0x3fff81f8, 0x1f81f820, 0x3ff6cdb2, 0xbbb212eb 65 .word 0x3c960332, 0xcdbaba2d, 0x00000000, 0x00000000 66 .word 0x3fff81f8, 0x1f81f820, 0x40001fe0, 0x3f61bad0 67 .word 0x3ca2c41a, 0x15cbfaf2, 0x00000000, 0x00000000 68 .word 0x3fff4465, 0x9e4a4271, 0x3ff6e41b, 0x9bfb3b75 69 .word 0xbc925d8c, 0xfd6d5c87, 0x00000000, 0x00000000 70 .word 0x3fff4465, 0x9e4a4271, 0x40002fb8, 0xd4e30f48 71 .word 0xbca64203, 0xab1ba910, 0x00000000, 0x00000000 72 .word 0x3fff07c1, 0xf07c1f08, 0x3ff6fa6e, 0xa162d0f0 73 .word 0x3c691a24, 0x3d6297e9, 0x00000000, 0x00000000 74 .word 0x3fff07c1, 0xf07c1f08, 0x40003f81, 0xf636b80c 75 .word 0xbca0efc8, 0xba812a8c, 0x00000000, 0x00000000 76 .word 0x3ffecc07, 0xb301ecc0, 0x3ff710ac, 0x0b5e5e32 77 .word 0xbc991218, 0xb8d2850d, 0x00000000, 0x00000000 78 .word 0x3ffecc07, 0xb301ecc0, 0x40004f3b, 0xd03c0a64 79 .word 0x3c9ee2cf, 0x2d8ae22b, 0x00000000, 0x00000000 80 .word 0x3ffe9131, 0xabf0b767, 0x3ff726d4, 0x1832a0be 81 .word 0xbc2d9b1a, 0xa8ecb058, 0x00000000, 0x00000000 82 .word 0x3ffe9131, 0xabf0b767, 0x40005ee6, 0x8efad48b 83 .word 0xbc9c35f4, 0x8f4b89f7, 0x00000000, 0x00000000 84 .word 0x3ffe573a, 0xc901e574, 0x3ff73ce7, 0x04fb7b23 85 .word 0x3c91470b, 0x816b17a6, 0x00000000, 0x00000000 86 .word 0x3ffe573a, 0xc901e574, 0x40006e82, 0x5da8fc2b 87 .word 0x3c9a315a, 0x8bd8a03b, 0x00000000, 0x00000000 88 .word 0x3ffe1e1e, 0x1e1e1e1e, 0x3ff752e5, 0x0db3a3a2 89 .word 0xbc939331, 0x3eea4381, 0x00000000, 0x00000000 90 .word 0x3ffe1e1e, 0x1e1e1e1e, 0x40007e0f, 0x66afed07 91 .word 0xbc74a6e1, 0xdcd59eaf, 0x00000000, 0x00000000 92 .word 0x3ffde5d6, 0xe3f8868a, 0x3ff768ce, 0x6d3c11e0 93 .word 0xbc9478b8, 0xab33074d, 0x00000000, 0x00000000 94 .word 0x3ffde5d6, 0xe3f8868a, 0x40008d8d, 0xd3b1d9aa 95 .word 0x3c81d533, 0x85fe2b96, 0x00000000, 0x00000000 96 .word 0x3ffdae60, 0x76b981db, 0x3ff77ea3, 0x5d632e43 97 .word 0x3c92f714, 0x9a22fa4f, 0x00000000, 0x00000000 98 .word 0x3ffdae60, 0x76b981db, 0x40009cfd, 0xcd8ed009 99 .word 0xbc4862a9, 0xbcf7f372, 0x00000000, 0x00000000 100 .word 0x3ffd77b6, 0x54b82c34, 0x3ff79464, 0x16ebc56c 101 .word 0x3c9a7cd5, 0x224c7375, 0x00000000, 0x00000000 102 .word 0x3ffd77b6, 0x54b82c34, 0x4000ac5f, 0x7c69a3c8 103 .word 0x3ca94dff, 0x7bfa2757, 0x00000000, 0x00000000 104 .word 0x3ffd41d4, 0x1d41d41d, 0x3ff7aa10, 0xd193c22d 105 .word 0xbc790ed9, 0x403afe85, 0x00000000, 0x00000000 106 .word 0x3ffd41d4, 0x1d41d41d, 0x4000bbb3, 0x07acafdb 107 .word 0xbc852a97, 0x686f9d2e, 0x00000000, 0x00000000 108 .word 0x3ffd0cb5, 0x8f6ec074, 0x3ff7bfa9, 0xc41ab040 109 .word 0x3c8d6bc3, 0x02ae758f, 0x00000000, 0x00000000 110 .word 0x3ffd0cb5, 0x8f6ec074, 0x4000caf8, 0x960e710d 111 .word 0x3c9caa6b, 0xe2366171, 0x00000000, 0x00000000 112 .word 0x3ffcd856, 0x89039b0b, 0x3ff7d52f, 0x244809e9 113 .word 0x3c9081f6, 0xf3b99d5f, 0x00000000, 0x00000000 114 .word 0x3ffcd856, 0x89039b0b, 0x4000da30, 0x4d95fb06 115 .word 0xbc9e1269, 0x76855586, 0x00000000, 0x00000000 116 .word 0x3ffca4b3, 0x055ee191, 0x3ff7eaa1, 0x26f15284 117 .word 0xbc846ce4, 0x68c1882b, 0x00000000, 0x00000000 118 .word 0x3ffca4b3, 0x055ee191, 0x4000e95a, 0x539f492c 119 .word 0xbc80c73f, 0xc38a2184, 0x00000000, 0x00000000 120 .word 0x3ffc71c7, 0x1c71c71c, 0x3ff80000, 0x00000000 121 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 122 .word 0x3ffc71c7, 0x1c71c71c, 0x4000f876, 0xccdf6cd9 123 .word 0x3cab1a18, 0xf13a34c0, 0x00000000, 0x00000000 124 .word 0x3ffc3f8f, 0x01c3f8f0, 0x3ff8154b, 0xe2773526 125 .word 0xbc857147, 0xe067d0ee, 0x00000000, 0x00000000 126 .word 0x3ffc3f8f, 0x01c3f8f0, 0x40010785, 0xdd689a29 127 .word 0xbcaaabbe, 0x9e4d810a, 0x00000000, 0x00000000 128 .word 0x3ffc0e07, 0x0381c0e0, 0x3ff82a85, 0x00794e6c 129 .word 0xbc82edaa, 0x75e6ac5f, 0x00000000, 0x00000000 130 .word 0x3ffc0e07, 0x0381c0e0, 0x40011687, 0xa8ae14a3 131 .word 0x3cac9b43, 0xbcf06106, 0x00000000, 0x00000000 132 .word 0x3ffbdd2b, 0x899406f7, 0x3ff83fab, 0x8b4d4315 133 .word 0x3c829e06, 0x2d3e134d, 0x00000000, 0x00000000 134 .word 0x3ffbdd2b, 0x899406f7, 0x4001257c, 0x5187fd09 135 .word 0xbca4a750, 0xa83950a4, 0x00000000, 0x00000000 136 .word 0x3ffbacf9, 0x14c1bad0, 0x3ff854bf, 0xb363dc39 137 .word 0x3c99399f, 0xca38787e, 0x00000000, 0x00000000 138 .word 0x3ffbacf9, 0x14c1bad0, 0x40013463, 0xfa37014e 139 .word 0x3c7b295b, 0xaa698cd3, 0x00000000, 0x00000000 140 .word 0x3ffb7d6c, 0x3dda338b, 0x3ff869c1, 0xa85cc346 141 .word 0x3c9fcc99, 0xde11b1d1, 0x00000000, 0x00000000 142 .word 0x3ffb7d6c, 0x3dda338b, 0x4001433e, 0xc467effb 143 .word 0x3c92c031, 0x3b7278c8, 0x00000000, 0x00000000 144 .word 0x3ffb4e81, 0xb4e81b4f, 0x3ff87eb1, 0x990b697a 145 .word 0x3c7c43e9, 0xf593ea0f, 0x00000000, 0x00000000 146 .word 0x3ffb4e81, 0xb4e81b4f, 0x4001520c, 0xd1372feb 147 .word 0xbcadec22, 0x5d8e66d2, 0x00000000, 0x00000000 148 .word 0x3ffb2036, 0x406c80d9, 0x3ff8938f, 0xb37bc9c1 149 .word 0xbc7c115f, 0x9f5c8d6f, 0x00000000, 0x00000000 150 .word 0x3ffb2036, 0x406c80d9, 0x400160ce, 0x41341d74 151 .word 0x3c967036, 0x863a1bb2, 0x00000000, 0x00000000 152 .word 0x3ffaf286, 0xbca1af28, 0x3ff8a85c, 0x24f70659 153 .word 0x3c9f6e07, 0x6b588a50, 0x00000000, 0x00000000 154 .word 0x3ffaf286, 0xbca1af28, 0x40016f83, 0x34644df9 155 .word 0xbcae8679, 0x80a1c48e, 0x00000000, 0x00000000 156 .word 0x3ffac570, 0x1ac5701b, 0x3ff8bd17, 0x1a07e38a 157 .word 0x3c9c20b5, 0xa697f23f, 0x00000000, 0x00000000 158 .word 0x3ffac570, 0x1ac5701b, 0x40017e2b, 0xca46bab9 159 .word 0x3ca1519b, 0x10d04d5f, 0x00000000, 0x00000000 160 .word 0x3ffa98ef, 0x606a63be, 0x3ff8d1c0, 0xbe7f20ac 161 .word 0xbc8bdb8a, 0x6df021f3, 0x00000000, 0x00000000 162 .word 0x3ffa98ef, 0x606a63be, 0x40018cc8, 0x21d6d3e3 163 .word 0xbca30af1, 0xd725cc5b, 0x00000000, 0x00000000 164 .word 0x3ffa6d01, 0xa6d01a6d, 0x3ff8e659, 0x3d77b0b8 165 .word 0xbc7d99d7, 0x64769954, 0x00000000, 0x00000000 166 .word 0x3ffa6d01, 0xa6d01a6d, 0x40019b58, 0x598f7c9f 167 .word 0xbc72e0d8, 0x51c0e011, 0x00000000, 0x00000000 168 .word 0x3ffa41a4, 0x1a41a41a, 0x3ff8fae0, 0xc15ad38a 169 .word 0xbc7db7ad, 0xb6817f6d, 0x00000000, 0x00000000 170 .word 0x3ffa41a4, 0x1a41a41a, 0x4001a9dc, 0x8f6df104 171 .word 0xbcafc519, 0xc18dc1d5, 0x00000000, 0x00000000 172 .word 0x3ffa16d3, 0xf97a4b02, 0x3ff90f57, 0x73e410e4 173 .word 0x3c6fb605, 0xcee75482, 0x00000000, 0x00000000 174 .word 0x3ffa16d3, 0xf97a4b02, 0x4001b854, 0xe0f496a0 175 .word 0x3ca27006, 0x899b7c3a, 0x00000000, 0x00000000 176 .word 0x3ff9ec8e, 0x951033d9, 0x3ff923bd, 0x7e25164d 177 .word 0xbc9278d1, 0x901d3b40, 0x00000000, 0x00000000 178 .word 0x3ff9ec8e, 0x951033d9, 0x4001c6c1, 0x6b2db870 179 .word 0x3c887e1d, 0x8335fb28, 0x00000000, 0x00000000 180 .word 0x3ff9c2d1, 0x4ee4a102, 0x3ff93813, 0x088978c5 181 .word 0xbc54312c, 0x627e5c52, 0x00000000, 0x00000000 182 .word 0x3ff9c2d1, 0x4ee4a102, 0x4001d522, 0x4aae2ee1 183 .word 0x3ca91222, 0xf6aebdc9, 0x00000000, 0x00000000 184 .word 0x3ff99999, 0x9999999a, 0x3ff94c58, 0x3ada5b53 185 .word 0xbc9b7ed7, 0x50df3cca, 0x00000000, 0x00000000 186 .word 0x3ff99999, 0x9999999a, 0x4001e377, 0x9b97f4a8 187 .word 0xbc9f5063, 0x19fcfd19, 0x00000000, 0x00000000 188 .word 0x3ff970e4, 0xf80cb872, 0x3ff9608d, 0x3c41fb4b 189 .word 0x3c73df32, 0xeaa86b83, 0x00000000, 0x00000000 190 .word 0x3ff970e4, 0xf80cb872, 0x4001f1c1, 0x799ca8ff 191 .word 0xbca28b52, 0xeb725e0a, 0x00000000, 0x00000000 192 .word 0x3ff948b0, 0xfcd6e9e0, 0x3ff974b2, 0x334f2346 193 .word 0x3c814e4a, 0xd3ae9e3f, 0x00000000, 0x00000000 194 .word 0x3ff948b0, 0xfcd6e9e0, 0x40020000, 0x00000000 195 .word 0xb9000000, 0x00000000, 0x00000000, 0x00000000 196 .word 0x3ff920fb, 0x49d0e229, 0x3ff988c7, 0x45f88592 197 .word 0x3c95af70, 0x1a56047b, 0x00000000, 0x00000000 198 .word 0x3ff920fb, 0x49d0e229, 0x40020e33, 0x499a21a9 199 .word 0xbc924ba2, 0x74fea9a1, 0x00000000, 0x00000000 200 .word 0x3ff8f9c1, 0x8f9c18fa, 0x3ff99ccc, 0x999fff00 201 .word 0x3c866234, 0x063b88ee, 0x00000000, 0x00000000 202 .word 0x3ff8f9c1, 0x8f9c18fa, 0x40021c5b, 0x70d9f824 203 .word 0xbca844f9, 0x9eee6fc3, 0x00000000, 0x00000000 204 .word 0x3ff8d301, 0x8d3018d3, 0x3ff9b0c2, 0x5315c2ce 205 .word 0xbc87f64a, 0x65cc6887, 0x00000000, 0x00000000 206 .word 0x3ff8d301, 0x8d3018d3, 0x40022a78, 0x8fc76de5 207 .word 0x3c931e32, 0xd4e07a48, 0x00000000, 0x00000000 208 .word 0x3ff8acb9, 0x0f6bf3aa, 0x3ff9c4a8, 0x969b7077 209 .word 0xbc96ca9e, 0x5cd4517a, 0x00000000, 0x00000000 210 .word 0x3ff8acb9, 0x0f6bf3aa, 0x4002388a, 0xc0059c28 211 .word 0xbc96072f, 0xbe0e5da3, 0x00000000, 0x00000000 212 .word 0x3ff886e5, 0xf0abb04a, 0x3ff9d87f, 0x87e71422 213 .word 0xbc85fdd8, 0xb11b7b1d, 0x00000000, 0x00000000 214 .word 0x3ff886e5, 0xf0abb04a, 0x40024692, 0x1ad4ea49 215 .word 0xbcaa6d9b, 0x268ef62d, 0x00000000, 0x00000000 216 .word 0x3ff86186, 0x18618618, 0x3ff9ec47, 0x4a261264 217 .word 0xbc8540c4, 0x89ba5074, 0x00000000, 0x00000000 218 .word 0x3ff86186, 0x18618618, 0x4002548e, 0xb9151e85 219 .word 0x3c999820, 0x0a774879, 0x00000000, 0x00000000 220 .word 0x3ff83c97, 0x7ab2bedd, 0x3ffa0000, 0x00000000 221 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 222 .word 0x3ff83c97, 0x7ab2bedd, 0x40026280, 0xb3476096 223 .word 0x3c9ab88b, 0x5ffe1cf5, 0x00000000, 0x00000000 224 .word 0x3ff81818, 0x18181818, 0x3ffa13a9, 0xcb996651 225 .word 0xbc9f9ab9, 0x0e4e85c3, 0x00000000, 0x00000000 226 .word 0x3ff81818, 0x18181818, 0x40027068, 0x21902e9a 227 .word 0x3c90ff4c, 0x20f541f6, 0x00000000, 0x00000000 228 .word 0x3ff7f405, 0xfd017f40, 0x3ffa2744, 0xce9674f5 229 .word 0xbc8b936c, 0x81e54daa, 0x00000000, 0x00000000 230 .word 0x3ff7f405, 0xfd017f40, 0x40027e45, 0x1bb944c3 231 .word 0x3c8e4a16, 0x42099ef0, 0x00000000, 0x00000000 232 .word 0x3ff7d05f, 0x417d05f4, 0x3ffa3ad1, 0x2a1da160 233 .word 0x3c951168, 0xf4be5984, 0x00000000, 0x00000000 234 .word 0x3ff7d05f, 0x417d05f4, 0x40028c17, 0xb9337834 235 .word 0xbc8af150, 0xa0e88972, 0x00000000, 0x00000000 236 .word 0x3ff7ad22, 0x08e0ecc3, 0x3ffa4e4e, 0xfeda34de 237 .word 0x3c6afbb4, 0xdbdadd0d, 0x00000000, 0x00000000 238 .word 0x3ff7ad22, 0x08e0ecc3, 0x400299e0, 0x11188575 239 .word 0xbc9a6169, 0x3fb250e5, 0x00000000, 0x00000000 240 .word 0x3ff78a4c, 0x8178a4c8, 0x3ffa61be, 0x6cfec997 241 .word 0xbc8c37ea, 0xb2bb5ca0, 0x00000000, 0x00000000 242 .word 0x3ff78a4c, 0x8178a4c8, 0x4002a79e, 0x3a2cd2e6 243 .word 0xbca5ddd4, 0x9cc9ad59, 0x00000000, 0x00000000 244 .word 0x3ff767dc, 0xe434a9b1, 0x3ffa751f, 0x9447b724 245 .word 0x3c82b909, 0x477e9ed1, 0x00000000, 0x00000000 246 .word 0x3ff767dc, 0xe434a9b1, 0x4002b552, 0x4ae1278e 247 .word 0xbca2f2a9, 0x8841b934, 0x00000000, 0x00000000 248 .word 0x3ff745d1, 0x745d1746, 0x3ffa8872, 0x93fd6f34 249 .word 0x3c768ef2, 0x4f198721, 0x00000000, 0x00000000 250 .word 0x3ff745d1, 0x745d1746, 0x4002c2fc, 0x595456a7 251 .word 0xbc996f60, 0xb0fc7e96, 0x00000000, 0x00000000 252 .word 0x3ff72428, 0x7f46debc, 0x3ffa9bb7, 0x8af6cabc 253 .word 0x3c8ba60d, 0xc999aba7, 0x00000000, 0x00000000 254 .word 0x3ff72428, 0x7f46debc, 0x4002d09c, 0x7b54e03e 255 .word 0x3c98c747, 0xfdeda6de, 0x00000000, 0x00000000 256 .word 0x3ff702e0, 0x5c0b8170, 0x3ffaaeee, 0x979b4838 257 .word 0xbc91f08a, 0xef9ef6c0, 0x00000000, 0x00000000 258 .word 0x3ff702e0, 0x5c0b8170, 0x4002de32, 0xc6628741 259 .word 0x3ca78746, 0xc499a4f7, 0x00000000, 0x00000000 260 .word 0x3ff6e1f7, 0x6b4337c7, 0x3ffac217, 0xd7e53b66 261 .word 0xbc64282a, 0xaa967e4f, 0x00000000, 0x00000000 262 .word 0x3ff6e1f7, 0x6b4337c7, 0x4002ebbf, 0x4fafdd4b 263 .word 0xbca78a73, 0xb72d5c41, 0x00000000, 0x00000000 264 .word 0x3ff6c16c, 0x16c16c17, 0x3ffad533, 0x6963eefc 265 .word 0xbc977c4a, 0x537dbdd2, 0x00000000, 0x00000000 266 .word 0x3ff6c16c, 0x16c16c17, 0x4002f942, 0x2c23c47e 267 .word 0xbc827c85, 0xf29db65d, 0x00000000, 0x00000000 268 .word 0x3ff6a13c, 0xd1537290, 0x3ffae841, 0x693db8b4 269 .word 0x3c90f773, 0xcd7a0713, 0x00000000, 0x00000000 270 .word 0x3ff6a13c, 0xd1537290, 0x400306bb, 0x705ae7c3 271 .word 0x3caf4933, 0x907af47a, 0x00000000, 0x00000000 272 .word 0x3ff68168, 0x16816817, 0x3ffafb41, 0xf432002e 273 .word 0xbc7ac94a, 0xfdfe8c5b, 0x00000000, 0x00000000 274 .word 0x3ff68168, 0x16816817, 0x4003142b, 0x30a929ab 275 .word 0x3c98dc01, 0x081a6c5c, 0x00000000, 0x00000000 276 .word 0x3ff661ec, 0x6a5122f9, 0x3ffb0e35, 0x269b38f5 277 .word 0xbc4f69a8, 0x05c3271a, 0x00000000, 0x00000000 278 .word 0x3ff661ec, 0x6a5122f9, 0x40032191, 0x811b0a41 279 .word 0xbc9ce3f0, 0xb38c0bf7, 0x00000000, 0x00000000 280 .word 0x3ff642c8, 0x590b2164, 0x3ffb211b, 0x1c70d023 281 .word 0x3c2e4c5e, 0x66eae2f0, 0x00000000, 0x00000000 282 .word 0x3ff642c8, 0x590b2164, 0x40032eee, 0x75770416 283 .word 0x3caed8e7, 0x730eaff2, 0x00000000, 0x00000000 284 .word 0x3ff623fa, 0x77016240, 0x3ffb33f3, 0xf1490def 285 .word 0xbc95894b, 0xcb02373b, 0x00000000, 0x00000000 286 .word 0x3ff623fa, 0x77016240, 0x40033c42, 0x213ee0c9 287 .word 0x3ca84c24, 0x4ba98124, 0x00000000, 0x00000000 288 .word 0x3ff60581, 0x60581606, 0x3ffb46bf, 0xc05aeb89 289 .word 0x3c9b1c7c, 0xc39adc9f, 0x00000000, 0x00000000 290 .word 0x3ff60581, 0x60581606, 0x4003498c, 0x97b10540 291 .word 0x3c734193, 0xbc8543b4, 0x00000000, 0x00000000 292 .word 0x3ff5e75b, 0xb8d015e7, 0x3ffb597e, 0xa47fdda3 293 .word 0xbc923cc8, 0x9d1e4635, 0x00000000, 0x00000000 294 .word 0x3ff5e75b, 0xb8d015e7, 0x400356cd, 0xebc9b5e2 295 .word 0x3c96dee1, 0x46bb1571, 0x00000000, 0x00000000 296 .word 0x3ff5c988, 0x2b931057, 0x3ffb6c30, 0xb83593e6 297 .word 0x3c8f4e3f, 0xd28d84bc, 0x00000000, 0x00000000 298 .word 0x3ff5c988, 0x2b931057, 0x40036406, 0x30445306 299 .word 0xbca78d86, 0x2327430a, 0x00000000, 0x00000000 300 .word 0x3ff5ac05, 0x6b015ac0, 0x3ffb7ed6, 0x159fadc8 301 .word 0xbc899bcf, 0xf04d134b, 0x00000000, 0x00000000 302 .word 0x3ff5ac05, 0x6b015ac0, 0x40037135, 0x779c8dcb 303 .word 0xbc8fe126, 0xce9778ae, 0x00000000, 0x00000000 304 .word 0x3ff58ed2, 0x308158ed, 0x3ffb916e, 0xd68964ec 305 .word 0x3c826a5d, 0x5dbaae29, 0x00000000, 0x00000000 306 .word 0x3ff58ed2, 0x308158ed, 0x40037e5b, 0xd40f95a1 307 .word 0x3cac6ff5, 0xeca5d122, 0x00000000, 0x00000000 308 .word 0x3ff571ed, 0x3c506b3a, 0x3ffba3fb, 0x14672d7c 309 .word 0xbc8117d3, 0x97dcefc9, 0x00000000, 0x00000000 310 .word 0x3ff571ed, 0x3c506b3a, 0x40038b79, 0x579d3eab 311 .word 0xbcac254f, 0xc0db598e, 0x00000000, 0x00000000 312 .word 0x3ff55555, 0x55555555, 0x3ffbb67a, 0xe8584caa 313 .word 0x3c9cec95, 0xd0b5c1e3, 0x00000000, 0x00000000 314 .word 0x3ff55555, 0x55555555, 0x4003988e, 0x1409212e 315 .word 0x3caf40c8, 0x6450c869, 0x00000000, 0x00000000 316 .word 0x3ff53909, 0x48f40feb, 0x3ffbc8ee, 0x6b2865b9 317 .word 0x3c9394eb, 0x90f645c8, 0x00000000, 0x00000000 318 .word 0x3ff53909, 0x48f40feb, 0x4003a59a, 0x1adbb257 319 .word 0x3ca6adce, 0x020a308d, 0x00000000, 0x00000000 320 .word 0x3ff51d07, 0xeae2f815, 0x3ffbdb55, 0xb550fdbc 321 .word 0x3c7365e9, 0x6aa5fae3, 0x00000000, 0x00000000 322 .word 0x3ff51d07, 0xeae2f815, 0x4003b29d, 0x7d635662 323 .word 0x3cac99b0, 0x5e282129, 0x00000000, 0x00000000 324 .word 0x3ff50150, 0x15015015, 0x3ffbedb0, 0xdefaf661 325 .word 0x3c91a627, 0xb279170d, 0x00000000, 0x00000000 326 .word 0x3ff50150, 0x15015015, 0x4003bf98, 0x4cb56c77 327 .word 0x3ca8f653, 0xbcc0c4a1, 0x00000000, 0x00000000 328 .word 0x3ff4e5e0, 0xa72f0539, 0x3ffc0000, 0x00000000 329 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 330 .word 0x3ff4e5e0, 0xa72f0539, 0x4003cc8a, 0x99af5453 331 .word 0xbc486364, 0x4f05f2be, 0x00000000, 0x00000000 332 .word 0x3ff4cab8, 0x8725af6e, 0x3ffc1243, 0x2fec0329 333 .word 0x3c96e0d7, 0x8dd23a7d, 0x00000000, 0x00000000 334 .word 0x3ff4cab8, 0x8725af6e, 0x4003d974, 0x74f76df2 335 .word 0x3c82e3c9, 0xfdbbbdc2, 0x00000000, 0x00000000 336 .word 0x3ff4afd6, 0xa052bf5b, 0x3ffc247a, 0x85fe81fa 337 .word 0x3c89d8ee, 0xf6854220, 0x00000000, 0x00000000 338 .word 0x3ff4afd6, 0xa052bf5b, 0x4003e655, 0xeefe1367 339 .word 0x3c80eb35, 0xbb532559, 0x00000000, 0x00000000 340 .word 0x3ff49539, 0xe3b2d067, 0x3ffc36a6, 0x192bf168 341 .word 0xbc9083d8, 0x1a423b11, 0x00000000, 0x00000000 342 .word 0x3ff49539, 0xe3b2d067, 0x4003f32f, 0x17fe8d04 343 .word 0xbc905d6c, 0x1c437de0, 0x00000000, 0x00000000 344 .word 0x3ff47ae1, 0x47ae147b, 0x3ffc48c6, 0x001f0ac0 345 .word 0xbc92d481, 0x189efd6b, 0x00000000, 0x00000000 346 .word 0x3ff47ae1, 0x47ae147b, 0x40040000, 0x00000000 347 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 348 .word 0x3ff460cb, 0xc7f5cf9a, 0x3ffc5ada, 0x513a1593 349 .word 0xbc7aaedd, 0x014f5f03, 0x00000000, 0x00000000 350 .word 0x3ff460cb, 0xc7f5cf9a, 0x40040cc8, 0xb6d657c2 351 .word 0xbc9c05ab, 0xf480ce19, 0x00000000, 0x00000000 352 .word 0x3ff446f8, 0x6562d9fb, 0x3ffc6ce3, 0x22982a3f 353 .word 0x3c891b2d, 0xf3e15f29, 0x00000000, 0x00000000 354 .word 0x3ff446f8, 0x6562d9fb, 0x40041989, 0x4c2329f0 355 .word 0x3c976037, 0x46da0ea6, 0x00000000, 0x00000000 356 .word 0x3ff42d66, 0x25d51f87, 0x3ffc7ee0, 0x8a0e6d4c 357 .word 0x3c991c54, 0xc53e75c8, 0x00000000, 0x00000000 358 .word 0x3ff42d66, 0x25d51f87, 0x40042641, 0xcf569572 359 .word 0xbcadf80b, 0x1442c029, 0x00000000, 0x00000000 360 .word 0x3ff41414, 0x14141414, 0x3ffc90d2, 0x9d2d43ce 361 .word 0xbc9edadb, 0x07f1137a, 0x00000000, 0x00000000 362 .word 0x3ff41414, 0x14141414, 0x400432f2, 0x4fb01c7a 363 .word 0x3ca38bfe, 0x0e012c1c, 0x00000000, 0x00000000 364 .word 0x3ff3fb01, 0x3fb013fb, 0x3ffca2b9, 0x714180f7 365 .word 0xbc81a63d, 0x6750c57c, 0x00000000, 0x00000000 366 .word 0x3ff3fb01, 0x3fb013fb, 0x40043f9a, 0xdc3f79ce 367 .word 0x3c66d2b1, 0x767ae30a, 0x00000000, 0x00000000 368 .word 0x3ff3e22c, 0xbce4a902, 0x3ffcb495, 0x1b558d17 369 .word 0x3c8fcbcb, 0x357f2308, 0x00000000, 0x00000000 370 .word 0x3ff3e22c, 0xbce4a902, 0x40044c3b, 0x83e57153 371 .word 0x3c98c853, 0xc6be5ee1, 0x00000000, 0x00000000 372 .word 0x3ff3c995, 0xa47babe7, 0x3ffcc665, 0xb0328622 373 .word 0xbc91baa4, 0xd369f814, 0x00000000, 0x00000000 374 .word 0x3ff3c995, 0xa47babe7, 0x400458d4, 0x55549c1a 375 .word 0x3ca02d72, 0x8d9a6054, 0x00000000, 0x00000000 376 .word 0x3ff3b13b, 0x13b13b14, 0x3ffcd82b, 0x446159f3 377 .word 0x3c983fb7, 0xb33cdfe8, 0x00000000, 0x00000000 378 .word 0x3ff3b13b, 0x13b13b14, 0x40046565, 0x5f122ff6 379 .word 0x3ca862c5, 0xd2f0ca4c, 0x00000000, 0x00000000 380 .word 0x3ff3991c, 0x2c187f63, 0x3ffce9e5, 0xec2bda80 381 .word 0xbc94ccf3, 0xd8e249ab, 0x00000000, 0x00000000 382 .word 0x3ff3991c, 0x2c187f63, 0x400471ee, 0xaf76c2c6 383 .word 0x3c975c62, 0xeff26e8e, 0x00000000, 0x00000000 384 .word 0x3ff38138, 0x13813814, 0x3ffcfb95, 0xbb9dcc0c 385 .word 0x3c92cea2, 0x0857ae03, 0x00000000, 0x00000000 386 .word 0x3ff38138, 0x13813814, 0x40047e70, 0x54af0989 387 .word 0x3c9d8c33, 0xc0054830, 0x00000000, 0x00000000 388 .word 0x3ff3698d, 0xf3de0748, 0x3ffd0d3a, 0xc685eda4 389 .word 0x3c94115a, 0x0ff4cf9e, 0x00000000, 0x00000000 390 .word 0x3ff3698d, 0xf3de0748, 0x40048aea, 0x5cbc935f 391 .word 0xbca8cb00, 0x12d14ff5, 0x00000000, 0x00000000 392 .word 0x3ff3521c, 0xfb2b78c1, 0x3ffd1ed5, 0x2076fbe9 393 .word 0x3c8f48a8, 0x6b72875f, 0x00000000, 0x00000000 394 .word 0x3ff3521c, 0xfb2b78c1, 0x4004975c, 0xd5768088 395 .word 0xbca1731e, 0xbc02f748, 0x00000000, 0x00000000 396 .word 0x3ff33ae4, 0x5b57bcb2, 0x3ffd3064, 0xdcc8ae67 397 .word 0x3c93480e, 0x805158ba, 0x00000000, 0x00000000 398 .word 0x3ff33ae4, 0x5b57bcb2, 0x4004a3c7, 0xcc8a358a 399 .word 0xbc9d8f7f, 0xd2726ffa, 0x00000000, 0x00000000 400 .word 0x3ff323e3, 0x4a2b10bf, 0x3ffd41ea, 0x0e98af91 401 .word 0x3c824640, 0x0309962f, 0x00000000, 0x00000000 402 .word 0x3ff323e3, 0x4a2b10bf, 0x4004b02b, 0x4f7c0a88 403 .word 0xbcaf71e1, 0xf6cafde2, 0x00000000, 0x00000000 404 .word 0x3ff30d19, 0x0130d190, 0x3ffd5364, 0xc8cb8f86 405 .word 0x3c8ad003, 0xc00630e1, 0x00000000, 0x00000000 406 .word 0x3ff30d19, 0x0130d190, 0x4004bc87, 0x6ba7f6ec 407 .word 0x3c9c1edb, 0x2be943b8, 0x00000000, 0x00000000 408 .word 0x3ff2f684, 0xbda12f68, 0x3ffd64d5, 0x1e0db1c6 409 .word 0xbc911ed3, 0x6986d362, 0x00000000, 0x00000000 410 .word 0x3ff2f684, 0xbda12f68, 0x4004c8dc, 0x2e423980 411 .word 0xbc949d1f, 0x46ef5d2c, 0x00000000, 0x00000000 412 .word 0x3ff2e025, 0xc04b8097, 0x3ffd763b, 0x20d435ef 413 .word 0x3c9d6780, 0xf76cb258, 0x00000000, 0x00000000 414 .word 0x3ff2e025, 0xc04b8097, 0x4004d529, 0xa457fcfc 415 .word 0xbca1404a, 0x46484e3d, 0x00000000, 0x00000000 416 .word 0x3ff2c9fb, 0x4d812ca0, 0x3ffd8796, 0xe35ddbb2 417 .word 0x3c83fdd9, 0x1aeb637a, 0x00000000, 0x00000000 418 .word 0x3ff2c9fb, 0x4d812ca0, 0x4004e16f, 0xdacff937 419 .word 0xbca1deb9, 0xd3815ad2, 0x00000000, 0x00000000 420 .word 0x3ff2b404, 0xad012b40, 0x3ffd98e8, 0x77b3e207 421 .word 0xbc48c301, 0xee02dee8, 0x00000000, 0x00000000 422 .word 0x3ff2b404, 0xad012b40, 0x4004edae, 0xde6b10fe 423 .word 0x3ca99709, 0x4a91a780, 0x00000000, 0x00000000 424 .word 0x3ff29e41, 0x29e4129e, 0x3ffdaa2f, 0xefaae1d8 425 .word 0xbc63fe0e, 0x03f44594, 0x00000000, 0x00000000 426 .word 0x3ff29e41, 0x29e4129e, 0x4004f9e6, 0xbbc4ecb3 427 .word 0x3c6ce5a6, 0x018493f1, 0x00000000, 0x00000000 428 .word 0x3ff288b0, 0x1288b013, 0x3ffdbb6d, 0x5ce3a42f 429 .word 0xbc922c27, 0xf71c8337, 0x00000000, 0x00000000 430 .word 0x3ff288b0, 0x1288b013, 0x40050617, 0x7f5491bb 431 .word 0xbc9e591e, 0x7b2a6d1a, 0x00000000, 0x00000000 432 .word 0x3ff27350, 0xb8812735, 0x3ffdcca0, 0xd0cbf408 433 .word 0x3c7a6d16, 0x2310db57, 0x00000000, 0x00000000 434 .word 0x3ff27350, 0xb8812735, 0x40051241, 0x356cf6e0 435 .word 0x3ca37dc2, 0x60e8bc2d, 0x00000000, 0x00000000 436 .word 0x3ff25e22, 0x708092f1, 0x3ffdddca, 0x5c9f6be8 437 .word 0x3c818520, 0xf0a3f809, 0x00000000, 0x00000000 438 .word 0x3ff25e22, 0x708092f1, 0x40051e63, 0xea3d95b0 439 .word 0x3caecf78, 0x2e88d5ce, 0x00000000, 0x00000000 440 .word 0x3ff24924, 0x92492492, 0x3ffdeeea, 0x11683f49 441 .word 0x3c802aae, 0x4bfa7c27, 0x00000000, 0x00000000 442 .word 0x3ff24924, 0x92492492, 0x40052a7f, 0xa9d2f8ea 443 .word 0xbca21c62, 0xb033c079, 0x00000000, 0x00000000 444 .word 0x3ff23456, 0x789abcdf, 0x3ffe0000, 0x00000000 445 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 446 .word 0x3ff23456, 0x789abcdf, 0x40053694, 0x80174810 447 .word 0xbc9c3ec1, 0xa4ee7c21, 0x00000000, 0x00000000 448 .word 0x3ff21fb7, 0x8121fb78, 0x3ffe110c, 0x39105faf 449 .word 0x3c776161, 0x4c513964, 0x00000000, 0x00000000 450 .word 0x3ff21fb7, 0x8121fb78, 0x400542a2, 0x78d2d036 451 .word 0xbca495c2, 0x45254df4, 0x00000000, 0x00000000 452 .word 0x3ff20b47, 0x0c67c0d9, 0x3ffe220e, 0xcd13ed60 453 .word 0xbc729f01, 0xf18c9dc9, 0x00000000, 0x00000000 454 .word 0x3ff20b47, 0x0c67c0d9, 0x40054ea9, 0x9fac8a0f 455 .word 0x3c80cfbb, 0x19353b3d, 0x00000000, 0x00000000 456 .word 0x3ff1f704, 0x7dc11f70, 0x3ffe3307, 0xcc56cf5c 457 .word 0xbc81f04e, 0xc3189131, 0x00000000, 0x00000000 458 .word 0x3ff1f704, 0x7dc11f70, 0x40055aaa, 0x002a9d5a 459 .word 0xbc4bf504, 0x76241f94, 0x00000000, 0x00000000 460 .word 0x3ff1e2ef, 0x3b3fb874, 0x3ffe43f7, 0x46f7795b 461 .word 0xbc931e7f, 0x8af68f8c, 0x00000000, 0x00000000 462 .word 0x3ff1e2ef, 0x3b3fb874, 0x400566a3, 0xa5b2e1b1 463 .word 0x3caa1fd2, 0x8cc92e33, 0x00000000, 0x00000000 464 .word 0x3ff1cf06, 0xada2811d, 0x3ffe54dd, 0x4ce75f1e 465 .word 0xbc811b19, 0x5dfc62e5, 0x00000000, 0x00000000 466 .word 0x3ff1cf06, 0xada2811d, 0x40057296, 0x9b8b5cd8 467 .word 0x3ca30cbf, 0x1c53312e, 0x00000000, 0x00000000 468 .word 0x3ff1bb4a, 0x4046ed29, 0x3ffe65b9, 0xedeba38e 469 .word 0xbc7bb732, 0x51e8c364, 0x00000000, 0x00000000 470 .word 0x3ff1bb4a, 0x4046ed29, 0x40057e82, 0xecdabe8d 471 .word 0xbc7c2aed, 0xf3c4c4bd, 0x00000000, 0x00000000 472 .word 0x3ff1a7b9, 0x611a7b96, 0x3ffe768d, 0x399dc470 473 .word 0xbc9a8c81, 0x3405c01c, 0x00000000, 0x00000000 474 .word 0x3ff1a7b9, 0x611a7b96, 0x40058a68, 0xa4a8d9f3 475 .word 0x3ca50798, 0xe67012d9, 0x00000000, 0x00000000 476 .word 0x3ff19453, 0x808ca29c, 0x3ffe8757, 0x3f6c42c5 477 .word 0x3c9dbf9c, 0xf7bbcda3, 0x00000000, 0x00000000 478 .word 0x3ff19453, 0x808ca29c, 0x40059647, 0xcddf1ca5 479 .word 0x3ca14a95, 0xf35dea0b, 0x00000000, 0x00000000 480 .word 0x3ff18118, 0x11811812, 0x3ffe9818, 0x0e9b47f2 481 .word 0xbc9b6bd7, 0x4396d08e, 0x00000000, 0x00000000 482 .word 0x3ff18118, 0x11811812, 0x4005a220, 0x73490377 483 .word 0xbcadd036, 0x39925812, 0x00000000, 0x00000000 484 .word 0x3ff16e06, 0x89427379, 0x3ffea8cf, 0xb64547ab 485 .word 0x3c8721b2, 0x6374e19f, 0x00000000, 0x00000000 486 .word 0x3ff16e06, 0x89427379, 0x4005adf2, 0x9f948cfb 487 .word 0xbca42520, 0xf7716fa6, 0x00000000, 0x00000000 488 .word 0x3ff15b1e, 0x5f75270d, 0x3ffeb97e, 0x455b9edb 489 .word 0x3c999b45, 0x40857883, 0x00000000, 0x00000000 490 .word 0x3ff15b1e, 0x5f75270d, 0x4005b9be, 0x5d52a9da 491 .word 0x3c9098cd, 0x1b3af777, 0x00000000, 0x00000000 492 .word 0x3ff1485f, 0x0e0acd3b, 0x3ffeca23, 0xcaa72f73 493 .word 0x3c7e3ed5, 0x29679959, 0x00000000, 0x00000000 494 .word 0x3ff1485f, 0x0e0acd3b, 0x4005c583, 0xb6f7ab03 495 .word 0x3ca963bc, 0x9d795b51, 0x00000000, 0x00000000 496 .word 0x3ff135c8, 0x1135c811, 0x3ffedac0, 0x54c8f94c 497 .word 0x3c90b5c1, 0x15a56207, 0x00000000, 0x00000000 498 .word 0x3ff135c8, 0x1135c811, 0x4005d142, 0xb6dbadc5 499 .word 0x3ca6f1f5, 0x5323d116, 0x00000000, 0x00000000 500 .word 0x3ff12358, 0xe75d3033, 0x3ffeeb53, 0xf23ab028 501 .word 0xbc8617e4, 0xb5384f5d, 0x00000000, 0x00000000 502 .word 0x3ff12358, 0xe75d3033, 0x4005dcfb, 0x673b05df 503 .word 0xbca099df, 0xc321634f, 0x00000000, 0x00000000 504 .word 0x3ff11111, 0x11111111, 0x3ffefbde, 0xb14f4eda 505 .word 0xbc93a145, 0xfe1be078, 0x00000000, 0x00000000 506 .word 0x3ff11111, 0x11111111, 0x4005e8ad, 0xd236a58f 507 .word 0xbc7ef8c7, 0xc0d1fec6, 0x00000000, 0x00000000 508 .word 0x3ff0fef0, 0x10fef011, 0x3fff0c60, 0xa033a7b3 509 .word 0xbc91b0fc, 0x15cd89c6, 0x00000000, 0x00000000 510 .word 0x3ff0fef0, 0x10fef011, 0x4005f45a, 0x01d483b4 511 .word 0xbc94a237, 0xdc0fa105, 0x00000000, 0x00000000 512 .word 0x3ff0ecf5, 0x6be69c90, 0x3fff1cd9, 0xcceef239 513 .word 0x3c91afd8, 0x64eab60a, 0x00000000, 0x00000000 514 .word 0x3ff0ecf5, 0x6be69c90, 0x40060000, 0x00000000 515 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 516 .word 0x3ff0db20, 0xa88f4696, 0x3fff2d4a, 0x45635640 517 .word 0xbc8eebae, 0xea670bc2, 0x00000000, 0x00000000 518 .word 0x3ff0db20, 0xa88f4696, 0x40060b9f, 0xd68a4554 519 .word 0x3ca328e1, 0x70dae176, 0x00000000, 0x00000000 520 .word 0x3ff0c971, 0x4fbcda3b, 0x3fff3db2, 0x174e7468 521 .word 0x3c9e1513, 0x2d6ac52a, 0x00000000, 0x00000000 522 .word 0x3ff0c971, 0x4fbcda3b, 0x40061739, 0x8f2aaa48 523 .word 0xbc9b672b, 0xba260735, 0x00000000, 0x00000000 524 .word 0x3ff0b7e6, 0xec259dc8, 0x3fff4e11, 0x5049ec26 525 .word 0xbc9b6656, 0xb6bd5d76, 0x00000000, 0x00000000 526 .word 0x3ff0b7e6, 0xec259dc8, 0x400622cd, 0x337f0fe8 527 .word 0x3c9fe207, 0x3279559f, 0x00000000, 0x00000000 528 .word 0x3ff0a681, 0x0a6810a7, 0x3fff5e67, 0xfdcbdf44 529 .word 0xbc98af06, 0x1849d6fc, 0x00000000, 0x00000000 530 .word 0x3ff0a681, 0x0a6810a7, 0x40062e5a, 0xcd0c3ebe 531 .word 0xbca2c50e, 0x2092203a, 0x00000000, 0x00000000 532 .word 0x3ff0953f, 0x39010954, 0x3fff6eb6, 0x2d27730d 533 .word 0xbc9401d9, 0x5ca1ce34, 0x00000000, 0x00000000 534 .word 0x3ff0953f, 0x39010954, 0x400639e2, 0x653e421b 535 .word 0xbc9f75e0, 0x5835e4b9, 0x00000000, 0x00000000 536 .word 0x3ff08421, 0x08421084, 0x3fff7efb, 0xeb8d4f12 537 .word 0xbc7e84e8, 0xa6ff3256, 0x00000000, 0x00000000 538 .word 0x3ff08421, 0x08421084, 0x40064564, 0x0568c1c3 539 .word 0x3cad1778, 0x7e4c8970, 0x00000000, 0x00000000 540 .word 0x3ff07326, 0x0a47f7c6, 0x3fff8f39, 0x460c19a8 541 .word 0x3c989b4e, 0x16ee9aaf, 0x00000000, 0x00000000 542 .word 0x3ff07326, 0x0a47f7c6, 0x400650df, 0xb6c759f4 543 .word 0x3c99063c, 0x91db4c77, 0x00000000, 0x00000000 544 .word 0x3ff0624d, 0xd2f1a9fc, 0x3fff9f6e, 0x4990f227 545 .word 0x3c8b42e5, 0xb5d1e808, 0x00000000, 0x00000000 546 .word 0x3ff0624d, 0xd2f1a9fc, 0x40065c55, 0x827df1d2 547 .word 0xbca3923d, 0xf03e1e2f, 0x00000000, 0x00000000 548 .word 0x3ff05197, 0xf7d73404, 0x3fffaf9b, 0x02e7e8f2 549 .word 0x3c897a76, 0x8f34e1c2, 0x00000000, 0x00000000 550 .word 0x3ff05197, 0xf7d73404, 0x400667c5, 0x7199104b 551 .word 0x3c875b89, 0x6f332e70, 0x00000000, 0x00000000 552 .word 0x3ff04104, 0x10410410, 0x3fffbfbf, 0x7ebc755f 553 .word 0xbc9b2a94, 0x084da0b6, 0x00000000, 0x00000000 554 .word 0x3ff04104, 0x10410410, 0x4006732f, 0x8d0e2f77 555 .word 0xbc93dffd, 0x470422e3, 0x00000000, 0x00000000 556 .word 0x3ff03091, 0xb51f5e1a, 0x3fffcfdb, 0xc999e97d 557 .word 0x3c82be17, 0xecdd3bbc, 0x00000000, 0x00000000 558 .word 0x3ff03091, 0xb51f5e1a, 0x40067e93, 0xddbc0e73 559 .word 0xbc86eb9f, 0x32ac1a5c, 0x00000000, 0x00000000 560 .word 0x3ff02040, 0x81020408, 0x3fffdfef, 0xefebe3d6 561 .word 0xbc909afc, 0xfc7c1f3b, 0x00000000, 0x00000000 562 .word 0x3ff02040, 0x81020408, 0x400689f2, 0x6c6b01d0 563 .word 0x3cae816f, 0x9d2a1032, 0x00000000, 0x00000000 564 .word 0x3ff01010, 0x10101010, 0x3fffeffb, 0xfdfebf1f 565 .word 0x3c95dee5, 0x1994f18b, 0x00000000, 0x00000000 566 .word 0x3ff01010, 0x10101010, 0x4006954b, 0x41cd4293 567 .word 0x3ca3d5bc, 0xcc443076, 0x00000000, 0x00000000 568 .word 0x3ff00000, 0x00000000, 0x40000000, 0x00000000 569 .word 0x00000000, 0x00000000, 0x00000000, 0x00000000 570 .word 0x3ff00000, 0x00000000, 0x4006a09e, 0x667f3bcd 571 .word 0xbcabdd34, 0x13b26456, 0x00000000, 0x00000000 572 573 #define A5 %f32 574 #define A4 %f30 575 #define A3 %f28 576 #define A2 %f26 577 #define A1 %f56 578 579 #define DC0 %f8 580 #define DC2 %f6 581 #define DC3 %f4 582 583 #define counter %l3 584 #define TBL %l5 585 #define stridex %l6 586 #define stridey %l7 587 588 #define _0x00001ff8 %i0 589 #define _0x7ff00000 %o0 590 #define _0x00100000 %o2 591 592 #define tmp_counter STACK_BIAS-0x40 593 #define tmp_px STACK_BIAS-0x38 594 #define tmp0 STACK_BIAS-0x30 595 #define tmp1 STACK_BIAS-0x28 596 #define tmp2 STACK_BIAS-0x20 597 #define tmp3 STACK_BIAS-0x18 598 #define tmp4 STACK_BIAS-0x10 599 #define tmp5 STACK_BIAS-0x08 600 601 ! sizeof temp storage - must be a multiple of 16 for V9 602 #define tmps 0x40 603 604 !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! 605 ! !!!!! algorithm !!!!! 606 ! ((float*)&res)[0] = ((float*)px)[0]; 607 ! ((float*)&res)[1] = ((float*)px)[1]; 608 ! hx = *(int*)px; 609 ! px += stridex; 610 ! 611 ! if ( hx >= 0x7ff00000 ) 612 ! { 613 ! res = sqrt(res); 614 ! ((float*)py)[0] = ((float*)&res)[0]; 615 ! ((float*)py)[1] = ((float*)&res)[1]; 616 ! py += stridey; 617 ! goto next; 618 ! } 619 ! if ( hx < 0x00100000 ) 620 ! { 621 ! res = sqrt(res); 622 ! ((float*)py)[0] = ((float*)&res)[0]; 623 ! ((float*)py)[1] = ((float*)&res)[1]; 624 ! py += stridey; 625 ! goto next; 626 ! } 627 ! 628 ! sqrt_exp = hx >> 21; 629 ! sqrt_exp -= 512; 630 ! sqrt_exp <<= 52; 631 ! dsqrt_exp = *(double*)&sqrt_exp; 632 ! bit = hx >> 15; 633 ! bit &= 32; 634 ! ind0 = hx >> 7; 635 ! ind0 &= 0x1ff8; 636 ! ind0 += 32; 637 ! ind0 &= -64; 638 ! ind1 = ind0; 639 ! ind1 += bit; 640 ! 641 ! res = vis_fand(res,DC0); /* DC0 = vis_to_double(0x000fffff, 0xffffffff); */ 642 ! res = vis_for(res,A1); /* A1 = vis_to_double(0x3fe00000, 0x00000000); */ 643 ! res_c = vis_fpadd32(res,DC2); /* DC2 = vis_to_double(0x00001000, 0x00000000); */ 644 ! res_c = vis_fand(res_c,DC3); /* DC3 = vis_to_double(0x7fffe000, 0x00000000); */ 645 ! 646 ! pind = (char*)TBL + ind1; 647 ! dexp_hi = ((double*)pind)[1]; 648 ! dexp_lo = ((double*)pind)[2]; 649 ! 650 ! dtmp0 = ((double*)pind)[0]; 651 ! xx = (res - res_c); 652 ! xx *= dtmp0; 653 ! 654 ! res = A5 * xx; 655 ! res += A4; 656 ! res *= xx; 657 ! res += A3; 658 ! res *= xx; 659 ! res += A2; 660 ! res *= xx; 661 ! res += A1; 662 ! res *= xx; 663 ! 664 ! res = dexp_hi * res; 665 ! res += dexp_lo; 666 ! res += dexp_hi; 667 ! 668 ! dtmp0 = vis_fpadd32(dsqrt_exp,res); 669 ! ((float*)py)[0] = ((float*)&dtmp0)[0]; 670 ! ((float*)py)[1] = ((float*)&dtmp0)[1]; 671 ! py += stridey; 672 ! 673 !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!! 674 675 ENTRY(__vsqrt) 676 save %sp,-SA(MINFRAME)-tmps,%sp 677 PIC_SETUP(l7) 678 PIC_SET(l7,.CONST_TBL,l5) 679 wr %g0,0x82,%asi 680 681 ldd [TBL],A1 682 sll %i2,3,stridex 683 or %g0,%i3,%o4 684 685 ldd [TBL+8],A2 686 sll %i4,3,stridey 687 or %g0,0x7ff,%o0 688 689 ldd [TBL+16],A3 690 sll %o0,20,_0x7ff00000 691 or %g0,0x001,%o2 692 693 ldd [TBL+24],A4 694 sll %o2,20,_0x00100000 695 696 ldd [TBL+32],A5 697 ldd [TBL+40],DC0 698 ldd [TBL+48],DC2 699 ldd [TBL+56],DC3 700 701 add TBL,64,TBL 702 add %g0,1023,%o5 703 st %i0,[%fp+tmp_counter] 704 705 sll %o5,3,_0x00001ff8 706 stx %i1,[%fp+tmp_px] 707 708 .begin: 709 ld [%fp+tmp_counter],counter 710 ldx [%fp+tmp_px],%l2 711 st %g0,[%fp+tmp_counter] 712 .begin1: 713 cmp counter,0 714 ble,pn %icc,.exit 715 lda [%l2]%asi,%o5 ! (5_1) hx = *(int*)px; 716 717 lda [%l2]%asi,%f10 ! (5_0) ((float*)&res)[0] = ((float*)px)[0]; 718 719 lda [%l2+4]%asi,%f11 ! (5_0) ((float*)&res)[1] = ((float*)px)[1]; 720 721 cmp %o5,_0x7ff00000 ! (5_1) hx ? 0x7ff00000 722 bge,pn %icc,.spec ! (5_1) if ( hx >= 0x7ff00000 ) 723 nop 724 725 cmp %o5,_0x00100000 ! (5_1) hx ? 0x00100000 726 bl,pn %icc,.spec ! (5_1) if ( hx < 0x00100000 ) 727 nop 728 729 add %l2,stridex,%l2 ! px += stridex 730 fand %f10,DC0,%f50 ! (5_1) res = vis_fand(res,DC0); 731 732 for %f50,A1,%f40 ! (5_1) res = vis_for(res,A1); 733 sra %o5,21,%l1 ! (5_1) sqrt_exp = hx >> 21; 734 sra %o5,15,%i1 ! (5_1) bit = hx >> 15; 735 736 sra %o5,7,%o1 ! (5_1) ind0 = hx >> 7; 737 sub %l1,512,%o3 ! (5_1) sqrt_exp -= 512; 738 739 and %o1,_0x00001ff8,%o1 ! (5_1) ind0 &= 0x1ff8; 740 lda [%l2]%asi,%f10 ! (0_0) ((float*)&res)[0] = ((float*)px)[0]; 741 742 add %o1,32,%o1 ! (5_1) ind0 += 32; 743 lda [%l2+4]%asi,%f11 ! (0_0) ((float*)&res)[1] = ((float*)px)[1]; 744 745 and %i1,32,%i4 ! (5_1) bit &= 32; 746 and %o1,-64,%o1 ! (5_1) ind0 &= -8; 747 748 sll %o1,0,%o7 ! (5_1) ind1 = ind0; 749 750 sllx %o3,52,%o3 ! (5_1) sqrt_exp <<= 52; 751 add %o7,%i4,%l0 ! (5_1) ind1 += bit; 752 lda [%l2]%asi,%o5 ! (0_0) hx = *(int*)px; 753 754 stx %o3,[%fp+tmp0] ! (5_1) dsqrt_exp = *(double*)&sqrt_exp; 755 fand %f10,DC0,%f50 ! (0_0) res = vis_fand(res,DC0); 756 757 add %l2,stridex,%l2 ! px += stridex 758 fpadd32 %f40,DC2,%f54 ! (5_1) res_c = vis_fpadd32(res,DC2); 759 760 add %l0,TBL,%o1 ! (5_1) pind = (char*)TBL + ind1 761 762 cmp %o5,_0x7ff00000 ! (0_0) hx ? 0x7ff00000 763 bge,pn %icc,.update0 ! (0_0) if ( hx >= 0x7ff00000 ) 764 for %f50,A1,%f42 ! (0_0) res = vis_for(res,A1); 765 .cont0: 766 sra %o5,21,%l1 ! (0_0) sqrt_exp = hx >> 21; 767 sra %o5,15,%i2 ! (0_0) bit = hx >> 15; 768 ldd [%o1],%f50 ! (5_1) dtmp0 = ((double*)pind)[0]; 769 770 sra %o5,7,%o1 ! (0_0) ind0 = hx >> 7; 771 sub %l1,512,%o3 ! (0_0) sqrt_exp -= 512; 772 fand %f54,DC3,%f54 ! (5_1) res_c = vis_fand(res_c,DC3); 773 774 and %o1,_0x00001ff8,%o1 ! (0_0) ind0 &= 0x1ff8; 775 lda [%l2]%asi,%f10 ! (1_0) ((float*)&res)[0] = ((float*)px)[0]; 776 777 add %o1,32,%o1 ! (0_0) ind0 += 32; 778 lda [%l2+4]%asi,%f11 ! (1_0) ((float*)&res)[1] = ((float*)px)[1]; 779 780 and %i2,32,%i4 ! (0_0) bit &= 32; 781 and %o1,-64,%o1 ! (0_0) ind0 &= -8; 782 fsubd %f40,%f54,%f40 ! (5_1) xx = (res - res_c); 783 784 sll %o1,0,%o7 ! (0_0) ind1 = ind0; 785 786 cmp %o5,_0x00100000 ! (0_0) hx ? 0x00100000 787 bl,pn %icc,.update1 ! (0_0) if ( hx < 0x00100000 ) 788 lda [%l2]%asi,%o5 ! (1_0) hx = *(int*)px; 789 .cont1: 790 sllx %o3,52,%o3 ! (0_0) sqrt_exp <<= 52; 791 add %o7,%i4,%i1 ! (0_0) ind1 += bit; 792 793 fmuld %f40,%f50,%f40 ! (5_1) xx *= dtmp0; 794 stx %o3,[%fp+tmp1] ! (0_0) dsqrt_exp = *(double*)&sqrt_exp; 795 fand %f10,DC0,%f50 ! (1_0) res = vis_fand(res,DC0); 796 797 add %l2,stridex,%l2 ! px += stridex 798 fpadd32 %f42,DC2,%f54 ! (0_0) res_c = vis_fpadd32(res,DC2); 799 800 add %i1,TBL,%o1 ! (0_0) pind = (char*)TBL + ind1 801 802 cmp %o5,_0x7ff00000 ! (1_0) hx ? 0x7ff00000 803 bge,pn %icc,.update2 ! (1_0) if ( hx >= 0x7ff00000 ) 804 for %f50,A1,%f14 ! (1_0) res = vis_for(res,A1); 805 .cont2: 806 sra %o5,21,%l1 ! (1_0) sqrt_exp = hx >> 21; 807 sra %o5,15,%g5 ! (1_0) bit = hx >> 15; 808 ldd [%o1],%f50 ! (0_0) dtmp0 = ((double*)pind)[0]; 809 810 fmuld A5,%f40,%f52 ! (5_1) res = A5 * xx; 811 sra %o5,7,%o1 ! (1_0) ind0 = hx >> 7; 812 sub %l1,512,%o3 ! (1_0) sqrt_exp -= 512; 813 fand %f54,DC3,%f54 ! (0_0) res_c = vis_fand(res_c,DC3); 814 815 and %o1,_0x00001ff8,%o1 ! (1_0) ind0 &= 0x1ff8; 816 lda [%l2]%asi,%f10 ! (2_0) ((float*)&res)[0] = ((float*)px)[0]; 817 818 add %o1,32,%o1 ! (1_0) ind0 += 32; 819 lda [%l2+4]%asi,%f11 ! (2_0) ((float*)&res)[1] = ((float*)px)[1]; 820 821 and %g5,32,%i4 ! (1_0) bit &= 32; 822 and %o1,-64,%o1 ! (1_0) ind0 &= -8; 823 fsubd %f42,%f54,%f42 ! (0_0) xx = (res - res_c); 824 825 sll %o1,0,%o7 ! (1_0) ind1 = ind0; 826 faddd %f52,A4,%f54 ! (5_1) res += A4; 827 828 cmp %o5,_0x00100000 ! (1_0) hx ? 0x00100000 829 bl,pn %icc,.update3 ! (1_0) if ( hx < 0x00100000 ) 830 lda [%l2]%asi,%o5 ! (2_0) hx = *(int*)px; 831 .cont3: 832 sllx %o3,52,%o3 ! (1_0) sqrt_exp <<= 52; 833 add %o7,%i4,%i2 ! (1_0) ind1 += bit; 834 835 fmuld %f42,%f50,%f42 ! (0_0) xx *= dtmp0; 836 stx %o3,[%fp+tmp2] ! (1_0) dsqrt_exp = *(double*)&sqrt_exp; 837 fand %f10,DC0,%f50 ! (2_0) res = vis_fand(res,DC0); 838 839 fmuld %f54,%f40,%f34 ! (5_1) res *= xx; 840 fpadd32 %f14,DC2,%f54 ! (1_0) res_c = vis_fpadd32(res,DC2); 841 add %l2,stridex,%l2 ! px += stridex 842 843 add %i2,TBL,%o1 ! (1_0) pind = (char*)TBL + ind1 844 845 cmp %o5,_0x7ff00000 ! (2_0) hx ? 0x7ff00000 846 bge,pn %icc,.update4 ! (2_0) if ( hx >= 0x7ff00000 ) 847 for %f50,A1,%f18 ! (2_0) res = vis_for(res,A1); 848 .cont4: 849 sra %o5,21,%l1 ! (2_0) sqrt_exp = hx >> 21; 850 sra %o5,15,%g1 ! (2_0) bit = hx >> 15; 851 ldd [%o1],%f50 ! (1_0) dtmp0 = ((double*)pind)[0]; 852 853 fmuld A5,%f42,%f52 ! (0_0) res = A5 * xx; 854 sra %o5,7,%o1 ! (2_0) ind0 = hx >> 7; 855 sub %l1,512,%o3 ! (2_0) sqrt_exp -= 512; 856 fand %f54,DC3,%f54 ! (1_0) res_c = vis_fand(res_c,DC3); 857 858 and %o1,_0x00001ff8,%o1 ! (2_0) ind0 &= 0x1ff8; 859 lda [%l2]%asi,%f10 ! (3_0) ((float*)&res)[0] = ((float*)px)[0]; 860 faddd %f34,A3,%f62 ! (5_1) res += A3; 861 862 add %o1,32,%o1 ! (2_0) ind0 += 32; 863 lda [%l2+4]%asi,%f11 ! (3_0) ((float*)&res)[1] = ((float*)px)[1]; 864 865 and %g1,32,%i4 ! (2_0) bit &= 32; 866 and %o1,-64,%o1 ! (2_0) ind0 &= -8; 867 fsubd %f14,%f54,%f14 ! (1_0) xx = (res - res_c); 868 869 sll %o1,0,%o7 ! (2_0) ind1 = ind0; 870 faddd %f52,A4,%f54 ! (0_0) res += A4; 871 872 fmuld %f62,%f40,%f52 ! (5_1) res *= xx; 873 cmp %o5,_0x00100000 ! (2_0) hx ? 0x00100000 874 bl,pn %icc,.update5 ! (2_0) if ( hx < 0x00100000 ) 875 lda [%l2]%asi,%o5 ! (3_0) hx = *(int*)px; 876 .cont5: 877 sllx %o3,52,%o3 ! (2_0) sqrt_exp <<= 52; 878 add %o7,%i4,%g5 ! (2_0) ind1 += bit; 879 880 fmuld %f14,%f50,%f14 ! (1_0) xx *= dtmp0; 881 stx %o3,[%fp+tmp3] ! (2_0) dsqrt_exp = *(double*)&sqrt_exp; 882 fand %f10,DC0,%f50 ! (3_0) res = vis_fand(res,DC0); 883 884 fmuld %f54,%f42,%f34 ! (0_0) res *= xx; 885 fpadd32 %f18,DC2,%f54 ! (2_0) res_c = vis_fpadd32(res,DC2); 886 add %l2,stridex,%l2 ! px += stridex 887 888 add %g5,TBL,%o1 ! (2_0) pind = (char*)TBL + ind1 889 faddd %f52,A2,%f20 ! (5_1) res += A2; 890 891 cmp %o5,_0x7ff00000 ! (3_0) hx ? 0x7ff00000 892 bge,pn %icc,.update6 ! (3_0) if ( hx >= 0x7ff00000 ) 893 for %f50,A1,%f44 ! (3_0) res = vis_for(res,A1); 894 .cont6: 895 sra %o5,21,%l1 ! (3_0) sqrt_exp = hx >> 21; 896 sra %o5,15,%i3 ! (3_0) bit = hx >> 15; 897 ldd [%o1],%f50 ! (2_0) dtmp0 = ((double*)pind)[0]; 898 899 fmuld A5,%f14,%f52 ! (1_0) res = A5 * xx; 900 sra %o5,7,%o1 ! (3_0) ind0 = hx >> 7; 901 sub %l1,512,%o3 ! (3_0) sqrt_exp -= 512; 902 fand %f54,DC3,%f54 ! (2_0) res_c = vis_fand(res_c,DC3); 903 904 fmuld %f20,%f40,%f20 ! (5_1) res *= xx; 905 and %o1,_0x00001ff8,%o1 ! (3_0) ind0 &= 0x1ff8; 906 lda [%l2]%asi,%f10 ! (4_0) ((float*)&res)[0] = ((float*)px)[0]; 907 faddd %f34,A3,%f62 ! (0_0) res += A3; 908 909 add %o1,32,%o1 ! (3_0) ind0 += 32; 910 lda [%l2+4]%asi,%f11 ! (4_0) ((float*)&res)[1] = ((float*)px)[1]; 911 912 and %i3,32,%i4 ! (3_0) bit &= 32; 913 and %o1,-64,%o1 ! (3_0) ind0 &= -8; 914 fsubd %f18,%f54,%f18 ! (2_0) xx = (res - res_c); 915 916 sll %o1,0,%o7 ! (3_0) ind1 = ind0; 917 faddd %f52,A4,%f54 ! (1_0) res += A4; 918 919 fmuld %f62,%f42,%f52 ! (0_0) res *= xx; 920 cmp %o5,_0x00100000 ! (3_0) hx ? 0x00100000 921 bl,pn %icc,.update7 ! (3_0) if ( hx < 0x00100000 ) 922 faddd %f20,A1,%f12 ! (5_1) res += A1; 923 .cont7: 924 lda [%l2]%asi,%o5 ! (4_0) hx = *(int*)px; 925 sllx %o3,52,%o3 ! (3_0) sqrt_exp <<= 52; 926 add %o7,%i4,%g1 ! (3_0) ind1 += bit; 927 928 fmuld %f18,%f50,%f18 ! (2_0) xx *= dtmp0; 929 add %l0,TBL,%l0 ! (5_1) pind = (char*)TBL + ind1; 930 stx %o3,[%fp+tmp4] ! (3_0) dsqrt_exp = *(double*)&sqrt_exp; 931 fand %f10,DC0,%f50 ! (4_0) res = vis_fand(res,DC0); 932 933 fmuld %f54,%f14,%f34 ! (1_0) res *= xx; 934 add %l2,stridex,%l2 ! px += stridex 935 ldd [%l0+16],%f36 ! (5_1) dexp_lo = ((double*)pind)[2]; 936 fpadd32 %f44,DC2,%f54 ! (3_0) res_c = vis_fpadd32(res,DC2); 937 938 fmuld %f12,%f40,%f12 ! (5_1) res *= xx; 939 add %g1,TBL,%o1 ! (3_0) (char*)div_arr+ind0 940 ldd [%l0+8],%f40 ! (5_1) dexp_hi = ((double*)pind)[1]; 941 faddd %f52,A2,%f20 ! (0_0) res += A2; 942 943 cmp %o5,_0x7ff00000 ! (4_0) hx ? 0x7ff00000 944 bge,pn %icc,.update8 ! (4_0) if ( hx >= 0x7ff00000 ) 945 for %f50,A1,%f24 ! (4_0) res = vis_for(res,A1); 946 .cont8: 947 sra %o5,21,%l1 ! (4_0) sqrt_exp = hx >> 21; 948 sra %o5,15,%l0 ! (4_0) bit = hx >> 15; 949 ldd [%o1],%f22 ! (3_0) dtmp0 = ((double*)pind)[0]; 950 951 fmuld A5,%f18,%f52 ! (2_0) res = A5 * xx; 952 sra %o5,7,%o1 ! (4_0) ind0 = hx >> 7; 953 sub %l1,512,%o3 ! (4_0) sqrt_exp -= 512; 954 fand %f54,DC3,%f54 ! (3_0) res_c = vis_fand(res_c,DC3); 955 956 fmuld %f20,%f42,%f20 ! (0_0) res *= xx; 957 and %o1,_0x00001ff8,%o1 ! (4_0) ind0 &= 0x1ff8; 958 lda [%l2]%asi,%f10 ! (5_0) ((float*)&res)[0] = ((float*)px)[0]; 959 faddd %f34,A3,%f62 ! (1_0) res += A3; 960 961 fmuld %f40,%f12,%f34 ! (5_1) res = dexp_hi * res; 962 add %o1,32,%o1 ! (4_0) ind0 += 32; 963 lda [%l2+4]%asi,%f11 ! (5_0) ((float*)&res)[1] = ((float*)px)[1]; 964 965 and %l0,32,%i4 ! (4_0) bit &= 32; 966 cmp %o5,_0x00100000 ! (4_0) hx ? 0x00100000 967 bl,pn %icc,.update9 ! (4_0) if ( hx < 0x00100000 ) 968 fsubd %f44,%f54,%f44 ! (3_0) xx = (res - res_c); 969 .cont9: 970 and %o1,-64,%o1 ! (4_0) ind0 &= -8; 971 faddd %f52,A4,%f54 ! (2_0) res += A4; 972 973 cmp counter,6 974 bl,pn %icc,.tail 975 or %g0,%o4,%l0 976 977 ba .main_loop 978 nop 979 980 .align 16 981 .main_loop: 982 fmuld %f62,%f14,%f52 ! (1_1) res *= xx; 983 sll %o1,0,%i3 ! (4_1) ind1 = ind0; 984 add %i1,TBL,%i1 ! (0_1) pind = (char*)TBL + ind1; 985 faddd %f20,A1,%f12 ! (0_1) res += A1; 986 987 lda [%l2]%asi,%o5 ! (5_1) hx = *(int*)px; 988 sllx %o3,52,%o3 ! (4_1) sqrt_exp <<= 52; 989 add %i3,%i4,%i3 ! (4_1) ind1 += bit; 990 faddd %f34,%f36,%f60 ! (5_2) res += dexp_lo; 991 992 fmuld %f44,%f22,%f44 ! (3_1) xx *= dtmp0; 993 add %l2,stridex,%l2 ! px += stridex 994 stx %o3,[%fp+tmp5] ! (4_1) dsqrt_exp = *(double*)&sqrt_exp; 995 fand %f10,DC0,%f50 ! (5_1) res = vis_fand(res,DC0); 996 997 fmuld %f54,%f18,%f34 ! (2_1) res *= xx; 998 nop 999 ldd [%i1+16],%f36 ! (0_1) dexp_lo = ((double*)pind)[2]; 1000 fpadd32 %f24,DC2,%f54 ! (4_1) res_c = vis_fpadd32(res,DC2); 1001 1002 fmuld %f12,%f42,%f16 ! (0_1) res *= xx; 1003 sra %o5,21,%l1 ! (5_1) sqrt_exp = hx >> 21; 1004 ldd [%i1+8],%f42 ! (0_1) dexp_hi = ((double*)pind)[1]; 1005 faddd %f52,A2,%f20 ! (1_1) res += A2; 1006 1007 ldd [%fp+tmp0],%f48 ! (5_2) dsqrt_exp = *(double*)&sqrt_exp; 1008 cmp %o5,_0x7ff00000 ! (5_1) hx ? 0x7ff00000 1009 bge,pn %icc,.update10 ! (5_1) if ( hx >= 0x7ff00000 ) 1010 faddd %f60,%f40,%f60 ! (5_2) res += dexp_hi; 1011 .cont10: 1012 lda [%l2]%asi,%f10 ! (0_0) ((float*)&res)[0] = ((float*)px)[0]; 1013 sra %o5,15,%i1 ! (5_1) bit = hx >> 15; 1014 add %i3,TBL,%o7 ! (4_1) pind = (char*)TBL + ind1 1015 for %f50,A1,%f40 ! (5_1) res = vis_for(res,A1); 1016 1017 fmuld A5,%f44,%f52 ! (3_1) res = A5 * xx; 1018 sra %o5,7,%o1 ! (5_1) ind0 = hx >> 7; 1019 ldd [%o7],%f22 ! (4_1) dtmp0 = ((double*)pind)[0]; 1020 fand %f54,DC3,%f54 ! (4_1) res_c = vis_fand(res_c,DC3); 1021 1022 fmuld %f20,%f14,%f20 ! (1_1) res *= xx; 1023 and %o1,_0x00001ff8,%o1 ! (5_1) ind0 &= 0x1ff8; 1024 sub %l1,512,%o3 ! (5_1) sqrt_exp -= 512; 1025 faddd %f34,A3,%f62 ! (2_1) res += A3; 1026 1027 fpadd32 %f48,%f60,%f12 ! (5_2) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1028 add %o1,32,%o1 ! (5_1) ind0 += 32; 1029 st %f12,[%l0] ! (5_2) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1030 fmuld %f42,%f16,%f34 ! (0_1) res = dexp_hi * res; 1031 1032 lda [%l2+4]%asi,%f11 ! (0_0) ((float*)&res)[1] = ((float*)px)[1]; 1033 and %i1,32,%i4 ! (5_1) bit &= 32; 1034 and %o1,-64,%o1 ! (5_1) ind0 &= -8; 1035 fsubd %f24,%f54,%f24 ! (4_1) xx = (res - res_c); 1036 1037 sll %o1,0,%o7 ! (5_1) ind1 = ind0; 1038 add %l0,stridey,%i1 ! py += stridey 1039 st %f13,[%l0+4] ! (5_2) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1040 faddd %f52,A4,%f54 ! (3_1) res += A4; 1041 1042 fmuld %f62,%f18,%f52 ! (2_1) res *= xx; 1043 cmp %o5,_0x00100000 ! (5_1) hx ? 0x00100000 1044 bl,pn %icc,.update11 ! (5_1) if ( hx < 0x00100000 ) 1045 faddd %f20,A1,%f12 ! (1_1) res += A1; 1046 .cont11: 1047 sllx %o3,52,%o3 ! (5_1) sqrt_exp <<= 52; 1048 add %o7,%i4,%l0 ! (5_1) ind1 += bit; 1049 lda [%l2]%asi,%o5 ! (0_0) hx = *(int*)px; 1050 faddd %f34,%f36,%f60 ! (0_1) res += dexp_lo; 1051 1052 fmuld %f24,%f22,%f24 ! (4_1) xx *= dtmp0; 1053 add %i2,TBL,%i2 ! (1_1) pind = (char*)TBL + ind1; 1054 stx %o3,[%fp+tmp0] ! (5_1) dsqrt_exp = *(double*)&sqrt_exp; 1055 fand %f10,DC0,%f50 ! (0_0) res = vis_fand(res,DC0); 1056 1057 fmuld %f54,%f44,%f34 ! (3_1) res *= xx; 1058 add %l2,stridex,%l2 ! px += stridex 1059 ldd [%i2+16],%f36 ! (1_1) dexp_lo = ((double*)pind)[2]; 1060 fpadd32 %f40,DC2,%f54 ! (5_1) res_c = vis_fpadd32(res,DC2); 1061 1062 fmuld %f12,%f14,%f16 ! (1_1) res *= xx; 1063 sra %o5,21,%l1 ! (0_0) sqrt_exp = hx >> 21; 1064 ldd [%i2+8],%f14 ! (1_1) dexp_hi = ((double*)pind)[1]; 1065 faddd %f52,A2,%f20 ! (2_1) res += A2; 1066 1067 ldd [%fp+tmp1],%f48 ! (0_1) dsqrt_exp = *(double*)&sqrt_exp; 1068 cmp %o5,_0x7ff00000 ! (0_0) hx ? 0x7ff00000 1069 bge,pn %icc,.update12 ! (0_0) if ( hx >= 0x7ff00000 ) 1070 faddd %f60,%f42,%f60 ! (0_1) res += dexp_hi; 1071 .cont12: 1072 lda [%l2]%asi,%f10 ! (1_0) ((float*)&res)[0] = ((float*)px)[0]; 1073 sra %o5,15,%i2 ! (0_0) bit = hx >> 15; 1074 add %l0,TBL,%o7 ! (5_1) pind = (char*)TBL + ind1 1075 for %f50,A1,%f42 ! (0_0) res = vis_for(res,A1); 1076 1077 fmuld A5,%f24,%f52 ! (4_1) res = A5 * xx; 1078 sra %o5,7,%o1 ! (0_0) ind0 = hx >> 7; 1079 ldd [%o7],%f22 ! (5_1) dtmp0 = ((double*)pind)[0]; 1080 fand %f54,DC3,%f54 ! (5_1) res_c = vis_fand(res_c,DC3); 1081 1082 fmuld %f20,%f18,%f20 ! (2_1) res *= xx; 1083 and %o1,_0x00001ff8,%o1 ! (0_0) ind0 &= 0x1ff8; 1084 sub %l1,512,%o3 ! (0_0) sqrt_exp -= 512; 1085 faddd %f34,A3,%f62 ! (3_1) res += A3; 1086 1087 fpadd32 %f48,%f60,%f12 ! (0_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1088 add %o1,32,%o1 ! (0_0) ind0 += 32; 1089 st %f12,[%i1] ! (0_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1090 fmuld %f14,%f16,%f34 ! (1_1) res = dexp_hi * res; 1091 1092 lda [%l2+4]%asi,%f11 ! (1_0) ((float*)&res)[1] = ((float*)px)[1]; 1093 and %i2,32,%i4 ! (0_0) bit &= 32; 1094 and %o1,-64,%o1 ! (0_0) ind0 &= -8; 1095 fsubd %f40,%f54,%f40 ! (5_1) xx = (res - res_c); 1096 1097 sll %o1,0,%o7 ! (0_0) ind1 = ind0; 1098 add %i1,stridey,%i2 ! py += stridey 1099 st %f13,[%i1+4] ! (0_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1100 faddd %f52,A4,%f54 ! (4_1) res += A4; 1101 1102 fmuld %f62,%f44,%f52 ! (3_1) res *= xx; 1103 cmp %o5,_0x00100000 ! (0_0) hx ? 0x00100000 1104 bl,pn %icc,.update13 ! (0_0) if ( hx < 0x00100000 ) 1105 faddd %f20,A1,%f12 ! (2_1) res += A1; 1106 .cont13: 1107 lda [%l2]%asi,%o5 ! (1_0) hx = *(int*)px; 1108 sllx %o3,52,%o3 ! (0_0) sqrt_exp <<= 52; 1109 add %o7,%i4,%i1 ! (0_0) ind1 += bit; 1110 faddd %f34,%f36,%f60 ! (1_1) res += dexp_lo; 1111 1112 fmuld %f40,%f22,%f40 ! (5_1) xx *= dtmp0; 1113 add %g5,TBL,%g5 ! (2_1) pind = (char*)TBL + ind1; 1114 stx %o3,[%fp+tmp1] ! (0_0) dsqrt_exp = *(double*)&sqrt_exp; 1115 fand %f10,DC0,%f50 ! (1_0) res = vis_fand(res,DC0); 1116 1117 fmuld %f54,%f24,%f34 ! (4_1) res *= xx; 1118 add %l2,stridex,%l2 ! px += stridex 1119 ldd [%g5+16],%f36 ! (2_1) dexp_lo = ((double*)pind)[2]; 1120 fpadd32 %f42,DC2,%f54 ! (0_0) res_c = vis_fpadd32(res,DC2); 1121 1122 fmuld %f12,%f18,%f16 ! (2_1) res *= xx; 1123 sra %o5,21,%l1 ! (1_0) sqrt_exp = hx >> 21; 1124 ldd [%g5+8],%f18 ! (2_1) dexp_hi = ((double*)pind)[1]; 1125 faddd %f52,A2,%f20 ! (3_1) res += A2; 1126 1127 ldd [%fp+tmp2],%f48 ! (1_1) dsqrt_exp = *(double*)&sqrt_exp; 1128 cmp %o5,_0x7ff00000 ! (1_0) hx ? 0x7ff00000 1129 bge,pn %icc,.update14 ! (1_0) if ( hx >= 0x7ff00000 ) 1130 faddd %f60,%f14,%f60 ! (1_1) res += dexp_hi; 1131 .cont14: 1132 lda [%l2]%asi,%f10 ! (2_0) ((float*)&res)[0] = ((float*)px)[0]; 1133 sra %o5,15,%g5 ! (1_0) bit = hx >> 15; 1134 add %i1,TBL,%o7 ! (0_0) pind = (char*)TBL + ind1 1135 for %f50,A1,%f14 ! (1_0) res = vis_for(res,A1); 1136 1137 fmuld A5,%f40,%f52 ! (5_1) res = A5 * xx; 1138 sra %o5,7,%o1 ! (1_0) ind0 = hx >> 7; 1139 ldd [%o7],%f22 ! (0_0) dtmp0 = ((double*)pind)[0]; 1140 fand %f54,DC3,%f54 ! (0_0) res_c = vis_fand(res_c,DC3); 1141 1142 fmuld %f20,%f44,%f20 ! (3_1) res *= xx; 1143 and %o1,_0x00001ff8,%o1 ! (1_0) ind0 &= 0x1ff8; 1144 sub %l1,512,%o3 ! (1_0) sqrt_exp -= 512; 1145 faddd %f34,A3,%f62 ! (4_1) res += A3; 1146 1147 fpadd32 %f48,%f60,%f12 ! (1_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1148 add %o1,32,%o1 ! (1_0) ind0 += 32; 1149 st %f12,[%i2] ! (1_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1150 fmuld %f18,%f16,%f34 ! (2_1) res = dexp_hi * res; 1151 1152 lda [%l2+4]%asi,%f11 ! (2_0) ((float*)&res)[1] = ((float*)px)[1]; 1153 and %g5,32,%i4 ! (1_0) bit &= 32; 1154 and %o1,-64,%o1 ! (1_0) ind0 &= -8; 1155 fsubd %f42,%f54,%f42 ! (0_0) xx = (res - res_c); 1156 1157 sll %o1,0,%o7 ! (1_0) ind1 = ind0; 1158 add %i2,stridey,%g5 ! py += stridey 1159 st %f13,[%i2+4] ! (1_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1160 faddd %f52,A4,%f54 ! (5_1) res += A4; 1161 1162 fmuld %f62,%f24,%f52 ! (4_1) res *= xx; 1163 cmp %o5,_0x00100000 ! (1_0) hx ? 0x00100000 1164 bl,pn %icc,.update15 ! (1_0) if ( hx < 0x00100000 ) 1165 faddd %f20,A1,%f12 ! (3_1) res += A1; 1166 .cont15: 1167 lda [%l2]%asi,%o5 ! (2_0) hx = *(int*)px; 1168 sllx %o3,52,%o3 ! (1_0) sqrt_exp <<= 52; 1169 add %o7,%i4,%i2 ! (1_0) ind1 += bit; 1170 faddd %f34,%f36,%f60 ! (2_1) res += dexp_lo; 1171 1172 fmuld %f42,%f22,%f42 ! (0_0) xx *= dtmp0; 1173 add %g1,TBL,%g1 ! (3_1) pind = (char*)TBL + ind1; 1174 stx %o3,[%fp+tmp2] ! (1_0) dsqrt_exp = *(double*)&sqrt_exp; 1175 fand %f10,DC0,%f50 ! (2_0) res = vis_fand(res,DC0); 1176 1177 fmuld %f54,%f40,%f34 ! (5_1) res *= xx; 1178 fpadd32 %f14,DC2,%f54 ! (1_0) res_c = vis_fpadd32(res,DC2); 1179 add %l2,stridex,%l2 ! px += stridex 1180 ldd [%g1+16],%f36 ! (3_1) dexp_lo = ((double*)pind)[2]; 1181 1182 fmuld %f12,%f44,%f16 ! (3_1) res *= xx; 1183 sra %o5,21,%l1 ! (2_0) sqrt_exp = hx >> 21; 1184 ldd [%g1+8],%f44 ! (3_1) dexp_hi = ((double*)pind)[1]; 1185 faddd %f52,A2,%f20 ! (4_1) res += A2; 1186 1187 ldd [%fp+tmp3],%f48 ! (2_1) dsqrt_exp = *(double*)&sqrt_exp; 1188 cmp %o5,_0x7ff00000 ! (2_0) hx ? 0x7ff00000 1189 bge,pn %icc,.update16 ! (2_0) if ( hx >= 0x7ff00000 ) 1190 faddd %f60,%f18,%f60 ! (2_1) res += dexp_hi; 1191 .cont16: 1192 lda [%l2]%asi,%f10 ! (3_0) ((float*)&res)[0] = ((float*)px)[0]; 1193 sra %o5,15,%g1 ! (2_0) bit = hx >> 15; 1194 add %i2,TBL,%o7 ! (1_0) pind = (char*)TBL + ind1 1195 for %f50,A1,%f18 ! (2_0) res = vis_for(res,A1); 1196 1197 fmuld A5,%f42,%f52 ! (0_0) res = A5 * xx; 1198 sra %o5,7,%o1 ! (2_0) ind0 = hx >> 7; 1199 ldd [%o7],%f22 ! (1_0) dtmp0 = ((double*)pind)[0]; 1200 fand %f54,DC3,%f54 ! (1_0) res_c = vis_fand(res_c,DC3); 1201 1202 fmuld %f20,%f24,%f20 ! (4_1) res *= xx; 1203 and %o1,_0x00001ff8,%o1 ! (2_0) ind0 &= 0x1ff8; 1204 sub %l1,512,%o3 ! (2_0) sqrt_exp -= 512; 1205 faddd %f34,A3,%f62 ! (5_1) res += A3; 1206 1207 fpadd32 %f48,%f60,%f12 ! (2_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1208 add %o1,32,%o1 ! (2_0) ind0 += 32; 1209 st %f12,[%g5] ! (2_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1210 fmuld %f44,%f16,%f34 ! (3_1) res = dexp_hi * res; 1211 1212 lda [%l2+4]%asi,%f11 ! (3_0) ((float*)&res)[1] = ((float*)px)[1]; 1213 and %g1,32,%i4 ! (2_0) bit &= 32; 1214 and %o1,-64,%o1 ! (2_0) ind0 &= -8; 1215 fsubd %f14,%f54,%f14 ! (1_0) xx = (res - res_c); 1216 1217 sll %o1,0,%o7 ! (2_0) ind1 = ind0; 1218 add %g5,stridey,%g1 ! py += stridey 1219 st %f13,[%g5+4] ! (2_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1220 faddd %f52,A4,%f54 ! (0_0) res += A4; 1221 1222 fmuld %f62,%f40,%f52 ! (5_1) res *= xx; 1223 cmp %o5,_0x00100000 ! (2_0) hx ? 0x00100000 1224 bl,pn %icc,.update17 ! (2_0) if ( hx < 0x00100000 ) 1225 faddd %f20,A1,%f12 ! (4_1) res += A1; 1226 .cont17: 1227 lda [%l2]%asi,%o5 ! (3_0) hx = *(int*)px; 1228 sllx %o3,52,%o3 ! (2_0) sqrt_exp <<= 52; 1229 add %o7,%i4,%g5 ! (2_0) ind1 += bit; 1230 faddd %f34,%f36,%f60 ! (3_1) res += dexp_lo; 1231 1232 fmuld %f14,%f22,%f14 ! (1_0) xx *= dtmp0; 1233 add %i3,TBL,%i3 ! (4_1) pind = (char*)TBL + ind1; 1234 stx %o3,[%fp+tmp3] ! (2_0) dsqrt_exp = *(double*)&sqrt_exp; 1235 fand %f10,DC0,%f50 ! (3_0) res = vis_fand(res,DC0); 1236 1237 fmuld %f54,%f42,%f34 ! (0_0) res *= xx; 1238 fpadd32 %f18,DC2,%f54 ! (2_0) res_c = vis_fpadd32(res,DC2); 1239 add %l2,stridex,%l2 ! px += stridex 1240 ldd [%i3+16],%f36 ! (4_1) dexp_lo = ((double*)pind)[2]; 1241 1242 fmuld %f12,%f24,%f16 ! (4_1) res *= xx; 1243 sra %o5,21,%l1 ! (3_0) sqrt_exp = hx >> 21; 1244 ldd [%i3+8],%f24 ! (4_1) dexp_hi = ((double*)pind)[1]; 1245 faddd %f52,A2,%f20 ! (5_1) res += A2; 1246 1247 ldd [%fp+tmp4],%f48 ! (3_1) dsqrt_exp = *(double*)&sqrt_exp; 1248 cmp %o5,_0x7ff00000 ! (3_0) hx ? 0x7ff00000 1249 bge,pn %icc,.update18 ! (3_0) if ( hx >= 0x7ff00000 ) 1250 faddd %f60,%f44,%f60 ! (3_1) res += dexp_hi; 1251 .cont18: 1252 lda [%l2]%asi,%f10 ! (4_0) ((float*)&res)[0] = ((float*)px)[0]; 1253 sra %o5,15,%i3 ! (3_0) bit = hx >> 15; 1254 add %g5,TBL,%o7 ! (2_0) pind = (char*)TBL + ind1 1255 for %f50,A1,%f44 ! (3_0) res = vis_for(res,A1); 1256 1257 fmuld A5,%f14,%f52 ! (1_0) res = A5 * xx; 1258 sra %o5,7,%o1 ! (3_0) ind0 = hx >> 7; 1259 ldd [%o7],%f22 ! (2_0) dtmp0 = ((double*)pind)[0]; 1260 fand %f54,DC3,%f54 ! (2_0) res_c = vis_fand(res_c,DC3); 1261 1262 fmuld %f20,%f40,%f20 ! (5_1) res *= xx; 1263 and %o1,_0x00001ff8,%o1 ! (3_0) ind0 &= 0x1ff8; 1264 sub %l1,512,%o3 ! (3_0) sqrt_exp -= 512; 1265 faddd %f34,A3,%f62 ! (0_0) res += A3; 1266 1267 fpadd32 %f48,%f60,%f12 ! (3_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1268 add %o1,32,%o1 ! (3_0) ind0 += 32; 1269 st %f12,[%g1] ! (3_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1270 fmuld %f24,%f16,%f34 ! (4_1) res = dexp_hi * res; 1271 1272 lda [%l2+4]%asi,%f11 ! (4_0) ((float*)&res)[1] = ((float*)px)[1]; 1273 and %i3,32,%i4 ! (3_0) bit &= 32; 1274 and %o1,-64,%o1 ! (3_0) ind0 &= -8; 1275 fsubd %f18,%f54,%f18 ! (2_0) xx = (res - res_c); 1276 1277 or %g0,%o1,%o7 ! (3_0) ind1 = ind0; 1278 add %g1,stridey,%i3 ! py += stridey 1279 st %f13,[%g1+4] ! (3_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1280 faddd %f52,A4,%f54 ! (1_0) res += A4; 1281 1282 fmuld %f62,%f42,%f52 ! (0_0) res *= xx; 1283 cmp %o5,_0x00100000 ! (3_0) hx ? 0x00100000 1284 bl,pn %icc,.update19 ! (3_0) if ( hx < 0x00100000 ) 1285 faddd %f20,A1,%f12 ! (5_1) res += A1; 1286 .cont19: 1287 lda [%l2]%asi,%o5 ! (4_0) hx = *(int*)px; 1288 sllx %o3,52,%o3 ! (3_0) sqrt_exp <<= 52; 1289 add %o7,%i4,%g1 ! (3_0) ind1 += bit; 1290 faddd %f34,%f36,%f60 ! (4_1) res += dexp_lo; 1291 1292 fmuld %f18,%f22,%f18 ! (2_0) xx *= dtmp0; 1293 add %l0,TBL,%l0 ! (5_1) pind = (char*)TBL + ind1; 1294 stx %o3,[%fp+tmp4] ! (3_0) dsqrt_exp = *(double*)&sqrt_exp; 1295 fand %f10,DC0,%f50 ! (4_0) res = vis_fand(res,DC0); 1296 1297 fmuld %f54,%f14,%f34 ! (1_0) res *= xx; 1298 add %l2,stridex,%l2 ! px += stridex 1299 ldd [%l0+16],%f36 ! (5_1) dexp_lo = ((double*)pind)[2]; 1300 fpadd32 %f44,DC2,%f54 ! (3_0) res_c = vis_fpadd32(res,DC2); 1301 1302 fmuld %f12,%f40,%f16 ! (5_1) res *= xx; 1303 sra %o5,21,%l1 ! (4_0) sqrt_exp = hx >> 21; 1304 ldd [%l0+8],%f40 ! (5_1) dexp_hi = ((double*)pind)[1]; 1305 faddd %f52,A2,%f20 ! (0_0) res += A2; 1306 1307 ldd [%fp+tmp5],%f48 ! (4_1) dsqrt_exp = *(double*)&sqrt_exp; 1308 cmp %o5,_0x7ff00000 ! (4_0) hx ? 0x7ff00000 1309 bge,pn %icc,.update20 ! (4_0) if ( hx >= 0x7ff00000 ) 1310 faddd %f60,%f24,%f60 ! (4_1) res += dexp_hi; 1311 .cont20: 1312 lda [%l2]%asi,%f10 ! (5_0) ((float*)&res)[0] = ((float*)px)[0]; 1313 sra %o5,15,%l0 ! (4_0) bit = hx >> 15; 1314 add %g1,TBL,%o7 ! (3_0) (char*)div_arr+ind0 1315 for %f50,A1,%f24 ! (4_0) res = vis_for(res,A1); 1316 1317 fmuld A5,%f18,%f52 ! (2_0) res = A5 * xx; 1318 sra %o5,7,%o1 ! (4_0) ind0 = hx >> 7; 1319 ldd [%o7],%f22 ! (3_0) dtmp0 = ((double*)pind)[0]; 1320 fand %f54,DC3,%f54 ! (3_0) res_c = vis_fand(res_c,DC3); 1321 1322 fmuld %f20,%f42,%f20 ! (0_0) res *= xx; 1323 and %o1,_0x00001ff8,%o1 ! (4_0) ind0 &= 0x1ff8; 1324 sub %l1,512,%o3 ! (4_0) sqrt_exp -= 512; 1325 faddd %f34,A3,%f62 ! (1_0) res += A3; 1326 1327 lda [%l2+4]%asi,%f11 ! (5_0) ((float*)&res)[1] = ((float*)px)[1]; 1328 add %o1,32,%o1 ! (4_0) ind0 += 32; 1329 fpadd32 %f48,%f60,%f12 ! (4_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1330 fmuld %f40,%f16,%f34 ! (5_1) res = dexp_hi * res; 1331 1332 and %l0,32,%i4 ! (4_0) bit &= 32; 1333 cmp %o5,_0x00100000 ! (4_0) hx ? 0x00100000 1334 bl,pn %icc,.update21 ! (4_0) if ( hx < 0x00100000 ) 1335 fsubd %f44,%f54,%f44 ! (3_0) xx = (res - res_c); 1336 .cont21: 1337 and %o1,-64,%o1 ! (4_0) ind0 &= -8; 1338 sub counter,6,counter ! counter 1339 st %f12,[%i3] ! (4_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1340 faddd %f52,A4,%f54 ! (2_0) res += A4; 1341 1342 st %f13,[%i3+4] ! (4_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1343 cmp counter,6 1344 bge,pt %icc,.main_loop 1345 add %i3,stridey,%l0 ! py += stridey 1346 1347 .tail: 1348 subcc counter,1,counter 1349 bneg .begin 1350 or %g0,%l0,%o4 1351 1352 fmuld %f62,%f14,%f52 ! (1_1) res *= xx; 1353 add %i1,TBL,%i1 ! (0_1) pind = (char*)TBL + ind1; 1354 faddd %f20,A1,%f12 ! (0_1) res += A1; 1355 1356 faddd %f34,%f36,%f60 ! (5_2) res += dexp_lo; 1357 1358 fmuld %f44,%f22,%f44 ! (3_1) xx *= dtmp0; 1359 add %l2,stridex,%l2 ! px += stridex 1360 1361 fmuld %f54,%f18,%f34 ! (2_1) res *= xx; 1362 ldd [%i1+16],%f36 ! (0_1) dexp_lo = ((double*)pind)[2]; 1363 1364 fmuld %f12,%f42,%f12 ! (0_1) res *= xx; 1365 ldd [%i1+8],%f42 ! (0_1) dexp_hi = ((double*)pind)[1]; 1366 faddd %f52,A2,%f20 ! (1_1) res += A2; 1367 1368 ldd [%fp+tmp0],%f48 ! (5_2) dsqrt_exp = *(double*)&sqrt_exp; 1369 faddd %f60,%f40,%f60 ! (5_2) res += dexp_hi; 1370 1371 fmuld A5,%f44,%f52 ! (3_1) res = A5 * xx; 1372 1373 fmuld %f20,%f14,%f20 ! (1_1) res *= xx; 1374 faddd %f34,A3,%f62 ! (2_1) res += A3; 1375 1376 fmuld %f42,%f12,%f34 ! (0_1) res = dexp_hi * res; 1377 fpadd32 %f48,%f60,%f12 ! (5_2) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1378 1379 st %f12,[%l0] ! (5_2) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1380 1381 add %l0,stridey,%i1 ! py += stridey 1382 st %f13,[%l0+4] ! (5_2) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1383 faddd %f52,A4,%f54 ! (3_1) res += A4; 1384 1385 subcc counter,1,counter 1386 bneg .begin 1387 or %g0,%i1,%o4 1388 1389 fmuld %f62,%f18,%f52 ! (2_1) res *= xx; 1390 faddd %f20,A1,%f12 ! (1_1) res += A1; 1391 1392 faddd %f34,%f36,%f60 ! (0_1) res += dexp_lo; 1393 1394 add %i2,TBL,%i2 ! (1_1) pind = (char*)TBL + ind1; 1395 1396 fmuld %f54,%f44,%f34 ! (3_1) res *= xx; 1397 add %l2,stridex,%l2 ! px += stridex 1398 ldd [%i2+16],%f36 ! (1_1) dexp_lo = ((double*)pind)[2]; 1399 1400 fmuld %f12,%f14,%f12 ! (1_1) res *= xx; 1401 ldd [%i2+8],%f14 ! (1_1) dexp_hi = ((double*)pind)[1]; 1402 faddd %f52,A2,%f20 ! (2_1) res += A2; 1403 1404 ldd [%fp+tmp1],%f48 ! (0_1) dsqrt_exp = *(double*)&sqrt_exp; 1405 faddd %f60,%f42,%f60 ! (0_1) res += dexp_hi; 1406 1407 fmuld %f20,%f18,%f20 ! (2_1) res *= xx; 1408 faddd %f34,A3,%f62 ! (3_1) res += A3; 1409 1410 fmuld %f14,%f12,%f34 ! (1_1) res = dexp_hi * res; 1411 fpadd32 %f48,%f60,%f12 ! (0_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1412 1413 st %f12,[%i1] ! (0_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1414 1415 add %i1,stridey,%i2 ! py += stridey 1416 st %f13,[%i1+4] ! (0_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1417 1418 subcc counter,1,counter 1419 bneg .begin 1420 or %g0,%i2,%o4 1421 1422 fmuld %f62,%f44,%f52 ! (3_1) res *= xx; 1423 faddd %f20,A1,%f12 ! (2_1) res += A1; 1424 1425 faddd %f34,%f36,%f60 ! (1_1) res += dexp_lo; 1426 1427 add %g5,TBL,%g5 ! (2_1) pind = (char*)TBL + ind1; 1428 1429 add %l2,stridex,%l2 ! px += stridex 1430 ldd [%g5+16],%f36 ! (2_1) dexp_lo = ((double*)pind)[2]; 1431 1432 fmuld %f12,%f18,%f12 ! (2_1) res *= xx; 1433 ldd [%g5+8],%f18 ! (2_1) dexp_hi = ((double*)pind)[1]; 1434 faddd %f52,A2,%f20 ! (3_1) res += A2; 1435 1436 ldd [%fp+tmp2],%f48 ! (1_1) dsqrt_exp = *(double*)&sqrt_exp; 1437 faddd %f60,%f14,%f60 ! (1_1) res += dexp_hi; 1438 1439 fmuld %f20,%f44,%f20 ! (3_1) res *= xx; 1440 1441 fmuld %f18,%f12,%f34 ! (2_1) res = dexp_hi * res; 1442 fpadd32 %f48,%f60,%f12 ! (1_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1443 1444 st %f12,[%i2] ! (1_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1445 1446 add %i2,stridey,%g5 ! py += stridey 1447 st %f13,[%i2+4] ! (1_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1448 1449 subcc counter,1,counter 1450 bneg .begin 1451 or %g0,%g5,%o4 1452 1453 faddd %f20,A1,%f12 ! (3_1) res += A1; 1454 1455 faddd %f34,%f36,%f60 ! (2_1) res += dexp_lo; 1456 1457 add %g1,TBL,%g1 ! (3_1) pind = (char*)TBL + ind1; 1458 1459 add %l2,stridex,%l2 ! px += stridex 1460 ldd [%g1+16],%f36 ! (3_1) dexp_lo = ((double*)pind)[2]; 1461 1462 fmuld %f12,%f44,%f12 ! (3_1) res *= xx; 1463 ldd [%g1+8],%f44 ! (3_1) dexp_hi = ((double*)pind)[1]; 1464 1465 ldd [%fp+tmp3],%f48 ! (2_1) dsqrt_exp = *(double*)&sqrt_exp; 1466 faddd %f60,%f18,%f60 ! (2_1) res += dexp_hi; 1467 1468 fmuld %f44,%f12,%f34 ! (3_1) res = dexp_hi * res; 1469 fpadd32 %f48,%f60,%f12 ! (2_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1470 1471 st %f12,[%g5] ! (2_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1472 1473 add %g5,stridey,%g1 ! py += stridey 1474 st %f13,[%g5+4] ! (2_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1475 1476 subcc counter,1,counter 1477 bneg .begin 1478 or %g0,%g1,%o4 1479 1480 faddd %f34,%f36,%f60 ! (3_1) res += dexp_lo; 1481 1482 add %l2,stridex,%l2 ! px += stridex 1483 1484 ldd [%fp+tmp4],%f48 ! (3_1) dsqrt_exp = *(double*)&sqrt_exp; 1485 faddd %f60,%f44,%f60 ! (3_1) res += dexp_hi; 1486 1487 fpadd32 %f48,%f60,%f12 ! (3_1) dtmp0 = vis_fpadd32(dsqrt_exp,res); 1488 1489 st %f12,[%g1] ! (3_1) ((float*)py)[0] = ((float*)&dtmp0)[0]; 1490 1491 add %g1,stridey,%i3 ! py += stridey 1492 st %f13,[%g1+4] ! (3_1) ((float*)py)[1] = ((float*)&dtmp0)[1]; 1493 1494 ba .begin 1495 or %g0,%i3,%o4 1496 1497 .align 16 1498 .spec: 1499 fsqrtd %f10,%f10 1500 add %l2,stridex,%l2 1501 1502 st %f10,[%o4] 1503 st %f11,[%o4+4] 1504 1505 add %o4,stridey,%o4 1506 ba .begin1 1507 sub counter,1,counter 1508 1509 .align 16 1510 .update0: 1511 cmp counter,1 1512 ble .cont0 1513 nop 1514 1515 sub %l2,stridex,%i5 1516 stx %i5,[%fp+tmp_px] 1517 1518 sub counter,1,counter 1519 st counter,[%fp+tmp_counter] 1520 1521 ba .cont0 1522 or %g0,1,counter 1523 1524 .align 16 1525 .update1: 1526 cmp counter,1 1527 ble .cont1 1528 nop 1529 1530 sub %l2,stridex,%i5 1531 stx %i5,[%fp+tmp_px] 1532 1533 sub counter,1,counter 1534 st counter,[%fp+tmp_counter] 1535 1536 ba .cont1 1537 or %g0,1,counter 1538 1539 .align 16 1540 .update2: 1541 cmp counter,2 1542 ble .cont2 1543 nop 1544 1545 sub %l2,stridex,%i5 1546 stx %i5,[%fp+tmp_px] 1547 1548 sub counter,2,counter 1549 st counter,[%fp+tmp_counter] 1550 1551 ba .cont2 1552 or %g0,2,counter 1553 1554 .align 16 1555 .update3: 1556 cmp counter,2 1557 ble .cont3 1558 nop 1559 1560 sub %l2,stridex,%i5 1561 stx %i5,[%fp+tmp_px] 1562 1563 sub counter,2,counter 1564 st counter,[%fp+tmp_counter] 1565 1566 ba .cont3 1567 or %g0,2,counter 1568 1569 .align 16 1570 .update4: 1571 cmp counter,3 1572 ble .cont4 1573 nop 1574 1575 sub %l2,stridex,%i5 1576 stx %i5,[%fp+tmp_px] 1577 1578 sub counter,3,counter 1579 st counter,[%fp+tmp_counter] 1580 1581 ba .cont4 1582 or %g0,3,counter 1583 1584 .align 16 1585 .update5: 1586 cmp counter,3 1587 ble .cont5 1588 nop 1589 1590 sub %l2,stridex,%i5 1591 stx %i5,[%fp+tmp_px] 1592 1593 sub counter,3,counter 1594 st counter,[%fp+tmp_counter] 1595 1596 ba .cont5 1597 or %g0,3,counter 1598 1599 .align 16 1600 .update6: 1601 cmp counter,4 1602 ble .cont6 1603 nop 1604 1605 sub %l2,stridex,%i5 1606 stx %i5,[%fp+tmp_px] 1607 1608 sub counter,4,counter 1609 st counter,[%fp+tmp_counter] 1610 1611 ba .cont6 1612 or %g0,4,counter 1613 1614 .align 16 1615 .update7: 1616 cmp counter,4 1617 ble .cont7 1618 nop 1619 1620 sub %l2,stridex,%i5 1621 stx %i5,[%fp+tmp_px] 1622 1623 sub counter,4,counter 1624 st counter,[%fp+tmp_counter] 1625 1626 ba .cont7 1627 or %g0,4,counter 1628 1629 .align 16 1630 .update8: 1631 cmp counter,5 1632 ble .cont8 1633 nop 1634 1635 sub %l2,stridex,%i5 1636 stx %i5,[%fp+tmp_px] 1637 1638 sub counter,5,counter 1639 st counter,[%fp+tmp_counter] 1640 1641 ba .cont8 1642 or %g0,5,counter 1643 1644 .align 16 1645 .update9: 1646 cmp counter,5 1647 ble .cont9 1648 nop 1649 1650 sub %l2,stridex,%i5 1651 stx %i5,[%fp+tmp_px] 1652 1653 sub counter,5,counter 1654 st counter,[%fp+tmp_counter] 1655 1656 ba .cont9 1657 or %g0,5,counter 1658 1659 .align 16 1660 .update10: 1661 cmp counter,6 1662 ble .cont10 1663 nop 1664 1665 sub %l2,stridex,%i5 1666 stx %i5,[%fp+tmp_px] 1667 1668 sub counter,6,counter 1669 st counter,[%fp+tmp_counter] 1670 1671 ba .cont10 1672 or %g0,6,counter 1673 1674 .align 16 1675 .update11: 1676 cmp counter,6 1677 ble .cont11 1678 nop 1679 1680 sub %l2,stridex,%i5 1681 stx %i5,[%fp+tmp_px] 1682 1683 sub counter,6,counter 1684 st counter,[%fp+tmp_counter] 1685 1686 ba .cont11 1687 or %g0,6,counter 1688 1689 .align 16 1690 .update12: 1691 cmp counter,7 1692 ble .cont12 1693 nop 1694 1695 sub %l2,stridex,%i5 1696 stx %i5,[%fp+tmp_px] 1697 1698 sub counter,7,counter 1699 st counter,[%fp+tmp_counter] 1700 1701 ba .cont12 1702 or %g0,7,counter 1703 1704 .align 16 1705 .update13: 1706 cmp counter,7 1707 ble .cont13 1708 nop 1709 1710 sub %l2,stridex,%i5 1711 stx %i5,[%fp+tmp_px] 1712 1713 sub counter,7,counter 1714 st counter,[%fp+tmp_counter] 1715 1716 ba .cont13 1717 or %g0,7,counter 1718 1719 .align 16 1720 .update14: 1721 cmp counter,8 1722 ble .cont14 1723 nop 1724 1725 sub %l2,stridex,%i5 1726 stx %i5,[%fp+tmp_px] 1727 1728 sub counter,8,counter 1729 st counter,[%fp+tmp_counter] 1730 1731 ba .cont14 1732 or %g0,8,counter 1733 1734 .align 16 1735 .update15: 1736 cmp counter,8 1737 ble .cont15 1738 nop 1739 1740 sub %l2,stridex,%i5 1741 stx %i5,[%fp+tmp_px] 1742 1743 sub counter,8,counter 1744 st counter,[%fp+tmp_counter] 1745 1746 ba .cont15 1747 or %g0,8,counter 1748 1749 .align 16 1750 .update16: 1751 cmp counter,9 1752 ble .cont16 1753 nop 1754 1755 sub %l2,stridex,%i5 1756 stx %i5,[%fp+tmp_px] 1757 1758 sub counter,9,counter 1759 st counter,[%fp+tmp_counter] 1760 1761 ba .cont16 1762 or %g0,9,counter 1763 1764 .align 16 1765 .update17: 1766 cmp counter,9 1767 ble .cont17 1768 nop 1769 1770 sub %l2,stridex,%i5 1771 stx %i5,[%fp+tmp_px] 1772 1773 sub counter,9,counter 1774 st counter,[%fp+tmp_counter] 1775 1776 ba .cont17 1777 or %g0,9,counter 1778 1779 .align 16 1780 .update18: 1781 cmp counter,10 1782 ble .cont18 1783 nop 1784 1785 sub %l2,stridex,%i5 1786 stx %i5,[%fp+tmp_px] 1787 1788 sub counter,10,counter 1789 st counter,[%fp+tmp_counter] 1790 1791 ba .cont18 1792 or %g0,10,counter 1793 1794 .align 16 1795 .update19: 1796 cmp counter,10 1797 ble .cont19 1798 nop 1799 1800 sub %l2,stridex,%i5 1801 stx %i5,[%fp+tmp_px] 1802 1803 sub counter,10,counter 1804 st counter,[%fp+tmp_counter] 1805 1806 ba .cont19 1807 or %g0,10,counter 1808 1809 .align 16 1810 .update20: 1811 cmp counter,11 1812 ble .cont20 1813 nop 1814 1815 sub %l2,stridex,%i5 1816 stx %i5,[%fp+tmp_px] 1817 1818 sub counter,11,counter 1819 st counter,[%fp+tmp_counter] 1820 1821 ba .cont20 1822 or %g0,11,counter 1823 1824 .align 16 1825 .update21: 1826 cmp counter,11 1827 ble .cont21 1828 nop 1829 1830 sub %l2,stridex,%i5 1831 stx %i5,[%fp+tmp_px] 1832 1833 sub counter,11,counter 1834 st counter,[%fp+tmp_counter] 1835 1836 ba .cont21 1837 or %g0,11,counter 1838 1839 .exit: 1840 ret 1841 restore 1842 1843 SET_SIZE(__vsqrt) 1844