1:
2: 3: 4: 5: 6: 7: 8: 9: 10: 11:
12:
13: 14: 15: 16: 17: 18: 19: 20: 21: 22: 23: 24: 25: 26: 27: 28: 29: 30: 31: 32: 33: 34: 35: 36: 37: 38: 39: 40: 41: 42: 43: 44: 45: 46: 47: 48: 49: 50: 51: 52: 53: 54: 55: 56: 57: 58: 59: 60: 61: 62: 63: 64: 65: 66: 67: 68: 69: 70: 71: 72: 73: 74: 75: 76: 77: 78: 79: 80: 81: 82: 83: 84: 85: 86: 87: 88: 89: 90: 91: 92: 93: 94: 95: 96: 97: 98: 99: 100: 101: 102: 103: 104: 105: 106: 107: 108: 109: 110: 111: 112:
113:
114:
115: 116: 117: 118: 119: 120: 121:
122:
123: #include <float.h>
124: #include <math.h>
125:
126: #include "math_private.h"
127:
128: static const int init_jk[] = {2,3,4,6};
129:
130: 131: 132: 133: 134: 135: 136: 137: 138: 139: 140: 141:
142: static const int32_t ipio2[] = {
143: 0xA2F983, 0x6E4E44, 0x1529FC, 0x2757D1, 0xF534DD, 0xC0DB62,
144: 0x95993C, 0x439041, 0xFE5163, 0xABDEBB, 0xC561B7, 0x246E3A,
145: 0x424DD2, 0xE00649, 0x2EEA09, 0xD1921C, 0xFE1DEB, 0x1CB129,
146: 0xA73EE8, 0x8235F5, 0x2EBB44, 0x84E99C, 0x7026B4, 0x5F7E41,
147: 0x3991D6, 0x398353, 0x39F49C, 0x845F8B, 0xBDF928, 0x3B1FF8,
148: 0x97FFDE, 0x05980F, 0xEF2F11, 0x8B5A0A, 0x6D1F6D, 0x367ECF,
149: 0x27CB09, 0xB74F46, 0x3F669E, 0x5FEA2D, 0x7527BA, 0xC7EBE5,
150: 0xF17B3D, 0x0739F7, 0x8A5292, 0xEA6BFB, 0x5FB11F, 0x8D5D08,
151: 0x560330, 0x46FC7B, 0x6BABF0, 0xCFBC20, 0x9AF436, 0x1DA9E3,
152: 0x91615E, 0xE61B08, 0x659985, 0x5F14A0, 0x68408D, 0xFFD880,
153: 0x4D7327, 0x310606, 0x1556CA, 0x73A8C9, 0x60E27B, 0xC08C6B,
154:
155: #if LDBL_MAX_EXP > 1024
156: #if LDBL_MAX_EXP > 16384
157: #error "ipio2 table needs to be expanded"
158: #endif
159: 0x47C419, 0xC367CD, 0xDCE809, 0x2A8359, 0xC4768B, 0x961CA6,
160: 0xDDAF44, 0xD15719, 0x053EA5, 0xFF0705, 0x3F7E33, 0xE832C2,
161: 0xDE4F98, 0x327DBB, 0xC33D26, 0xEF6B1E, 0x5EF89F, 0x3A1F35,
162: 0xCAF27F, 0x1D87F1, 0x21907C, 0x7C246A, 0xFA6ED5, 0x772D30,
163: 0x433B15, 0xC614B5, 0x9D19C3, 0xC2C4AD, 0x414D2C, 0x5D000C,
164: 0x467D86, 0x2D71E3, 0x9AC69B, 0x006233, 0x7CD2B4, 0x97A7B4,
165: 0xD55537, 0xF63ED7, 0x1810A3, 0xFC764D, 0x2A9D64, 0xABD770,
166: 0xF87C63, 0x57B07A, 0xE71517, 0x5649C0, 0xD9D63B, 0x3884A7,
167: 0xCB2324, 0x778AD6, 0x23545A, 0xB91F00, 0x1B0AF1, 0xDFCE19,
168: 0xFF319F, 0x6A1E66, 0x615799, 0x47FBAC, 0xD87F7E, 0xB76522,
169: 0x89E832, 0x60BFE6, 0xCDC4EF, 0x09366C, 0xD43F5D, 0xD7DE16,
170: 0xDE3B58, 0x929BDE, 0x2822D2, 0xE88628, 0x4D58E2, 0x32CAC6,
171: 0x16E308, 0xCB7DE0, 0x50C017, 0xA71DF3, 0x5BE018, 0x34132E,
172: 0x621283, 0x014883, 0x5B8EF5, 0x7FB0AD, 0xF2E91E, 0x434A48,
173: 0xD36710, 0xD8DDAA, 0x425FAE, 0xCE616A, 0xA4280A, 0xB499D3,
174: 0xF2A606, 0x7F775C, 0x83C2A3, 0x883C61, 0x78738A, 0x5A8CAF,
175: 0xBDD76F, 0x63A62D, 0xCBBFF4, 0xEF818D, 0x67C126, 0x45CA55,
176: 0x36D9CA, 0xD2A828, 0x8D61C2, 0x77C912, 0x142604, 0x9B4612,
177: 0xC459C4, 0x44C5C8, 0x91B24D, 0xF31700, 0xAD43D4, 0xE54929,
178: 0x10D5FD, 0xFCBE00, 0xCC941E, 0xEECE70, 0xF53E13, 0x80F1EC,
179: 0xC3E7B3, 0x28F8C7, 0x940593, 0x3E71C1, 0xB3092E, 0xF3450B,
180: 0x9C1288, 0x7B20AB, 0x9FB52E, 0xC29247, 0x2F327B, 0x6D550C,
181: 0x90A772, 0x1FE76B, 0x96CB31, 0x4A1679, 0xE27941, 0x89DFF4,
182: 0x9794E8, 0x84E6E2, 0x973199, 0x6BED88, 0x365F5F, 0x0EFDBB,
183: 0xB49A48, 0x6CA467, 0x427271, 0x325D8D, 0xB8159F, 0x09E5BC,
184: 0x25318D, 0x3974F7, 0x1C0530, 0x010C0D, 0x68084B, 0x58EE2C,
185: 0x90AA47, 0x02E774, 0x24D6BD, 0xA67DF7, 0x72486E, 0xEF169F,
186: 0xA6948E, 0xF691B4, 0x5153D1, 0xF20ACF, 0x339820, 0x7E4BF5,
187: 0x6863B2, 0x5F3EDD, 0x035D40, 0x7F8985, 0x295255, 0xC06437,
188: 0x10D86D, 0x324832, 0x754C5B, 0xD4714E, 0x6E5445, 0xC1090B,
189: 0x69F52A, 0xD56614, 0x9D0727, 0x50045D, 0xDB3BB4, 0xC576EA,
190: 0x17F987, 0x7D6B49, 0xBA271D, 0x296996, 0xACCCC6, 0x5414AD,
191: 0x6AE290, 0x89D988, 0x50722C, 0xBEA404, 0x940777, 0x7030F3,
192: 0x27FC00, 0xA871EA, 0x49C266, 0x3DE064, 0x83DD97, 0x973FA3,
193: 0xFD9443, 0x8C860D, 0xDE4131, 0x9D3992, 0x8C70DD, 0xE7B717,
194: 0x3BDF08, 0x2B3715, 0xA0805C, 0x93805A, 0x921110, 0xD8E80F,
195: 0xAF806C, 0x4BFFDB, 0x0F9038, 0x761859, 0x15A562, 0xBBCB61,
196: 0xB989C7, 0xBD4010, 0x04F2D2, 0x277549, 0xF6B6EB, 0xBB22DB,
197: 0xAA140A, 0x2F2689, 0x768364, 0x333B09, 0x1A940E, 0xAA3A51,
198: 0xC2A31D, 0xAEEDAF, 0x12265C, 0x4DC26D, 0x9C7A2D, 0x9756C0,
199: 0x833F03, 0xF6F009, 0x8C402B, 0x99316D, 0x07B439, 0x15200C,
200: 0x5BC3D8, 0xC492F5, 0x4BADC6, 0xA5CA4E, 0xCD37A7, 0x36A9E6,
201: 0x9492AB, 0x6842DD, 0xDE6319, 0xEF8C76, 0x528B68, 0x37DBFC,
202: 0xABA1AE, 0x3115DF, 0xA1AE00, 0xDAFB0C, 0x664D64, 0xB705ED,
203: 0x306529, 0xBF5657, 0x3AFF47, 0xB9F96A, 0xF3BE75, 0xDF9328,
204: 0x3080AB, 0xF68C66, 0x15CB04, 0x0622FA, 0x1DE4D9, 0xA4B33D,
205: 0x8F1B57, 0x09CD36, 0xE9424E, 0xA4BE13, 0xB52333, 0x1AAAF0,
206: 0xA8654F, 0xA5C1D2, 0x0F3F0B, 0xCD785B, 0x76F923, 0x048B7B,
207: 0x721789, 0x53A6C6, 0xE26E6F, 0x00EBEF, 0x584A9B, 0xB7DAC4,
208: 0xBA66AA, 0xCFCF76, 0x1D02D1, 0x2DF1B1, 0xC1998C, 0x77ADC3,
209: 0xDA4886, 0xA05DF7, 0xF480C6, 0x2FF0AC, 0x9AECDD, 0xBC5C3F,
210: 0x6DDED0, 0x1FC790, 0xB6DB2A, 0x3A25A3, 0x9AAF00, 0x9353AD,
211: 0x0457B6, 0xB42D29, 0x7E804B, 0xA707DA, 0x0EAA76, 0xA1597B,
212: 0x2A1216, 0x2DB7DC, 0xFDE5FA, 0xFEDB89, 0xFDBE89, 0x6C76E4,
213: 0xFCA906, 0x70803E, 0x156E85, 0xFF87FD, 0x073E28, 0x336761,
214: 0x86182A, 0xEABD4D, 0xAFE7B3, 0x6E6D8F, 0x396795, 0x5BBF31,
215: 0x48D784, 0x16DF30, 0x432DC7, 0x356125, 0xCE70C9, 0xB8CB30,
216: 0xFD6CBF, 0xA200A4, 0xE46C05, 0xA0DD5A, 0x476F21, 0xD21262,
217: 0x845CB9, 0x496170, 0xE0566B, 0x015299, 0x375550, 0xB7D51E,
218: 0xC4F133, 0x5F6E13, 0xE4305D, 0xA92E85, 0xC3B21D, 0x3632A1,
219: 0xA4B708, 0xD4B1EA, 0x21F716, 0xE4698F, 0x77FF27, 0x80030C,
220: 0x2D408D, 0xA0CD4F, 0x99A520, 0xD3A2B3, 0x0A5D2F, 0x42F9B4,
221: 0xCBDA11, 0xD0BE7D, 0xC1DB9B, 0xBD17AB, 0x81A2CA, 0x5C6A08,
222: 0x17552E, 0x550027, 0xF0147F, 0x8607E1, 0x640B14, 0x8D4196,
223: 0xDEBE87, 0x2AFDDA, 0xB6256B, 0x34897B, 0xFEF305, 0x9EBFB9,
224: 0x4F6A68, 0xA82A4A, 0x5AC44F, 0xBCF82D, 0x985AD7, 0x95C7F4,
225: 0x8D4D0D, 0xA63A20, 0x5F57A4, 0xB13F14, 0x953880, 0x0120CC,
226: 0x86DD71, 0xB6DEC9, 0xF560BF, 0x11654D, 0x6B0701, 0xACB08C,
227: 0xD0C0B2, 0x485551, 0x0EFB1E, 0xC37295, 0x3B06A3, 0x3540C0,
228: 0x7BDC06, 0xCC45E0, 0xFA294E, 0xC8CAD6, 0x41F3E8, 0xDE647C,
229: 0xD8649B, 0x31BED9, 0xC397A4, 0xD45877, 0xC5E369, 0x13DAF0,
230: 0x3C3ABA, 0x461846, 0x5F7555, 0xF5BDD2, 0xC6926E, 0x5D2EAC,
231: 0xED440E, 0x423E1C, 0x87C461, 0xE9FD29, 0xF3D6E7, 0xCA7C22,
232: 0x35916F, 0xC5E008, 0x8DD7FF, 0xE26A6E, 0xC6FDB0, 0xC10893,
233: 0x745D7C, 0xB2AD6B, 0x9D6ECD, 0x7B723E, 0x6A11C6, 0xA9CFF7,
234: 0xDF7329, 0xBAC9B5, 0x5100B7, 0x0DB2E2, 0x24BA74, 0x607DE5,
235: 0x8AD874, 0x2C150D, 0x0C1881, 0x94667E, 0x162901, 0x767A9F,
236: 0xBEFDFD, 0xEF4556, 0x367ED9, 0x13D9EC, 0xB9BA8B, 0xFC97C4,
237: 0x27A831, 0xC36EF1, 0x36C594, 0x56A8D8, 0xB5A8B4, 0x0ECCCF,
238: 0x2D8912, 0x34576F, 0x89562C, 0xE3CE99, 0xB920D6, 0xAA5E6B,
239: 0x9C2A3E, 0xCC5F11, 0x4A0BFD, 0xFBF4E1, 0x6D3B8E, 0x2C86E2,
240: 0x84D4E9, 0xA9B4FC, 0xD1EEEF, 0xC9352E, 0x61392F, 0x442138,
241: 0xC8D91B, 0x0AFC81, 0x6A4AFB, 0xD81C2F, 0x84B453, 0x8C994E,
242: 0xCC2254, 0xDC552A, 0xD6C6C0, 0x96190B, 0xB8701A, 0x649569,
243: 0x605A26, 0xEE523F, 0x0F117F, 0x11B5F4, 0xF5CBFC, 0x2DBC34,
244: 0xEEBC34, 0xCC5DE8, 0x605EDD, 0x9B8E67, 0xEF3392, 0xB817C9,
245: 0x9B5861, 0xBC57E1, 0xC68351, 0x103ED8, 0x4871DD, 0xDD1C2D,
246: 0xA118AF, 0x462C21, 0xD7F359, 0x987AD9, 0xC0549E, 0xFA864F,
247: 0xFC0656, 0xAE79E5, 0x362289, 0x22AD38, 0xDC9367, 0xAAE855,
248: 0x382682, 0x9BE7CA, 0xA40D51, 0xB13399, 0x0ED7A9, 0x480569,
249: 0xF0B265, 0xA7887F, 0x974C88, 0x36D1F9, 0xB39221, 0x4A827B,
250: 0x21CF98, 0xDC9F40, 0x5547DC, 0x3A74E1, 0x42EB67, 0xDF9DFE,
251: 0x5FD45E, 0xA4677B, 0x7AACBA, 0xA2F655, 0x23882B, 0x55BA41,
252: 0x086E59, 0x862A21, 0x834739, 0xE6E389, 0xD49EE5, 0x40FB49,
253: 0xE956FF, 0xCA0F1C, 0x8A59C5, 0x2BFA94, 0xC5C1D3, 0xCFC50F,
254: 0xAE5ADB, 0x86C547, 0x624385, 0x3B8621, 0x94792C, 0x876110,
255: 0x7B4C2A, 0x1A2C80, 0x12BF43, 0x902688, 0x893C78, 0xE4C4A8,
256: 0x7BDBE5, 0xC23AC4, 0xEAF426, 0x8A67F7, 0xBF920D, 0x2BA365,
257: 0xB1933D, 0x0B7CBD, 0xDC51A4, 0x63DD27, 0xDDE169, 0x19949A,
258: 0x9529A8, 0x28CE68, 0xB4ED09, 0x209F44, 0xCA984E, 0x638270,
259: 0x237C7E, 0x32B90F, 0x8EF5A7, 0xE75614, 0x08F121, 0x2A9DB5,
260: 0x4D7E6F, 0x5119A5, 0xABF9B5, 0xD6DF82, 0x61DD96, 0x023616,
261: 0x9F3AC4, 0xA1A283, 0x6DED72, 0x7A8D39, 0xA9B882, 0x5C326B,
262: 0x5B2746, 0xED3400, 0x7700D2, 0x55F4FC, 0x4D5901, 0x8071E0,
263: #endif
264:
265: };
266:
267: static const double PIo2[] = {
268: 1.57079625129699707031e+00,
269: 7.54978941586159635335e-08,
270: 5.39030252995776476554e-15,
271: 3.28200341580791294123e-22,
272: 1.27065575308067607349e-29,
273: 1.22933308981111328932e-36,
274: 2.73370053816464559624e-44,
275: 2.16741683877804819444e-51,
276: };
277:
278: static const double
279: zero = 0.0,
280: one = 1.0,
281: two24 = 1.67772160000000000000e+07,
282: twon24 = 5.96046447753906250000e-08;
283:
284: int
285: __kernel_rem_pio2(double *x, double *y, int e0, int nx, int prec)
286: {
287: int32_t jz,jx,jv,jp,jk,carry,n,iq[20],i,j,k,m,q0,ih;
288: double z,fw,f[20],fq[20],q[20];
289:
290:
291: jk = init_jk[prec];
292: jp = jk;
293:
294:
295: jx = nx-1;
296: jv = (e0-3)/24; if(jv<0) jv=0;
297: q0 = e0-24*(jv+1);
298:
299:
300: j = jv-jx; m = jx+jk;
301: for(i=0;i<=m;i++,j++) f[i] = (j<0)? zero : (double) ipio2[j];
302:
303:
304: for (i=0;i<=jk;i++) {
305: for(j=0,fw=0.0;j<=jx;j++) fw += x[j]*f[jx+i-j]; q[i] = fw;
306: }
307:
308: jz = jk;
309: recompute:
310:
311: for(i=0,j=jz,z=q[jz];j>0;i++,j--) {
312: fw = (double)((int32_t)(twon24* z));
313: iq[i] = (int32_t)(z-two24*fw);
314: z = q[j-1]+fw;
315: }
316:
317:
318: z = scalbn(z,q0);
319: z -= 8.0*floor(z*0.125);
320: n = (int32_t) z;
321: z -= (double)n;
322: ih = 0;
323: if(q0>0) {
324: i = (iq[jz-1]>>(24-q0)); n += i;
325: iq[jz-1] -= i<<(24-q0);
326: ih = iq[jz-1]>>(23-q0);
327: }
328: else if(q0==0) ih = iq[jz-1]>>23;
329: else if(z>=0.5) ih=2;
330:
331: if(ih>0) {
332: n += 1; carry = 0;
333: for(i=0;i<jz ;i++) {
334: j = iq[i];
335: if(carry==0) {
336: if(j!=0) {
337: carry = 1; iq[i] = 0x1000000- j;
338: }
339: } else iq[i] = 0xffffff - j;
340: }
341: if(q0>0) {
342: switch(q0) {
343: case 1:
344: iq[jz-1] &= 0x7fffff; break;
345: case 2:
346: iq[jz-1] &= 0x3fffff; break;
347: }
348: }
349: if(ih==2) {
350: z = one - z;
351: if(carry!=0) z -= scalbn(one,q0);
352: }
353: }
354:
355:
356: if(z==zero) {
357: j = 0;
358: for (i=jz-1;i>=jk;i--) j |= iq[i];
359: if(j==0) {
360: for(k=1;iq[jk-k]==0;k++);
361:
362: for(i=jz+1;i<=jz+k;i++) {
363: f[jx+i] = (double) ipio2[jv+i];
364: for(j=0,fw=0.0;j<=jx;j++) fw += x[j]*f[jx+i-j];
365: q[i] = fw;
366: }
367: jz += k;
368: goto recompute;
369: }
370: }
371:
372:
373: if(z==0.0) {
374: jz -= 1; q0 -= 24;
375: while(iq[jz]==0) { jz--; q0-=24;}
376: } else {
377: z = scalbn(z,-q0);
378: if(z>=two24) {
379: fw = (double)((int32_t)(twon24*z));
380: iq[jz] = (int32_t)(z-two24*fw);
381: jz += 1; q0 += 24;
382: iq[jz] = (int32_t) fw;
383: } else iq[jz] = (int32_t) z ;
384: }
385:
386:
387: fw = scalbn(one,q0);
388: for(i=jz;i>=0;i--) {
389: q[i] = fw*(double)iq[i]; fw*=twon24;
390: }
391:
392:
393: for(i=jz;i>=0;i--) {
394: for(fw=0.0,k=0;k<=jp&&k<=jz-i;k++) fw += PIo2[k]*q[i+k];
395: fq[jz-i] = fw;
396: }
397:
398:
399: switch(prec) {
400: case 0:
401: fw = 0.0;
402: for (i=jz;i>=0;i--) fw += fq[i];
403: y[0] = (ih==0)? fw: -fw;
404: break;
405: case 1:
406: case 2:
407: fw = 0.0;
408: for (i=jz;i>=0;i--) fw += fq[i];
409: STRICT_ASSIGN(double,fw,fw);
410: y[0] = (ih==0)? fw: -fw;
411: fw = fq[0]-fw;
412: for (i=1;i<=jz;i++) fw += fq[i];
413: y[1] = (ih==0)? fw: -fw;
414: break;
415: case 3:
416: for (i=jz;i>0;i--) {
417: fw = fq[i-1]+fq[i];
418: fq[i] += fq[i-1]-fw;
419: fq[i-1] = fw;
420: }
421: for (i=jz;i>1;i--) {
422: fw = fq[i-1]+fq[i];
423: fq[i] += fq[i-1]-fw;
424: fq[i-1] = fw;
425: }
426: for (fw=0.0,i=jz;i>=2;i--) fw += fq[i];
427: if(ih==0) {
428: y[0] = fq[0]; y[1] = fq[1]; y[2] = fw;
429: } else {
430: y[0] = -fq[0]; y[1] = -fq[1]; y[2] = -fw;
431: }
432: }
433: return n&7;
434: }