erf_lgamma.c 7.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255
  1. /*
  2. * This file is part of the MicroPython project, http://micropython.org/
  3. *
  4. * These math functions are taken from newlib-nano-2, the newlib/libm/math
  5. * directory, available from https://github.com/32bitmicro/newlib-nano-2.
  6. *
  7. * Appropriate copyright headers are reproduced below.
  8. */
  9. /* erf_lgamma.c -- float version of er_lgamma.c.
  10. * Conversion to float by Ian Lance Taylor, Cygnus Support, ian@cygnus.com.
  11. */
  12. /*
  13. * ====================================================
  14. * Copyright (C) 1993 by Sun Microsystems, Inc. All rights reserved.
  15. *
  16. * Developed at SunPro, a Sun Microsystems, Inc. business.
  17. * Permission to use, copy, modify, and distribute this
  18. * software is freely granted, provided that this notice
  19. * is preserved.
  20. * ====================================================
  21. *
  22. */
  23. #include "fdlibm.h"
  24. #define __ieee754_logf logf
  25. #ifdef __STDC__
  26. static const float
  27. #else
  28. static float
  29. #endif
  30. two23= 8.3886080000e+06, /* 0x4b000000 */
  31. half= 5.0000000000e-01, /* 0x3f000000 */
  32. one = 1.0000000000e+00, /* 0x3f800000 */
  33. pi = 3.1415927410e+00, /* 0x40490fdb */
  34. a0 = 7.7215664089e-02, /* 0x3d9e233f */
  35. a1 = 3.2246702909e-01, /* 0x3ea51a66 */
  36. a2 = 6.7352302372e-02, /* 0x3d89f001 */
  37. a3 = 2.0580807701e-02, /* 0x3ca89915 */
  38. a4 = 7.3855509982e-03, /* 0x3bf2027e */
  39. a5 = 2.8905137442e-03, /* 0x3b3d6ec6 */
  40. a6 = 1.1927076848e-03, /* 0x3a9c54a1 */
  41. a7 = 5.1006977446e-04, /* 0x3a05b634 */
  42. a8 = 2.2086278477e-04, /* 0x39679767 */
  43. a9 = 1.0801156895e-04, /* 0x38e28445 */
  44. a10 = 2.5214456400e-05, /* 0x37d383a2 */
  45. a11 = 4.4864096708e-05, /* 0x383c2c75 */
  46. tc = 1.4616321325e+00, /* 0x3fbb16c3 */
  47. tf = -1.2148628384e-01, /* 0xbdf8cdcd */
  48. /* tt = -(tail of tf) */
  49. tt = 6.6971006518e-09, /* 0x31e61c52 */
  50. t0 = 4.8383611441e-01, /* 0x3ef7b95e */
  51. t1 = -1.4758771658e-01, /* 0xbe17213c */
  52. t2 = 6.4624942839e-02, /* 0x3d845a15 */
  53. t3 = -3.2788541168e-02, /* 0xbd064d47 */
  54. t4 = 1.7970675603e-02, /* 0x3c93373d */
  55. t5 = -1.0314224288e-02, /* 0xbc28fcfe */
  56. t6 = 6.1005386524e-03, /* 0x3bc7e707 */
  57. t7 = -3.6845202558e-03, /* 0xbb7177fe */
  58. t8 = 2.2596477065e-03, /* 0x3b141699 */
  59. t9 = -1.4034647029e-03, /* 0xbab7f476 */
  60. t10 = 8.8108185446e-04, /* 0x3a66f867 */
  61. t11 = -5.3859531181e-04, /* 0xba0d3085 */
  62. t12 = 3.1563205994e-04, /* 0x39a57b6b */
  63. t13 = -3.1275415677e-04, /* 0xb9a3f927 */
  64. t14 = 3.3552918467e-04, /* 0x39afe9f7 */
  65. u0 = -7.7215664089e-02, /* 0xbd9e233f */
  66. u1 = 6.3282704353e-01, /* 0x3f2200f4 */
  67. u2 = 1.4549225569e+00, /* 0x3fba3ae7 */
  68. u3 = 9.7771751881e-01, /* 0x3f7a4bb2 */
  69. u4 = 2.2896373272e-01, /* 0x3e6a7578 */
  70. u5 = 1.3381091878e-02, /* 0x3c5b3c5e */
  71. v1 = 2.4559779167e+00, /* 0x401d2ebe */
  72. v2 = 2.1284897327e+00, /* 0x4008392d */
  73. v3 = 7.6928514242e-01, /* 0x3f44efdf */
  74. v4 = 1.0422264785e-01, /* 0x3dd572af */
  75. v5 = 3.2170924824e-03, /* 0x3b52d5db */
  76. s0 = -7.7215664089e-02, /* 0xbd9e233f */
  77. s1 = 2.1498242021e-01, /* 0x3e5c245a */
  78. s2 = 3.2577878237e-01, /* 0x3ea6cc7a */
  79. s3 = 1.4635047317e-01, /* 0x3e15dce6 */
  80. s4 = 2.6642270386e-02, /* 0x3cda40e4 */
  81. s5 = 1.8402845599e-03, /* 0x3af135b4 */
  82. s6 = 3.1947532989e-05, /* 0x3805ff67 */
  83. r1 = 1.3920053244e+00, /* 0x3fb22d3b */
  84. r2 = 7.2193557024e-01, /* 0x3f38d0c5 */
  85. r3 = 1.7193385959e-01, /* 0x3e300f6e */
  86. r4 = 1.8645919859e-02, /* 0x3c98bf54 */
  87. r5 = 7.7794247773e-04, /* 0x3a4beed6 */
  88. r6 = 7.3266842264e-06, /* 0x36f5d7bd */
  89. w0 = 4.1893854737e-01, /* 0x3ed67f1d */
  90. w1 = 8.3333335817e-02, /* 0x3daaaaab */
  91. w2 = -2.7777778450e-03, /* 0xbb360b61 */
  92. w3 = 7.9365057172e-04, /* 0x3a500cfd */
  93. w4 = -5.9518753551e-04, /* 0xba1c065c */
  94. w5 = 8.3633989561e-04, /* 0x3a5b3dd2 */
  95. w6 = -1.6309292987e-03; /* 0xbad5c4e8 */
  96. #ifdef __STDC__
  97. static const float zero= 0.0000000000e+00;
  98. #else
  99. static float zero= 0.0000000000e+00;
  100. #endif
  101. #ifdef __STDC__
  102. static float sin_pif(float x)
  103. #else
  104. static float sin_pif(x)
  105. float x;
  106. #endif
  107. {
  108. float y,z;
  109. __int32_t n,ix;
  110. GET_FLOAT_WORD(ix,x);
  111. ix &= 0x7fffffff;
  112. if(ix<0x3e800000) return __kernel_sinf(pi*x,zero,0);
  113. y = -x; /* x is assume negative */
  114. /*
  115. * argument reduction, make sure inexact flag not raised if input
  116. * is an integer
  117. */
  118. z = floorf(y);
  119. if(z!=y) { /* inexact anyway */
  120. y *= (float)0.5;
  121. y = (float)2.0*(y - floorf(y)); /* y = |x| mod 2.0 */
  122. n = (__int32_t) (y*(float)4.0);
  123. } else {
  124. if(ix>=0x4b800000) {
  125. y = zero; n = 0; /* y must be even */
  126. } else {
  127. if(ix<0x4b000000) z = y+two23; /* exact */
  128. GET_FLOAT_WORD(n,z);
  129. n &= 1;
  130. y = n;
  131. n<<= 2;
  132. }
  133. }
  134. switch (n) {
  135. case 0: y = __kernel_sinf(pi*y,zero,0); break;
  136. case 1:
  137. case 2: y = __kernel_cosf(pi*((float)0.5-y),zero); break;
  138. case 3:
  139. case 4: y = __kernel_sinf(pi*(one-y),zero,0); break;
  140. case 5:
  141. case 6: y = -__kernel_cosf(pi*(y-(float)1.5),zero); break;
  142. default: y = __kernel_sinf(pi*(y-(float)2.0),zero,0); break;
  143. }
  144. return -y;
  145. }
  146. #ifdef __STDC__
  147. float __ieee754_lgammaf_r(float x, int *signgamp)
  148. #else
  149. float __ieee754_lgammaf_r(x,signgamp)
  150. float x; int *signgamp;
  151. #endif
  152. {
  153. float t,y,z,nadj = 0.0,p,p1,p2,p3,q,r,w;
  154. __int32_t i,hx,ix;
  155. GET_FLOAT_WORD(hx,x);
  156. /* purge off +-inf, NaN, +-0, and negative arguments */
  157. *signgamp = 1;
  158. ix = hx&0x7fffffff;
  159. if(ix>=0x7f800000) return x*x;
  160. if(ix==0) return one/zero;
  161. if(ix<0x1c800000) { /* |x|<2**-70, return -log(|x|) */
  162. if(hx<0) {
  163. *signgamp = -1;
  164. return -__ieee754_logf(-x);
  165. } else return -__ieee754_logf(x);
  166. }
  167. if(hx<0) {
  168. if(ix>=0x4b000000) /* |x|>=2**23, must be -integer */
  169. return one/zero;
  170. t = sin_pif(x);
  171. if(t==zero) return one/zero; /* -integer */
  172. nadj = __ieee754_logf(pi/fabsf(t*x));
  173. if(t<zero) *signgamp = -1;
  174. x = -x;
  175. }
  176. /* purge off 1 and 2 */
  177. if (ix==0x3f800000||ix==0x40000000) r = 0;
  178. /* for x < 2.0 */
  179. else if(ix<0x40000000) {
  180. if(ix<=0x3f666666) { /* lgamma(x) = lgamma(x+1)-log(x) */
  181. r = -__ieee754_logf(x);
  182. if(ix>=0x3f3b4a20) {y = one-x; i= 0;}
  183. else if(ix>=0x3e6d3308) {y= x-(tc-one); i=1;}
  184. else {y = x; i=2;}
  185. } else {
  186. r = zero;
  187. if(ix>=0x3fdda618) {y=(float)2.0-x;i=0;} /* [1.7316,2] */
  188. else if(ix>=0x3F9da620) {y=x-tc;i=1;} /* [1.23,1.73] */
  189. else {y=x-one;i=2;}
  190. }
  191. switch(i) {
  192. case 0:
  193. z = y*y;
  194. p1 = a0+z*(a2+z*(a4+z*(a6+z*(a8+z*a10))));
  195. p2 = z*(a1+z*(a3+z*(a5+z*(a7+z*(a9+z*a11)))));
  196. p = y*p1+p2;
  197. r += (p-(float)0.5*y); break;
  198. case 1:
  199. z = y*y;
  200. w = z*y;
  201. p1 = t0+w*(t3+w*(t6+w*(t9 +w*t12))); /* parallel comp */
  202. p2 = t1+w*(t4+w*(t7+w*(t10+w*t13)));
  203. p3 = t2+w*(t5+w*(t8+w*(t11+w*t14)));
  204. p = z*p1-(tt-w*(p2+y*p3));
  205. r += (tf + p); break;
  206. case 2:
  207. p1 = y*(u0+y*(u1+y*(u2+y*(u3+y*(u4+y*u5)))));
  208. p2 = one+y*(v1+y*(v2+y*(v3+y*(v4+y*v5))));
  209. r += (-(float)0.5*y + p1/p2);
  210. }
  211. }
  212. else if(ix<0x41000000) { /* x < 8.0 */
  213. i = (__int32_t)x;
  214. t = zero;
  215. y = x-(float)i;
  216. p = y*(s0+y*(s1+y*(s2+y*(s3+y*(s4+y*(s5+y*s6))))));
  217. q = one+y*(r1+y*(r2+y*(r3+y*(r4+y*(r5+y*r6)))));
  218. r = half*y+p/q;
  219. z = one; /* lgamma(1+s) = log(s) + lgamma(s) */
  220. switch(i) {
  221. case 7: z *= (y+(float)6.0); /* FALLTHRU */
  222. case 6: z *= (y+(float)5.0); /* FALLTHRU */
  223. case 5: z *= (y+(float)4.0); /* FALLTHRU */
  224. case 4: z *= (y+(float)3.0); /* FALLTHRU */
  225. case 3: z *= (y+(float)2.0); /* FALLTHRU */
  226. r += __ieee754_logf(z); break;
  227. }
  228. /* 8.0 <= x < 2**58 */
  229. } else if (ix < 0x5c800000) {
  230. t = __ieee754_logf(x);
  231. z = one/x;
  232. y = z*z;
  233. w = w0+z*(w1+y*(w2+y*(w3+y*(w4+y*(w5+y*w6)))));
  234. r = (x-half)*(t-one)+w;
  235. } else
  236. /* 2**58 <= x <= inf */
  237. r = x*(__ieee754_logf(x)-one);
  238. if(hx<0) r = nadj - r;
  239. return r;
  240. }