mpz.c 48 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735
  1. /*
  2. * This file is part of the MicroPython project, http://micropython.org/
  3. *
  4. * The MIT License (MIT)
  5. *
  6. * Copyright (c) 2013, 2014 Damien P. George
  7. *
  8. * Permission is hereby granted, free of charge, to any person obtaining a copy
  9. * of this software and associated documentation files (the "Software"), to deal
  10. * in the Software without restriction, including without limitation the rights
  11. * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  12. * copies of the Software, and to permit persons to whom the Software is
  13. * furnished to do so, subject to the following conditions:
  14. *
  15. * The above copyright notice and this permission notice shall be included in
  16. * all copies or substantial portions of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  21. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  23. * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  24. * THE SOFTWARE.
  25. */
  26. #include <string.h>
  27. #include <assert.h>
  28. #include "py/mpz.h"
  29. #if MICROPY_LONGINT_IMPL == MICROPY_LONGINT_IMPL_MPZ
  30. #define DIG_SIZE (MPZ_DIG_SIZE)
  31. #define DIG_MASK ((MPZ_LONG_1 << DIG_SIZE) - 1)
  32. #define DIG_MSB (MPZ_LONG_1 << (DIG_SIZE - 1))
  33. #define DIG_BASE (MPZ_LONG_1 << DIG_SIZE)
  34. /*
  35. mpz is an arbitrary precision integer type with a public API.
  36. mpn functions act on non-negative integers represented by an array of generalised
  37. digits (eg a word per digit). You also need to specify separately the length of the
  38. array. There is no public API for mpn. Rather, the functions are used by mpz to
  39. implement its features.
  40. Integer values are stored little endian (first digit is first in memory).
  41. Definition of normalise: ?
  42. */
  43. STATIC size_t mpn_remove_trailing_zeros(mpz_dig_t *oidig, mpz_dig_t *idig) {
  44. for (--idig; idig >= oidig && *idig == 0; --idig) {
  45. }
  46. return idig + 1 - oidig;
  47. }
  48. /* compares i with j
  49. returns sign(i - j)
  50. assumes i, j are normalised
  51. */
  52. STATIC int mpn_cmp(const mpz_dig_t *idig, size_t ilen, const mpz_dig_t *jdig, size_t jlen) {
  53. if (ilen < jlen) { return -1; }
  54. if (ilen > jlen) { return 1; }
  55. for (idig += ilen, jdig += ilen; ilen > 0; --ilen) {
  56. mpz_dbl_dig_signed_t cmp = (mpz_dbl_dig_t)*(--idig) - (mpz_dbl_dig_t)*(--jdig);
  57. if (cmp < 0) { return -1; }
  58. if (cmp > 0) { return 1; }
  59. }
  60. return 0;
  61. }
  62. /* computes i = j << n
  63. returns number of digits in i
  64. assumes enough memory in i; assumes normalised j; assumes n > 0
  65. can have i, j pointing to same memory
  66. */
  67. STATIC size_t mpn_shl(mpz_dig_t *idig, mpz_dig_t *jdig, size_t jlen, mp_uint_t n) {
  68. mp_uint_t n_whole = (n + DIG_SIZE - 1) / DIG_SIZE;
  69. mp_uint_t n_part = n % DIG_SIZE;
  70. if (n_part == 0) {
  71. n_part = DIG_SIZE;
  72. }
  73. // start from the high end of the digit arrays
  74. idig += jlen + n_whole - 1;
  75. jdig += jlen - 1;
  76. // shift the digits
  77. mpz_dbl_dig_t d = 0;
  78. for (size_t i = jlen; i > 0; i--, idig--, jdig--) {
  79. d |= *jdig;
  80. *idig = (d >> (DIG_SIZE - n_part)) & DIG_MASK;
  81. d <<= DIG_SIZE;
  82. }
  83. // store remaining bits
  84. *idig = (d >> (DIG_SIZE - n_part)) & DIG_MASK;
  85. idig -= n_whole - 1;
  86. memset(idig, 0, (n_whole - 1) * sizeof(mpz_dig_t));
  87. // work out length of result
  88. jlen += n_whole;
  89. while (jlen != 0 && idig[jlen - 1] == 0) {
  90. jlen--;
  91. }
  92. // return length of result
  93. return jlen;
  94. }
  95. /* computes i = j >> n
  96. returns number of digits in i
  97. assumes enough memory in i; assumes normalised j; assumes n > 0
  98. can have i, j pointing to same memory
  99. */
  100. STATIC size_t mpn_shr(mpz_dig_t *idig, mpz_dig_t *jdig, size_t jlen, mp_uint_t n) {
  101. mp_uint_t n_whole = n / DIG_SIZE;
  102. mp_uint_t n_part = n % DIG_SIZE;
  103. if (n_whole >= jlen) {
  104. return 0;
  105. }
  106. jdig += n_whole;
  107. jlen -= n_whole;
  108. for (size_t i = jlen; i > 0; i--, idig++, jdig++) {
  109. mpz_dbl_dig_t d = *jdig;
  110. if (i > 1) {
  111. d |= (mpz_dbl_dig_t)jdig[1] << DIG_SIZE;
  112. }
  113. d >>= n_part;
  114. *idig = d & DIG_MASK;
  115. }
  116. if (idig[-1] == 0) {
  117. jlen--;
  118. }
  119. return jlen;
  120. }
  121. /* computes i = j + k
  122. returns number of digits in i
  123. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen
  124. can have i, j, k pointing to same memory
  125. */
  126. STATIC size_t mpn_add(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  127. mpz_dig_t *oidig = idig;
  128. mpz_dbl_dig_t carry = 0;
  129. jlen -= klen;
  130. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  131. carry += (mpz_dbl_dig_t)*jdig + (mpz_dbl_dig_t)*kdig;
  132. *idig = carry & DIG_MASK;
  133. carry >>= DIG_SIZE;
  134. }
  135. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  136. carry += *jdig;
  137. *idig = carry & DIG_MASK;
  138. carry >>= DIG_SIZE;
  139. }
  140. if (carry != 0) {
  141. *idig++ = carry;
  142. }
  143. return idig - oidig;
  144. }
  145. /* computes i = j - k
  146. returns number of digits in i
  147. assumes enough memory in i; assumes normalised j, k; assumes j >= k
  148. can have i, j, k pointing to same memory
  149. */
  150. STATIC size_t mpn_sub(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  151. mpz_dig_t *oidig = idig;
  152. mpz_dbl_dig_signed_t borrow = 0;
  153. jlen -= klen;
  154. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  155. borrow += (mpz_dbl_dig_t)*jdig - (mpz_dbl_dig_t)*kdig;
  156. *idig = borrow & DIG_MASK;
  157. borrow >>= DIG_SIZE;
  158. }
  159. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  160. borrow += *jdig;
  161. *idig = borrow & DIG_MASK;
  162. borrow >>= DIG_SIZE;
  163. }
  164. return mpn_remove_trailing_zeros(oidig, idig);
  165. }
  166. #if MICROPY_OPT_MPZ_BITWISE
  167. /* computes i = j & k
  168. returns number of digits in i
  169. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen (jlen argument not needed)
  170. can have i, j, k pointing to same memory
  171. */
  172. STATIC size_t mpn_and(mpz_dig_t *idig, const mpz_dig_t *jdig, const mpz_dig_t *kdig, size_t klen) {
  173. mpz_dig_t *oidig = idig;
  174. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  175. *idig = *jdig & *kdig;
  176. }
  177. return mpn_remove_trailing_zeros(oidig, idig);
  178. }
  179. #endif
  180. /* i = -((-j) & (-k)) = ~((~j + 1) & (~k + 1)) + 1
  181. i = (j & (-k)) = (j & (~k + 1)) = ( j & (~k + 1))
  182. i = ((-j) & k) = ((~j + 1) & k) = ((~j + 1) & k )
  183. computes general form:
  184. i = (im ^ (((j ^ jm) + jc) & ((k ^ km) + kc))) + ic where Xm = Xc == 0 ? 0 : DIG_MASK
  185. returns number of digits in i
  186. assumes enough memory in i; assumes normalised j, k; assumes length j >= length k
  187. can have i, j, k pointing to same memory
  188. */
  189. STATIC size_t mpn_and_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  190. mpz_dbl_dig_t carryi, mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  191. mpz_dig_t *oidig = idig;
  192. mpz_dig_t imask = (0 == carryi) ? 0 : DIG_MASK;
  193. mpz_dig_t jmask = (0 == carryj) ? 0 : DIG_MASK;
  194. mpz_dig_t kmask = (0 == carryk) ? 0 : DIG_MASK;
  195. for (; jlen > 0; ++idig, ++jdig) {
  196. carryj += *jdig ^ jmask;
  197. carryk += (--klen <= --jlen) ? (*kdig++ ^ kmask) : kmask;
  198. carryi += ((carryj & carryk) ^ imask) & DIG_MASK;
  199. *idig = carryi & DIG_MASK;
  200. carryk >>= DIG_SIZE;
  201. carryj >>= DIG_SIZE;
  202. carryi >>= DIG_SIZE;
  203. }
  204. if (0 != carryi) {
  205. *idig++ = carryi;
  206. }
  207. return mpn_remove_trailing_zeros(oidig, idig);
  208. }
  209. #if MICROPY_OPT_MPZ_BITWISE
  210. /* computes i = j | k
  211. returns number of digits in i
  212. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen
  213. can have i, j, k pointing to same memory
  214. */
  215. STATIC size_t mpn_or(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  216. mpz_dig_t *oidig = idig;
  217. jlen -= klen;
  218. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  219. *idig = *jdig | *kdig;
  220. }
  221. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  222. *idig = *jdig;
  223. }
  224. return idig - oidig;
  225. }
  226. #endif
  227. /* i = -((-j) | (-k)) = ~((~j + 1) | (~k + 1)) + 1
  228. i = -(j | (-k)) = -(j | (~k + 1)) = ~( j | (~k + 1)) + 1
  229. i = -((-j) | k) = -((~j + 1) | k) = ~((~j + 1) | k ) + 1
  230. computes general form:
  231. i = ~(((j ^ jm) + jc) | ((k ^ km) + kc)) + 1 where Xm = Xc == 0 ? 0 : DIG_MASK
  232. returns number of digits in i
  233. assumes enough memory in i; assumes normalised j, k; assumes length j >= length k
  234. can have i, j, k pointing to same memory
  235. */
  236. #if MICROPY_OPT_MPZ_BITWISE
  237. STATIC size_t mpn_or_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  238. mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  239. mpz_dig_t *oidig = idig;
  240. mpz_dbl_dig_t carryi = 1;
  241. mpz_dig_t jmask = (0 == carryj) ? 0 : DIG_MASK;
  242. mpz_dig_t kmask = (0 == carryk) ? 0 : DIG_MASK;
  243. for (; jlen > 0; ++idig, ++jdig) {
  244. carryj += *jdig ^ jmask;
  245. carryk += (--klen <= --jlen) ? (*kdig++ ^ kmask) : kmask;
  246. carryi += ((carryj | carryk) ^ DIG_MASK) & DIG_MASK;
  247. *idig = carryi & DIG_MASK;
  248. carryk >>= DIG_SIZE;
  249. carryj >>= DIG_SIZE;
  250. carryi >>= DIG_SIZE;
  251. }
  252. // At least one of j,k must be negative so the above for-loop runs at least
  253. // once. For carryi to be non-zero here it must be equal to 1 at the end of
  254. // each iteration of the loop. So the accumulation of carryi must overflow
  255. // each time, ie carryi += 0xff..ff. So carryj|carryk must be 0 in the
  256. // DIG_MASK bits on each iteration. But considering all cases of signs of
  257. // j,k one sees that this is not possible.
  258. assert(carryi == 0);
  259. return mpn_remove_trailing_zeros(oidig, idig);
  260. }
  261. #else
  262. STATIC size_t mpn_or_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  263. mpz_dbl_dig_t carryi, mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  264. mpz_dig_t *oidig = idig;
  265. mpz_dig_t imask = (0 == carryi) ? 0 : DIG_MASK;
  266. mpz_dig_t jmask = (0 == carryj) ? 0 : DIG_MASK;
  267. mpz_dig_t kmask = (0 == carryk) ? 0 : DIG_MASK;
  268. for (; jlen > 0; ++idig, ++jdig) {
  269. carryj += *jdig ^ jmask;
  270. carryk += (--klen <= --jlen) ? (*kdig++ ^ kmask) : kmask;
  271. carryi += ((carryj | carryk) ^ imask) & DIG_MASK;
  272. *idig = carryi & DIG_MASK;
  273. carryk >>= DIG_SIZE;
  274. carryj >>= DIG_SIZE;
  275. carryi >>= DIG_SIZE;
  276. }
  277. // See comment in above mpn_or_neg for why carryi must be 0.
  278. assert(carryi == 0);
  279. return mpn_remove_trailing_zeros(oidig, idig);
  280. }
  281. #endif
  282. #if MICROPY_OPT_MPZ_BITWISE
  283. /* computes i = j ^ k
  284. returns number of digits in i
  285. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen
  286. can have i, j, k pointing to same memory
  287. */
  288. STATIC size_t mpn_xor(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  289. mpz_dig_t *oidig = idig;
  290. jlen -= klen;
  291. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  292. *idig = *jdig ^ *kdig;
  293. }
  294. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  295. *idig = *jdig;
  296. }
  297. return mpn_remove_trailing_zeros(oidig, idig);
  298. }
  299. #endif
  300. /* i = (-j) ^ (-k) = ~(j - 1) ^ ~(k - 1) = (j - 1) ^ (k - 1)
  301. i = -(j ^ (-k)) = -(j ^ ~(k - 1)) = ~(j ^ ~(k - 1)) + 1 = (j ^ (k - 1)) + 1
  302. i = -((-j) ^ k) = -(~(j - 1) ^ k) = ~(~(j - 1) ^ k) + 1 = ((j - 1) ^ k) + 1
  303. computes general form:
  304. i = ((j - 1 + jc) ^ (k - 1 + kc)) + ic
  305. returns number of digits in i
  306. assumes enough memory in i; assumes normalised j, k; assumes length j >= length k
  307. can have i, j, k pointing to same memory
  308. */
  309. STATIC size_t mpn_xor_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  310. mpz_dbl_dig_t carryi, mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  311. mpz_dig_t *oidig = idig;
  312. for (; jlen > 0; ++idig, ++jdig) {
  313. carryj += *jdig + DIG_MASK;
  314. carryk += (--klen <= --jlen) ? (*kdig++ + DIG_MASK) : DIG_MASK;
  315. carryi += (carryj ^ carryk) & DIG_MASK;
  316. *idig = carryi & DIG_MASK;
  317. carryk >>= DIG_SIZE;
  318. carryj >>= DIG_SIZE;
  319. carryi >>= DIG_SIZE;
  320. }
  321. if (0 != carryi) {
  322. *idig++ = carryi;
  323. }
  324. return mpn_remove_trailing_zeros(oidig, idig);
  325. }
  326. /* computes i = i * d1 + d2
  327. returns number of digits in i
  328. assumes enough memory in i; assumes normalised i; assumes dmul != 0
  329. */
  330. STATIC size_t mpn_mul_dig_add_dig(mpz_dig_t *idig, size_t ilen, mpz_dig_t dmul, mpz_dig_t dadd) {
  331. mpz_dig_t *oidig = idig;
  332. mpz_dbl_dig_t carry = dadd;
  333. for (; ilen > 0; --ilen, ++idig) {
  334. carry += (mpz_dbl_dig_t)*idig * (mpz_dbl_dig_t)dmul; // will never overflow so long as DIG_SIZE <= 8*sizeof(mpz_dbl_dig_t)/2
  335. *idig = carry & DIG_MASK;
  336. carry >>= DIG_SIZE;
  337. }
  338. if (carry != 0) {
  339. *idig++ = carry;
  340. }
  341. return idig - oidig;
  342. }
  343. /* computes i = j * k
  344. returns number of digits in i
  345. assumes enough memory in i; assumes i is zeroed; assumes normalised j, k
  346. can have j, k point to same memory
  347. */
  348. STATIC size_t mpn_mul(mpz_dig_t *idig, mpz_dig_t *jdig, size_t jlen, mpz_dig_t *kdig, size_t klen) {
  349. mpz_dig_t *oidig = idig;
  350. size_t ilen = 0;
  351. for (; klen > 0; --klen, ++idig, ++kdig) {
  352. mpz_dig_t *id = idig;
  353. mpz_dbl_dig_t carry = 0;
  354. size_t jl = jlen;
  355. for (mpz_dig_t *jd = jdig; jl > 0; --jl, ++jd, ++id) {
  356. carry += (mpz_dbl_dig_t)*id + (mpz_dbl_dig_t)*jd * (mpz_dbl_dig_t)*kdig; // will never overflow so long as DIG_SIZE <= 8*sizeof(mpz_dbl_dig_t)/2
  357. *id = carry & DIG_MASK;
  358. carry >>= DIG_SIZE;
  359. }
  360. if (carry != 0) {
  361. *id++ = carry;
  362. }
  363. ilen = id - oidig;
  364. }
  365. return ilen;
  366. }
  367. /* natural_div - quo * den + new_num = old_num (ie num is replaced with rem)
  368. assumes den != 0
  369. assumes num_dig has enough memory to be extended by 1 digit
  370. assumes quo_dig has enough memory (as many digits as num)
  371. assumes quo_dig is filled with zeros
  372. */
  373. STATIC void mpn_div(mpz_dig_t *num_dig, size_t *num_len, const mpz_dig_t *den_dig, size_t den_len, mpz_dig_t *quo_dig, size_t *quo_len) {
  374. mpz_dig_t *orig_num_dig = num_dig;
  375. mpz_dig_t *orig_quo_dig = quo_dig;
  376. mpz_dig_t norm_shift = 0;
  377. mpz_dbl_dig_t lead_den_digit;
  378. // handle simple cases
  379. {
  380. int cmp = mpn_cmp(num_dig, *num_len, den_dig, den_len);
  381. if (cmp == 0) {
  382. *num_len = 0;
  383. quo_dig[0] = 1;
  384. *quo_len = 1;
  385. return;
  386. } else if (cmp < 0) {
  387. // numerator remains the same
  388. *quo_len = 0;
  389. return;
  390. }
  391. }
  392. // We need to normalise the denominator (leading bit of leading digit is 1)
  393. // so that the division routine works. Since the denominator memory is
  394. // read-only we do the normalisation on the fly, each time a digit of the
  395. // denominator is needed. We need to know is how many bits to shift by.
  396. // count number of leading zeros in leading digit of denominator
  397. {
  398. mpz_dig_t d = den_dig[den_len - 1];
  399. while ((d & DIG_MSB) == 0) {
  400. d <<= 1;
  401. ++norm_shift;
  402. }
  403. }
  404. // now need to shift numerator by same amount as denominator
  405. // first, increase length of numerator in case we need more room to shift
  406. num_dig[*num_len] = 0;
  407. ++(*num_len);
  408. for (mpz_dig_t *num = num_dig, carry = 0; num < num_dig + *num_len; ++num) {
  409. mpz_dig_t n = *num;
  410. *num = ((n << norm_shift) | carry) & DIG_MASK;
  411. carry = (mpz_dbl_dig_t)n >> (DIG_SIZE - norm_shift);
  412. }
  413. // cache the leading digit of the denominator
  414. lead_den_digit = (mpz_dbl_dig_t)den_dig[den_len - 1] << norm_shift;
  415. if (den_len >= 2) {
  416. lead_den_digit |= (mpz_dbl_dig_t)den_dig[den_len - 2] >> (DIG_SIZE - norm_shift);
  417. }
  418. // point num_dig to last digit in numerator
  419. num_dig += *num_len - 1;
  420. // calculate number of digits in quotient
  421. *quo_len = *num_len - den_len;
  422. // point to last digit to store for quotient
  423. quo_dig += *quo_len - 1;
  424. // keep going while we have enough digits to divide
  425. while (*num_len > den_len) {
  426. mpz_dbl_dig_t quo = ((mpz_dbl_dig_t)*num_dig << DIG_SIZE) | num_dig[-1];
  427. // get approximate quotient
  428. quo /= lead_den_digit;
  429. // Multiply quo by den and subtract from num to get remainder.
  430. // We have different code here to handle different compile-time
  431. // configurations of mpz:
  432. //
  433. // 1. DIG_SIZE is stricly less than half the number of bits
  434. // available in mpz_dbl_dig_t. In this case we can use a
  435. // slightly more optimal (in time and space) routine that
  436. // uses the extra bits in mpz_dbl_dig_signed_t to store a
  437. // sign bit.
  438. //
  439. // 2. DIG_SIZE is exactly half the number of bits available in
  440. // mpz_dbl_dig_t. In this (common) case we need to be careful
  441. // not to overflow the borrow variable. And the shifting of
  442. // borrow needs some special logic (it's a shift right with
  443. // round up).
  444. //
  445. const mpz_dig_t *d = den_dig;
  446. mpz_dbl_dig_t d_norm = 0;
  447. mpz_dbl_dig_t borrow = 0;
  448. for (mpz_dig_t *n = num_dig - den_len; n < num_dig; ++n, ++d) {
  449. d_norm = ((mpz_dbl_dig_t)*d << norm_shift) | (d_norm >> DIG_SIZE);
  450. mpz_dbl_dig_t x = (mpz_dbl_dig_t)quo * (d_norm & DIG_MASK);
  451. #if DIG_SIZE < MPZ_DBL_DIG_SIZE / 2
  452. borrow += (mpz_dbl_dig_t)*n - x; // will overflow if DIG_SIZE >= MPZ_DBL_DIG_SIZE/2
  453. *n = borrow & DIG_MASK;
  454. borrow = (mpz_dbl_dig_signed_t)borrow >> DIG_SIZE;
  455. #else // DIG_SIZE == MPZ_DBL_DIG_SIZE / 2
  456. if (x >= *n || *n - x <= borrow) {
  457. borrow += x - (mpz_dbl_dig_t)*n;
  458. *n = (-borrow) & DIG_MASK;
  459. borrow = (borrow >> DIG_SIZE) + ((borrow & DIG_MASK) == 0 ? 0 : 1); // shift-right with round-up
  460. } else {
  461. *n = ((mpz_dbl_dig_t)*n - x - borrow) & DIG_MASK;
  462. borrow = 0;
  463. }
  464. #endif
  465. }
  466. #if DIG_SIZE < MPZ_DBL_DIG_SIZE / 2
  467. // Borrow was negative in the above for-loop, make it positive for next if-block.
  468. borrow = -borrow;
  469. #endif
  470. // At this point we have either:
  471. //
  472. // 1. quo was the correct value and the most-sig-digit of num is exactly
  473. // cancelled by borrow (borrow == *num_dig). In this case there is
  474. // nothing more to do.
  475. //
  476. // 2. quo was too large, we subtracted too many den from num, and the
  477. // most-sig-digit of num is 1 less than borrow (borrow == *num_dig + 1).
  478. // In this case we must reduce quo and add back den to num until the
  479. // carry from this operation cancels out the borrow.
  480. //
  481. borrow -= *num_dig;
  482. for (; borrow != 0; --quo) {
  483. d = den_dig;
  484. d_norm = 0;
  485. mpz_dbl_dig_t carry = 0;
  486. for (mpz_dig_t *n = num_dig - den_len; n < num_dig; ++n, ++d) {
  487. d_norm = ((mpz_dbl_dig_t)*d << norm_shift) | (d_norm >> DIG_SIZE);
  488. carry += (mpz_dbl_dig_t)*n + (d_norm & DIG_MASK);
  489. *n = carry & DIG_MASK;
  490. carry >>= DIG_SIZE;
  491. }
  492. borrow -= carry;
  493. }
  494. // store this digit of the quotient
  495. *quo_dig = quo & DIG_MASK;
  496. --quo_dig;
  497. // move down to next digit of numerator
  498. --num_dig;
  499. --(*num_len);
  500. }
  501. // unnormalise numerator (remainder now)
  502. for (mpz_dig_t *num = orig_num_dig + *num_len - 1, carry = 0; num >= orig_num_dig; --num) {
  503. mpz_dig_t n = *num;
  504. *num = ((n >> norm_shift) | carry) & DIG_MASK;
  505. carry = (mpz_dbl_dig_t)n << (DIG_SIZE - norm_shift);
  506. }
  507. // strip trailing zeros
  508. while (*quo_len > 0 && orig_quo_dig[*quo_len - 1] == 0) {
  509. --(*quo_len);
  510. }
  511. while (*num_len > 0 && orig_num_dig[*num_len - 1] == 0) {
  512. --(*num_len);
  513. }
  514. }
  515. #define MIN_ALLOC (2)
  516. void mpz_init_zero(mpz_t *z) {
  517. z->neg = 0;
  518. z->fixed_dig = 0;
  519. z->alloc = 0;
  520. z->len = 0;
  521. z->dig = NULL;
  522. }
  523. void mpz_init_from_int(mpz_t *z, mp_int_t val) {
  524. mpz_init_zero(z);
  525. mpz_set_from_int(z, val);
  526. }
  527. void mpz_init_fixed_from_int(mpz_t *z, mpz_dig_t *dig, size_t alloc, mp_int_t val) {
  528. z->neg = 0;
  529. z->fixed_dig = 1;
  530. z->alloc = alloc;
  531. z->len = 0;
  532. z->dig = dig;
  533. mpz_set_from_int(z, val);
  534. }
  535. void mpz_deinit(mpz_t *z) {
  536. if (z != NULL && !z->fixed_dig) {
  537. m_del(mpz_dig_t, z->dig, z->alloc);
  538. }
  539. }
  540. #if 0
  541. these functions are unused
  542. mpz_t *mpz_zero(void) {
  543. mpz_t *z = m_new_obj(mpz_t);
  544. mpz_init_zero(z);
  545. return z;
  546. }
  547. mpz_t *mpz_from_int(mp_int_t val) {
  548. mpz_t *z = mpz_zero();
  549. mpz_set_from_int(z, val);
  550. return z;
  551. }
  552. mpz_t *mpz_from_ll(long long val, bool is_signed) {
  553. mpz_t *z = mpz_zero();
  554. mpz_set_from_ll(z, val, is_signed);
  555. return z;
  556. }
  557. #if MICROPY_PY_BUILTINS_FLOAT
  558. mpz_t *mpz_from_float(mp_float_t val) {
  559. mpz_t *z = mpz_zero();
  560. mpz_set_from_float(z, val);
  561. return z;
  562. }
  563. #endif
  564. mpz_t *mpz_from_str(const char *str, size_t len, bool neg, unsigned int base) {
  565. mpz_t *z = mpz_zero();
  566. mpz_set_from_str(z, str, len, neg, base);
  567. return z;
  568. }
  569. #endif
  570. STATIC void mpz_free(mpz_t *z) {
  571. if (z != NULL) {
  572. m_del(mpz_dig_t, z->dig, z->alloc);
  573. m_del_obj(mpz_t, z);
  574. }
  575. }
  576. STATIC void mpz_need_dig(mpz_t *z, size_t need) {
  577. if (need < MIN_ALLOC) {
  578. need = MIN_ALLOC;
  579. }
  580. if (z->dig == NULL || z->alloc < need) {
  581. // if z has fixed digit buffer there's not much we can do as the caller will
  582. // be expecting a buffer with at least "need" bytes (but it shouldn't happen)
  583. assert(!z->fixed_dig);
  584. z->dig = m_renew(mpz_dig_t, z->dig, z->alloc, need);
  585. z->alloc = need;
  586. }
  587. }
  588. STATIC mpz_t *mpz_clone(const mpz_t *src) {
  589. assert(src->alloc != 0);
  590. mpz_t *z = m_new_obj(mpz_t);
  591. z->neg = src->neg;
  592. z->fixed_dig = 0;
  593. z->alloc = src->alloc;
  594. z->len = src->len;
  595. z->dig = m_new(mpz_dig_t, z->alloc);
  596. memcpy(z->dig, src->dig, src->alloc * sizeof(mpz_dig_t));
  597. return z;
  598. }
  599. /* sets dest = src
  600. can have dest, src the same
  601. */
  602. void mpz_set(mpz_t *dest, const mpz_t *src) {
  603. mpz_need_dig(dest, src->len);
  604. dest->neg = src->neg;
  605. dest->len = src->len;
  606. memcpy(dest->dig, src->dig, src->len * sizeof(mpz_dig_t));
  607. }
  608. void mpz_set_from_int(mpz_t *z, mp_int_t val) {
  609. if (val == 0) {
  610. z->len = 0;
  611. return;
  612. }
  613. mpz_need_dig(z, MPZ_NUM_DIG_FOR_INT);
  614. mp_uint_t uval;
  615. if (val < 0) {
  616. z->neg = 1;
  617. uval = -val;
  618. } else {
  619. z->neg = 0;
  620. uval = val;
  621. }
  622. z->len = 0;
  623. while (uval > 0) {
  624. z->dig[z->len++] = uval & DIG_MASK;
  625. uval >>= DIG_SIZE;
  626. }
  627. }
  628. void mpz_set_from_ll(mpz_t *z, long long val, bool is_signed) {
  629. mpz_need_dig(z, MPZ_NUM_DIG_FOR_LL);
  630. unsigned long long uval;
  631. if (is_signed && val < 0) {
  632. z->neg = 1;
  633. uval = -val;
  634. } else {
  635. z->neg = 0;
  636. uval = val;
  637. }
  638. z->len = 0;
  639. while (uval > 0) {
  640. z->dig[z->len++] = uval & DIG_MASK;
  641. uval >>= DIG_SIZE;
  642. }
  643. }
  644. #if MICROPY_PY_BUILTINS_FLOAT
  645. void mpz_set_from_float(mpz_t *z, mp_float_t src) {
  646. #if MICROPY_FLOAT_IMPL == MICROPY_FLOAT_IMPL_DOUBLE
  647. typedef uint64_t mp_float_int_t;
  648. #elif MICROPY_FLOAT_IMPL == MICROPY_FLOAT_IMPL_FLOAT
  649. typedef uint32_t mp_float_int_t;
  650. #endif
  651. union {
  652. mp_float_t f;
  653. #if MP_ENDIANNESS_LITTLE
  654. struct { mp_float_int_t frc:MP_FLOAT_FRAC_BITS, exp:MP_FLOAT_EXP_BITS, sgn:1; } p;
  655. #else
  656. struct { mp_float_int_t sgn:1, exp:MP_FLOAT_EXP_BITS, frc:MP_FLOAT_FRAC_BITS; } p;
  657. #endif
  658. } u = {src};
  659. z->neg = u.p.sgn;
  660. if (u.p.exp == 0) {
  661. // value == 0 || value < 1
  662. mpz_set_from_int(z, 0);
  663. } else if (u.p.exp == ((1 << MP_FLOAT_EXP_BITS) - 1)) {
  664. // u.p.frc == 0 indicates inf, else NaN
  665. // should be handled by caller
  666. mpz_set_from_int(z, 0);
  667. } else {
  668. const int adj_exp = (int)u.p.exp - MP_FLOAT_EXP_BIAS;
  669. if (adj_exp < 0) {
  670. // value < 1 , truncates to 0
  671. mpz_set_from_int(z, 0);
  672. } else if (adj_exp == 0) {
  673. // 1 <= value < 2 , so truncates to 1
  674. mpz_set_from_int(z, 1);
  675. } else {
  676. // 2 <= value
  677. const int dig_cnt = (adj_exp + 1 + (DIG_SIZE - 1)) / DIG_SIZE;
  678. const unsigned int rem = adj_exp % DIG_SIZE;
  679. int dig_ind, shft;
  680. mp_float_int_t frc = u.p.frc | ((mp_float_int_t)1 << MP_FLOAT_FRAC_BITS);
  681. if (adj_exp < MP_FLOAT_FRAC_BITS) {
  682. shft = 0;
  683. dig_ind = 0;
  684. frc >>= MP_FLOAT_FRAC_BITS - adj_exp;
  685. } else {
  686. shft = (rem - MP_FLOAT_FRAC_BITS) % DIG_SIZE;
  687. dig_ind = (adj_exp - MP_FLOAT_FRAC_BITS) / DIG_SIZE;
  688. }
  689. mpz_need_dig(z, dig_cnt);
  690. z->len = dig_cnt;
  691. if (dig_ind != 0) {
  692. memset(z->dig, 0, dig_ind * sizeof(mpz_dig_t));
  693. }
  694. if (shft != 0) {
  695. z->dig[dig_ind++] = (frc << shft) & DIG_MASK;
  696. frc >>= DIG_SIZE - shft;
  697. }
  698. #if DIG_SIZE < (MP_FLOAT_FRAC_BITS + 1)
  699. while (dig_ind != dig_cnt) {
  700. z->dig[dig_ind++] = frc & DIG_MASK;
  701. frc >>= DIG_SIZE;
  702. }
  703. #else
  704. if (dig_ind != dig_cnt) {
  705. z->dig[dig_ind] = frc;
  706. }
  707. #endif
  708. }
  709. }
  710. }
  711. #endif
  712. // returns number of bytes from str that were processed
  713. size_t mpz_set_from_str(mpz_t *z, const char *str, size_t len, bool neg, unsigned int base) {
  714. assert(base <= 36);
  715. const char *cur = str;
  716. const char *top = str + len;
  717. mpz_need_dig(z, len * 8 / DIG_SIZE + 1);
  718. if (neg) {
  719. z->neg = 1;
  720. } else {
  721. z->neg = 0;
  722. }
  723. z->len = 0;
  724. for (; cur < top; ++cur) { // XXX UTF8 next char
  725. //mp_uint_t v = char_to_numeric(cur#); // XXX UTF8 get char
  726. mp_uint_t v = *cur;
  727. if ('0' <= v && v <= '9') {
  728. v -= '0';
  729. } else if ('A' <= v && v <= 'Z') {
  730. v -= 'A' - 10;
  731. } else if ('a' <= v && v <= 'z') {
  732. v -= 'a' - 10;
  733. } else {
  734. break;
  735. }
  736. if (v >= base) {
  737. break;
  738. }
  739. z->len = mpn_mul_dig_add_dig(z->dig, z->len, base, v);
  740. }
  741. return cur - str;
  742. }
  743. void mpz_set_from_bytes(mpz_t *z, bool big_endian, size_t len, const byte *buf) {
  744. int delta = 1;
  745. if (big_endian) {
  746. buf += len - 1;
  747. delta = -1;
  748. }
  749. mpz_need_dig(z, (len * 8 + DIG_SIZE - 1) / DIG_SIZE);
  750. mpz_dig_t d = 0;
  751. int num_bits = 0;
  752. z->neg = 0;
  753. z->len = 0;
  754. while (len) {
  755. while (len && num_bits < DIG_SIZE) {
  756. d |= *buf << num_bits;
  757. num_bits += 8;
  758. buf += delta;
  759. len--;
  760. }
  761. z->dig[z->len++] = d & DIG_MASK;
  762. // Need this #if because it's C undefined behavior to do: uint32_t >> 32
  763. #if DIG_SIZE != 8 && DIG_SIZE != 16 && DIG_SIZE != 32
  764. d >>= DIG_SIZE;
  765. #else
  766. d = 0;
  767. #endif
  768. num_bits -= DIG_SIZE;
  769. }
  770. z->len = mpn_remove_trailing_zeros(z->dig, z->dig + z->len);
  771. }
  772. #if 0
  773. these functions are unused
  774. bool mpz_is_pos(const mpz_t *z) {
  775. return z->len > 0 && z->neg == 0;
  776. }
  777. bool mpz_is_odd(const mpz_t *z) {
  778. return z->len > 0 && (z->dig[0] & 1) != 0;
  779. }
  780. bool mpz_is_even(const mpz_t *z) {
  781. return z->len == 0 || (z->dig[0] & 1) == 0;
  782. }
  783. #endif
  784. int mpz_cmp(const mpz_t *z1, const mpz_t *z2) {
  785. // to catch comparison of -0 with +0
  786. if (z1->len == 0 && z2->len == 0) {
  787. return 0;
  788. }
  789. int cmp = (int)z2->neg - (int)z1->neg;
  790. if (cmp != 0) {
  791. return cmp;
  792. }
  793. cmp = mpn_cmp(z1->dig, z1->len, z2->dig, z2->len);
  794. if (z1->neg != 0) {
  795. cmp = -cmp;
  796. }
  797. return cmp;
  798. }
  799. #if 0
  800. // obsolete
  801. // compares mpz with an integer that fits within DIG_SIZE bits
  802. mp_int_t mpz_cmp_sml_int(const mpz_t *z, mp_int_t sml_int) {
  803. mp_int_t cmp;
  804. if (z->neg == 0) {
  805. if (sml_int < 0) return 1;
  806. if (sml_int == 0) {
  807. if (z->len == 0) return 0;
  808. return 1;
  809. }
  810. if (z->len == 0) return -1;
  811. assert(sml_int < (1 << DIG_SIZE));
  812. if (z->len != 1) return 1;
  813. cmp = z->dig[0] - sml_int;
  814. } else {
  815. if (sml_int > 0) return -1;
  816. if (sml_int == 0) {
  817. if (z->len == 0) return 0;
  818. return -1;
  819. }
  820. if (z->len == 0) return 1;
  821. assert(sml_int > -(1 << DIG_SIZE));
  822. if (z->len != 1) return -1;
  823. cmp = -z->dig[0] - sml_int;
  824. }
  825. if (cmp < 0) return -1;
  826. if (cmp > 0) return 1;
  827. return 0;
  828. }
  829. #endif
  830. #if 0
  831. these functions are unused
  832. /* returns abs(z)
  833. */
  834. mpz_t *mpz_abs(const mpz_t *z) {
  835. // TODO: handle case of z->alloc=0
  836. mpz_t *z2 = mpz_clone(z);
  837. z2->neg = 0;
  838. return z2;
  839. }
  840. /* returns -z
  841. */
  842. mpz_t *mpz_neg(const mpz_t *z) {
  843. // TODO: handle case of z->alloc=0
  844. mpz_t *z2 = mpz_clone(z);
  845. z2->neg = 1 - z2->neg;
  846. return z2;
  847. }
  848. /* returns lhs + rhs
  849. can have lhs, rhs the same
  850. */
  851. mpz_t *mpz_add(const mpz_t *lhs, const mpz_t *rhs) {
  852. mpz_t *z = mpz_zero();
  853. mpz_add_inpl(z, lhs, rhs);
  854. return z;
  855. }
  856. /* returns lhs - rhs
  857. can have lhs, rhs the same
  858. */
  859. mpz_t *mpz_sub(const mpz_t *lhs, const mpz_t *rhs) {
  860. mpz_t *z = mpz_zero();
  861. mpz_sub_inpl(z, lhs, rhs);
  862. return z;
  863. }
  864. /* returns lhs * rhs
  865. can have lhs, rhs the same
  866. */
  867. mpz_t *mpz_mul(const mpz_t *lhs, const mpz_t *rhs) {
  868. mpz_t *z = mpz_zero();
  869. mpz_mul_inpl(z, lhs, rhs);
  870. return z;
  871. }
  872. /* returns lhs ** rhs
  873. can have lhs, rhs the same
  874. */
  875. mpz_t *mpz_pow(const mpz_t *lhs, const mpz_t *rhs) {
  876. mpz_t *z = mpz_zero();
  877. mpz_pow_inpl(z, lhs, rhs);
  878. return z;
  879. }
  880. /* computes new integers in quo and rem such that:
  881. quo * rhs + rem = lhs
  882. 0 <= rem < rhs
  883. can have lhs, rhs the same
  884. */
  885. void mpz_divmod(const mpz_t *lhs, const mpz_t *rhs, mpz_t **quo, mpz_t **rem) {
  886. *quo = mpz_zero();
  887. *rem = mpz_zero();
  888. mpz_divmod_inpl(*quo, *rem, lhs, rhs);
  889. }
  890. #endif
  891. /* computes dest = abs(z)
  892. can have dest, z the same
  893. */
  894. void mpz_abs_inpl(mpz_t *dest, const mpz_t *z) {
  895. if (dest != z) {
  896. mpz_set(dest, z);
  897. }
  898. dest->neg = 0;
  899. }
  900. /* computes dest = -z
  901. can have dest, z the same
  902. */
  903. void mpz_neg_inpl(mpz_t *dest, const mpz_t *z) {
  904. if (dest != z) {
  905. mpz_set(dest, z);
  906. }
  907. dest->neg = 1 - dest->neg;
  908. }
  909. /* computes dest = ~z (= -z - 1)
  910. can have dest, z the same
  911. */
  912. void mpz_not_inpl(mpz_t *dest, const mpz_t *z) {
  913. if (dest != z) {
  914. mpz_set(dest, z);
  915. }
  916. if (dest->len == 0) {
  917. mpz_need_dig(dest, 1);
  918. dest->dig[0] = 1;
  919. dest->len = 1;
  920. dest->neg = 1;
  921. } else if (dest->neg) {
  922. dest->neg = 0;
  923. mpz_dig_t k = 1;
  924. dest->len = mpn_sub(dest->dig, dest->dig, dest->len, &k, 1);
  925. } else {
  926. mpz_need_dig(dest, dest->len + 1);
  927. mpz_dig_t k = 1;
  928. dest->len = mpn_add(dest->dig, dest->dig, dest->len, &k, 1);
  929. dest->neg = 1;
  930. }
  931. }
  932. /* computes dest = lhs << rhs
  933. can have dest, lhs the same
  934. */
  935. void mpz_shl_inpl(mpz_t *dest, const mpz_t *lhs, mp_uint_t rhs) {
  936. if (lhs->len == 0 || rhs == 0) {
  937. mpz_set(dest, lhs);
  938. } else {
  939. mpz_need_dig(dest, lhs->len + (rhs + DIG_SIZE - 1) / DIG_SIZE);
  940. dest->len = mpn_shl(dest->dig, lhs->dig, lhs->len, rhs);
  941. dest->neg = lhs->neg;
  942. }
  943. }
  944. /* computes dest = lhs >> rhs
  945. can have dest, lhs the same
  946. */
  947. void mpz_shr_inpl(mpz_t *dest, const mpz_t *lhs, mp_uint_t rhs) {
  948. if (lhs->len == 0 || rhs == 0) {
  949. mpz_set(dest, lhs);
  950. } else {
  951. mpz_need_dig(dest, lhs->len);
  952. dest->len = mpn_shr(dest->dig, lhs->dig, lhs->len, rhs);
  953. dest->neg = lhs->neg;
  954. if (dest->neg) {
  955. // arithmetic shift right, rounding to negative infinity
  956. mp_uint_t n_whole = rhs / DIG_SIZE;
  957. mp_uint_t n_part = rhs % DIG_SIZE;
  958. mpz_dig_t round_up = 0;
  959. for (size_t i = 0; i < lhs->len && i < n_whole; i++) {
  960. if (lhs->dig[i] != 0) {
  961. round_up = 1;
  962. break;
  963. }
  964. }
  965. if (n_whole < lhs->len && (lhs->dig[n_whole] & ((1 << n_part) - 1)) != 0) {
  966. round_up = 1;
  967. }
  968. if (round_up) {
  969. if (dest->len == 0) {
  970. // dest == 0, so need to add 1 by hand (answer will be -1)
  971. dest->dig[0] = 1;
  972. dest->len = 1;
  973. } else {
  974. // dest > 0, so can use mpn_add to add 1
  975. dest->len = mpn_add(dest->dig, dest->dig, dest->len, &round_up, 1);
  976. }
  977. }
  978. }
  979. }
  980. }
  981. /* computes dest = lhs + rhs
  982. can have dest, lhs, rhs the same
  983. */
  984. void mpz_add_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  985. if (mpn_cmp(lhs->dig, lhs->len, rhs->dig, rhs->len) < 0) {
  986. const mpz_t *temp = lhs;
  987. lhs = rhs;
  988. rhs = temp;
  989. }
  990. if (lhs->neg == rhs->neg) {
  991. mpz_need_dig(dest, lhs->len + 1);
  992. dest->len = mpn_add(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  993. } else {
  994. mpz_need_dig(dest, lhs->len);
  995. dest->len = mpn_sub(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  996. }
  997. dest->neg = lhs->neg;
  998. }
  999. /* computes dest = lhs - rhs
  1000. can have dest, lhs, rhs the same
  1001. */
  1002. void mpz_sub_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1003. bool neg = false;
  1004. if (mpn_cmp(lhs->dig, lhs->len, rhs->dig, rhs->len) < 0) {
  1005. const mpz_t *temp = lhs;
  1006. lhs = rhs;
  1007. rhs = temp;
  1008. neg = true;
  1009. }
  1010. if (lhs->neg != rhs->neg) {
  1011. mpz_need_dig(dest, lhs->len + 1);
  1012. dest->len = mpn_add(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1013. } else {
  1014. mpz_need_dig(dest, lhs->len);
  1015. dest->len = mpn_sub(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1016. }
  1017. if (neg) {
  1018. dest->neg = 1 - lhs->neg;
  1019. } else {
  1020. dest->neg = lhs->neg;
  1021. }
  1022. }
  1023. /* computes dest = lhs & rhs
  1024. can have dest, lhs, rhs the same
  1025. */
  1026. void mpz_and_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1027. // make sure lhs has the most digits
  1028. if (lhs->len < rhs->len) {
  1029. const mpz_t *temp = lhs;
  1030. lhs = rhs;
  1031. rhs = temp;
  1032. }
  1033. #if MICROPY_OPT_MPZ_BITWISE
  1034. if ((0 == lhs->neg) && (0 == rhs->neg)) {
  1035. mpz_need_dig(dest, lhs->len);
  1036. dest->len = mpn_and(dest->dig, lhs->dig, rhs->dig, rhs->len);
  1037. dest->neg = 0;
  1038. } else {
  1039. mpz_need_dig(dest, lhs->len + 1);
  1040. dest->len = mpn_and_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1041. lhs->neg == rhs->neg, 0 != lhs->neg, 0 != rhs->neg);
  1042. dest->neg = lhs->neg & rhs->neg;
  1043. }
  1044. #else
  1045. mpz_need_dig(dest, lhs->len + (lhs->neg || rhs->neg));
  1046. dest->len = mpn_and_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1047. (lhs->neg == rhs->neg) ? lhs->neg : 0, lhs->neg, rhs->neg);
  1048. dest->neg = lhs->neg & rhs->neg;
  1049. #endif
  1050. }
  1051. /* computes dest = lhs | rhs
  1052. can have dest, lhs, rhs the same
  1053. */
  1054. void mpz_or_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1055. // make sure lhs has the most digits
  1056. if (lhs->len < rhs->len) {
  1057. const mpz_t *temp = lhs;
  1058. lhs = rhs;
  1059. rhs = temp;
  1060. }
  1061. #if MICROPY_OPT_MPZ_BITWISE
  1062. if ((0 == lhs->neg) && (0 == rhs->neg)) {
  1063. mpz_need_dig(dest, lhs->len);
  1064. dest->len = mpn_or(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1065. dest->neg = 0;
  1066. } else {
  1067. mpz_need_dig(dest, lhs->len + 1);
  1068. dest->len = mpn_or_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1069. 0 != lhs->neg, 0 != rhs->neg);
  1070. dest->neg = 1;
  1071. }
  1072. #else
  1073. mpz_need_dig(dest, lhs->len + (lhs->neg || rhs->neg));
  1074. dest->len = mpn_or_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1075. (lhs->neg || rhs->neg), lhs->neg, rhs->neg);
  1076. dest->neg = lhs->neg | rhs->neg;
  1077. #endif
  1078. }
  1079. /* computes dest = lhs ^ rhs
  1080. can have dest, lhs, rhs the same
  1081. */
  1082. void mpz_xor_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1083. // make sure lhs has the most digits
  1084. if (lhs->len < rhs->len) {
  1085. const mpz_t *temp = lhs;
  1086. lhs = rhs;
  1087. rhs = temp;
  1088. }
  1089. #if MICROPY_OPT_MPZ_BITWISE
  1090. if (lhs->neg == rhs->neg) {
  1091. mpz_need_dig(dest, lhs->len);
  1092. if (lhs->neg == 0) {
  1093. dest->len = mpn_xor(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1094. } else {
  1095. dest->len = mpn_xor_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len, 0, 0, 0);
  1096. }
  1097. dest->neg = 0;
  1098. } else {
  1099. mpz_need_dig(dest, lhs->len + 1);
  1100. dest->len = mpn_xor_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len, 1,
  1101. 0 == lhs->neg, 0 == rhs->neg);
  1102. dest->neg = 1;
  1103. }
  1104. #else
  1105. mpz_need_dig(dest, lhs->len + (lhs->neg || rhs->neg));
  1106. dest->len = mpn_xor_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1107. (lhs->neg != rhs->neg), 0 == lhs->neg, 0 == rhs->neg);
  1108. dest->neg = lhs->neg ^ rhs->neg;
  1109. #endif
  1110. }
  1111. /* computes dest = lhs * rhs
  1112. can have dest, lhs, rhs the same
  1113. */
  1114. void mpz_mul_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1115. if (lhs->len == 0 || rhs->len == 0) {
  1116. mpz_set_from_int(dest, 0);
  1117. return;
  1118. }
  1119. mpz_t *temp = NULL;
  1120. if (lhs == dest) {
  1121. lhs = temp = mpz_clone(lhs);
  1122. if (rhs == dest) {
  1123. rhs = lhs;
  1124. }
  1125. } else if (rhs == dest) {
  1126. rhs = temp = mpz_clone(rhs);
  1127. }
  1128. mpz_need_dig(dest, lhs->len + rhs->len); // min mem l+r-1, max mem l+r
  1129. memset(dest->dig, 0, dest->alloc * sizeof(mpz_dig_t));
  1130. dest->len = mpn_mul(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1131. if (lhs->neg == rhs->neg) {
  1132. dest->neg = 0;
  1133. } else {
  1134. dest->neg = 1;
  1135. }
  1136. mpz_free(temp);
  1137. }
  1138. /* computes dest = lhs ** rhs
  1139. can have dest, lhs, rhs the same
  1140. */
  1141. void mpz_pow_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1142. if (lhs->len == 0 || rhs->neg != 0) {
  1143. mpz_set_from_int(dest, 0);
  1144. return;
  1145. }
  1146. if (rhs->len == 0) {
  1147. mpz_set_from_int(dest, 1);
  1148. return;
  1149. }
  1150. mpz_t *x = mpz_clone(lhs);
  1151. mpz_t *n = mpz_clone(rhs);
  1152. mpz_set_from_int(dest, 1);
  1153. while (n->len > 0) {
  1154. if ((n->dig[0] & 1) != 0) {
  1155. mpz_mul_inpl(dest, dest, x);
  1156. }
  1157. n->len = mpn_shr(n->dig, n->dig, n->len, 1);
  1158. if (n->len == 0) {
  1159. break;
  1160. }
  1161. mpz_mul_inpl(x, x, x);
  1162. }
  1163. mpz_free(x);
  1164. mpz_free(n);
  1165. }
  1166. /* computes dest = (lhs ** rhs) % mod
  1167. can have dest, lhs, rhs the same; mod can't be the same as dest
  1168. */
  1169. void mpz_pow3_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs, const mpz_t *mod) {
  1170. if (lhs->len == 0 || rhs->neg != 0 || (mod->len == 1 && mod->dig[0] == 1)) {
  1171. mpz_set_from_int(dest, 0);
  1172. return;
  1173. }
  1174. mpz_set_from_int(dest, 1);
  1175. if (rhs->len == 0) {
  1176. return;
  1177. }
  1178. mpz_t *x = mpz_clone(lhs);
  1179. mpz_t *n = mpz_clone(rhs);
  1180. mpz_t quo; mpz_init_zero(&quo);
  1181. while (n->len > 0) {
  1182. if ((n->dig[0] & 1) != 0) {
  1183. mpz_mul_inpl(dest, dest, x);
  1184. mpz_divmod_inpl(&quo, dest, dest, mod);
  1185. }
  1186. n->len = mpn_shr(n->dig, n->dig, n->len, 1);
  1187. if (n->len == 0) {
  1188. break;
  1189. }
  1190. mpz_mul_inpl(x, x, x);
  1191. mpz_divmod_inpl(&quo, x, x, mod);
  1192. }
  1193. mpz_deinit(&quo);
  1194. mpz_free(x);
  1195. mpz_free(n);
  1196. }
  1197. #if 0
  1198. these functions are unused
  1199. /* computes gcd(z1, z2)
  1200. based on Knuth's modified gcd algorithm (I think?)
  1201. gcd(z1, z2) >= 0
  1202. gcd(0, 0) = 0
  1203. gcd(z, 0) = abs(z)
  1204. */
  1205. mpz_t *mpz_gcd(const mpz_t *z1, const mpz_t *z2) {
  1206. if (z1->len == 0) {
  1207. // TODO: handle case of z2->alloc=0
  1208. mpz_t *a = mpz_clone(z2);
  1209. a->neg = 0;
  1210. return a;
  1211. } else if (z2->len == 0) {
  1212. mpz_t *a = mpz_clone(z1);
  1213. a->neg = 0;
  1214. return a;
  1215. }
  1216. mpz_t *a = mpz_clone(z1);
  1217. mpz_t *b = mpz_clone(z2);
  1218. mpz_t c; mpz_init_zero(&c);
  1219. a->neg = 0;
  1220. b->neg = 0;
  1221. for (;;) {
  1222. if (mpz_cmp(a, b) < 0) {
  1223. if (a->len == 0) {
  1224. mpz_free(a);
  1225. mpz_deinit(&c);
  1226. return b;
  1227. }
  1228. mpz_t *t = a; a = b; b = t;
  1229. }
  1230. if (!(b->len >= 2 || (b->len == 1 && b->dig[0] > 1))) { // compute b > 0; could be mpz_cmp_small_int(b, 1) > 0
  1231. break;
  1232. }
  1233. mpz_set(&c, b);
  1234. do {
  1235. mpz_add_inpl(&c, &c, &c);
  1236. } while (mpz_cmp(&c, a) <= 0);
  1237. c.len = mpn_shr(c.dig, c.dig, c.len, 1);
  1238. mpz_sub_inpl(a, a, &c);
  1239. }
  1240. mpz_deinit(&c);
  1241. if (b->len == 1 && b->dig[0] == 1) { // compute b == 1; could be mpz_cmp_small_int(b, 1) == 0
  1242. mpz_free(a);
  1243. return b;
  1244. } else {
  1245. mpz_free(b);
  1246. return a;
  1247. }
  1248. }
  1249. /* computes lcm(z1, z2)
  1250. = abs(z1) / gcd(z1, z2) * abs(z2)
  1251. lcm(z1, z1) >= 0
  1252. lcm(0, 0) = 0
  1253. lcm(z, 0) = 0
  1254. */
  1255. mpz_t *mpz_lcm(const mpz_t *z1, const mpz_t *z2) {
  1256. if (z1->len == 0 || z2->len == 0) {
  1257. return mpz_zero();
  1258. }
  1259. mpz_t *gcd = mpz_gcd(z1, z2);
  1260. mpz_t *quo = mpz_zero();
  1261. mpz_t *rem = mpz_zero();
  1262. mpz_divmod_inpl(quo, rem, z1, gcd);
  1263. mpz_mul_inpl(rem, quo, z2);
  1264. mpz_free(gcd);
  1265. mpz_free(quo);
  1266. rem->neg = 0;
  1267. return rem;
  1268. }
  1269. #endif
  1270. /* computes new integers in quo and rem such that:
  1271. quo * rhs + rem = lhs
  1272. 0 <= rem < rhs
  1273. can have lhs, rhs the same
  1274. assumes rhs != 0 (undefined behaviour if it is)
  1275. */
  1276. void mpz_divmod_inpl(mpz_t *dest_quo, mpz_t *dest_rem, const mpz_t *lhs, const mpz_t *rhs) {
  1277. assert(!mpz_is_zero(rhs));
  1278. mpz_need_dig(dest_quo, lhs->len + 1); // +1 necessary?
  1279. memset(dest_quo->dig, 0, (lhs->len + 1) * sizeof(mpz_dig_t));
  1280. dest_quo->len = 0;
  1281. mpz_need_dig(dest_rem, lhs->len + 1); // +1 necessary?
  1282. mpz_set(dest_rem, lhs);
  1283. mpn_div(dest_rem->dig, &dest_rem->len, rhs->dig, rhs->len, dest_quo->dig, &dest_quo->len);
  1284. // check signs and do Python style modulo
  1285. if (lhs->neg != rhs->neg) {
  1286. dest_quo->neg = 1;
  1287. if (!mpz_is_zero(dest_rem)) {
  1288. mpz_t mpzone; mpz_init_from_int(&mpzone, -1);
  1289. mpz_add_inpl(dest_quo, dest_quo, &mpzone);
  1290. mpz_add_inpl(dest_rem, dest_rem, rhs);
  1291. }
  1292. }
  1293. }
  1294. #if 0
  1295. these functions are unused
  1296. /* computes floor(lhs / rhs)
  1297. can have lhs, rhs the same
  1298. */
  1299. mpz_t *mpz_div(const mpz_t *lhs, const mpz_t *rhs) {
  1300. mpz_t *quo = mpz_zero();
  1301. mpz_t rem; mpz_init_zero(&rem);
  1302. mpz_divmod_inpl(quo, &rem, lhs, rhs);
  1303. mpz_deinit(&rem);
  1304. return quo;
  1305. }
  1306. /* computes lhs % rhs ( >= 0)
  1307. can have lhs, rhs the same
  1308. */
  1309. mpz_t *mpz_mod(const mpz_t *lhs, const mpz_t *rhs) {
  1310. mpz_t quo; mpz_init_zero(&quo);
  1311. mpz_t *rem = mpz_zero();
  1312. mpz_divmod_inpl(&quo, rem, lhs, rhs);
  1313. mpz_deinit(&quo);
  1314. return rem;
  1315. }
  1316. #endif
  1317. // must return actual int value if it fits in mp_int_t
  1318. mp_int_t mpz_hash(const mpz_t *z) {
  1319. mp_uint_t val = 0;
  1320. mpz_dig_t *d = z->dig + z->len;
  1321. while (d-- > z->dig) {
  1322. val = (val << DIG_SIZE) | *d;
  1323. }
  1324. if (z->neg != 0) {
  1325. val = -val;
  1326. }
  1327. return val;
  1328. }
  1329. bool mpz_as_int_checked(const mpz_t *i, mp_int_t *value) {
  1330. mp_uint_t val = 0;
  1331. mpz_dig_t *d = i->dig + i->len;
  1332. while (d-- > i->dig) {
  1333. if (val > (~(WORD_MSBIT_HIGH) >> DIG_SIZE)) {
  1334. // will overflow
  1335. return false;
  1336. }
  1337. val = (val << DIG_SIZE) | *d;
  1338. }
  1339. if (i->neg != 0) {
  1340. val = -val;
  1341. }
  1342. *value = val;
  1343. return true;
  1344. }
  1345. bool mpz_as_uint_checked(const mpz_t *i, mp_uint_t *value) {
  1346. if (i->neg != 0) {
  1347. // can't represent signed values
  1348. return false;
  1349. }
  1350. mp_uint_t val = 0;
  1351. mpz_dig_t *d = i->dig + i->len;
  1352. while (d-- > i->dig) {
  1353. if (val > (~(WORD_MSBIT_HIGH) >> (DIG_SIZE - 1))) {
  1354. // will overflow
  1355. return false;
  1356. }
  1357. val = (val << DIG_SIZE) | *d;
  1358. }
  1359. *value = val;
  1360. return true;
  1361. }
  1362. // writes at most len bytes to buf (so buf should be zeroed before calling)
  1363. void mpz_as_bytes(const mpz_t *z, bool big_endian, size_t len, byte *buf) {
  1364. byte *b = buf;
  1365. if (big_endian) {
  1366. b += len;
  1367. }
  1368. mpz_dig_t *zdig = z->dig;
  1369. int bits = 0;
  1370. mpz_dbl_dig_t d = 0;
  1371. mpz_dbl_dig_t carry = 1;
  1372. for (size_t zlen = z->len; zlen > 0; --zlen) {
  1373. bits += DIG_SIZE;
  1374. d = (d << DIG_SIZE) | *zdig++;
  1375. for (; bits >= 8; bits -= 8, d >>= 8) {
  1376. mpz_dig_t val = d;
  1377. if (z->neg) {
  1378. val = (~val & 0xff) + carry;
  1379. carry = val >> 8;
  1380. }
  1381. if (big_endian) {
  1382. *--b = val;
  1383. if (b == buf) {
  1384. return;
  1385. }
  1386. } else {
  1387. *b++ = val;
  1388. if (b == buf + len) {
  1389. return;
  1390. }
  1391. }
  1392. }
  1393. }
  1394. }
  1395. #if MICROPY_PY_BUILTINS_FLOAT
  1396. mp_float_t mpz_as_float(const mpz_t *i) {
  1397. mp_float_t val = 0;
  1398. mpz_dig_t *d = i->dig + i->len;
  1399. while (d-- > i->dig) {
  1400. val = val * DIG_BASE + *d;
  1401. }
  1402. if (i->neg != 0) {
  1403. val = -val;
  1404. }
  1405. return val;
  1406. }
  1407. #endif
  1408. #if 0
  1409. this function is unused
  1410. char *mpz_as_str(const mpz_t *i, unsigned int base) {
  1411. char *s = m_new(char, mp_int_format_size(mpz_max_num_bits(i), base, NULL, '\0'));
  1412. mpz_as_str_inpl(i, base, NULL, 'a', '\0', s);
  1413. return s;
  1414. }
  1415. #endif
  1416. // assumes enough space in str as calculated by mp_int_format_size
  1417. // base must be between 2 and 32 inclusive
  1418. // returns length of string, not including null byte
  1419. size_t mpz_as_str_inpl(const mpz_t *i, unsigned int base, const char *prefix, char base_char, char comma, char *str) {
  1420. assert(str != NULL);
  1421. assert(2 <= base && base <= 32);
  1422. size_t ilen = i->len;
  1423. char *s = str;
  1424. if (ilen == 0) {
  1425. if (prefix) {
  1426. while (*prefix)
  1427. *s++ = *prefix++;
  1428. }
  1429. *s++ = '0';
  1430. *s = '\0';
  1431. return s - str;
  1432. }
  1433. // make a copy of mpz digits, so we can do the div/mod calculation
  1434. mpz_dig_t *dig = m_new(mpz_dig_t, ilen);
  1435. memcpy(dig, i->dig, ilen * sizeof(mpz_dig_t));
  1436. // convert
  1437. char *last_comma = str;
  1438. bool done;
  1439. do {
  1440. mpz_dig_t *d = dig + ilen;
  1441. mpz_dbl_dig_t a = 0;
  1442. // compute next remainder
  1443. while (--d >= dig) {
  1444. a = (a << DIG_SIZE) | *d;
  1445. *d = a / base;
  1446. a %= base;
  1447. }
  1448. // convert to character
  1449. a += '0';
  1450. if (a > '9') {
  1451. a += base_char - '9' - 1;
  1452. }
  1453. *s++ = a;
  1454. // check if number is zero
  1455. done = true;
  1456. for (d = dig; d < dig + ilen; ++d) {
  1457. if (*d != 0) {
  1458. done = false;
  1459. break;
  1460. }
  1461. }
  1462. if (comma && (s - last_comma) == 3) {
  1463. *s++ = comma;
  1464. last_comma = s;
  1465. }
  1466. }
  1467. while (!done);
  1468. // free the copy of the digits array
  1469. m_del(mpz_dig_t, dig, ilen);
  1470. if (prefix) {
  1471. const char *p = &prefix[strlen(prefix)];
  1472. while (p > prefix) {
  1473. *s++ = *--p;
  1474. }
  1475. }
  1476. if (i->neg != 0) {
  1477. *s++ = '-';
  1478. }
  1479. // reverse string
  1480. for (char *u = str, *v = s - 1; u < v; ++u, --v) {
  1481. char temp = *u;
  1482. *u = *v;
  1483. *v = temp;
  1484. }
  1485. *s = '\0'; // null termination
  1486. return s - str;
  1487. }
  1488. #endif // MICROPY_LONGINT_IMPL == MICROPY_LONGINT_IMPL_MPZ