mpz.c 47 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746
  1. /*
  2. * This file is part of the MicroPython project, http://micropython.org/
  3. *
  4. * The MIT License (MIT)
  5. *
  6. * Copyright (c) 2013, 2014 Damien P. George
  7. *
  8. * Permission is hereby granted, free of charge, to any person obtaining a copy
  9. * of this software and associated documentation files (the "Software"), to deal
  10. * in the Software without restriction, including without limitation the rights
  11. * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
  12. * copies of the Software, and to permit persons to whom the Software is
  13. * furnished to do so, subject to the following conditions:
  14. *
  15. * The above copyright notice and this permission notice shall be included in
  16. * all copies or substantial portions of the Software.
  17. *
  18. * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  19. * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  20. * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  21. * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  22. * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  23. * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
  24. * THE SOFTWARE.
  25. */
  26. #include <string.h>
  27. #include <assert.h>
  28. #include "py/mpz.h"
  29. #if MICROPY_LONGINT_IMPL == MICROPY_LONGINT_IMPL_MPZ
  30. #define DIG_SIZE (MPZ_DIG_SIZE)
  31. #define DIG_MASK ((MPZ_LONG_1 << DIG_SIZE) - 1)
  32. #define DIG_MSB (MPZ_LONG_1 << (DIG_SIZE - 1))
  33. #define DIG_BASE (MPZ_LONG_1 << DIG_SIZE)
  34. /*
  35. mpz is an arbitrary precision integer type with a public API.
  36. mpn functions act on non-negative integers represented by an array of generalised
  37. digits (eg a word per digit). You also need to specify separately the length of the
  38. array. There is no public API for mpn. Rather, the functions are used by mpz to
  39. implement its features.
  40. Integer values are stored little endian (first digit is first in memory).
  41. Definition of normalise: ?
  42. */
  43. static size_t mpn_remove_trailing_zeros(mpz_dig_t *oidig, mpz_dig_t *idig) {
  44. for (--idig; idig >= oidig && *idig == 0; --idig) {
  45. }
  46. return idig + 1 - oidig;
  47. }
  48. /* compares i with j
  49. returns sign(i - j)
  50. assumes i, j are normalised
  51. */
  52. static int mpn_cmp(const mpz_dig_t *idig, size_t ilen, const mpz_dig_t *jdig, size_t jlen) {
  53. if (ilen < jlen) {
  54. return -1;
  55. }
  56. if (ilen > jlen) {
  57. return 1;
  58. }
  59. for (idig += ilen, jdig += ilen; ilen > 0; --ilen) {
  60. mpz_dbl_dig_signed_t cmp = (mpz_dbl_dig_t)*(--idig) - (mpz_dbl_dig_t)*(--jdig);
  61. if (cmp < 0) {
  62. return -1;
  63. }
  64. if (cmp > 0) {
  65. return 1;
  66. }
  67. }
  68. return 0;
  69. }
  70. /* computes i = j << n
  71. returns number of digits in i
  72. assumes enough memory in i; assumes normalised j; assumes n > 0
  73. can have i, j pointing to same memory
  74. */
  75. static size_t mpn_shl(mpz_dig_t *idig, mpz_dig_t *jdig, size_t jlen, mp_uint_t n) {
  76. mp_uint_t n_whole = (n + DIG_SIZE - 1) / DIG_SIZE;
  77. mp_uint_t n_part = n % DIG_SIZE;
  78. if (n_part == 0) {
  79. n_part = DIG_SIZE;
  80. }
  81. // start from the high end of the digit arrays
  82. idig += jlen + n_whole - 1;
  83. jdig += jlen - 1;
  84. // shift the digits
  85. mpz_dbl_dig_t d = 0;
  86. for (size_t i = jlen; i > 0; i--, idig--, jdig--) {
  87. d |= *jdig;
  88. *idig = (d >> (DIG_SIZE - n_part)) & DIG_MASK;
  89. d <<= DIG_SIZE;
  90. }
  91. // store remaining bits
  92. *idig = (d >> (DIG_SIZE - n_part)) & DIG_MASK;
  93. idig -= n_whole - 1;
  94. memset(idig, 0, (n_whole - 1) * sizeof(mpz_dig_t));
  95. // work out length of result
  96. jlen += n_whole;
  97. while (jlen != 0 && idig[jlen - 1] == 0) {
  98. jlen--;
  99. }
  100. // return length of result
  101. return jlen;
  102. }
  103. /* computes i = j >> n
  104. returns number of digits in i
  105. assumes enough memory in i; assumes normalised j; assumes n > 0
  106. can have i, j pointing to same memory
  107. */
  108. static size_t mpn_shr(mpz_dig_t *idig, mpz_dig_t *jdig, size_t jlen, mp_uint_t n) {
  109. mp_uint_t n_whole = n / DIG_SIZE;
  110. mp_uint_t n_part = n % DIG_SIZE;
  111. if (n_whole >= jlen) {
  112. return 0;
  113. }
  114. jdig += n_whole;
  115. jlen -= n_whole;
  116. for (size_t i = jlen; i > 0; i--, idig++, jdig++) {
  117. mpz_dbl_dig_t d = *jdig;
  118. if (i > 1) {
  119. d |= (mpz_dbl_dig_t)jdig[1] << DIG_SIZE;
  120. }
  121. d >>= n_part;
  122. *idig = d & DIG_MASK;
  123. }
  124. if (idig[-1] == 0) {
  125. jlen--;
  126. }
  127. return jlen;
  128. }
  129. /* computes i = j + k
  130. returns number of digits in i
  131. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen
  132. can have i, j, k pointing to same memory
  133. */
  134. static size_t mpn_add(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  135. mpz_dig_t *oidig = idig;
  136. mpz_dbl_dig_t carry = 0;
  137. jlen -= klen;
  138. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  139. carry += (mpz_dbl_dig_t)*jdig + (mpz_dbl_dig_t)*kdig;
  140. *idig = carry & DIG_MASK;
  141. carry >>= DIG_SIZE;
  142. }
  143. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  144. carry += *jdig;
  145. *idig = carry & DIG_MASK;
  146. carry >>= DIG_SIZE;
  147. }
  148. if (carry != 0) {
  149. *idig++ = carry;
  150. }
  151. return idig - oidig;
  152. }
  153. /* computes i = j - k
  154. returns number of digits in i
  155. assumes enough memory in i; assumes normalised j, k; assumes j >= k
  156. can have i, j, k pointing to same memory
  157. */
  158. static size_t mpn_sub(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  159. mpz_dig_t *oidig = idig;
  160. mpz_dbl_dig_signed_t borrow = 0;
  161. jlen -= klen;
  162. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  163. borrow += (mpz_dbl_dig_t)*jdig - (mpz_dbl_dig_t)*kdig;
  164. *idig = borrow & DIG_MASK;
  165. borrow >>= DIG_SIZE;
  166. }
  167. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  168. borrow += *jdig;
  169. *idig = borrow & DIG_MASK;
  170. borrow >>= DIG_SIZE;
  171. }
  172. return mpn_remove_trailing_zeros(oidig, idig);
  173. }
  174. #if MICROPY_OPT_MPZ_BITWISE
  175. /* computes i = j & k
  176. returns number of digits in i
  177. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen (jlen argument not needed)
  178. can have i, j, k pointing to same memory
  179. */
  180. static size_t mpn_and(mpz_dig_t *idig, const mpz_dig_t *jdig, const mpz_dig_t *kdig, size_t klen) {
  181. mpz_dig_t *oidig = idig;
  182. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  183. *idig = *jdig & *kdig;
  184. }
  185. return mpn_remove_trailing_zeros(oidig, idig);
  186. }
  187. #endif
  188. /* i = -((-j) & (-k)) = ~((~j + 1) & (~k + 1)) + 1
  189. i = (j & (-k)) = (j & (~k + 1)) = ( j & (~k + 1))
  190. i = ((-j) & k) = ((~j + 1) & k) = ((~j + 1) & k )
  191. computes general form:
  192. i = (im ^ (((j ^ jm) + jc) & ((k ^ km) + kc))) + ic where Xm = Xc == 0 ? 0 : DIG_MASK
  193. returns number of digits in i
  194. assumes enough memory in i; assumes normalised j, k; assumes length j >= length k
  195. can have i, j, k pointing to same memory
  196. */
  197. static size_t mpn_and_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  198. mpz_dbl_dig_t carryi, mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  199. mpz_dig_t *oidig = idig;
  200. mpz_dig_t imask = (0 == carryi) ? 0 : DIG_MASK;
  201. mpz_dig_t jmask = (0 == carryj) ? 0 : DIG_MASK;
  202. mpz_dig_t kmask = (0 == carryk) ? 0 : DIG_MASK;
  203. for (; jlen > 0; ++idig, ++jdig) {
  204. carryj += *jdig ^ jmask;
  205. carryk += (--klen <= --jlen) ? (*kdig++ ^ kmask) : kmask;
  206. carryi += ((carryj & carryk) ^ imask) & DIG_MASK;
  207. *idig = carryi & DIG_MASK;
  208. carryk >>= DIG_SIZE;
  209. carryj >>= DIG_SIZE;
  210. carryi >>= DIG_SIZE;
  211. }
  212. if (0 != carryi) {
  213. *idig++ = carryi;
  214. }
  215. return mpn_remove_trailing_zeros(oidig, idig);
  216. }
  217. #if MICROPY_OPT_MPZ_BITWISE
  218. /* computes i = j | k
  219. returns number of digits in i
  220. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen
  221. can have i, j, k pointing to same memory
  222. */
  223. static size_t mpn_or(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  224. mpz_dig_t *oidig = idig;
  225. jlen -= klen;
  226. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  227. *idig = *jdig | *kdig;
  228. }
  229. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  230. *idig = *jdig;
  231. }
  232. return idig - oidig;
  233. }
  234. #endif
  235. /* i = -((-j) | (-k)) = ~((~j + 1) | (~k + 1)) + 1
  236. i = -(j | (-k)) = -(j | (~k + 1)) = ~( j | (~k + 1)) + 1
  237. i = -((-j) | k) = -((~j + 1) | k) = ~((~j + 1) | k ) + 1
  238. computes general form:
  239. i = ~(((j ^ jm) + jc) | ((k ^ km) + kc)) + 1 where Xm = Xc == 0 ? 0 : DIG_MASK
  240. returns number of digits in i
  241. assumes enough memory in i; assumes normalised j, k; assumes length j >= length k
  242. can have i, j, k pointing to same memory
  243. */
  244. #if MICROPY_OPT_MPZ_BITWISE
  245. static size_t mpn_or_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  246. mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  247. mpz_dig_t *oidig = idig;
  248. mpz_dbl_dig_t carryi = 1;
  249. mpz_dig_t jmask = (0 == carryj) ? 0 : DIG_MASK;
  250. mpz_dig_t kmask = (0 == carryk) ? 0 : DIG_MASK;
  251. for (; jlen > 0; ++idig, ++jdig) {
  252. carryj += *jdig ^ jmask;
  253. carryk += (--klen <= --jlen) ? (*kdig++ ^ kmask) : kmask;
  254. carryi += ((carryj | carryk) ^ DIG_MASK) & DIG_MASK;
  255. *idig = carryi & DIG_MASK;
  256. carryk >>= DIG_SIZE;
  257. carryj >>= DIG_SIZE;
  258. carryi >>= DIG_SIZE;
  259. }
  260. // At least one of j,k must be negative so the above for-loop runs at least
  261. // once. For carryi to be non-zero here it must be equal to 1 at the end of
  262. // each iteration of the loop. So the accumulation of carryi must overflow
  263. // each time, ie carryi += 0xff..ff. So carryj|carryk must be 0 in the
  264. // DIG_MASK bits on each iteration. But considering all cases of signs of
  265. // j,k one sees that this is not possible.
  266. assert(carryi == 0);
  267. return mpn_remove_trailing_zeros(oidig, idig);
  268. }
  269. #else
  270. static size_t mpn_or_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  271. mpz_dbl_dig_t carryi, mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  272. mpz_dig_t *oidig = idig;
  273. mpz_dig_t imask = (0 == carryi) ? 0 : DIG_MASK;
  274. mpz_dig_t jmask = (0 == carryj) ? 0 : DIG_MASK;
  275. mpz_dig_t kmask = (0 == carryk) ? 0 : DIG_MASK;
  276. for (; jlen > 0; ++idig, ++jdig) {
  277. carryj += *jdig ^ jmask;
  278. carryk += (--klen <= --jlen) ? (*kdig++ ^ kmask) : kmask;
  279. carryi += ((carryj | carryk) ^ imask) & DIG_MASK;
  280. *idig = carryi & DIG_MASK;
  281. carryk >>= DIG_SIZE;
  282. carryj >>= DIG_SIZE;
  283. carryi >>= DIG_SIZE;
  284. }
  285. // See comment in above mpn_or_neg for why carryi must be 0.
  286. assert(carryi == 0);
  287. return mpn_remove_trailing_zeros(oidig, idig);
  288. }
  289. #endif
  290. #if MICROPY_OPT_MPZ_BITWISE
  291. /* computes i = j ^ k
  292. returns number of digits in i
  293. assumes enough memory in i; assumes normalised j, k; assumes jlen >= klen
  294. can have i, j, k pointing to same memory
  295. */
  296. static size_t mpn_xor(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen) {
  297. mpz_dig_t *oidig = idig;
  298. jlen -= klen;
  299. for (; klen > 0; --klen, ++idig, ++jdig, ++kdig) {
  300. *idig = *jdig ^ *kdig;
  301. }
  302. for (; jlen > 0; --jlen, ++idig, ++jdig) {
  303. *idig = *jdig;
  304. }
  305. return mpn_remove_trailing_zeros(oidig, idig);
  306. }
  307. #endif
  308. /* i = (-j) ^ (-k) = ~(j - 1) ^ ~(k - 1) = (j - 1) ^ (k - 1)
  309. i = -(j ^ (-k)) = -(j ^ ~(k - 1)) = ~(j ^ ~(k - 1)) + 1 = (j ^ (k - 1)) + 1
  310. i = -((-j) ^ k) = -(~(j - 1) ^ k) = ~(~(j - 1) ^ k) + 1 = ((j - 1) ^ k) + 1
  311. computes general form:
  312. i = ((j - 1 + jc) ^ (k - 1 + kc)) + ic
  313. returns number of digits in i
  314. assumes enough memory in i; assumes normalised j, k; assumes length j >= length k
  315. can have i, j, k pointing to same memory
  316. */
  317. static size_t mpn_xor_neg(mpz_dig_t *idig, const mpz_dig_t *jdig, size_t jlen, const mpz_dig_t *kdig, size_t klen,
  318. mpz_dbl_dig_t carryi, mpz_dbl_dig_t carryj, mpz_dbl_dig_t carryk) {
  319. mpz_dig_t *oidig = idig;
  320. for (; jlen > 0; ++idig, ++jdig) {
  321. carryj += *jdig + DIG_MASK;
  322. carryk += (--klen <= --jlen) ? (*kdig++ + DIG_MASK) : DIG_MASK;
  323. carryi += (carryj ^ carryk) & DIG_MASK;
  324. *idig = carryi & DIG_MASK;
  325. carryk >>= DIG_SIZE;
  326. carryj >>= DIG_SIZE;
  327. carryi >>= DIG_SIZE;
  328. }
  329. if (0 != carryi) {
  330. *idig++ = carryi;
  331. }
  332. return mpn_remove_trailing_zeros(oidig, idig);
  333. }
  334. /* computes i = i * d1 + d2
  335. returns number of digits in i
  336. assumes enough memory in i; assumes normalised i; assumes dmul != 0
  337. */
  338. static size_t mpn_mul_dig_add_dig(mpz_dig_t *idig, size_t ilen, mpz_dig_t dmul, mpz_dig_t dadd) {
  339. mpz_dig_t *oidig = idig;
  340. mpz_dbl_dig_t carry = dadd;
  341. for (; ilen > 0; --ilen, ++idig) {
  342. carry += (mpz_dbl_dig_t)*idig * (mpz_dbl_dig_t)dmul; // will never overflow so long as DIG_SIZE <= 8*sizeof(mpz_dbl_dig_t)/2
  343. *idig = carry & DIG_MASK;
  344. carry >>= DIG_SIZE;
  345. }
  346. if (carry != 0) {
  347. *idig++ = carry;
  348. }
  349. return idig - oidig;
  350. }
  351. /* computes i = j * k
  352. returns number of digits in i
  353. assumes enough memory in i; assumes i is zeroed; assumes normalised j, k
  354. can have j, k point to same memory
  355. */
  356. static size_t mpn_mul(mpz_dig_t *idig, mpz_dig_t *jdig, size_t jlen, mpz_dig_t *kdig, size_t klen) {
  357. mpz_dig_t *oidig = idig;
  358. size_t ilen = 0;
  359. for (; klen > 0; --klen, ++idig, ++kdig) {
  360. mpz_dig_t *id = idig;
  361. mpz_dbl_dig_t carry = 0;
  362. size_t jl = jlen;
  363. for (mpz_dig_t *jd = jdig; jl > 0; --jl, ++jd, ++id) {
  364. carry += (mpz_dbl_dig_t)*id + (mpz_dbl_dig_t)*jd * (mpz_dbl_dig_t)*kdig; // will never overflow so long as DIG_SIZE <= 8*sizeof(mpz_dbl_dig_t)/2
  365. *id = carry & DIG_MASK;
  366. carry >>= DIG_SIZE;
  367. }
  368. if (carry != 0) {
  369. *id++ = carry;
  370. }
  371. ilen = id - oidig;
  372. }
  373. return ilen;
  374. }
  375. /* natural_div - quo * den + new_num = old_num (ie num is replaced with rem)
  376. assumes den != 0
  377. assumes num_dig has enough memory to be extended by 1 digit
  378. assumes quo_dig has enough memory (as many digits as num)
  379. assumes quo_dig is filled with zeros
  380. */
  381. static void mpn_div(mpz_dig_t *num_dig, size_t *num_len, const mpz_dig_t *den_dig, size_t den_len, mpz_dig_t *quo_dig, size_t *quo_len) {
  382. mpz_dig_t *orig_num_dig = num_dig;
  383. mpz_dig_t *orig_quo_dig = quo_dig;
  384. mpz_dig_t norm_shift = 0;
  385. mpz_dbl_dig_t lead_den_digit;
  386. // handle simple cases
  387. {
  388. int cmp = mpn_cmp(num_dig, *num_len, den_dig, den_len);
  389. if (cmp == 0) {
  390. *num_len = 0;
  391. quo_dig[0] = 1;
  392. *quo_len = 1;
  393. return;
  394. } else if (cmp < 0) {
  395. // numerator remains the same
  396. *quo_len = 0;
  397. return;
  398. }
  399. }
  400. // We need to normalise the denominator (leading bit of leading digit is 1)
  401. // so that the division routine works. Since the denominator memory is
  402. // read-only we do the normalisation on the fly, each time a digit of the
  403. // denominator is needed. We need to know is how many bits to shift by.
  404. // count number of leading zeros in leading digit of denominator
  405. {
  406. mpz_dig_t d = den_dig[den_len - 1];
  407. while ((d & DIG_MSB) == 0) {
  408. d <<= 1;
  409. ++norm_shift;
  410. }
  411. }
  412. // now need to shift numerator by same amount as denominator
  413. // first, increase length of numerator in case we need more room to shift
  414. num_dig[*num_len] = 0;
  415. ++(*num_len);
  416. for (mpz_dig_t *num = num_dig, carry = 0; num < num_dig + *num_len; ++num) {
  417. mpz_dig_t n = *num;
  418. *num = ((n << norm_shift) | carry) & DIG_MASK;
  419. carry = (mpz_dbl_dig_t)n >> (DIG_SIZE - norm_shift);
  420. }
  421. // cache the leading digit of the denominator
  422. lead_den_digit = (mpz_dbl_dig_t)den_dig[den_len - 1] << norm_shift;
  423. if (den_len >= 2) {
  424. lead_den_digit |= (mpz_dbl_dig_t)den_dig[den_len - 2] >> (DIG_SIZE - norm_shift);
  425. }
  426. // point num_dig to last digit in numerator
  427. num_dig += *num_len - 1;
  428. // calculate number of digits in quotient
  429. *quo_len = *num_len - den_len;
  430. // point to last digit to store for quotient
  431. quo_dig += *quo_len - 1;
  432. // keep going while we have enough digits to divide
  433. while (*num_len > den_len) {
  434. mpz_dbl_dig_t quo = ((mpz_dbl_dig_t)*num_dig << DIG_SIZE) | num_dig[-1];
  435. // get approximate quotient
  436. quo /= lead_den_digit;
  437. // Multiply quo by den and subtract from num to get remainder.
  438. // Must be careful with overflow of the borrow variable. Both
  439. // borrow and low_digs are signed values and need signed right-shift,
  440. // but x is unsigned and may take a full-range value.
  441. const mpz_dig_t *d = den_dig;
  442. mpz_dbl_dig_t d_norm = 0;
  443. mpz_dbl_dig_signed_t borrow = 0;
  444. for (mpz_dig_t *n = num_dig - den_len; n < num_dig; ++n, ++d) {
  445. // Get the next digit in (den).
  446. d_norm = ((mpz_dbl_dig_t)*d << norm_shift) | (d_norm >> DIG_SIZE);
  447. // Multiply the next digit in (quo * den).
  448. mpz_dbl_dig_t x = (mpz_dbl_dig_t)quo * (d_norm & DIG_MASK);
  449. // Compute the low DIG_MASK bits of the next digit in (num - quo * den)
  450. mpz_dbl_dig_signed_t low_digs = (borrow & DIG_MASK) + *n - (x & DIG_MASK);
  451. // Store the digit result for (num).
  452. *n = low_digs & DIG_MASK;
  453. // Compute the borrow, shifted right before summing to avoid overflow.
  454. borrow = (borrow >> DIG_SIZE) - (x >> DIG_SIZE) + (low_digs >> DIG_SIZE);
  455. }
  456. // At this point we have either:
  457. //
  458. // 1. quo was the correct value and the most-sig-digit of num is exactly
  459. // cancelled by borrow (borrow + *num_dig == 0). In this case there is
  460. // nothing more to do.
  461. //
  462. // 2. quo was too large, we subtracted too many den from num, and the
  463. // most-sig-digit of num is less than needed (borrow + *num_dig < 0).
  464. // In this case we must reduce quo and add back den to num until the
  465. // carry from this operation cancels out the borrow.
  466. //
  467. borrow += *num_dig;
  468. for (; borrow != 0; --quo) {
  469. d = den_dig;
  470. d_norm = 0;
  471. mpz_dbl_dig_t carry = 0;
  472. for (mpz_dig_t *n = num_dig - den_len; n < num_dig; ++n, ++d) {
  473. d_norm = ((mpz_dbl_dig_t)*d << norm_shift) | (d_norm >> DIG_SIZE);
  474. carry += (mpz_dbl_dig_t)*n + (d_norm & DIG_MASK);
  475. *n = carry & DIG_MASK;
  476. carry >>= DIG_SIZE;
  477. }
  478. borrow += carry;
  479. }
  480. // store this digit of the quotient
  481. *quo_dig = quo & DIG_MASK;
  482. --quo_dig;
  483. // move down to next digit of numerator
  484. --num_dig;
  485. --(*num_len);
  486. }
  487. // unnormalise numerator (remainder now)
  488. for (mpz_dig_t *num = orig_num_dig + *num_len - 1, carry = 0; num >= orig_num_dig; --num) {
  489. mpz_dig_t n = *num;
  490. *num = ((n >> norm_shift) | carry) & DIG_MASK;
  491. carry = (mpz_dbl_dig_t)n << (DIG_SIZE - norm_shift);
  492. }
  493. // strip trailing zeros
  494. while (*quo_len > 0 && orig_quo_dig[*quo_len - 1] == 0) {
  495. --(*quo_len);
  496. }
  497. while (*num_len > 0 && orig_num_dig[*num_len - 1] == 0) {
  498. --(*num_len);
  499. }
  500. }
  501. #define MIN_ALLOC (2)
  502. void mpz_init_zero(mpz_t *z) {
  503. z->neg = 0;
  504. z->fixed_dig = 0;
  505. z->alloc = 0;
  506. z->len = 0;
  507. z->dig = NULL;
  508. }
  509. void mpz_init_from_int(mpz_t *z, mp_int_t val) {
  510. mpz_init_zero(z);
  511. mpz_set_from_int(z, val);
  512. }
  513. void mpz_init_fixed_from_int(mpz_t *z, mpz_dig_t *dig, size_t alloc, mp_int_t val) {
  514. z->neg = 0;
  515. z->fixed_dig = 1;
  516. z->alloc = alloc;
  517. z->len = 0;
  518. z->dig = dig;
  519. mpz_set_from_int(z, val);
  520. }
  521. void mpz_deinit(mpz_t *z) {
  522. if (z != NULL && !z->fixed_dig) {
  523. m_del(mpz_dig_t, z->dig, z->alloc);
  524. }
  525. }
  526. #if 0
  527. these functions are unused
  528. mpz_t *mpz_zero(void) {
  529. mpz_t *z = m_new_obj(mpz_t);
  530. mpz_init_zero(z);
  531. return z;
  532. }
  533. mpz_t *mpz_from_int(mp_int_t val) {
  534. mpz_t *z = mpz_zero();
  535. mpz_set_from_int(z, val);
  536. return z;
  537. }
  538. mpz_t *mpz_from_ll(long long val, bool is_signed) {
  539. mpz_t *z = mpz_zero();
  540. mpz_set_from_ll(z, val, is_signed);
  541. return z;
  542. }
  543. #if MICROPY_PY_BUILTINS_FLOAT
  544. mpz_t *mpz_from_float(mp_float_t val) {
  545. mpz_t *z = mpz_zero();
  546. mpz_set_from_float(z, val);
  547. return z;
  548. }
  549. #endif
  550. mpz_t *mpz_from_str(const char *str, size_t len, bool neg, unsigned int base) {
  551. mpz_t *z = mpz_zero();
  552. mpz_set_from_str(z, str, len, neg, base);
  553. return z;
  554. }
  555. #endif
  556. static void mpz_free(mpz_t *z) {
  557. if (z != NULL) {
  558. m_del(mpz_dig_t, z->dig, z->alloc);
  559. m_del_obj(mpz_t, z);
  560. }
  561. }
  562. static void mpz_need_dig(mpz_t *z, size_t need) {
  563. if (need < MIN_ALLOC) {
  564. need = MIN_ALLOC;
  565. }
  566. if (z->dig == NULL || z->alloc < need) {
  567. // if z has fixed digit buffer there's not much we can do as the caller will
  568. // be expecting a buffer with at least "need" bytes (but it shouldn't happen)
  569. assert(!z->fixed_dig);
  570. z->dig = m_renew(mpz_dig_t, z->dig, z->alloc, need);
  571. z->alloc = need;
  572. }
  573. }
  574. static mpz_t *mpz_clone(const mpz_t *src) {
  575. assert(src->alloc != 0);
  576. mpz_t *z = m_new_obj(mpz_t);
  577. z->neg = src->neg;
  578. z->fixed_dig = 0;
  579. z->alloc = src->alloc;
  580. z->len = src->len;
  581. z->dig = m_new(mpz_dig_t, z->alloc);
  582. memcpy(z->dig, src->dig, src->alloc * sizeof(mpz_dig_t));
  583. return z;
  584. }
  585. /* sets dest = src
  586. can have dest, src the same
  587. */
  588. void mpz_set(mpz_t *dest, const mpz_t *src) {
  589. mpz_need_dig(dest, src->len);
  590. dest->neg = src->neg;
  591. dest->len = src->len;
  592. memcpy(dest->dig, src->dig, src->len * sizeof(mpz_dig_t));
  593. }
  594. void mpz_set_from_int(mpz_t *z, mp_int_t val) {
  595. if (val == 0) {
  596. z->neg = 0;
  597. z->len = 0;
  598. return;
  599. }
  600. mpz_need_dig(z, MPZ_NUM_DIG_FOR_INT);
  601. mp_uint_t uval;
  602. if (val < 0) {
  603. z->neg = 1;
  604. uval = -val;
  605. } else {
  606. z->neg = 0;
  607. uval = val;
  608. }
  609. z->len = 0;
  610. while (uval > 0) {
  611. z->dig[z->len++] = uval & DIG_MASK;
  612. uval >>= DIG_SIZE;
  613. }
  614. }
  615. void mpz_set_from_ll(mpz_t *z, long long val, bool is_signed) {
  616. mpz_need_dig(z, MPZ_NUM_DIG_FOR_LL);
  617. unsigned long long uval;
  618. if (is_signed && val < 0) {
  619. z->neg = 1;
  620. uval = -(unsigned long long)val;
  621. } else {
  622. z->neg = 0;
  623. uval = val;
  624. }
  625. z->len = 0;
  626. while (uval > 0) {
  627. z->dig[z->len++] = uval & DIG_MASK;
  628. uval >>= DIG_SIZE;
  629. }
  630. }
  631. #if MICROPY_PY_BUILTINS_FLOAT
  632. void mpz_set_from_float(mpz_t *z, mp_float_t src) {
  633. mp_float_union_t u = {src};
  634. z->neg = u.p.sgn;
  635. if (u.p.exp == 0) {
  636. // value == 0 || value < 1
  637. mpz_set_from_int(z, 0);
  638. } else if (u.p.exp == ((1 << MP_FLOAT_EXP_BITS) - 1)) {
  639. // u.p.frc == 0 indicates inf, else NaN
  640. // should be handled by caller
  641. mpz_set_from_int(z, 0);
  642. } else {
  643. const int adj_exp = (int)u.p.exp - MP_FLOAT_EXP_BIAS;
  644. if (adj_exp < 0) {
  645. // value < 1 , truncates to 0
  646. mpz_set_from_int(z, 0);
  647. } else if (adj_exp == 0) {
  648. // 1 <= value < 2 , so truncates to 1
  649. mpz_set_from_int(z, 1);
  650. } else {
  651. // 2 <= value
  652. const int dig_cnt = (adj_exp + 1 + (DIG_SIZE - 1)) / DIG_SIZE;
  653. const unsigned int rem = adj_exp % DIG_SIZE;
  654. int dig_ind, shft;
  655. mp_float_uint_t frc = u.p.frc | ((mp_float_uint_t)1 << MP_FLOAT_FRAC_BITS);
  656. if (adj_exp < MP_FLOAT_FRAC_BITS) {
  657. shft = 0;
  658. dig_ind = 0;
  659. frc >>= MP_FLOAT_FRAC_BITS - adj_exp;
  660. } else {
  661. shft = (rem - MP_FLOAT_FRAC_BITS) % DIG_SIZE;
  662. dig_ind = (adj_exp - MP_FLOAT_FRAC_BITS) / DIG_SIZE;
  663. }
  664. mpz_need_dig(z, dig_cnt);
  665. z->len = dig_cnt;
  666. if (dig_ind != 0) {
  667. memset(z->dig, 0, dig_ind * sizeof(mpz_dig_t));
  668. }
  669. if (shft != 0) {
  670. z->dig[dig_ind++] = (frc << shft) & DIG_MASK;
  671. frc >>= DIG_SIZE - shft;
  672. }
  673. #if DIG_SIZE < (MP_FLOAT_FRAC_BITS + 1)
  674. while (dig_ind != dig_cnt) {
  675. z->dig[dig_ind++] = frc & DIG_MASK;
  676. frc >>= DIG_SIZE;
  677. }
  678. #else
  679. if (dig_ind != dig_cnt) {
  680. z->dig[dig_ind] = frc;
  681. }
  682. #endif
  683. }
  684. }
  685. }
  686. #endif
  687. // returns number of bytes from str that were processed
  688. size_t mpz_set_from_str(mpz_t *z, const char *str, size_t len, bool neg, unsigned int base) {
  689. assert(base <= 36);
  690. const char *cur = str;
  691. const char *top = str + len;
  692. mpz_need_dig(z, len * 8 / DIG_SIZE + 1);
  693. if (neg) {
  694. z->neg = 1;
  695. } else {
  696. z->neg = 0;
  697. }
  698. z->len = 0;
  699. for (; cur < top; ++cur) { // XXX UTF8 next char
  700. // mp_uint_t v = char_to_numeric(cur#); // XXX UTF8 get char
  701. mp_uint_t v = *cur;
  702. if ('0' <= v && v <= '9') {
  703. v -= '0';
  704. } else if ('A' <= v && v <= 'Z') {
  705. v -= 'A' - 10;
  706. } else if ('a' <= v && v <= 'z') {
  707. v -= 'a' - 10;
  708. } else {
  709. break;
  710. }
  711. if (v >= base) {
  712. break;
  713. }
  714. z->len = mpn_mul_dig_add_dig(z->dig, z->len, base, v);
  715. }
  716. return cur - str;
  717. }
  718. void mpz_set_from_bytes(mpz_t *z, bool big_endian, size_t len, const byte *buf) {
  719. int delta = 1;
  720. if (big_endian) {
  721. buf += len - 1;
  722. delta = -1;
  723. }
  724. mpz_need_dig(z, (len * 8 + DIG_SIZE - 1) / DIG_SIZE);
  725. mpz_dig_t d = 0;
  726. int num_bits = 0;
  727. z->neg = 0;
  728. z->len = 0;
  729. while (len) {
  730. while (len && num_bits < DIG_SIZE) {
  731. d |= *buf << num_bits;
  732. num_bits += 8;
  733. buf += delta;
  734. len--;
  735. }
  736. z->dig[z->len++] = d & DIG_MASK;
  737. // Need this #if because it's C undefined behavior to do: uint32_t >> 32
  738. #if DIG_SIZE != 8 && DIG_SIZE != 16 && DIG_SIZE != 32
  739. d >>= DIG_SIZE;
  740. #else
  741. d = 0;
  742. #endif
  743. num_bits -= DIG_SIZE;
  744. }
  745. z->len = mpn_remove_trailing_zeros(z->dig, z->dig + z->len);
  746. }
  747. #if 0
  748. these functions are unused
  749. bool mpz_is_pos(const mpz_t *z) {
  750. return z->len > 0 && z->neg == 0;
  751. }
  752. bool mpz_is_odd(const mpz_t *z) {
  753. return z->len > 0 && (z->dig[0] & 1) != 0;
  754. }
  755. bool mpz_is_even(const mpz_t *z) {
  756. return z->len == 0 || (z->dig[0] & 1) == 0;
  757. }
  758. #endif
  759. int mpz_cmp(const mpz_t *z1, const mpz_t *z2) {
  760. int cmp = (int)z2->neg - (int)z1->neg;
  761. if (cmp != 0) {
  762. return cmp;
  763. }
  764. cmp = mpn_cmp(z1->dig, z1->len, z2->dig, z2->len);
  765. if (z1->neg != 0) {
  766. cmp = -cmp;
  767. }
  768. return cmp;
  769. }
  770. #if 0
  771. // obsolete
  772. // compares mpz with an integer that fits within DIG_SIZE bits
  773. mp_int_t mpz_cmp_sml_int(const mpz_t *z, mp_int_t sml_int) {
  774. mp_int_t cmp;
  775. if (z->neg == 0) {
  776. if (sml_int < 0) {
  777. return 1;
  778. }
  779. if (sml_int == 0) {
  780. if (z->len == 0) {
  781. return 0;
  782. }
  783. return 1;
  784. }
  785. if (z->len == 0) {
  786. return -1;
  787. }
  788. assert(sml_int < (1 << DIG_SIZE));
  789. if (z->len != 1) {
  790. return 1;
  791. }
  792. cmp = z->dig[0] - sml_int;
  793. } else {
  794. if (sml_int > 0) {
  795. return -1;
  796. }
  797. if (sml_int == 0) {
  798. if (z->len == 0) {
  799. return 0;
  800. }
  801. return -1;
  802. }
  803. if (z->len == 0) {
  804. return 1;
  805. }
  806. assert(sml_int > -(1 << DIG_SIZE));
  807. if (z->len != 1) {
  808. return -1;
  809. }
  810. cmp = -z->dig[0] - sml_int;
  811. }
  812. if (cmp < 0) {
  813. return -1;
  814. }
  815. if (cmp > 0) {
  816. return 1;
  817. }
  818. return 0;
  819. }
  820. #endif
  821. #if 0
  822. these functions are unused
  823. /* returns abs(z)
  824. */
  825. mpz_t *mpz_abs(const mpz_t *z) {
  826. // TODO: handle case of z->alloc=0
  827. mpz_t *z2 = mpz_clone(z);
  828. z2->neg = 0;
  829. return z2;
  830. }
  831. /* returns -z
  832. */
  833. mpz_t *mpz_neg(const mpz_t *z) {
  834. // TODO: handle case of z->alloc=0
  835. mpz_t *z2 = mpz_clone(z);
  836. z2->neg = 1 - z2->neg;
  837. return z2;
  838. }
  839. /* returns lhs + rhs
  840. can have lhs, rhs the same
  841. */
  842. mpz_t *mpz_add(const mpz_t *lhs, const mpz_t *rhs) {
  843. mpz_t *z = mpz_zero();
  844. mpz_add_inpl(z, lhs, rhs);
  845. return z;
  846. }
  847. /* returns lhs - rhs
  848. can have lhs, rhs the same
  849. */
  850. mpz_t *mpz_sub(const mpz_t *lhs, const mpz_t *rhs) {
  851. mpz_t *z = mpz_zero();
  852. mpz_sub_inpl(z, lhs, rhs);
  853. return z;
  854. }
  855. /* returns lhs * rhs
  856. can have lhs, rhs the same
  857. */
  858. mpz_t *mpz_mul(const mpz_t *lhs, const mpz_t *rhs) {
  859. mpz_t *z = mpz_zero();
  860. mpz_mul_inpl(z, lhs, rhs);
  861. return z;
  862. }
  863. /* returns lhs ** rhs
  864. can have lhs, rhs the same
  865. */
  866. mpz_t *mpz_pow(const mpz_t *lhs, const mpz_t *rhs) {
  867. mpz_t *z = mpz_zero();
  868. mpz_pow_inpl(z, lhs, rhs);
  869. return z;
  870. }
  871. /* computes new integers in quo and rem such that:
  872. quo * rhs + rem = lhs
  873. 0 <= rem < rhs
  874. can have lhs, rhs the same
  875. */
  876. void mpz_divmod(const mpz_t *lhs, const mpz_t *rhs, mpz_t **quo, mpz_t **rem) {
  877. *quo = mpz_zero();
  878. *rem = mpz_zero();
  879. mpz_divmod_inpl(*quo, *rem, lhs, rhs);
  880. }
  881. #endif
  882. /* computes dest = abs(z)
  883. can have dest, z the same
  884. */
  885. void mpz_abs_inpl(mpz_t *dest, const mpz_t *z) {
  886. if (dest != z) {
  887. mpz_set(dest, z);
  888. }
  889. dest->neg = 0;
  890. }
  891. /* computes dest = -z
  892. can have dest, z the same
  893. */
  894. void mpz_neg_inpl(mpz_t *dest, const mpz_t *z) {
  895. if (dest != z) {
  896. mpz_set(dest, z);
  897. }
  898. if (dest->len) {
  899. dest->neg = 1 - dest->neg;
  900. }
  901. }
  902. /* computes dest = ~z (= -z - 1)
  903. can have dest, z the same
  904. */
  905. void mpz_not_inpl(mpz_t *dest, const mpz_t *z) {
  906. if (dest != z) {
  907. mpz_set(dest, z);
  908. }
  909. if (dest->len == 0) {
  910. mpz_need_dig(dest, 1);
  911. dest->dig[0] = 1;
  912. dest->len = 1;
  913. dest->neg = 1;
  914. } else if (dest->neg) {
  915. dest->neg = 0;
  916. mpz_dig_t k = 1;
  917. dest->len = mpn_sub(dest->dig, dest->dig, dest->len, &k, 1);
  918. } else {
  919. mpz_need_dig(dest, dest->len + 1);
  920. mpz_dig_t k = 1;
  921. dest->len = mpn_add(dest->dig, dest->dig, dest->len, &k, 1);
  922. dest->neg = 1;
  923. }
  924. }
  925. /* computes dest = lhs << rhs
  926. can have dest, lhs the same
  927. */
  928. void mpz_shl_inpl(mpz_t *dest, const mpz_t *lhs, mp_uint_t rhs) {
  929. if (lhs->len == 0 || rhs == 0) {
  930. mpz_set(dest, lhs);
  931. } else {
  932. mpz_need_dig(dest, lhs->len + (rhs + DIG_SIZE - 1) / DIG_SIZE);
  933. dest->len = mpn_shl(dest->dig, lhs->dig, lhs->len, rhs);
  934. dest->neg = lhs->neg;
  935. }
  936. }
  937. /* computes dest = lhs >> rhs
  938. can have dest, lhs the same
  939. */
  940. void mpz_shr_inpl(mpz_t *dest, const mpz_t *lhs, mp_uint_t rhs) {
  941. if (lhs->len == 0 || rhs == 0) {
  942. mpz_set(dest, lhs);
  943. } else {
  944. mpz_need_dig(dest, lhs->len);
  945. dest->len = mpn_shr(dest->dig, lhs->dig, lhs->len, rhs);
  946. dest->neg = lhs->neg;
  947. if (dest->neg) {
  948. // arithmetic shift right, rounding to negative infinity
  949. mp_uint_t n_whole = rhs / DIG_SIZE;
  950. mp_uint_t n_part = rhs % DIG_SIZE;
  951. mpz_dig_t round_up = 0;
  952. for (size_t i = 0; i < lhs->len && i < n_whole; i++) {
  953. if (lhs->dig[i] != 0) {
  954. round_up = 1;
  955. break;
  956. }
  957. }
  958. if (n_whole < lhs->len && (lhs->dig[n_whole] & ((1 << n_part) - 1)) != 0) {
  959. round_up = 1;
  960. }
  961. if (round_up) {
  962. if (dest->len == 0) {
  963. // dest == 0, so need to add 1 by hand (answer will be -1)
  964. dest->dig[0] = 1;
  965. dest->len = 1;
  966. } else {
  967. // dest > 0, so can use mpn_add to add 1
  968. dest->len = mpn_add(dest->dig, dest->dig, dest->len, &round_up, 1);
  969. }
  970. }
  971. }
  972. }
  973. }
  974. /* computes dest = lhs + rhs
  975. can have dest, lhs, rhs the same
  976. */
  977. void mpz_add_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  978. if (mpn_cmp(lhs->dig, lhs->len, rhs->dig, rhs->len) < 0) {
  979. const mpz_t *temp = lhs;
  980. lhs = rhs;
  981. rhs = temp;
  982. }
  983. if (lhs->neg == rhs->neg) {
  984. mpz_need_dig(dest, lhs->len + 1);
  985. dest->len = mpn_add(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  986. } else {
  987. mpz_need_dig(dest, lhs->len);
  988. dest->len = mpn_sub(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  989. }
  990. dest->neg = lhs->neg & !!dest->len;
  991. }
  992. /* computes dest = lhs - rhs
  993. can have dest, lhs, rhs the same
  994. */
  995. void mpz_sub_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  996. bool neg = false;
  997. if (mpn_cmp(lhs->dig, lhs->len, rhs->dig, rhs->len) < 0) {
  998. const mpz_t *temp = lhs;
  999. lhs = rhs;
  1000. rhs = temp;
  1001. neg = true;
  1002. }
  1003. if (lhs->neg != rhs->neg) {
  1004. mpz_need_dig(dest, lhs->len + 1);
  1005. dest->len = mpn_add(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1006. } else {
  1007. mpz_need_dig(dest, lhs->len);
  1008. dest->len = mpn_sub(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1009. }
  1010. if (dest->len == 0) {
  1011. dest->neg = 0;
  1012. } else if (neg) {
  1013. dest->neg = 1 - lhs->neg;
  1014. } else {
  1015. dest->neg = lhs->neg;
  1016. }
  1017. }
  1018. /* computes dest = lhs & rhs
  1019. can have dest, lhs, rhs the same
  1020. */
  1021. void mpz_and_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1022. // make sure lhs has the most digits
  1023. if (lhs->len < rhs->len) {
  1024. const mpz_t *temp = lhs;
  1025. lhs = rhs;
  1026. rhs = temp;
  1027. }
  1028. #if MICROPY_OPT_MPZ_BITWISE
  1029. if ((0 == lhs->neg) && (0 == rhs->neg)) {
  1030. mpz_need_dig(dest, lhs->len);
  1031. dest->len = mpn_and(dest->dig, lhs->dig, rhs->dig, rhs->len);
  1032. dest->neg = 0;
  1033. } else {
  1034. mpz_need_dig(dest, lhs->len + 1);
  1035. dest->len = mpn_and_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1036. lhs->neg == rhs->neg, 0 != lhs->neg, 0 != rhs->neg);
  1037. dest->neg = lhs->neg & rhs->neg;
  1038. }
  1039. #else
  1040. mpz_need_dig(dest, lhs->len + (lhs->neg || rhs->neg));
  1041. dest->len = mpn_and_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1042. (lhs->neg == rhs->neg) ? lhs->neg : 0, lhs->neg, rhs->neg);
  1043. dest->neg = lhs->neg & rhs->neg;
  1044. #endif
  1045. }
  1046. /* computes dest = lhs | rhs
  1047. can have dest, lhs, rhs the same
  1048. */
  1049. void mpz_or_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1050. // make sure lhs has the most digits
  1051. if (lhs->len < rhs->len) {
  1052. const mpz_t *temp = lhs;
  1053. lhs = rhs;
  1054. rhs = temp;
  1055. }
  1056. #if MICROPY_OPT_MPZ_BITWISE
  1057. if ((0 == lhs->neg) && (0 == rhs->neg)) {
  1058. mpz_need_dig(dest, lhs->len);
  1059. dest->len = mpn_or(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1060. dest->neg = 0;
  1061. } else {
  1062. mpz_need_dig(dest, lhs->len + 1);
  1063. dest->len = mpn_or_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1064. 0 != lhs->neg, 0 != rhs->neg);
  1065. dest->neg = 1;
  1066. }
  1067. #else
  1068. mpz_need_dig(dest, lhs->len + (lhs->neg || rhs->neg));
  1069. dest->len = mpn_or_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1070. (lhs->neg || rhs->neg), lhs->neg, rhs->neg);
  1071. dest->neg = lhs->neg | rhs->neg;
  1072. #endif
  1073. }
  1074. /* computes dest = lhs ^ rhs
  1075. can have dest, lhs, rhs the same
  1076. */
  1077. void mpz_xor_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1078. // make sure lhs has the most digits
  1079. if (lhs->len < rhs->len) {
  1080. const mpz_t *temp = lhs;
  1081. lhs = rhs;
  1082. rhs = temp;
  1083. }
  1084. #if MICROPY_OPT_MPZ_BITWISE
  1085. if (lhs->neg == rhs->neg) {
  1086. mpz_need_dig(dest, lhs->len);
  1087. if (lhs->neg == 0) {
  1088. dest->len = mpn_xor(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1089. } else {
  1090. dest->len = mpn_xor_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len, 0, 0, 0);
  1091. }
  1092. dest->neg = 0;
  1093. } else {
  1094. mpz_need_dig(dest, lhs->len + 1);
  1095. dest->len = mpn_xor_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len, 1,
  1096. 0 == lhs->neg, 0 == rhs->neg);
  1097. dest->neg = 1;
  1098. }
  1099. #else
  1100. mpz_need_dig(dest, lhs->len + (lhs->neg || rhs->neg));
  1101. dest->len = mpn_xor_neg(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len,
  1102. (lhs->neg != rhs->neg), 0 == lhs->neg, 0 == rhs->neg);
  1103. dest->neg = lhs->neg ^ rhs->neg;
  1104. #endif
  1105. }
  1106. /* computes dest = lhs * rhs
  1107. can have dest, lhs, rhs the same
  1108. */
  1109. void mpz_mul_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1110. if (lhs->len == 0 || rhs->len == 0) {
  1111. mpz_set_from_int(dest, 0);
  1112. return;
  1113. }
  1114. mpz_t *temp = NULL;
  1115. if (lhs == dest) {
  1116. lhs = temp = mpz_clone(lhs);
  1117. if (rhs == dest) {
  1118. rhs = lhs;
  1119. }
  1120. } else if (rhs == dest) {
  1121. rhs = temp = mpz_clone(rhs);
  1122. }
  1123. mpz_need_dig(dest, lhs->len + rhs->len); // min mem l+r-1, max mem l+r
  1124. memset(dest->dig, 0, dest->alloc * sizeof(mpz_dig_t));
  1125. dest->len = mpn_mul(dest->dig, lhs->dig, lhs->len, rhs->dig, rhs->len);
  1126. if (lhs->neg == rhs->neg) {
  1127. dest->neg = 0;
  1128. } else {
  1129. dest->neg = 1;
  1130. }
  1131. mpz_free(temp);
  1132. }
  1133. /* computes dest = lhs ** rhs
  1134. can have dest, lhs, rhs the same
  1135. */
  1136. void mpz_pow_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs) {
  1137. if (lhs->len == 0 || rhs->neg != 0) {
  1138. mpz_set_from_int(dest, 0);
  1139. return;
  1140. }
  1141. if (rhs->len == 0) {
  1142. mpz_set_from_int(dest, 1);
  1143. return;
  1144. }
  1145. mpz_t *x = mpz_clone(lhs);
  1146. mpz_t *n = mpz_clone(rhs);
  1147. mpz_set_from_int(dest, 1);
  1148. while (n->len > 0) {
  1149. if ((n->dig[0] & 1) != 0) {
  1150. mpz_mul_inpl(dest, dest, x);
  1151. }
  1152. n->len = mpn_shr(n->dig, n->dig, n->len, 1);
  1153. if (n->len == 0) {
  1154. break;
  1155. }
  1156. mpz_mul_inpl(x, x, x);
  1157. }
  1158. mpz_free(x);
  1159. mpz_free(n);
  1160. }
  1161. /* computes dest = (lhs ** rhs) % mod
  1162. can have dest, lhs, rhs the same; mod can't be the same as dest
  1163. */
  1164. void mpz_pow3_inpl(mpz_t *dest, const mpz_t *lhs, const mpz_t *rhs, const mpz_t *mod) {
  1165. if (lhs->len == 0 || rhs->neg != 0 || (mod->len == 1 && mod->dig[0] == 1)) {
  1166. mpz_set_from_int(dest, 0);
  1167. return;
  1168. }
  1169. mpz_set_from_int(dest, 1);
  1170. if (rhs->len == 0) {
  1171. return;
  1172. }
  1173. mpz_t *x = mpz_clone(lhs);
  1174. mpz_t *n = mpz_clone(rhs);
  1175. mpz_t quo;
  1176. mpz_init_zero(&quo);
  1177. while (n->len > 0) {
  1178. if ((n->dig[0] & 1) != 0) {
  1179. mpz_mul_inpl(dest, dest, x);
  1180. mpz_divmod_inpl(&quo, dest, dest, mod);
  1181. }
  1182. n->len = mpn_shr(n->dig, n->dig, n->len, 1);
  1183. if (n->len == 0) {
  1184. break;
  1185. }
  1186. mpz_mul_inpl(x, x, x);
  1187. mpz_divmod_inpl(&quo, x, x, mod);
  1188. }
  1189. mpz_deinit(&quo);
  1190. mpz_free(x);
  1191. mpz_free(n);
  1192. }
  1193. #if 0
  1194. these functions are unused
  1195. /* computes gcd(z1, z2)
  1196. based on Knuth's modified gcd algorithm (I think?)
  1197. gcd(z1, z2) >= 0
  1198. gcd(0, 0) = 0
  1199. gcd(z, 0) = abs(z)
  1200. */
  1201. mpz_t *mpz_gcd(const mpz_t *z1, const mpz_t *z2) {
  1202. if (z1->len == 0) {
  1203. // TODO: handle case of z2->alloc=0
  1204. mpz_t *a = mpz_clone(z2);
  1205. a->neg = 0;
  1206. return a;
  1207. } else if (z2->len == 0) {
  1208. mpz_t *a = mpz_clone(z1);
  1209. a->neg = 0;
  1210. return a;
  1211. }
  1212. mpz_t *a = mpz_clone(z1);
  1213. mpz_t *b = mpz_clone(z2);
  1214. mpz_t c;
  1215. mpz_init_zero(&c);
  1216. a->neg = 0;
  1217. b->neg = 0;
  1218. for (;;) {
  1219. if (mpz_cmp(a, b) < 0) {
  1220. if (a->len == 0) {
  1221. mpz_free(a);
  1222. mpz_deinit(&c);
  1223. return b;
  1224. }
  1225. mpz_t *t = a;
  1226. a = b;
  1227. b = t;
  1228. }
  1229. if (!(b->len >= 2 || (b->len == 1 && b->dig[0] > 1))) { // compute b > 0; could be mpz_cmp_small_int(b, 1) > 0
  1230. break;
  1231. }
  1232. mpz_set(&c, b);
  1233. do {
  1234. mpz_add_inpl(&c, &c, &c);
  1235. } while (mpz_cmp(&c, a) <= 0);
  1236. c.len = mpn_shr(c.dig, c.dig, c.len, 1);
  1237. mpz_sub_inpl(a, a, &c);
  1238. }
  1239. mpz_deinit(&c);
  1240. if (b->len == 1 && b->dig[0] == 1) { // compute b == 1; could be mpz_cmp_small_int(b, 1) == 0
  1241. mpz_free(a);
  1242. return b;
  1243. } else {
  1244. mpz_free(b);
  1245. return a;
  1246. }
  1247. }
  1248. /* computes lcm(z1, z2)
  1249. = abs(z1) / gcd(z1, z2) * abs(z2)
  1250. lcm(z1, z1) >= 0
  1251. lcm(0, 0) = 0
  1252. lcm(z, 0) = 0
  1253. */
  1254. mpz_t *mpz_lcm(const mpz_t *z1, const mpz_t *z2) {
  1255. if (z1->len == 0 || z2->len == 0) {
  1256. return mpz_zero();
  1257. }
  1258. mpz_t *gcd = mpz_gcd(z1, z2);
  1259. mpz_t *quo = mpz_zero();
  1260. mpz_t *rem = mpz_zero();
  1261. mpz_divmod_inpl(quo, rem, z1, gcd);
  1262. mpz_mul_inpl(rem, quo, z2);
  1263. mpz_free(gcd);
  1264. mpz_free(quo);
  1265. rem->neg = 0;
  1266. return rem;
  1267. }
  1268. #endif
  1269. /* computes new integers in quo and rem such that:
  1270. quo * rhs + rem = lhs
  1271. 0 <= rem < rhs
  1272. can have lhs, rhs the same
  1273. assumes rhs != 0 (undefined behaviour if it is)
  1274. */
  1275. void mpz_divmod_inpl(mpz_t *dest_quo, mpz_t *dest_rem, const mpz_t *lhs, const mpz_t *rhs) {
  1276. assert(!mpz_is_zero(rhs));
  1277. mpz_need_dig(dest_quo, lhs->len + 1); // +1 necessary?
  1278. memset(dest_quo->dig, 0, (lhs->len + 1) * sizeof(mpz_dig_t));
  1279. dest_quo->neg = 0;
  1280. dest_quo->len = 0;
  1281. mpz_need_dig(dest_rem, lhs->len + 1); // +1 necessary?
  1282. mpz_set(dest_rem, lhs);
  1283. mpn_div(dest_rem->dig, &dest_rem->len, rhs->dig, rhs->len, dest_quo->dig, &dest_quo->len);
  1284. dest_rem->neg &= !!dest_rem->len;
  1285. // check signs and do Python style modulo
  1286. if (lhs->neg != rhs->neg) {
  1287. dest_quo->neg = !!dest_quo->len;
  1288. if (!mpz_is_zero(dest_rem)) {
  1289. mpz_t mpzone;
  1290. mpz_init_from_int(&mpzone, -1);
  1291. mpz_add_inpl(dest_quo, dest_quo, &mpzone);
  1292. mpz_add_inpl(dest_rem, dest_rem, rhs);
  1293. }
  1294. }
  1295. }
  1296. #if 0
  1297. these functions are unused
  1298. /* computes floor(lhs / rhs)
  1299. can have lhs, rhs the same
  1300. */
  1301. mpz_t *mpz_div(const mpz_t *lhs, const mpz_t *rhs) {
  1302. mpz_t *quo = mpz_zero();
  1303. mpz_t rem;
  1304. mpz_init_zero(&rem);
  1305. mpz_divmod_inpl(quo, &rem, lhs, rhs);
  1306. mpz_deinit(&rem);
  1307. return quo;
  1308. }
  1309. /* computes lhs % rhs ( >= 0)
  1310. can have lhs, rhs the same
  1311. */
  1312. mpz_t *mpz_mod(const mpz_t *lhs, const mpz_t *rhs) {
  1313. mpz_t quo;
  1314. mpz_init_zero(&quo);
  1315. mpz_t *rem = mpz_zero();
  1316. mpz_divmod_inpl(&quo, rem, lhs, rhs);
  1317. mpz_deinit(&quo);
  1318. return rem;
  1319. }
  1320. #endif
  1321. // must return actual int value if it fits in mp_int_t
  1322. mp_int_t mpz_hash(const mpz_t *z) {
  1323. mp_uint_t val = 0;
  1324. mpz_dig_t *d = z->dig + z->len;
  1325. while (d-- > z->dig) {
  1326. val = (val << DIG_SIZE) | *d;
  1327. }
  1328. if (z->neg != 0) {
  1329. val = -val;
  1330. }
  1331. return val;
  1332. }
  1333. bool mpz_as_int_checked(const mpz_t *i, mp_int_t *value) {
  1334. mp_uint_t val = 0;
  1335. mpz_dig_t *d = i->dig + i->len;
  1336. while (d-- > i->dig) {
  1337. if (val > (~(MP_OBJ_WORD_MSBIT_HIGH) >> DIG_SIZE)) {
  1338. // will overflow
  1339. return false;
  1340. }
  1341. val = (val << DIG_SIZE) | *d;
  1342. }
  1343. if (i->neg != 0) {
  1344. val = -val;
  1345. }
  1346. *value = val;
  1347. return true;
  1348. }
  1349. bool mpz_as_uint_checked(const mpz_t *i, mp_uint_t *value) {
  1350. if (i->neg != 0) {
  1351. // can't represent signed values
  1352. return false;
  1353. }
  1354. mp_uint_t val = 0;
  1355. mpz_dig_t *d = i->dig + i->len;
  1356. while (d-- > i->dig) {
  1357. if (val > (~(MP_OBJ_WORD_MSBIT_HIGH) >> (DIG_SIZE - 1))) {
  1358. // will overflow
  1359. return false;
  1360. }
  1361. val = (val << DIG_SIZE) | *d;
  1362. }
  1363. *value = val;
  1364. return true;
  1365. }
  1366. void mpz_as_bytes(const mpz_t *z, bool big_endian, size_t len, byte *buf) {
  1367. byte *b = buf;
  1368. if (big_endian) {
  1369. b += len;
  1370. }
  1371. mpz_dig_t *zdig = z->dig;
  1372. int bits = 0;
  1373. mpz_dbl_dig_t d = 0;
  1374. mpz_dbl_dig_t carry = 1;
  1375. for (size_t zlen = z->len; zlen > 0; --zlen) {
  1376. bits += DIG_SIZE;
  1377. d = (d << DIG_SIZE) | *zdig++;
  1378. for (; bits >= 8; bits -= 8, d >>= 8) {
  1379. mpz_dig_t val = d;
  1380. if (z->neg) {
  1381. val = (~val & 0xff) + carry;
  1382. carry = val >> 8;
  1383. }
  1384. if (big_endian) {
  1385. *--b = val;
  1386. if (b == buf) {
  1387. return;
  1388. }
  1389. } else {
  1390. *b++ = val;
  1391. if (b == buf + len) {
  1392. return;
  1393. }
  1394. }
  1395. }
  1396. }
  1397. // fill remainder of buf with zero/sign extension of the integer
  1398. if (big_endian) {
  1399. len = b - buf;
  1400. } else {
  1401. len = buf + len - b;
  1402. buf = b;
  1403. }
  1404. memset(buf, z->neg ? 0xff : 0x00, len);
  1405. }
  1406. #if MICROPY_PY_BUILTINS_FLOAT
  1407. mp_float_t mpz_as_float(const mpz_t *i) {
  1408. mp_float_t val = 0;
  1409. mpz_dig_t *d = i->dig + i->len;
  1410. while (d-- > i->dig) {
  1411. val = val * DIG_BASE + *d;
  1412. }
  1413. if (i->neg != 0) {
  1414. val = -val;
  1415. }
  1416. return val;
  1417. }
  1418. #endif
  1419. #if 0
  1420. this function is unused
  1421. char *mpz_as_str(const mpz_t *i, unsigned int base) {
  1422. char *s = m_new(char, mp_int_format_size(mpz_max_num_bits(i), base, NULL, '\0'));
  1423. mpz_as_str_inpl(i, base, NULL, 'a', '\0', s);
  1424. return s;
  1425. }
  1426. #endif
  1427. // assumes enough space in str as calculated by mp_int_format_size
  1428. // base must be between 2 and 32 inclusive
  1429. // returns length of string, not including null byte
  1430. size_t mpz_as_str_inpl(const mpz_t *i, unsigned int base, const char *prefix, char base_char, char comma, char *str) {
  1431. assert(str != NULL);
  1432. assert(2 <= base && base <= 32);
  1433. size_t ilen = i->len;
  1434. char *s = str;
  1435. if (ilen == 0) {
  1436. if (prefix) {
  1437. while (*prefix) {
  1438. *s++ = *prefix++;
  1439. }
  1440. }
  1441. *s++ = '0';
  1442. *s = '\0';
  1443. return s - str;
  1444. }
  1445. // make a copy of mpz digits, so we can do the div/mod calculation
  1446. mpz_dig_t *dig = m_new(mpz_dig_t, ilen);
  1447. memcpy(dig, i->dig, ilen * sizeof(mpz_dig_t));
  1448. // convert
  1449. char *last_comma = str;
  1450. bool done;
  1451. do {
  1452. mpz_dig_t *d = dig + ilen;
  1453. mpz_dbl_dig_t a = 0;
  1454. // compute next remainder
  1455. while (--d >= dig) {
  1456. a = (a << DIG_SIZE) | *d;
  1457. *d = a / base;
  1458. a %= base;
  1459. }
  1460. // convert to character
  1461. a += '0';
  1462. if (a > '9') {
  1463. a += base_char - '9' - 1;
  1464. }
  1465. *s++ = a;
  1466. // check if number is zero
  1467. done = true;
  1468. for (d = dig; d < dig + ilen; ++d) {
  1469. if (*d != 0) {
  1470. done = false;
  1471. break;
  1472. }
  1473. }
  1474. if (comma && (s - last_comma) == 3) {
  1475. *s++ = comma;
  1476. last_comma = s;
  1477. }
  1478. }
  1479. while (!done);
  1480. // free the copy of the digits array
  1481. m_del(mpz_dig_t, dig, ilen);
  1482. if (prefix) {
  1483. const char *p = &prefix[strlen(prefix)];
  1484. while (p > prefix) {
  1485. *s++ = *--p;
  1486. }
  1487. }
  1488. if (i->neg != 0) {
  1489. *s++ = '-';
  1490. }
  1491. // reverse string
  1492. for (char *u = str, *v = s - 1; u < v; ++u, --v) {
  1493. char temp = *u;
  1494. *u = *v;
  1495. *v = temp;
  1496. }
  1497. *s = '\0'; // null termination
  1498. return s - str;
  1499. }
  1500. #endif // MICROPY_LONGINT_IMPL == MICROPY_LONGINT_IMPL_MPZ