aboutsummaryrefslogtreecommitdiff
path: root/src/String/Inline/Mpi.h
diff options
context:
space:
mode:
Diffstat (limited to 'src/String/Inline/Mpi.h')
-rw-r--r--src/String/Inline/Mpi.h499
1 files changed, 499 insertions, 0 deletions
diff --git a/src/String/Inline/Mpi.h b/src/String/Inline/Mpi.h
new file mode 100644
index 0000000..efaa388
--- /dev/null
+++ b/src/String/Inline/Mpi.h
@@ -0,0 +1,499 @@
+/* Platform dependant definition */
+#ifndef BH_TWEAK_SHORT_BINT
+#define MPI_SIZE 40
+#define MPI_TYPE uint32_t
+#define MPI_TTYPE uint64_t
+#define MPI_BITS 32
+#define MPI_MASK 0xFFFFFFFFul
+#else
+#define MPI_SIZE 80
+#define MPI_TYPE uint16_t
+#define MPI_TTYPE uint32_t
+#define MPI_BITS 16
+#define MPI_MASK 0xFFFFu
+#endif
+
+
+typedef struct Mpi {
+ int size;
+ MPI_TYPE data[MPI_SIZE];
+} Mpi;
+
+
+static const uint8_t clzLookup[256] =
+{
+ 8, 7, 6, 6, 5, 5, 5, 5, 4, 4, 4, 4, 4, 4, 4, 4,
+ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3,
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+ 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0
+};
+
+
+#ifndef BH_TWEAK_SHORT_BINT
+static const Mpi BInt1 = {1, {0x00000001ul}};
+static const Mpi BInt53 = {2, {0x00000000ul, 0x00200000ul}};
+
+
+static const Mpi powLookup[] =
+{
+ {1, {0x0000000Aul}},
+ {1, {0x00000064ul}},
+ {1, {0x00002710ul}},
+ {1, {0x05F5E100ul}},
+ {2, {0x6FC10000ul, 0x002386F2ul}},
+ {4, {0x00000000ul, 0x85ACEF81ul, 0x2D6D415Bul, 0x000004EEul}},
+ {7, {0x00000000ul, 0x00000000ul, 0xBF6A1F01ul, 0x6E38ED64ul, 0xDAA797EDul,
+ 0xE93FF9F4ul, 0x00184F03ul}},
+ {14, {0x00000000ul, 0x00000000ul, 0x00000000ul, 0x00000000ul, 0x2E953E01ul,
+ 0x03DF9909ul, 0x0F1538FDul, 0x2374E42Ful, 0xD3CFF5ECul, 0xC404DC08ul,
+ 0xBCCDB0DAul, 0xA6337F19ul, 0xE91F2603ul, 0x0000024Eul}},
+ {27, {0x00000000ul, 0x00000000ul, 0x00000000ul, 0x00000000ul, 0x00000000ul,
+ 0x00000000ul, 0x00000000ul, 0x00000000ul, 0x982E7C01ul, 0xBED3875Bul,
+ 0xD8D99F72ul, 0x12152F87ul, 0x6BDE50C6ul, 0xCF4A6E70ul, 0xD595D80Ful,
+ 0x26B2716Eul, 0xADC666B0ul, 0x1D153624ul, 0x3C42D35Aul, 0x63FF540Eul,
+ 0xCC5573C0ul, 0x65F9EF17ul, 0x55BC28F2ul, 0x80DCC7F7ul, 0xF46EEDDCul,
+ 0x5FDCEFCEul, 0x000553F7ul}}
+};
+
+
+static int MpiClz(MPI_TYPE value)
+{
+ if (value & 0xFF000000ul)
+ return clzLookup[(value >> 24) & 0xFF];
+ else if (value & 0x00FF0000ul)
+ return 8 + clzLookup[(value >> 16) & 0xFF];
+ else if (value & 0x0000FF00ul)
+ return 16 + clzLookup[(value >> 8) & 0xFF];
+ else
+ return 24 + clzLookup[value & 0xFF];
+}
+#else
+static const Mpi BInt1 = {1, {0x0001u}};
+static const Mpi BInt53 = {4, {0x0000u, 0x0000u, 0x0000u, 0x0020u}};
+
+
+static const Mpi powLookup[] =
+{
+ {1, {0x000Au}},
+ {1, {0x0064u}},
+ {1, {0x2710u}},
+ {2, {0xE100u, 0x05F5u}},
+ {4, {0x0000u, 0x6FC1u, 0x86F2u, 0x0023u}},
+ {7, {0x0000u, 0x0000u, 0xEF81u, 0x85ACu, 0x415Bu, 0x2D6Du, 0x04EEu}},
+ {14, {0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x1F01u, 0xBF6Au, 0xED64u,
+ 0x6E38u, 0x97EDu, 0xDAA7u, 0xF9F4u, 0xE93Fu, 0x4F03u, 0x0018u}},
+ {27, {0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u,
+ 0x0000u, 0x3E01u, 0x2E95u, 0x9909u, 0x03DFu, 0x38FDu, 0x0F15u,
+ 0xE42Fu, 0x2374u, 0xF5ECu, 0xD3CFu, 0xDC08u, 0xC404u, 0xB0DAu,
+ 0xBCCDu, 0x7F19u, 0xA633u, 0x2603u, 0xE91Fu, 0x024Eu}},
+ {54, {0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u,
+ 0x0000u,
+ 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u, 0x0000u,
+ 0x0000u, 0x7C01u, 0x982Eu, 0x875Bu, 0xBED3u, 0x9F72u, 0xD8D9u,
+ 0x2F87u, 0x1215u, 0x50C6u, 0x6BDEu, 0x6E70u, 0xCF4Au, 0xD80Fu,
+ 0xD595u, 0x716Eu, 0x26B2u, 0x66B0u, 0xADC6u, 0x3624u, 0x1D15u,
+ 0xD35Au, 0x3C42u, 0x540Eu, 0x63FFu, 0x73C0u, 0xCC55u, 0xEF17u,
+ 0x65F9u, 0x28F2u, 0x55BCu, 0xC7F7u, 0x80DCu, 0xEDDCu, 0xF46Eu,
+ 0xEFCEu, 0x5FDCu, 0x53F7u, 0x0005u}}
+};
+
+
+static int MpiClz(MPI_TYPE value)
+{
+ if (value & 0xFF00)
+ return clzLookup[(value >> 8) & 0xFF];
+ else
+ return 8 + clzLookup[value & 0xFF];
+}
+#endif
+
+
+static int MpiLog2(const Mpi *in)
+{
+ /* Preconditions */
+ assert(in != NULL);
+ assert(in->size != 0);
+ assert(in->data[in->size - 1] != 0);
+
+ return (MPI_BITS - 1) - MpiClz(in->data[in->size - 1]) + MPI_BITS * (in->size - 1);
+}
+
+
+static void MpiTrim(Mpi *in)
+{
+ /* Preconditions */
+ assert(in != NULL);
+
+ while (in->size && !in->data[in->size - 1])
+ in->size--;
+}
+
+
+static int MpiCompare(const Mpi *a,
+ const Mpi *b)
+{
+ int i;
+
+ /* Preconditions */
+ assert(a != NULL && b != NULL);
+
+ /* Compare by lengths */
+ i = a->size - b->size;
+ if (a->size - b->size)
+ return a->size - b->size;
+
+ /* Compare by blocks */
+ for (i = a->size; i; i--)
+ {
+ if (a->data[i - 1] < b->data[i - 1])
+ return -1;
+ else if (a->data[i - 1] > b->data[i - 1])
+ return 1;
+ }
+
+ return 0;
+}
+
+
+static void MpiAdd(const Mpi *a,
+ const Mpi *b,
+ Mpi *out)
+{
+ MPI_TTYPE carry;
+ int i;
+
+ /* Preconditions */
+ assert(a != NULL && b != NULL && out != NULL);
+ assert(a->size + 1 <= MPI_SIZE);
+ assert(b->size + 1 <= MPI_SIZE);
+
+ /* Addition loop */
+ carry = 0;
+ for (i = 0; i < a->size || i < b->size; i++)
+ {
+ if (i < a->size)
+ carry += a->data[i];
+ if (i < b->size)
+ carry += b->data[i];
+
+ out->data[i] = carry & MPI_MASK;
+ carry = (carry >> MPI_BITS);
+ }
+
+ /* Handle new digit */
+ if (carry)
+ out->data[i++] = carry;
+
+ out->size = i;
+}
+
+
+static void MpiSub(const Mpi *a,
+ const Mpi *b,
+ Mpi *out)
+{
+ MPI_TTYPE carry;
+ int i;
+
+ /* Preconditions */
+ assert(a != NULL && b != NULL && out != NULL);
+ assert(MpiCompare(a, b) >= 0);
+
+ /* Main subtraction loop */
+ carry = 0;
+ for (i = 0; i < a->size || i < b->size; i++)
+ {
+ if (i < a->size)
+ carry += a->data[i];
+ if (i < b->size)
+ carry -= b->data[i];
+
+ out->data[i] = carry & MPI_MASK;
+ carry = carry >> MPI_BITS;
+ carry |= (carry << MPI_BITS);
+ }
+
+ /* Trim leading zeros */
+ out->size = a->size;
+ MpiTrim(out);
+}
+
+
+static void MpiMul(const Mpi *a,
+ const Mpi *b,
+ Mpi *out)
+{
+ MPI_TTYPE carry;
+ int i, j;
+
+ /* Preconditions */
+ assert(a != NULL && b != NULL && out != NULL);
+ assert(a->size + b->size <= MPI_SIZE);
+
+ /* Zero out the result */
+ memset(out->data, 0, sizeof(out->data));
+
+ /* Multiplication loop */
+ for (i = 0; i < a->size; i++)
+ {
+ carry = 0;
+ for (j = 0; j < b->size; j++)
+ {
+ carry += out->data[i + j];
+ carry += (MPI_TTYPE)a->data[i] * (MPI_TTYPE)b->data[j];
+ out->data[i + j] = carry & MPI_MASK;
+ carry = (carry >> MPI_BITS);
+ }
+ out->data[i + j] += carry;
+ }
+
+ /* Trim leading zeros */
+ out->size = a->size + b->size;
+ MpiTrim(out);
+}
+
+
+static void MpiMulDigit(const Mpi *a,
+ MPI_TYPE b,
+ Mpi *out)
+{
+ MPI_TTYPE carry;
+ int i;
+
+ /* Preconditions */
+ assert(a != NULL && out != NULL);
+ assert(a->size + 1 <= MPI_SIZE);
+
+ /* Multiplication loop */
+ carry = 0;
+ for (i = 0; i < a->size; i++)
+ {
+ carry += (MPI_TTYPE)a->data[i] * b;
+ out->data[i] = carry & MPI_MASK;
+ carry = (carry >> MPI_BITS);
+ }
+ out->data[i] = carry;
+
+ /* Trim leading zeros */
+ out->size = a->size + 1;
+ MpiTrim(out);
+}
+
+
+static void MpiPow10(const Mpi *in,
+ int exponent,
+ Mpi *out,
+ Mpi *tmp)
+{
+ int i, current;
+
+ /* Preconditions */
+ assert(in != NULL && out != NULL && tmp != NULL);
+ assert(exponent >= 0 && exponent < 512);
+
+ tmp[0] = *in;
+ for (current = 0, i = 0; exponent; i++, exponent >>= 1)
+ {
+ if (!(exponent & 0x1))
+ continue;
+
+ MpiMul(&tmp[current], &powLookup[i], &tmp[1 - current]);
+ current = 1 - current;
+ }
+ *out = tmp[current];
+}
+
+
+static void MpiLsh(const Mpi *in,
+ int amount,
+ Mpi *out)
+{
+ int blocks, bits, i;
+ MPI_TYPE low, high;
+
+ /* Preconditions */
+ assert(in != NULL && out != NULL);
+ assert(amount >= 0 && in->size + (amount + MPI_BITS - 1) / MPI_BITS <= MPI_SIZE);
+
+ blocks = amount / MPI_BITS;
+ bits = amount % MPI_BITS;
+ if (!in->size)
+ {
+ out->size = 0;
+ return;
+ }
+
+ /* Main shift loop */
+ if (bits)
+ {
+ high = 0;
+ for (i = in->size + blocks; i > blocks; i--)
+ {
+ low = in->data[i - blocks - 1] >> (MPI_BITS - bits);
+ out->data[i] = low | high;
+ high = in->data[i - blocks - 1] << bits;
+ }
+ out->data[i] = high;
+ out->size = in->size + blocks + 1;
+ }
+ else
+ {
+ for (i = in->size; i; i--)
+ out->data[i - 1 + blocks] = in->data[i - 1];
+ out->size = in->size + blocks;
+ }
+
+ /* Trim leading zeros and zero out lower blocks */
+ MpiTrim(out);
+ for (i = blocks; i; i--)
+ out->data[i - 1] = 0;
+}
+
+
+static void MpiRsh(const Mpi *in,
+ int amount,
+ Mpi *out)
+{
+ int blocks, bits, i;
+ MPI_TYPE low, high;
+
+ /* Preconditions */
+ assert(in != NULL && out != NULL);
+ assert(amount >= 0);
+
+ blocks = amount / MPI_BITS;
+ bits = amount % MPI_BITS;
+
+ /* Zero size input or shift is bigger then input */
+ if (in->size == 0 || in->size <= blocks)
+ {
+ out->size = 0;
+ return;
+ }
+
+ /* Shift and copy parts of two blocks */
+ if (bits)
+ {
+ low = in->data[blocks] >> bits;
+ high = 0;
+ for (i = 0; i < in->size - blocks - 1; i++)
+ {
+ high = in->data[i + blocks + 1] << (MPI_BITS - bits);
+ out->data[i] = low | high;
+ low = in->data[i + blocks + 1] >> bits;
+ }
+ out->data[in->size - blocks - 1] = low;
+ }
+ else
+ {
+ for (i = 0; i < in->size - blocks; i++)
+ out->data[i] = out->data[i + blocks];
+ }
+
+ /* Trim leading zeros */
+ out->size = in->size - blocks;
+ MpiTrim(out);
+}
+
+
+static MPI_TTYPE MpiGuess(const Mpi *a,
+ const Mpi *b)
+{
+ MPI_TTYPE tmp;
+
+ /* Preconditions */
+ assert(a != NULL && b != NULL);
+ assert(a->size > 0 && b->size > 0);
+ assert((a->size == b->size) || ((a->size != b->size) && a->size > 1));
+
+ if (MpiCompare(a, b) < 0)
+ return 0;
+
+ tmp = a->data[a->size - 1];
+ if (a->size != b->size)
+ tmp = (tmp << MPI_BITS) | a->data[a->size - 2];
+
+ return tmp / b->data[b->size - 1];
+}
+
+
+static void MpiDiv(const Mpi *a,
+ const Mpi *b,
+ Mpi *q,
+ Mpi *r,
+ Mpi *tmp)
+{
+ MPI_TTYPE digit;
+ int shift;
+
+ /* Preconditions */
+ assert(a != NULL && b != NULL && q != NULL && r != NULL && tmp != NULL);
+ assert(b->size != 0);
+
+ /* Handle case where a is less then b */
+ if (MpiCompare(a, b) < 0)
+ {
+ *r = *a;
+ q->size = 0;
+ return;
+ }
+
+ /* Normilize input to reduce tries */
+ shift = MpiClz(b->data[b->size - 1]);
+ MpiLsh(a, shift, &tmp[0]);
+ MpiLsh(b, shift, &tmp[1]);
+
+ /* Prepare first step of the division */
+ q->size = 0;
+ r->size = 0;
+ while (MpiCompare(r, &tmp[1]) < 0)
+ {
+ MpiLsh(r, MPI_BITS, r);
+ r->data[0] = tmp[0].data[--tmp[0].size];
+ r->size += !r->size;
+ }
+
+ while (1)
+ {
+ /* Make a guess and check */
+ digit = MpiGuess(r, &tmp[1]);
+ while (digit > MPI_MASK)
+ digit--;
+ MpiMulDigit(&tmp[1], digit, &tmp[2]);
+ while (MpiCompare(r, &tmp[2]) < 0)
+ {
+ --digit;
+ MpiSub(&tmp[2], &tmp[1], &tmp[2]);
+ }
+
+ /* Store digit in quotient */
+ MpiSub(r, &tmp[2], r);
+ MpiLsh(q, MPI_BITS, q);
+ q->data[0] = digit;
+ q->size += !q->size;
+
+ /* Fetch next digit or exit */
+ if (!tmp[0].size)
+ break;
+
+ MpiLsh(r, MPI_BITS, r);
+ r->data[0] = tmp[0].data[--tmp[0].size];
+ if (!r->size)
+ r->size = 1;
+ }
+
+ /* Normilize remainder */
+ MpiRsh(r, shift, r);
+}