aboutsummaryrefslogtreecommitdiff
path: root/src/Specific/solinas64_2e256m2e32m977
diff options
context:
space:
mode:
Diffstat (limited to 'src/Specific/solinas64_2e256m2e32m977')
-rw-r--r--src/Specific/solinas64_2e256m2e32m977/femul.c59
-rw-r--r--src/Specific/solinas64_2e256m2e32m977/femul.h6
-rw-r--r--src/Specific/solinas64_2e256m2e32m977/fesquare.c59
-rw-r--r--src/Specific/solinas64_2e256m2e32m977/fesquare.h6
-rw-r--r--src/Specific/solinas64_2e256m2e32m977/freeze.c25
-rw-r--r--src/Specific/solinas64_2e256m2e32m977/freeze.h6
6 files changed, 161 insertions, 0 deletions
diff --git a/src/Specific/solinas64_2e256m2e32m977/femul.c b/src/Specific/solinas64_2e256m2e32m977/femul.c
new file mode 100644
index 000000000..b6759718f
--- /dev/null
+++ b/src/Specific/solinas64_2e256m2e32m977/femul.c
@@ -0,0 +1,59 @@
+#include <stdint.h>
+#include <stdbool.h>
+#include <x86intrin.h>
+#include "liblow.h"
+
+#include "femul.h"
+
+typedef unsigned int uint128_t __attribute__((mode(TI)));
+
+#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER))
+// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294
+#define _subborrow_u32 __builtin_ia32_sbb_u32
+#define _subborrow_u64 __builtin_ia32_sbb_u64
+#endif
+
+#undef force_inline
+#define force_inline __attribute__((always_inline))
+
+void force_inline femul(uint64_t* out, uint64_t x10, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x18, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13)
+{ uint128_t x20 = (((uint128_t)x5 * x18) + ((0x2 * ((uint128_t)x7 * x19)) + ((0x2 * ((uint128_t)x9 * x17)) + ((0x2 * ((uint128_t)x11 * x15)) + ((uint128_t)x10 * x13)))));
+{ ℤ x21 = ((((uint128_t)x5 * x19) + ((0x2 * ((uint128_t)x7 * x17)) + ((0x2 * ((uint128_t)x9 * x15)) + ((uint128_t)x11 * x13)))) +ℤ ((0x3d1 * ((uint128_t)x10 * x18)) +ℤ (0x100000000 *ℤ ((uint128_t)x10 * x18))));
+{ ℤ x22 = ((((uint128_t)x5 * x17) + ((0x2 * ((uint128_t)x7 * x15)) + ((uint128_t)x9 * x13))) +ℤ ((0x3d1 * (((uint128_t)x11 * x18) + ((uint128_t)x10 * x19))) +ℤ (0x100000000 *ℤ (((uint128_t)x11 * x18) + ((uint128_t)x10 * x19)))));
+{ ℤ x23 = ((((uint128_t)x5 * x15) + ((uint128_t)x7 * x13)) +ℤ ((0x3d1 * (((uint128_t)x9 * x18) + (((uint128_t)x11 * x19) + ((uint128_t)x10 * x17)))) +ℤ (0x100000000 *ℤ (((uint128_t)x9 * x18) + (((uint128_t)x11 * x19) + ((uint128_t)x10 * x17))))));
+{ ℤ x24 = (((uint128_t)x5 * x13) +ℤ ((0x3d1 * ((0x2 * ((uint128_t)x7 * x18)) + ((0x2 * ((uint128_t)x9 * x19)) + ((0x2 * ((uint128_t)x11 * x17)) + (0x2 * ((uint128_t)x10 * x15)))))) +ℤ (0x100000000 *ℤ ((0x2 * ((uint128_t)x7 * x18)) + ((0x2 * ((uint128_t)x9 * x19)) + ((0x2 * ((uint128_t)x11 * x17)) + (0x2 * ((uint128_t)x10 * x15))))))));
+{ uint64_t x25 = (uint64_t) (x20 >> 0x33);
+{ uint64_t x26 = ((uint64_t)x20 & 0x7ffffffffffff);
+{ uint128_t x27 = (((uint128_t)0x8000000000000 * x25) + x26);
+{ uint64_t x28 = (uint64_t) (x27 >> 0x33);
+{ uint64_t x29 = ((uint64_t)x27 & 0x7ffffffffffff);
+{ uint128_t x30 = (((uint128_t)0x8000000000000 * x28) + x29);
+{ uint64_t x31 = (uint64_t) (x30 >> 0x33);
+{ uint64_t x32 = ((uint64_t)x30 & 0x7ffffffffffff);
+{ ℤ x33 = (x24 +ℤ (((uint128_t)0x3d1 * x31) + ((uint128_t)0x100000000 * x31)));
+{ uint128_t x34 = (x33 >> 0x34);
+{ uint64_t x35 = (x33 & 0xfffffffffffff);
+{ ℤ x36 = (x34 +ℤ x23);
+{ uint128_t x37 = (x36 >> 0x33);
+{ uint64_t x38 = (x36 & 0x7ffffffffffff);
+{ ℤ x39 = (x37 +ℤ x22);
+{ uint128_t x40 = (x39 >> 0x33);
+{ uint64_t x41 = (x39 & 0x7ffffffffffff);
+{ ℤ x42 = (x40 +ℤ x21);
+{ uint128_t x43 = (x42 >> 0x33);
+{ uint64_t x44 = (x42 & 0x7ffffffffffff);
+{ uint128_t x45 = (x43 + x32);
+{ uint64_t x46 = (uint64_t) (x45 >> 0x33);
+{ uint64_t x47 = ((uint64_t)x45 & 0x7ffffffffffff);
+{ uint128_t x48 = (x35 + ((0x3d1 * x46) + ((uint128_t)0x100000000 * x46)));
+{ uint64_t x49 = (uint64_t) (x48 >> 0x34);
+{ uint64_t x50 = ((uint64_t)x48 & 0xfffffffffffff);
+{ uint64_t x51 = (x50 >> 0x34);
+{ uint64_t x52 = (x50 & 0xfffffffffffff);
+out[0] = x47;
+out[1] = x44;
+out[2] = x41;
+out[3] = x51 + x49 + x38;
+out[4] = x52;
+}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}
+// caller: uint64_t out[5];
diff --git a/src/Specific/solinas64_2e256m2e32m977/femul.h b/src/Specific/solinas64_2e256m2e32m977/femul.h
new file mode 100644
index 000000000..0e096575c
--- /dev/null
+++ b/src/Specific/solinas64_2e256m2e32m977/femul.h
@@ -0,0 +1,6 @@
+#include <stdint.h>
+
+#undef force_inline
+#define force_inline __attribute__((always_inline))
+
+void force_inline femul(uint64_t* out, uint64_t x10, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x18, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13);
diff --git a/src/Specific/solinas64_2e256m2e32m977/fesquare.c b/src/Specific/solinas64_2e256m2e32m977/fesquare.c
new file mode 100644
index 000000000..5a7485a7c
--- /dev/null
+++ b/src/Specific/solinas64_2e256m2e32m977/fesquare.c
@@ -0,0 +1,59 @@
+#include <stdint.h>
+#include <stdbool.h>
+#include <x86intrin.h>
+#include "liblow.h"
+
+#include "fesquare.h"
+
+typedef unsigned int uint128_t __attribute__((mode(TI)));
+
+#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER))
+// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294
+#define _subborrow_u32 __builtin_ia32_sbb_u32
+#define _subborrow_u64 __builtin_ia32_sbb_u64
+#endif
+
+#undef force_inline
+#define force_inline __attribute__((always_inline))
+
+void force_inline fesquare(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2)
+{ uint128_t x9 = (((uint128_t)x2 * x7) + ((0x2 * ((uint128_t)x4 * x8)) + ((0x2 * ((uint128_t)x6 * x6)) + ((0x2 * ((uint128_t)x8 * x4)) + ((uint128_t)x7 * x2)))));
+{ ℤ x10 = ((((uint128_t)x2 * x8) + ((0x2 * ((uint128_t)x4 * x6)) + ((0x2 * ((uint128_t)x6 * x4)) + ((uint128_t)x8 * x2)))) +ℤ ((0x3d1 * ((uint128_t)x7 * x7)) +ℤ (0x100000000 *ℤ ((uint128_t)x7 * x7))));
+{ ℤ x11 = ((((uint128_t)x2 * x6) + ((0x2 * ((uint128_t)x4 * x4)) + ((uint128_t)x6 * x2))) +ℤ ((0x3d1 * (((uint128_t)x8 * x7) + ((uint128_t)x7 * x8))) +ℤ (0x100000000 *ℤ (((uint128_t)x8 * x7) + ((uint128_t)x7 * x8)))));
+{ ℤ x12 = ((((uint128_t)x2 * x4) + ((uint128_t)x4 * x2)) +ℤ ((0x3d1 * (((uint128_t)x6 * x7) + (((uint128_t)x8 * x8) + ((uint128_t)x7 * x6)))) +ℤ (0x100000000 *ℤ (((uint128_t)x6 * x7) + (((uint128_t)x8 * x8) + ((uint128_t)x7 * x6))))));
+{ ℤ x13 = (((uint128_t)x2 * x2) +ℤ ((0x3d1 * ((0x2 * ((uint128_t)x4 * x7)) + ((0x2 * ((uint128_t)x6 * x8)) + ((0x2 * ((uint128_t)x8 * x6)) + (0x2 * ((uint128_t)x7 * x4)))))) +ℤ (0x100000000 *ℤ ((0x2 * ((uint128_t)x4 * x7)) + ((0x2 * ((uint128_t)x6 * x8)) + ((0x2 * ((uint128_t)x8 * x6)) + (0x2 * ((uint128_t)x7 * x4))))))));
+{ uint64_t x14 = (uint64_t) (x9 >> 0x33);
+{ uint64_t x15 = ((uint64_t)x9 & 0x7ffffffffffff);
+{ uint128_t x16 = (((uint128_t)0x8000000000000 * x14) + x15);
+{ uint64_t x17 = (uint64_t) (x16 >> 0x33);
+{ uint64_t x18 = ((uint64_t)x16 & 0x7ffffffffffff);
+{ uint128_t x19 = (((uint128_t)0x8000000000000 * x17) + x18);
+{ uint64_t x20 = (uint64_t) (x19 >> 0x33);
+{ uint64_t x21 = ((uint64_t)x19 & 0x7ffffffffffff);
+{ ℤ x22 = (x13 +ℤ (((uint128_t)0x3d1 * x20) + ((uint128_t)0x100000000 * x20)));
+{ uint128_t x23 = (x22 >> 0x34);
+{ uint64_t x24 = (x22 & 0xfffffffffffff);
+{ ℤ x25 = (x23 +ℤ x12);
+{ uint128_t x26 = (x25 >> 0x33);
+{ uint64_t x27 = (x25 & 0x7ffffffffffff);
+{ ℤ x28 = (x26 +ℤ x11);
+{ uint128_t x29 = (x28 >> 0x33);
+{ uint64_t x30 = (x28 & 0x7ffffffffffff);
+{ ℤ x31 = (x29 +ℤ x10);
+{ uint128_t x32 = (x31 >> 0x33);
+{ uint64_t x33 = (x31 & 0x7ffffffffffff);
+{ uint128_t x34 = (x32 + x21);
+{ uint64_t x35 = (uint64_t) (x34 >> 0x33);
+{ uint64_t x36 = ((uint64_t)x34 & 0x7ffffffffffff);
+{ uint128_t x37 = (x24 + ((0x3d1 * x35) + ((uint128_t)0x100000000 * x35)));
+{ uint64_t x38 = (uint64_t) (x37 >> 0x34);
+{ uint64_t x39 = ((uint64_t)x37 & 0xfffffffffffff);
+{ uint64_t x40 = (x39 >> 0x34);
+{ uint64_t x41 = (x39 & 0xfffffffffffff);
+out[0] = x36;
+out[1] = x33;
+out[2] = x30;
+out[3] = x40 + x38 + x27;
+out[4] = x41;
+}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}
+// caller: uint64_t out[5];
diff --git a/src/Specific/solinas64_2e256m2e32m977/fesquare.h b/src/Specific/solinas64_2e256m2e32m977/fesquare.h
new file mode 100644
index 000000000..2cfd2d5a8
--- /dev/null
+++ b/src/Specific/solinas64_2e256m2e32m977/fesquare.h
@@ -0,0 +1,6 @@
+#include <stdint.h>
+
+#undef force_inline
+#define force_inline __attribute__((always_inline))
+
+void force_inline fesquare(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2);
diff --git a/src/Specific/solinas64_2e256m2e32m977/freeze.c b/src/Specific/solinas64_2e256m2e32m977/freeze.c
new file mode 100644
index 000000000..5c8088e2e
--- /dev/null
+++ b/src/Specific/solinas64_2e256m2e32m977/freeze.c
@@ -0,0 +1,25 @@
+#include <stdint.h>
+#include <stdbool.h>
+#include <x86intrin.h>
+#include "liblow.h"
+
+#include "freeze.h"
+
+typedef unsigned int uint128_t __attribute__((mode(TI)));
+
+#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER))
+// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294
+#define _subborrow_u32 __builtin_ia32_sbb_u32
+#define _subborrow_u64 __builtin_ia32_sbb_u64
+#endif
+
+#undef force_inline
+#define force_inline __attribute__((always_inline))
+
+void force_inline freeze(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2)
+out[0] = uint64_t x10;
+out[1] = uint8_t x11 = Op Syntax.SubWithGetBorrow 52 Syntax.TWord 3 Syntax.TWord 6 Syntax.TWord 6 Syntax.TWord 6 Syntax.TWord 3 0x0;
+out[2] = x2;
+out[3] = 0xffffefffffc2f;;
+}
+// caller: uint64_t out[4];
diff --git a/src/Specific/solinas64_2e256m2e32m977/freeze.h b/src/Specific/solinas64_2e256m2e32m977/freeze.h
new file mode 100644
index 000000000..d296b2d57
--- /dev/null
+++ b/src/Specific/solinas64_2e256m2e32m977/freeze.h
@@ -0,0 +1,6 @@
+#include <stdint.h>
+
+#undef force_inline
+#define force_inline __attribute__((always_inline))
+
+void force_inline freeze(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2);