diff options
Diffstat (limited to 'src/Specific/solinas64_2e256m2e32m977')
-rw-r--r-- | src/Specific/solinas64_2e256m2e32m977/femul.c | 59 | ||||
-rw-r--r-- | src/Specific/solinas64_2e256m2e32m977/femul.h | 6 | ||||
-rw-r--r-- | src/Specific/solinas64_2e256m2e32m977/fesquare.c | 59 | ||||
-rw-r--r-- | src/Specific/solinas64_2e256m2e32m977/fesquare.h | 6 | ||||
-rw-r--r-- | src/Specific/solinas64_2e256m2e32m977/freeze.c | 25 | ||||
-rw-r--r-- | src/Specific/solinas64_2e256m2e32m977/freeze.h | 6 |
6 files changed, 161 insertions, 0 deletions
diff --git a/src/Specific/solinas64_2e256m2e32m977/femul.c b/src/Specific/solinas64_2e256m2e32m977/femul.c new file mode 100644 index 000000000..b6759718f --- /dev/null +++ b/src/Specific/solinas64_2e256m2e32m977/femul.c @@ -0,0 +1,59 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "femul.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline femul(uint64_t* out, uint64_t x10, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x18, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13) +{ uint128_t x20 = (((uint128_t)x5 * x18) + ((0x2 * ((uint128_t)x7 * x19)) + ((0x2 * ((uint128_t)x9 * x17)) + ((0x2 * ((uint128_t)x11 * x15)) + ((uint128_t)x10 * x13))))); +{ ℤ x21 = ((((uint128_t)x5 * x19) + ((0x2 * ((uint128_t)x7 * x17)) + ((0x2 * ((uint128_t)x9 * x15)) + ((uint128_t)x11 * x13)))) +ℤ ((0x3d1 * ((uint128_t)x10 * x18)) +ℤ (0x100000000 *ℤ ((uint128_t)x10 * x18)))); +{ ℤ x22 = ((((uint128_t)x5 * x17) + ((0x2 * ((uint128_t)x7 * x15)) + ((uint128_t)x9 * x13))) +ℤ ((0x3d1 * (((uint128_t)x11 * x18) + ((uint128_t)x10 * x19))) +ℤ (0x100000000 *ℤ (((uint128_t)x11 * x18) + ((uint128_t)x10 * x19))))); +{ ℤ x23 = ((((uint128_t)x5 * x15) + ((uint128_t)x7 * x13)) +ℤ ((0x3d1 * (((uint128_t)x9 * x18) + (((uint128_t)x11 * x19) + ((uint128_t)x10 * x17)))) +ℤ (0x100000000 *ℤ (((uint128_t)x9 * x18) + (((uint128_t)x11 * x19) + ((uint128_t)x10 * x17)))))); +{ ℤ x24 = (((uint128_t)x5 * x13) +ℤ ((0x3d1 * ((0x2 * ((uint128_t)x7 * x18)) + ((0x2 * ((uint128_t)x9 * x19)) + ((0x2 * ((uint128_t)x11 * x17)) + (0x2 * ((uint128_t)x10 * x15)))))) +ℤ (0x100000000 *ℤ ((0x2 * ((uint128_t)x7 * x18)) + ((0x2 * ((uint128_t)x9 * x19)) + ((0x2 * ((uint128_t)x11 * x17)) + (0x2 * ((uint128_t)x10 * x15)))))))); +{ uint64_t x25 = (uint64_t) (x20 >> 0x33); +{ uint64_t x26 = ((uint64_t)x20 & 0x7ffffffffffff); +{ uint128_t x27 = (((uint128_t)0x8000000000000 * x25) + x26); +{ uint64_t x28 = (uint64_t) (x27 >> 0x33); +{ uint64_t x29 = ((uint64_t)x27 & 0x7ffffffffffff); +{ uint128_t x30 = (((uint128_t)0x8000000000000 * x28) + x29); +{ uint64_t x31 = (uint64_t) (x30 >> 0x33); +{ uint64_t x32 = ((uint64_t)x30 & 0x7ffffffffffff); +{ ℤ x33 = (x24 +ℤ (((uint128_t)0x3d1 * x31) + ((uint128_t)0x100000000 * x31))); +{ uint128_t x34 = (x33 >> 0x34); +{ uint64_t x35 = (x33 & 0xfffffffffffff); +{ ℤ x36 = (x34 +ℤ x23); +{ uint128_t x37 = (x36 >> 0x33); +{ uint64_t x38 = (x36 & 0x7ffffffffffff); +{ ℤ x39 = (x37 +ℤ x22); +{ uint128_t x40 = (x39 >> 0x33); +{ uint64_t x41 = (x39 & 0x7ffffffffffff); +{ ℤ x42 = (x40 +ℤ x21); +{ uint128_t x43 = (x42 >> 0x33); +{ uint64_t x44 = (x42 & 0x7ffffffffffff); +{ uint128_t x45 = (x43 + x32); +{ uint64_t x46 = (uint64_t) (x45 >> 0x33); +{ uint64_t x47 = ((uint64_t)x45 & 0x7ffffffffffff); +{ uint128_t x48 = (x35 + ((0x3d1 * x46) + ((uint128_t)0x100000000 * x46))); +{ uint64_t x49 = (uint64_t) (x48 >> 0x34); +{ uint64_t x50 = ((uint64_t)x48 & 0xfffffffffffff); +{ uint64_t x51 = (x50 >> 0x34); +{ uint64_t x52 = (x50 & 0xfffffffffffff); +out[0] = x47; +out[1] = x44; +out[2] = x41; +out[3] = x51 + x49 + x38; +out[4] = x52; +}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +// caller: uint64_t out[5]; diff --git a/src/Specific/solinas64_2e256m2e32m977/femul.h b/src/Specific/solinas64_2e256m2e32m977/femul.h new file mode 100644 index 000000000..0e096575c --- /dev/null +++ b/src/Specific/solinas64_2e256m2e32m977/femul.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline femul(uint64_t* out, uint64_t x10, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x18, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13); diff --git a/src/Specific/solinas64_2e256m2e32m977/fesquare.c b/src/Specific/solinas64_2e256m2e32m977/fesquare.c new file mode 100644 index 000000000..5a7485a7c --- /dev/null +++ b/src/Specific/solinas64_2e256m2e32m977/fesquare.c @@ -0,0 +1,59 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "fesquare.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline fesquare(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2) +{ uint128_t x9 = (((uint128_t)x2 * x7) + ((0x2 * ((uint128_t)x4 * x8)) + ((0x2 * ((uint128_t)x6 * x6)) + ((0x2 * ((uint128_t)x8 * x4)) + ((uint128_t)x7 * x2))))); +{ ℤ x10 = ((((uint128_t)x2 * x8) + ((0x2 * ((uint128_t)x4 * x6)) + ((0x2 * ((uint128_t)x6 * x4)) + ((uint128_t)x8 * x2)))) +ℤ ((0x3d1 * ((uint128_t)x7 * x7)) +ℤ (0x100000000 *ℤ ((uint128_t)x7 * x7)))); +{ ℤ x11 = ((((uint128_t)x2 * x6) + ((0x2 * ((uint128_t)x4 * x4)) + ((uint128_t)x6 * x2))) +ℤ ((0x3d1 * (((uint128_t)x8 * x7) + ((uint128_t)x7 * x8))) +ℤ (0x100000000 *ℤ (((uint128_t)x8 * x7) + ((uint128_t)x7 * x8))))); +{ ℤ x12 = ((((uint128_t)x2 * x4) + ((uint128_t)x4 * x2)) +ℤ ((0x3d1 * (((uint128_t)x6 * x7) + (((uint128_t)x8 * x8) + ((uint128_t)x7 * x6)))) +ℤ (0x100000000 *ℤ (((uint128_t)x6 * x7) + (((uint128_t)x8 * x8) + ((uint128_t)x7 * x6)))))); +{ ℤ x13 = (((uint128_t)x2 * x2) +ℤ ((0x3d1 * ((0x2 * ((uint128_t)x4 * x7)) + ((0x2 * ((uint128_t)x6 * x8)) + ((0x2 * ((uint128_t)x8 * x6)) + (0x2 * ((uint128_t)x7 * x4)))))) +ℤ (0x100000000 *ℤ ((0x2 * ((uint128_t)x4 * x7)) + ((0x2 * ((uint128_t)x6 * x8)) + ((0x2 * ((uint128_t)x8 * x6)) + (0x2 * ((uint128_t)x7 * x4)))))))); +{ uint64_t x14 = (uint64_t) (x9 >> 0x33); +{ uint64_t x15 = ((uint64_t)x9 & 0x7ffffffffffff); +{ uint128_t x16 = (((uint128_t)0x8000000000000 * x14) + x15); +{ uint64_t x17 = (uint64_t) (x16 >> 0x33); +{ uint64_t x18 = ((uint64_t)x16 & 0x7ffffffffffff); +{ uint128_t x19 = (((uint128_t)0x8000000000000 * x17) + x18); +{ uint64_t x20 = (uint64_t) (x19 >> 0x33); +{ uint64_t x21 = ((uint64_t)x19 & 0x7ffffffffffff); +{ ℤ x22 = (x13 +ℤ (((uint128_t)0x3d1 * x20) + ((uint128_t)0x100000000 * x20))); +{ uint128_t x23 = (x22 >> 0x34); +{ uint64_t x24 = (x22 & 0xfffffffffffff); +{ ℤ x25 = (x23 +ℤ x12); +{ uint128_t x26 = (x25 >> 0x33); +{ uint64_t x27 = (x25 & 0x7ffffffffffff); +{ ℤ x28 = (x26 +ℤ x11); +{ uint128_t x29 = (x28 >> 0x33); +{ uint64_t x30 = (x28 & 0x7ffffffffffff); +{ ℤ x31 = (x29 +ℤ x10); +{ uint128_t x32 = (x31 >> 0x33); +{ uint64_t x33 = (x31 & 0x7ffffffffffff); +{ uint128_t x34 = (x32 + x21); +{ uint64_t x35 = (uint64_t) (x34 >> 0x33); +{ uint64_t x36 = ((uint64_t)x34 & 0x7ffffffffffff); +{ uint128_t x37 = (x24 + ((0x3d1 * x35) + ((uint128_t)0x100000000 * x35))); +{ uint64_t x38 = (uint64_t) (x37 >> 0x34); +{ uint64_t x39 = ((uint64_t)x37 & 0xfffffffffffff); +{ uint64_t x40 = (x39 >> 0x34); +{ uint64_t x41 = (x39 & 0xfffffffffffff); +out[0] = x36; +out[1] = x33; +out[2] = x30; +out[3] = x40 + x38 + x27; +out[4] = x41; +}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +// caller: uint64_t out[5]; diff --git a/src/Specific/solinas64_2e256m2e32m977/fesquare.h b/src/Specific/solinas64_2e256m2e32m977/fesquare.h new file mode 100644 index 000000000..2cfd2d5a8 --- /dev/null +++ b/src/Specific/solinas64_2e256m2e32m977/fesquare.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline fesquare(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2); diff --git a/src/Specific/solinas64_2e256m2e32m977/freeze.c b/src/Specific/solinas64_2e256m2e32m977/freeze.c new file mode 100644 index 000000000..5c8088e2e --- /dev/null +++ b/src/Specific/solinas64_2e256m2e32m977/freeze.c @@ -0,0 +1,25 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "freeze.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline freeze(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2) +out[0] = uint64_t x10; +out[1] = uint8_t x11 = Op Syntax.SubWithGetBorrow 52 Syntax.TWord 3 Syntax.TWord 6 Syntax.TWord 6 Syntax.TWord 6 Syntax.TWord 3 0x0; +out[2] = x2; +out[3] = 0xffffefffffc2f;; +} +// caller: uint64_t out[4]; diff --git a/src/Specific/solinas64_2e256m2e32m977/freeze.h b/src/Specific/solinas64_2e256m2e32m977/freeze.h new file mode 100644 index 000000000..d296b2d57 --- /dev/null +++ b/src/Specific/solinas64_2e256m2e32m977/freeze.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline freeze(uint64_t* out, uint64_t x7, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2); |