diff options
Diffstat (limited to 'src/Specific/solinas32_2e190m11/femul.c')
-rw-r--r-- | src/Specific/solinas32_2e190m11/femul.c | 61 |
1 files changed, 61 insertions, 0 deletions
diff --git a/src/Specific/solinas32_2e190m11/femul.c b/src/Specific/solinas32_2e190m11/femul.c new file mode 100644 index 000000000..8b6631bbf --- /dev/null +++ b/src/Specific/solinas32_2e190m11/femul.c @@ -0,0 +1,61 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "femul.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline femul(uint64_t* out, uint64_t x14, uint64_t x15, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x26, uint64_t x27, uint64_t x25, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17) +{ uint64_t x28 = (((uint64_t)x5 * x26) + ((0x2 * ((uint64_t)x7 * x27)) + ((0x2 * ((uint64_t)x9 * x25)) + ((0x2 * ((uint64_t)x11 * x23)) + ((0x2 * ((uint64_t)x13 * x21)) + ((0x2 * ((uint64_t)x15 * x19)) + ((uint64_t)x14 * x17))))))); +{ uint64_t x29 = ((((uint64_t)x5 * x27) + ((0x2 * ((uint64_t)x7 * x25)) + ((0x2 * ((uint64_t)x9 * x23)) + ((0x2 * ((uint64_t)x11 * x21)) + ((0x2 * ((uint64_t)x13 * x19)) + ((uint64_t)x15 * x17)))))) + (0xb * ((uint64_t)x14 * x26))); +{ uint64_t x30 = ((((uint64_t)x5 * x25) + ((0x2 * ((uint64_t)x7 * x23)) + ((0x2 * ((uint64_t)x9 * x21)) + ((0x2 * ((uint64_t)x11 * x19)) + ((uint64_t)x13 * x17))))) + (0xb * (((uint64_t)x15 * x26) + ((uint64_t)x14 * x27)))); +{ uint64_t x31 = ((((uint64_t)x5 * x23) + ((0x2 * ((uint64_t)x7 * x21)) + ((0x2 * ((uint64_t)x9 * x19)) + ((uint64_t)x11 * x17)))) + (0xb * (((uint64_t)x13 * x26) + (((uint64_t)x15 * x27) + ((uint64_t)x14 * x25))))); +{ uint64_t x32 = ((((uint64_t)x5 * x21) + ((0x2 * ((uint64_t)x7 * x19)) + ((uint64_t)x9 * x17))) + (0xb * (((uint64_t)x11 * x26) + (((uint64_t)x13 * x27) + (((uint64_t)x15 * x25) + ((uint64_t)x14 * x23)))))); +{ uint64_t x33 = ((((uint64_t)x5 * x19) + ((uint64_t)x7 * x17)) + (0xb * (((uint64_t)x9 * x26) + (((uint64_t)x11 * x27) + (((uint64_t)x13 * x25) + (((uint64_t)x15 * x23) + ((uint64_t)x14 * x21))))))); +{ ℤ x34 = (((uint64_t)x5 * x17) +ℤ (0xb *ℤ ((0x2 * ((uint64_t)x7 * x26)) + ((0x2 * ((uint64_t)x9 * x27)) + ((0x2 * ((uint64_t)x11 * x25)) + ((0x2 * ((uint64_t)x13 * x23)) + ((0x2 * ((uint64_t)x15 * x21)) + (0x2 * ((uint64_t)x14 * x19))))))))); +{ uint64_t x35 = (x34 >> 0x1c); +{ uint32_t x36 = (x34 & 0xfffffff); +{ uint64_t x37 = (x35 + x33); +{ uint64_t x38 = (x37 >> 0x1b); +{ uint32_t x39 = ((uint32_t)x37 & 0x7ffffff); +{ uint64_t x40 = (x38 + x32); +{ uint64_t x41 = (x40 >> 0x1b); +{ uint32_t x42 = ((uint32_t)x40 & 0x7ffffff); +{ uint64_t x43 = (x41 + x31); +{ uint64_t x44 = (x43 >> 0x1b); +{ uint32_t x45 = ((uint32_t)x43 & 0x7ffffff); +{ uint64_t x46 = (x44 + x30); +{ uint64_t x47 = (x46 >> 0x1b); +{ uint32_t x48 = ((uint32_t)x46 & 0x7ffffff); +{ uint64_t x49 = (x47 + x29); +{ uint64_t x50 = (x49 >> 0x1b); +{ uint32_t x51 = ((uint32_t)x49 & 0x7ffffff); +{ uint64_t x52 = (x50 + x28); +{ uint64_t x53 = (x52 >> 0x1b); +{ uint32_t x54 = ((uint32_t)x52 & 0x7ffffff); +{ uint64_t x55 = (x36 + (0xb * x53)); +{ uint32_t x56 = (uint32_t) (x55 >> 0x1c); +{ uint32_t x57 = ((uint32_t)x55 & 0xfffffff); +{ uint32_t x58 = (x56 + x39); +{ uint32_t x59 = (x58 >> 0x1b); +{ uint32_t x60 = (x58 & 0x7ffffff); +out[0] = x54; +out[1] = x51; +out[2] = x48; +out[3] = x45; +out[4] = x59 + x42; +out[5] = x60; +out[6] = x57; +}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +// caller: uint64_t out[7]; |