diff options
author | Jason Gross <jgross@mit.edu> | 2017-11-02 01:36:04 -0400 |
---|---|---|
committer | Jason Gross <jgross@mit.edu> | 2017-11-02 01:36:04 -0400 |
commit | 5b45aa93efa19d54e50299ff0df8ee46c60f891b (patch) | |
tree | 9cea98ab783f557b5cbca0456a4dc3b4498e43c5 /src/Specific/solinas32_2e322m2e161m1 | |
parent | e8bda9b779d5762c5868cd09c85142151655d5ca (diff) |
Update display logs and c files
Diffstat (limited to 'src/Specific/solinas32_2e322m2e161m1')
-rw-r--r-- | src/Specific/solinas32_2e322m2e161m1/femul.c | 119 | ||||
-rw-r--r-- | src/Specific/solinas32_2e322m2e161m1/femul.h | 6 | ||||
-rw-r--r-- | src/Specific/solinas32_2e322m2e161m1/fesquare.c | 119 | ||||
-rw-r--r-- | src/Specific/solinas32_2e322m2e161m1/fesquare.h | 6 | ||||
-rw-r--r-- | src/Specific/solinas32_2e322m2e161m1/freeze.c | 25 | ||||
-rw-r--r-- | src/Specific/solinas32_2e322m2e161m1/freeze.h | 6 |
6 files changed, 281 insertions, 0 deletions
diff --git a/src/Specific/solinas32_2e322m2e161m1/femul.c b/src/Specific/solinas32_2e322m2e161m1/femul.c new file mode 100644 index 000000000..7cfe5c54c --- /dev/null +++ b/src/Specific/solinas32_2e322m2e161m1/femul.c @@ -0,0 +1,119 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "femul.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline femul(uint64_t* out, uint64_t x28, uint64_t x29, uint64_t x27, uint64_t x25, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x54, uint64_t x55, uint64_t x53, uint64_t x51, uint64_t x49, uint64_t x47, uint64_t x45, uint64_t x43, uint64_t x41, uint64_t x39, uint64_t x37, uint64_t x35, uint64_t x33, uint64_t x31) +{ uint64_t x56 = (((uint64_t)(x17 + x28) * (x43 + x54)) - ((uint64_t)x17 * x43)); +{ uint64_t x57 = ((((uint64_t)(x15 + x29) * (x43 + x54)) + ((uint64_t)(x17 + x28) * (x41 + x55))) - (((uint64_t)x15 * x43) + ((uint64_t)x17 * x41))); +{ uint64_t x58 = ((((uint64_t)(x13 + x27) * (x43 + x54)) + (((uint64_t)(x15 + x29) * (x41 + x55)) + ((uint64_t)(x17 + x28) * (x39 + x53)))) - (((uint64_t)x13 * x43) + (((uint64_t)x15 * x41) + ((uint64_t)x17 * x39)))); +{ uint64_t x59 = ((((uint64_t)(x11 + x25) * (x43 + x54)) + (((uint64_t)(x13 + x27) * (x41 + x55)) + (((uint64_t)(x15 + x29) * (x39 + x53)) + ((uint64_t)(x17 + x28) * (x37 + x51))))) - (((uint64_t)x11 * x43) + (((uint64_t)x13 * x41) + (((uint64_t)x15 * x39) + ((uint64_t)x17 * x37))))); +{ uint64_t x60 = ((((uint64_t)(x9 + x23) * (x43 + x54)) + (((uint64_t)(x11 + x25) * (x41 + x55)) + (((uint64_t)(x13 + x27) * (x39 + x53)) + (((uint64_t)(x15 + x29) * (x37 + x51)) + ((uint64_t)(x17 + x28) * (x35 + x49)))))) - (((uint64_t)x9 * x43) + (((uint64_t)x11 * x41) + (((uint64_t)x13 * x39) + (((uint64_t)x15 * x37) + ((uint64_t)x17 * x35)))))); +{ uint64_t x61 = ((((uint64_t)(x7 + x21) * (x43 + x54)) + (((uint64_t)(x9 + x23) * (x41 + x55)) + (((uint64_t)(x11 + x25) * (x39 + x53)) + (((uint64_t)(x13 + x27) * (x37 + x51)) + (((uint64_t)(x15 + x29) * (x35 + x49)) + ((uint64_t)(x17 + x28) * (x33 + x47))))))) - (((uint64_t)x7 * x43) + (((uint64_t)x9 * x41) + (((uint64_t)x11 * x39) + (((uint64_t)x13 * x37) + (((uint64_t)x15 * x35) + ((uint64_t)x17 * x33))))))); +{ uint64_t x62 = ((((uint64_t)(x5 + x19) * (x43 + x54)) + (((uint64_t)(x7 + x21) * (x41 + x55)) + (((uint64_t)(x9 + x23) * (x39 + x53)) + (((uint64_t)(x11 + x25) * (x37 + x51)) + (((uint64_t)(x13 + x27) * (x35 + x49)) + (((uint64_t)(x15 + x29) * (x33 + x47)) + ((uint64_t)(x17 + x28) * (x31 + x45)))))))) - (((uint64_t)x5 * x43) + (((uint64_t)x7 * x41) + (((uint64_t)x9 * x39) + (((uint64_t)x11 * x37) + (((uint64_t)x13 * x35) + (((uint64_t)x15 * x33) + ((uint64_t)x17 * x31)))))))); +{ uint64_t x63 = ((((uint64_t)(x5 + x19) * (x41 + x55)) + (((uint64_t)(x7 + x21) * (x39 + x53)) + (((uint64_t)(x9 + x23) * (x37 + x51)) + (((uint64_t)(x11 + x25) * (x35 + x49)) + (((uint64_t)(x13 + x27) * (x33 + x47)) + ((uint64_t)(x15 + x29) * (x31 + x45))))))) - (((uint64_t)x5 * x41) + (((uint64_t)x7 * x39) + (((uint64_t)x9 * x37) + (((uint64_t)x11 * x35) + (((uint64_t)x13 * x33) + ((uint64_t)x15 * x31))))))); +{ uint64_t x64 = ((((uint64_t)(x5 + x19) * (x39 + x53)) + (((uint64_t)(x7 + x21) * (x37 + x51)) + (((uint64_t)(x9 + x23) * (x35 + x49)) + (((uint64_t)(x11 + x25) * (x33 + x47)) + ((uint64_t)(x13 + x27) * (x31 + x45)))))) - (((uint64_t)x5 * x39) + (((uint64_t)x7 * x37) + (((uint64_t)x9 * x35) + (((uint64_t)x11 * x33) + ((uint64_t)x13 * x31)))))); +{ uint64_t x65 = ((((uint64_t)(x5 + x19) * (x37 + x51)) + (((uint64_t)(x7 + x21) * (x35 + x49)) + (((uint64_t)(x9 + x23) * (x33 + x47)) + ((uint64_t)(x11 + x25) * (x31 + x45))))) - (((uint64_t)x5 * x37) + (((uint64_t)x7 * x35) + (((uint64_t)x9 * x33) + ((uint64_t)x11 * x31))))); +{ uint64_t x66 = ((((uint64_t)(x5 + x19) * (x35 + x49)) + (((uint64_t)(x7 + x21) * (x33 + x47)) + ((uint64_t)(x9 + x23) * (x31 + x45)))) - (((uint64_t)x5 * x35) + (((uint64_t)x7 * x33) + ((uint64_t)x9 * x31)))); +{ uint64_t x67 = ((((uint64_t)(x5 + x19) * (x33 + x47)) + ((uint64_t)(x7 + x21) * (x31 + x45))) - (((uint64_t)x5 * x33) + ((uint64_t)x7 * x31))); +{ uint64_t x68 = (((uint64_t)(x5 + x19) * (x31 + x45)) - ((uint64_t)x5 * x31)); +{ uint64_t x69 = (((((uint64_t)x17 * x43) + ((uint64_t)x28 * x54)) + x63) + x56); +{ uint64_t x70 = ((((((uint64_t)x15 * x43) + ((uint64_t)x17 * x41)) + (((uint64_t)x29 * x54) + ((uint64_t)x28 * x55))) + x64) + x57); +{ uint64_t x71 = ((((((uint64_t)x13 * x43) + (((uint64_t)x15 * x41) + ((uint64_t)x17 * x39))) + (((uint64_t)x27 * x54) + (((uint64_t)x29 * x55) + ((uint64_t)x28 * x53)))) + x65) + x58); +{ uint64_t x72 = ((((((uint64_t)x11 * x43) + (((uint64_t)x13 * x41) + (((uint64_t)x15 * x39) + ((uint64_t)x17 * x37)))) + (((uint64_t)x25 * x54) + (((uint64_t)x27 * x55) + (((uint64_t)x29 * x53) + ((uint64_t)x28 * x51))))) + x66) + x59); +{ uint64_t x73 = ((((((uint64_t)x9 * x43) + (((uint64_t)x11 * x41) + (((uint64_t)x13 * x39) + (((uint64_t)x15 * x37) + ((uint64_t)x17 * x35))))) + (((uint64_t)x23 * x54) + (((uint64_t)x25 * x55) + (((uint64_t)x27 * x53) + (((uint64_t)x29 * x51) + ((uint64_t)x28 * x49)))))) + x67) + x60); +{ uint64_t x74 = ((((((uint64_t)x7 * x43) + (((uint64_t)x9 * x41) + (((uint64_t)x11 * x39) + (((uint64_t)x13 * x37) + (((uint64_t)x15 * x35) + ((uint64_t)x17 * x33)))))) + (((uint64_t)x21 * x54) + (((uint64_t)x23 * x55) + (((uint64_t)x25 * x53) + (((uint64_t)x27 * x51) + (((uint64_t)x29 * x49) + ((uint64_t)x28 * x47))))))) + x68) + x61); +{ uint64_t x75 = ((((uint64_t)x5 * x43) + (((uint64_t)x7 * x41) + (((uint64_t)x9 * x39) + (((uint64_t)x11 * x37) + (((uint64_t)x13 * x35) + (((uint64_t)x15 * x33) + ((uint64_t)x17 * x31))))))) + (((uint64_t)x19 * x54) + (((uint64_t)x21 * x55) + (((uint64_t)x23 * x53) + (((uint64_t)x25 * x51) + (((uint64_t)x27 * x49) + (((uint64_t)x29 * x47) + ((uint64_t)x28 * x45)))))))); +{ uint64_t x76 = (((((uint64_t)x5 * x41) + (((uint64_t)x7 * x39) + (((uint64_t)x9 * x37) + (((uint64_t)x11 * x35) + (((uint64_t)x13 * x33) + ((uint64_t)x15 * x31)))))) + (((uint64_t)x19 * x55) + (((uint64_t)x21 * x53) + (((uint64_t)x23 * x51) + (((uint64_t)x25 * x49) + (((uint64_t)x27 * x47) + ((uint64_t)x29 * x45))))))) + x56); +{ uint64_t x77 = (((((uint64_t)x5 * x39) + (((uint64_t)x7 * x37) + (((uint64_t)x9 * x35) + (((uint64_t)x11 * x33) + ((uint64_t)x13 * x31))))) + (((uint64_t)x19 * x53) + (((uint64_t)x21 * x51) + (((uint64_t)x23 * x49) + (((uint64_t)x25 * x47) + ((uint64_t)x27 * x45)))))) + x57); +{ uint64_t x78 = (((((uint64_t)x5 * x37) + (((uint64_t)x7 * x35) + (((uint64_t)x9 * x33) + ((uint64_t)x11 * x31)))) + (((uint64_t)x19 * x51) + (((uint64_t)x21 * x49) + (((uint64_t)x23 * x47) + ((uint64_t)x25 * x45))))) + x58); +{ uint64_t x79 = (((((uint64_t)x5 * x35) + (((uint64_t)x7 * x33) + ((uint64_t)x9 * x31))) + (((uint64_t)x19 * x49) + (((uint64_t)x21 * x47) + ((uint64_t)x23 * x45)))) + x59); +{ uint64_t x80 = (((((uint64_t)x5 * x33) + ((uint64_t)x7 * x31)) + (((uint64_t)x19 * x47) + ((uint64_t)x21 * x45))) + x60); +{ uint64_t x81 = ((((uint64_t)x5 * x31) + ((uint64_t)x19 * x45)) + x61); +{ uint32_t x82 = (uint32_t) (x75 >> 0x17); +{ uint32_t x83 = ((uint32_t)x75 & 0x7fffff); +{ uint32_t x84 = (uint32_t) (x62 >> 0x17); +{ uint32_t x85 = ((uint32_t)x62 & 0x7fffff); +{ uint64_t x86 = (((uint64_t)0x800000 * x84) + x85); +{ uint32_t x87 = (uint32_t) (x86 >> 0x17); +{ uint32_t x88 = ((uint32_t)x86 & 0x7fffff); +{ uint64_t x89 = ((x82 + x74) + x87); +{ uint32_t x90 = (uint32_t) (x89 >> 0x17); +{ uint32_t x91 = ((uint32_t)x89 & 0x7fffff); +{ uint64_t x92 = (x81 + x87); +{ uint32_t x93 = (uint32_t) (x92 >> 0x17); +{ uint32_t x94 = ((uint32_t)x92 & 0x7fffff); +{ uint64_t x95 = (x90 + x73); +{ uint32_t x96 = (uint32_t) (x95 >> 0x17); +{ uint32_t x97 = ((uint32_t)x95 & 0x7fffff); +{ uint64_t x98 = (x93 + x80); +{ uint32_t x99 = (uint32_t) (x98 >> 0x17); +{ uint32_t x100 = ((uint32_t)x98 & 0x7fffff); +{ uint64_t x101 = (x96 + x72); +{ uint32_t x102 = (uint32_t) (x101 >> 0x17); +{ uint32_t x103 = ((uint32_t)x101 & 0x7fffff); +{ uint64_t x104 = (x99 + x79); +{ uint32_t x105 = (uint32_t) (x104 >> 0x17); +{ uint32_t x106 = ((uint32_t)x104 & 0x7fffff); +{ uint64_t x107 = (x102 + x71); +{ uint32_t x108 = (uint32_t) (x107 >> 0x17); +{ uint32_t x109 = ((uint32_t)x107 & 0x7fffff); +{ uint64_t x110 = (x105 + x78); +{ uint32_t x111 = (uint32_t) (x110 >> 0x17); +{ uint32_t x112 = ((uint32_t)x110 & 0x7fffff); +{ uint64_t x113 = (x108 + x70); +{ uint32_t x114 = (uint32_t) (x113 >> 0x17); +{ uint32_t x115 = ((uint32_t)x113 & 0x7fffff); +{ uint64_t x116 = (x111 + x77); +{ uint32_t x117 = (uint32_t) (x116 >> 0x17); +{ uint32_t x118 = ((uint32_t)x116 & 0x7fffff); +{ uint64_t x119 = (x114 + x69); +{ uint32_t x120 = (uint32_t) (x119 >> 0x17); +{ uint32_t x121 = ((uint32_t)x119 & 0x7fffff); +{ uint64_t x122 = (x117 + x76); +{ uint32_t x123 = (uint32_t) (x122 >> 0x17); +{ uint32_t x124 = ((uint32_t)x122 & 0x7fffff); +{ uint32_t x125 = (x120 + x88); +{ uint32_t x126 = (x125 >> 0x17); +{ uint32_t x127 = (x125 & 0x7fffff); +{ uint32_t x128 = (x123 + x83); +{ uint32_t x129 = (x128 >> 0x17); +{ uint32_t x130 = (x128 & 0x7fffff); +{ uint32_t x131 = ((0x800000 * x126) + x127); +{ uint32_t x132 = (x131 >> 0x17); +{ uint32_t x133 = (x131 & 0x7fffff); +{ uint32_t x134 = ((x129 + x91) + x132); +{ uint32_t x135 = (x134 >> 0x17); +{ uint32_t x136 = (x134 & 0x7fffff); +{ uint32_t x137 = (x94 + x132); +{ uint32_t x138 = (x137 >> 0x17); +{ uint32_t x139 = (x137 & 0x7fffff); +out[0] = x133; +out[1] = x121; +out[2] = x115; +out[3] = x109; +out[4] = x103; +out[5] = x135 + x97; +out[6] = x136; +out[7] = x130; +out[8] = x124; +out[9] = x118; +out[10] = x112; +out[11] = x106; +out[12] = x138 + x100; +out[13] = x139; +}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +// caller: uint64_t out[14]; diff --git a/src/Specific/solinas32_2e322m2e161m1/femul.h b/src/Specific/solinas32_2e322m2e161m1/femul.h new file mode 100644 index 000000000..6fdc2d29d --- /dev/null +++ b/src/Specific/solinas32_2e322m2e161m1/femul.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline femul(uint64_t* out, uint64_t x28, uint64_t x29, uint64_t x27, uint64_t x25, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x54, uint64_t x55, uint64_t x53, uint64_t x51, uint64_t x49, uint64_t x47, uint64_t x45, uint64_t x43, uint64_t x41, uint64_t x39, uint64_t x37, uint64_t x35, uint64_t x33, uint64_t x31); diff --git a/src/Specific/solinas32_2e322m2e161m1/fesquare.c b/src/Specific/solinas32_2e322m2e161m1/fesquare.c new file mode 100644 index 000000000..d745c603b --- /dev/null +++ b/src/Specific/solinas32_2e322m2e161m1/fesquare.c @@ -0,0 +1,119 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "fesquare.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline fesquare(uint64_t* out, uint64_t x25, uint64_t x26, uint64_t x24, uint64_t x22, uint64_t x20, uint64_t x18, uint64_t x16, uint64_t x14, uint64_t x12, uint64_t x10, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2) +{ uint64_t x27 = (((uint64_t)(x14 + x25) * (x14 + x25)) - ((uint64_t)x14 * x14)); +{ uint64_t x28 = ((((uint64_t)(x12 + x26) * (x14 + x25)) + ((uint64_t)(x14 + x25) * (x12 + x26))) - (((uint64_t)x12 * x14) + ((uint64_t)x14 * x12))); +{ uint64_t x29 = ((((uint64_t)(x10 + x24) * (x14 + x25)) + (((uint64_t)(x12 + x26) * (x12 + x26)) + ((uint64_t)(x14 + x25) * (x10 + x24)))) - (((uint64_t)x10 * x14) + (((uint64_t)x12 * x12) + ((uint64_t)x14 * x10)))); +{ uint64_t x30 = ((((uint64_t)(x8 + x22) * (x14 + x25)) + (((uint64_t)(x10 + x24) * (x12 + x26)) + (((uint64_t)(x12 + x26) * (x10 + x24)) + ((uint64_t)(x14 + x25) * (x8 + x22))))) - (((uint64_t)x8 * x14) + (((uint64_t)x10 * x12) + (((uint64_t)x12 * x10) + ((uint64_t)x14 * x8))))); +{ uint64_t x31 = ((((uint64_t)(x6 + x20) * (x14 + x25)) + (((uint64_t)(x8 + x22) * (x12 + x26)) + (((uint64_t)(x10 + x24) * (x10 + x24)) + (((uint64_t)(x12 + x26) * (x8 + x22)) + ((uint64_t)(x14 + x25) * (x6 + x20)))))) - (((uint64_t)x6 * x14) + (((uint64_t)x8 * x12) + (((uint64_t)x10 * x10) + (((uint64_t)x12 * x8) + ((uint64_t)x14 * x6)))))); +{ uint64_t x32 = ((((uint64_t)(x4 + x18) * (x14 + x25)) + (((uint64_t)(x6 + x20) * (x12 + x26)) + (((uint64_t)(x8 + x22) * (x10 + x24)) + (((uint64_t)(x10 + x24) * (x8 + x22)) + (((uint64_t)(x12 + x26) * (x6 + x20)) + ((uint64_t)(x14 + x25) * (x4 + x18))))))) - (((uint64_t)x4 * x14) + (((uint64_t)x6 * x12) + (((uint64_t)x8 * x10) + (((uint64_t)x10 * x8) + (((uint64_t)x12 * x6) + ((uint64_t)x14 * x4))))))); +{ uint64_t x33 = ((((uint64_t)(x2 + x16) * (x14 + x25)) + (((uint64_t)(x4 + x18) * (x12 + x26)) + (((uint64_t)(x6 + x20) * (x10 + x24)) + (((uint64_t)(x8 + x22) * (x8 + x22)) + (((uint64_t)(x10 + x24) * (x6 + x20)) + (((uint64_t)(x12 + x26) * (x4 + x18)) + ((uint64_t)(x14 + x25) * (x2 + x16)))))))) - (((uint64_t)x2 * x14) + (((uint64_t)x4 * x12) + (((uint64_t)x6 * x10) + (((uint64_t)x8 * x8) + (((uint64_t)x10 * x6) + (((uint64_t)x12 * x4) + ((uint64_t)x14 * x2)))))))); +{ uint64_t x34 = ((((uint64_t)(x2 + x16) * (x12 + x26)) + (((uint64_t)(x4 + x18) * (x10 + x24)) + (((uint64_t)(x6 + x20) * (x8 + x22)) + (((uint64_t)(x8 + x22) * (x6 + x20)) + (((uint64_t)(x10 + x24) * (x4 + x18)) + ((uint64_t)(x12 + x26) * (x2 + x16))))))) - (((uint64_t)x2 * x12) + (((uint64_t)x4 * x10) + (((uint64_t)x6 * x8) + (((uint64_t)x8 * x6) + (((uint64_t)x10 * x4) + ((uint64_t)x12 * x2))))))); +{ uint64_t x35 = ((((uint64_t)(x2 + x16) * (x10 + x24)) + (((uint64_t)(x4 + x18) * (x8 + x22)) + (((uint64_t)(x6 + x20) * (x6 + x20)) + (((uint64_t)(x8 + x22) * (x4 + x18)) + ((uint64_t)(x10 + x24) * (x2 + x16)))))) - (((uint64_t)x2 * x10) + (((uint64_t)x4 * x8) + (((uint64_t)x6 * x6) + (((uint64_t)x8 * x4) + ((uint64_t)x10 * x2)))))); +{ uint64_t x36 = ((((uint64_t)(x2 + x16) * (x8 + x22)) + (((uint64_t)(x4 + x18) * (x6 + x20)) + (((uint64_t)(x6 + x20) * (x4 + x18)) + ((uint64_t)(x8 + x22) * (x2 + x16))))) - (((uint64_t)x2 * x8) + (((uint64_t)x4 * x6) + (((uint64_t)x6 * x4) + ((uint64_t)x8 * x2))))); +{ uint64_t x37 = ((((uint64_t)(x2 + x16) * (x6 + x20)) + (((uint64_t)(x4 + x18) * (x4 + x18)) + ((uint64_t)(x6 + x20) * (x2 + x16)))) - (((uint64_t)x2 * x6) + (((uint64_t)x4 * x4) + ((uint64_t)x6 * x2)))); +{ uint64_t x38 = ((((uint64_t)(x2 + x16) * (x4 + x18)) + ((uint64_t)(x4 + x18) * (x2 + x16))) - (((uint64_t)x2 * x4) + ((uint64_t)x4 * x2))); +{ uint64_t x39 = (((uint64_t)(x2 + x16) * (x2 + x16)) - ((uint64_t)x2 * x2)); +{ uint64_t x40 = (((((uint64_t)x14 * x14) + ((uint64_t)x25 * x25)) + x34) + x27); +{ uint64_t x41 = ((((((uint64_t)x12 * x14) + ((uint64_t)x14 * x12)) + (((uint64_t)x26 * x25) + ((uint64_t)x25 * x26))) + x35) + x28); +{ uint64_t x42 = ((((((uint64_t)x10 * x14) + (((uint64_t)x12 * x12) + ((uint64_t)x14 * x10))) + (((uint64_t)x24 * x25) + (((uint64_t)x26 * x26) + ((uint64_t)x25 * x24)))) + x36) + x29); +{ uint64_t x43 = ((((((uint64_t)x8 * x14) + (((uint64_t)x10 * x12) + (((uint64_t)x12 * x10) + ((uint64_t)x14 * x8)))) + (((uint64_t)x22 * x25) + (((uint64_t)x24 * x26) + (((uint64_t)x26 * x24) + ((uint64_t)x25 * x22))))) + x37) + x30); +{ uint64_t x44 = ((((((uint64_t)x6 * x14) + (((uint64_t)x8 * x12) + (((uint64_t)x10 * x10) + (((uint64_t)x12 * x8) + ((uint64_t)x14 * x6))))) + (((uint64_t)x20 * x25) + (((uint64_t)x22 * x26) + (((uint64_t)x24 * x24) + (((uint64_t)x26 * x22) + ((uint64_t)x25 * x20)))))) + x38) + x31); +{ uint64_t x45 = ((((((uint64_t)x4 * x14) + (((uint64_t)x6 * x12) + (((uint64_t)x8 * x10) + (((uint64_t)x10 * x8) + (((uint64_t)x12 * x6) + ((uint64_t)x14 * x4)))))) + (((uint64_t)x18 * x25) + (((uint64_t)x20 * x26) + (((uint64_t)x22 * x24) + (((uint64_t)x24 * x22) + (((uint64_t)x26 * x20) + ((uint64_t)x25 * x18))))))) + x39) + x32); +{ uint64_t x46 = ((((uint64_t)x2 * x14) + (((uint64_t)x4 * x12) + (((uint64_t)x6 * x10) + (((uint64_t)x8 * x8) + (((uint64_t)x10 * x6) + (((uint64_t)x12 * x4) + ((uint64_t)x14 * x2))))))) + (((uint64_t)x16 * x25) + (((uint64_t)x18 * x26) + (((uint64_t)x20 * x24) + (((uint64_t)x22 * x22) + (((uint64_t)x24 * x20) + (((uint64_t)x26 * x18) + ((uint64_t)x25 * x16)))))))); +{ uint64_t x47 = (((((uint64_t)x2 * x12) + (((uint64_t)x4 * x10) + (((uint64_t)x6 * x8) + (((uint64_t)x8 * x6) + (((uint64_t)x10 * x4) + ((uint64_t)x12 * x2)))))) + (((uint64_t)x16 * x26) + (((uint64_t)x18 * x24) + (((uint64_t)x20 * x22) + (((uint64_t)x22 * x20) + (((uint64_t)x24 * x18) + ((uint64_t)x26 * x16))))))) + x27); +{ uint64_t x48 = (((((uint64_t)x2 * x10) + (((uint64_t)x4 * x8) + (((uint64_t)x6 * x6) + (((uint64_t)x8 * x4) + ((uint64_t)x10 * x2))))) + (((uint64_t)x16 * x24) + (((uint64_t)x18 * x22) + (((uint64_t)x20 * x20) + (((uint64_t)x22 * x18) + ((uint64_t)x24 * x16)))))) + x28); +{ uint64_t x49 = (((((uint64_t)x2 * x8) + (((uint64_t)x4 * x6) + (((uint64_t)x6 * x4) + ((uint64_t)x8 * x2)))) + (((uint64_t)x16 * x22) + (((uint64_t)x18 * x20) + (((uint64_t)x20 * x18) + ((uint64_t)x22 * x16))))) + x29); +{ uint64_t x50 = (((((uint64_t)x2 * x6) + (((uint64_t)x4 * x4) + ((uint64_t)x6 * x2))) + (((uint64_t)x16 * x20) + (((uint64_t)x18 * x18) + ((uint64_t)x20 * x16)))) + x30); +{ uint64_t x51 = (((((uint64_t)x2 * x4) + ((uint64_t)x4 * x2)) + (((uint64_t)x16 * x18) + ((uint64_t)x18 * x16))) + x31); +{ uint64_t x52 = ((((uint64_t)x2 * x2) + ((uint64_t)x16 * x16)) + x32); +{ uint32_t x53 = (uint32_t) (x46 >> 0x17); +{ uint32_t x54 = ((uint32_t)x46 & 0x7fffff); +{ uint32_t x55 = (uint32_t) (x33 >> 0x17); +{ uint32_t x56 = ((uint32_t)x33 & 0x7fffff); +{ uint64_t x57 = (((uint64_t)0x800000 * x55) + x56); +{ uint32_t x58 = (uint32_t) (x57 >> 0x17); +{ uint32_t x59 = ((uint32_t)x57 & 0x7fffff); +{ uint64_t x60 = ((x53 + x45) + x58); +{ uint32_t x61 = (uint32_t) (x60 >> 0x17); +{ uint32_t x62 = ((uint32_t)x60 & 0x7fffff); +{ uint64_t x63 = (x52 + x58); +{ uint32_t x64 = (uint32_t) (x63 >> 0x17); +{ uint32_t x65 = ((uint32_t)x63 & 0x7fffff); +{ uint64_t x66 = (x61 + x44); +{ uint32_t x67 = (uint32_t) (x66 >> 0x17); +{ uint32_t x68 = ((uint32_t)x66 & 0x7fffff); +{ uint64_t x69 = (x64 + x51); +{ uint32_t x70 = (uint32_t) (x69 >> 0x17); +{ uint32_t x71 = ((uint32_t)x69 & 0x7fffff); +{ uint64_t x72 = (x67 + x43); +{ uint32_t x73 = (uint32_t) (x72 >> 0x17); +{ uint32_t x74 = ((uint32_t)x72 & 0x7fffff); +{ uint64_t x75 = (x70 + x50); +{ uint32_t x76 = (uint32_t) (x75 >> 0x17); +{ uint32_t x77 = ((uint32_t)x75 & 0x7fffff); +{ uint64_t x78 = (x73 + x42); +{ uint32_t x79 = (uint32_t) (x78 >> 0x17); +{ uint32_t x80 = ((uint32_t)x78 & 0x7fffff); +{ uint64_t x81 = (x76 + x49); +{ uint32_t x82 = (uint32_t) (x81 >> 0x17); +{ uint32_t x83 = ((uint32_t)x81 & 0x7fffff); +{ uint64_t x84 = (x79 + x41); +{ uint32_t x85 = (uint32_t) (x84 >> 0x17); +{ uint32_t x86 = ((uint32_t)x84 & 0x7fffff); +{ uint64_t x87 = (x82 + x48); +{ uint32_t x88 = (uint32_t) (x87 >> 0x17); +{ uint32_t x89 = ((uint32_t)x87 & 0x7fffff); +{ uint64_t x90 = (x85 + x40); +{ uint32_t x91 = (uint32_t) (x90 >> 0x17); +{ uint32_t x92 = ((uint32_t)x90 & 0x7fffff); +{ uint64_t x93 = (x88 + x47); +{ uint32_t x94 = (uint32_t) (x93 >> 0x17); +{ uint32_t x95 = ((uint32_t)x93 & 0x7fffff); +{ uint32_t x96 = (x91 + x59); +{ uint32_t x97 = (x96 >> 0x17); +{ uint32_t x98 = (x96 & 0x7fffff); +{ uint32_t x99 = (x94 + x54); +{ uint32_t x100 = (x99 >> 0x17); +{ uint32_t x101 = (x99 & 0x7fffff); +{ uint32_t x102 = ((0x800000 * x97) + x98); +{ uint32_t x103 = (x102 >> 0x17); +{ uint32_t x104 = (x102 & 0x7fffff); +{ uint32_t x105 = ((x100 + x62) + x103); +{ uint32_t x106 = (x105 >> 0x17); +{ uint32_t x107 = (x105 & 0x7fffff); +{ uint32_t x108 = (x65 + x103); +{ uint32_t x109 = (x108 >> 0x17); +{ uint32_t x110 = (x108 & 0x7fffff); +out[0] = x104; +out[1] = x92; +out[2] = x86; +out[3] = x80; +out[4] = x74; +out[5] = x106 + x68; +out[6] = x107; +out[7] = x101; +out[8] = x95; +out[9] = x89; +out[10] = x83; +out[11] = x77; +out[12] = x109 + x71; +out[13] = x110; +}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +// caller: uint64_t out[14]; diff --git a/src/Specific/solinas32_2e322m2e161m1/fesquare.h b/src/Specific/solinas32_2e322m2e161m1/fesquare.h new file mode 100644 index 000000000..5c03beeab --- /dev/null +++ b/src/Specific/solinas32_2e322m2e161m1/fesquare.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline fesquare(uint64_t* out, uint64_t x25, uint64_t x26, uint64_t x24, uint64_t x22, uint64_t x20, uint64_t x18, uint64_t x16, uint64_t x14, uint64_t x12, uint64_t x10, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2); diff --git a/src/Specific/solinas32_2e322m2e161m1/freeze.c b/src/Specific/solinas32_2e322m2e161m1/freeze.c new file mode 100644 index 000000000..b157048ca --- /dev/null +++ b/src/Specific/solinas32_2e322m2e161m1/freeze.c @@ -0,0 +1,25 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "freeze.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline freeze(uint64_t* out, uint64_t x25, uint64_t x26, uint64_t x24, uint64_t x22, uint64_t x20, uint64_t x18, uint64_t x16, uint64_t x14, uint64_t x12, uint64_t x10, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2) +out[0] = uint32_t x28; +out[1] = uint8_t x29 = Op Syntax.SubWithGetBorrow 23 Syntax.TWord 3 Syntax.TWord 5 Syntax.TWord 5 Syntax.TWord 5 Syntax.TWord 3 0x0; +out[2] = x2; +out[3] = 0x7fffff;; +} +// caller: uint64_t out[4]; diff --git a/src/Specific/solinas32_2e322m2e161m1/freeze.h b/src/Specific/solinas32_2e322m2e161m1/freeze.h new file mode 100644 index 000000000..0fda81e7a --- /dev/null +++ b/src/Specific/solinas32_2e322m2e161m1/freeze.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline freeze(uint64_t* out, uint64_t x25, uint64_t x26, uint64_t x24, uint64_t x22, uint64_t x20, uint64_t x18, uint64_t x16, uint64_t x14, uint64_t x12, uint64_t x10, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2); |