diff options
author | 2017-11-02 02:20:52 -0400 | |
---|---|---|
committer | 2017-11-02 02:20:52 -0400 | |
commit | 37a8b2a0c14082298d77f0a4858ab3402d9d1c6c (patch) | |
tree | bd1b4c8c34485332ff15d58272efb38468ea72e5 /src/Specific/montgomery64_2e196m15 | |
parent | 11144d2e698c4a263e59acb02226d383865f74e0 (diff) |
Update display logs and c files
Diffstat (limited to 'src/Specific/montgomery64_2e196m15')
-rw-r--r-- | src/Specific/montgomery64_2e196m15/feadd.c | 66 | ||||
-rw-r--r-- | src/Specific/montgomery64_2e196m15/femul.c | 166 | ||||
-rw-r--r-- | src/Specific/montgomery64_2e196m15/fenz.c | 36 | ||||
-rw-r--r-- | src/Specific/montgomery64_2e196m15/feopp.c | 62 | ||||
-rw-r--r-- | src/Specific/montgomery64_2e196m15/fesub.c | 66 |
5 files changed, 221 insertions, 175 deletions
diff --git a/src/Specific/montgomery64_2e196m15/feadd.c b/src/Specific/montgomery64_2e196m15/feadd.c index c70f970dc..07a03ff20 100644 --- a/src/Specific/montgomery64_2e196m15/feadd.c +++ b/src/Specific/montgomery64_2e196m15/feadd.c @@ -1,38 +1,28 @@ -#include <stdint.h> -#include <stdbool.h> -#include <x86intrin.h> -#include "liblow.h" - -#include "feadd.h" - -typedef unsigned int uint128_t __attribute__((mode(TI))); - -#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) -// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 -#define _subborrow_u32 __builtin_ia32_sbb_u32 -#define _subborrow_u64 __builtin_ia32_sbb_u64 -#endif - -#undef force_inline -#define force_inline __attribute__((always_inline)) - -void force_inline feadd(uint64_t* out, uint64_t x8, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x14, uint64_t x15, uint64_t x13, uint64_t x11) -{ uint64_t x17; uint8_t x18 = _addcarryx_u64(0x0, x5, x11, &x17); -{ uint64_t x20; uint8_t x21 = _addcarryx_u64(x18, x7, x13, &x20); -{ uint64_t x23; uint8_t x24 = _addcarryx_u64(x21, x9, x15, &x23); -{ uint64_t x26; uint8_t x27 = _addcarryx_u64(x24, x8, x14, &x26); -{ uint64_t x29; uint8_t x30 = _subborrow_u64(0x0, x17, 0xfffffffffffffff1L, &x29); -{ uint64_t x32; uint8_t x33 = _subborrow_u64(x30, x20, 0xffffffffffffffffL, &x32); -{ uint64_t x35; uint8_t x36 = _subborrow_u64(x33, x23, 0xffffffffffffffffL, &x35); -{ uint64_t x38; uint8_t x39 = _subborrow_u64(x36, x26, 0xf, &x38); -{ uint64_t _; uint8_t x42 = _subborrow_u64(x39, x27, 0x0, &_); -{ uint64_t x43 = cmovznz(x42, x38, x26); -{ uint64_t x44 = cmovznz(x42, x35, x23); -{ uint64_t x45 = cmovznz(x42, x32, x20); -{ uint64_t x46 = cmovznz(x42, x29, x17); -out[0] = x43; -out[1] = x44; -out[2] = x45; -out[3] = x46; -}}}}}}}}}}}}} -// caller: uint64_t out[4]; +static void feadd(uint64_t out[4], const uint64_t in1[4], const uint64_t in2[4]) { + { const uint64_t x8 = in1[3]; + { const uint64_t x9 = in1[2]; + { const uint64_t x7 = in1[1]; + { const uint64_t x5 = in1[0]; + { const uint64_t x14 = in2[3]; + { const uint64_t x15 = in2[2]; + { const uint64_t x13 = in2[1]; + { const uint64_t x11 = in2[0]; + { uint64_t x17; uint8_t x18 = _addcarryx_u64(0x0, x5, x11, &x17); + { uint64_t x20; uint8_t x21 = _addcarryx_u64(x18, x7, x13, &x20); + { uint64_t x23; uint8_t x24 = _addcarryx_u64(x21, x9, x15, &x23); + { uint64_t x26; uint8_t x27 = _addcarryx_u64(x24, x8, x14, &x26); + { uint64_t x29; uint8_t x30 = _subborrow_u64(0x0, x17, 0xfffffffffffffff1L, &x29); + { uint64_t x32; uint8_t x33 = _subborrow_u64(x30, x20, 0xffffffffffffffffL, &x32); + { uint64_t x35; uint8_t x36 = _subborrow_u64(x33, x23, 0xffffffffffffffffL, &x35); + { uint64_t x38; uint8_t x39 = _subborrow_u64(x36, x26, 0xf, &x38); + { uint64_t _; uint8_t x42 = _subborrow_u64(x39, x27, 0x0, &_); + { uint64_t x43 = cmovznz(x42, x38, x26); + { uint64_t x44 = cmovznz(x42, x35, x23); + { uint64_t x45 = cmovznz(x42, x32, x20); + { uint64_t x46 = cmovznz(x42, x29, x17); + out[0] = x46; + out[1] = x45; + out[2] = x44; + out[3] = x43; + }}}}}}}}}}}}}}}}}}}}} +} diff --git a/src/Specific/montgomery64_2e196m15/femul.c b/src/Specific/montgomery64_2e196m15/femul.c index 61ba1a7e2..0febcb70c 100644 --- a/src/Specific/montgomery64_2e196m15/femul.c +++ b/src/Specific/montgomery64_2e196m15/femul.c @@ -1,36 +1,130 @@ -#include <stdint.h> -#include <stdbool.h> -#include <x86intrin.h> -#include "liblow.h" - -#include "femul.h" - -typedef unsigned int uint128_t __attribute__((mode(TI))); - -#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) -// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 -#define _subborrow_u32 __builtin_ia32_sbb_u32 -#define _subborrow_u64 __builtin_ia32_sbb_u64 -#endif - -#undef force_inline -#define force_inline __attribute__((always_inline)) - -void force_inline femul(uint64_t* out, uint64_t x8, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x14, uint64_t x15, uint64_t x13, uint64_t x11) -{ uint64_t x18; uint64_t x17 = _mulx_u64(x5, x11, &x18); -{ uint64_t x21; uint64_t x20 = _mulx_u64(x5, x13, &x21); -{ uint64_t x24; uint64_t x23 = _mulx_u64(x5, x15, &x24); -{ uint64_t x27; uint64_t x26 = _mulx_u64(x5, x14, &x27); -{ uint64_t x29; uint8_t x30 = _addcarryx_u64(0x0, x18, x20, &x29); -{ uint64_t x32; uint8_t x33 = _addcarryx_u64(x30, x21, x23, &x32); -{ uint64_t x35; uint8_t x36 = _addcarryx_u64(x33, x24, x26, &x35); -{ uint64_t x38; uint8_t _ = _addcarryx_u64(0x0, x36, x27, &x38); -{ uint64_t _; uint64_t x41 = _mulx_u64(x17, 0xeeeeeeeeeeeeeeefL, &_); -{ uint64_t x45; uint64_t x44 = _mulx_u64(x41, 0xfffffffffffffff1L, &x45); -{ uint64_t x48; uint64_t x47 = _mulx_u64(x41, 0xffffffffffffffffL, &x48); -{ uint64_t x51; uint64_t x50 = _mulx_u64(x41, 0xffffffffffffffffL, &x51); -out[0] = uint64_t x53; -out[1] = uint8_t x54 = Op Syntax.MulSplit 64 Syntax.TWord 6 Syntax.TWord 3 Syntax.TWord 6 Syntax.TWord 3 x41; -out[2] = 0xf;; -}}}}}}}}}}}} -// caller: uint64_t out[3]; +static void femul(uint64_t out[4], const uint64_t in1[4], const uint64_t in2[4]) { + { const uint64_t x8 = in1[3]; + { const uint64_t x9 = in1[2]; + { const uint64_t x7 = in1[1]; + { const uint64_t x5 = in1[0]; + { const uint64_t x14 = in2[3]; + { const uint64_t x15 = in2[2]; + { const uint64_t x13 = in2[1]; + { const uint64_t x11 = in2[0]; + { uint64_t x18; uint64_t x17 = _mulx_u64(x5, x11, &x18); + { uint64_t x21; uint64_t x20 = _mulx_u64(x5, x13, &x21); + { uint64_t x24; uint64_t x23 = _mulx_u64(x5, x15, &x24); + { uint64_t x27; uint64_t x26 = _mulx_u64(x5, x14, &x27); + { uint64_t x29; uint8_t x30 = _addcarryx_u64(0x0, x18, x20, &x29); + { uint64_t x32; uint8_t x33 = _addcarryx_u64(x30, x21, x23, &x32); + { uint64_t x35; uint8_t x36 = _addcarryx_u64(x33, x24, x26, &x35); + { uint64_t x38; uint8_t _ = _addcarryx_u64(0x0, x36, x27, &x38); + { uint64_t _; uint64_t x41 = _mulx_u64(x17, 0xeeeeeeeeeeeeeeefL, &_); + { uint64_t x45; uint64_t x44 = _mulx_u64(x41, 0xfffffffffffffff1L, &x45); + { uint64_t x48; uint64_t x47 = _mulx_u64(x41, 0xffffffffffffffffL, &x48); + { uint64_t x51; uint64_t x50 = _mulx_u64(x41, 0xffffffffffffffffL, &x51); + { uint64_t x53, uint8_t x54 = Op (Syntax.MulSplit 64 (Syntax.TWord 6) (Syntax.TWord 3) (Syntax.TWord 6) (Syntax.TWord 3)) (Return x41, 0xf); + { uint64_t x56; uint8_t x57 = _addcarryx_u64(0x0, x45, x47, &x56); + { uint64_t x59; uint8_t x60 = _addcarryx_u64(x57, x48, x50, &x59); + { uint64_t x62; uint8_t x63 = _addcarryx_u64(x60, x51, x53, &x62); + { uint8_t x64 = (x63 + x54); + { uint64_t _; uint8_t x67 = _addcarryx_u64(0x0, x17, x44, &_); + { uint64_t x69; uint8_t x70 = _addcarryx_u64(x67, x29, x56, &x69); + { uint64_t x72; uint8_t x73 = _addcarryx_u64(x70, x32, x59, &x72); + { uint64_t x75; uint8_t x76 = _addcarryx_u64(x73, x35, x62, &x75); + { uint64_t x78; uint8_t x79 = _addcarryx_u64(x76, x38, x64, &x78); + { uint64_t x82; uint64_t x81 = _mulx_u64(x7, x11, &x82); + { uint64_t x85; uint64_t x84 = _mulx_u64(x7, x13, &x85); + { uint64_t x88; uint64_t x87 = _mulx_u64(x7, x15, &x88); + { uint64_t x91; uint64_t x90 = _mulx_u64(x7, x14, &x91); + { uint64_t x93; uint8_t x94 = _addcarryx_u64(0x0, x82, x84, &x93); + { uint64_t x96; uint8_t x97 = _addcarryx_u64(x94, x85, x87, &x96); + { uint64_t x99; uint8_t x100 = _addcarryx_u64(x97, x88, x90, &x99); + { uint64_t x102; uint8_t _ = _addcarryx_u64(0x0, x100, x91, &x102); + { uint64_t x105; uint8_t x106 = _addcarryx_u64(0x0, x69, x81, &x105); + { uint64_t x108; uint8_t x109 = _addcarryx_u64(x106, x72, x93, &x108); + { uint64_t x111; uint8_t x112 = _addcarryx_u64(x109, x75, x96, &x111); + { uint64_t x114; uint8_t x115 = _addcarryx_u64(x112, x78, x99, &x114); + { uint64_t x117; uint8_t x118 = _addcarryx_u64(x115, x79, x102, &x117); + { uint64_t _; uint64_t x120 = _mulx_u64(x105, 0xeeeeeeeeeeeeeeefL, &_); + { uint64_t x124; uint64_t x123 = _mulx_u64(x120, 0xfffffffffffffff1L, &x124); + { uint64_t x127; uint64_t x126 = _mulx_u64(x120, 0xffffffffffffffffL, &x127); + { uint64_t x130; uint64_t x129 = _mulx_u64(x120, 0xffffffffffffffffL, &x130); + { uint64_t x132, uint8_t x133 = Op (Syntax.MulSplit 64 (Syntax.TWord 6) (Syntax.TWord 3) (Syntax.TWord 6) (Syntax.TWord 3)) (Return x120, 0xf); + { uint64_t x135; uint8_t x136 = _addcarryx_u64(0x0, x124, x126, &x135); + { uint64_t x138; uint8_t x139 = _addcarryx_u64(x136, x127, x129, &x138); + { uint64_t x141; uint8_t x142 = _addcarryx_u64(x139, x130, x132, &x141); + { uint8_t x143 = (x142 + x133); + { uint64_t _; uint8_t x146 = _addcarryx_u64(0x0, x105, x123, &_); + { uint64_t x148; uint8_t x149 = _addcarryx_u64(x146, x108, x135, &x148); + { uint64_t x151; uint8_t x152 = _addcarryx_u64(x149, x111, x138, &x151); + { uint64_t x154; uint8_t x155 = _addcarryx_u64(x152, x114, x141, &x154); + { uint64_t x157; uint8_t x158 = _addcarryx_u64(x155, x117, x143, &x157); + { uint8_t x159 = (x158 + x118); + { uint64_t x162; uint64_t x161 = _mulx_u64(x9, x11, &x162); + { uint64_t x165; uint64_t x164 = _mulx_u64(x9, x13, &x165); + { uint64_t x168; uint64_t x167 = _mulx_u64(x9, x15, &x168); + { uint64_t x171; uint64_t x170 = _mulx_u64(x9, x14, &x171); + { uint64_t x173; uint8_t x174 = _addcarryx_u64(0x0, x162, x164, &x173); + { uint64_t x176; uint8_t x177 = _addcarryx_u64(x174, x165, x167, &x176); + { uint64_t x179; uint8_t x180 = _addcarryx_u64(x177, x168, x170, &x179); + { uint64_t x182; uint8_t _ = _addcarryx_u64(0x0, x180, x171, &x182); + { uint64_t x185; uint8_t x186 = _addcarryx_u64(0x0, x148, x161, &x185); + { uint64_t x188; uint8_t x189 = _addcarryx_u64(x186, x151, x173, &x188); + { uint64_t x191; uint8_t x192 = _addcarryx_u64(x189, x154, x176, &x191); + { uint64_t x194; uint8_t x195 = _addcarryx_u64(x192, x157, x179, &x194); + { uint64_t x197; uint8_t x198 = _addcarryx_u64(x195, x159, x182, &x197); + { uint64_t _; uint64_t x200 = _mulx_u64(x185, 0xeeeeeeeeeeeeeeefL, &_); + { uint64_t x204; uint64_t x203 = _mulx_u64(x200, 0xfffffffffffffff1L, &x204); + { uint64_t x207; uint64_t x206 = _mulx_u64(x200, 0xffffffffffffffffL, &x207); + { uint64_t x210; uint64_t x209 = _mulx_u64(x200, 0xffffffffffffffffL, &x210); + { uint64_t x212, uint8_t x213 = Op (Syntax.MulSplit 64 (Syntax.TWord 6) (Syntax.TWord 3) (Syntax.TWord 6) (Syntax.TWord 3)) (Return x200, 0xf); + { uint64_t x215; uint8_t x216 = _addcarryx_u64(0x0, x204, x206, &x215); + { uint64_t x218; uint8_t x219 = _addcarryx_u64(x216, x207, x209, &x218); + { uint64_t x221; uint8_t x222 = _addcarryx_u64(x219, x210, x212, &x221); + { uint8_t x223 = (x222 + x213); + { uint64_t _; uint8_t x226 = _addcarryx_u64(0x0, x185, x203, &_); + { uint64_t x228; uint8_t x229 = _addcarryx_u64(x226, x188, x215, &x228); + { uint64_t x231; uint8_t x232 = _addcarryx_u64(x229, x191, x218, &x231); + { uint64_t x234; uint8_t x235 = _addcarryx_u64(x232, x194, x221, &x234); + { uint64_t x237; uint8_t x238 = _addcarryx_u64(x235, x197, x223, &x237); + { uint8_t x239 = (x238 + x198); + { uint64_t x242; uint64_t x241 = _mulx_u64(x8, x11, &x242); + { uint64_t x245; uint64_t x244 = _mulx_u64(x8, x13, &x245); + { uint64_t x248; uint64_t x247 = _mulx_u64(x8, x15, &x248); + { uint64_t x251; uint64_t x250 = _mulx_u64(x8, x14, &x251); + { uint64_t x253; uint8_t x254 = _addcarryx_u64(0x0, x242, x244, &x253); + { uint64_t x256; uint8_t x257 = _addcarryx_u64(x254, x245, x247, &x256); + { uint64_t x259; uint8_t x260 = _addcarryx_u64(x257, x248, x250, &x259); + { uint64_t x262; uint8_t _ = _addcarryx_u64(0x0, x260, x251, &x262); + { uint64_t x265; uint8_t x266 = _addcarryx_u64(0x0, x228, x241, &x265); + { uint64_t x268; uint8_t x269 = _addcarryx_u64(x266, x231, x253, &x268); + { uint64_t x271; uint8_t x272 = _addcarryx_u64(x269, x234, x256, &x271); + { uint64_t x274; uint8_t x275 = _addcarryx_u64(x272, x237, x259, &x274); + { uint64_t x277; uint8_t x278 = _addcarryx_u64(x275, x239, x262, &x277); + { uint64_t _; uint64_t x280 = _mulx_u64(x265, 0xeeeeeeeeeeeeeeefL, &_); + { uint64_t x284; uint64_t x283 = _mulx_u64(x280, 0xfffffffffffffff1L, &x284); + { uint64_t x287; uint64_t x286 = _mulx_u64(x280, 0xffffffffffffffffL, &x287); + { uint64_t x290; uint64_t x289 = _mulx_u64(x280, 0xffffffffffffffffL, &x290); + { uint64_t x292, uint8_t x293 = Op (Syntax.MulSplit 64 (Syntax.TWord 6) (Syntax.TWord 3) (Syntax.TWord 6) (Syntax.TWord 3)) (Return x280, 0xf); + { uint64_t x295; uint8_t x296 = _addcarryx_u64(0x0, x284, x286, &x295); + { uint64_t x298; uint8_t x299 = _addcarryx_u64(x296, x287, x289, &x298); + { uint64_t x301; uint8_t x302 = _addcarryx_u64(x299, x290, x292, &x301); + { uint8_t x303 = (x302 + x293); + { uint64_t _; uint8_t x306 = _addcarryx_u64(0x0, x265, x283, &_); + { uint64_t x308; uint8_t x309 = _addcarryx_u64(x306, x268, x295, &x308); + { uint64_t x311; uint8_t x312 = _addcarryx_u64(x309, x271, x298, &x311); + { uint64_t x314; uint8_t x315 = _addcarryx_u64(x312, x274, x301, &x314); + { uint64_t x317; uint8_t x318 = _addcarryx_u64(x315, x277, x303, &x317); + { uint8_t x319 = (x318 + x278); + { uint64_t x321; uint8_t x322 = _subborrow_u64(0x0, x308, 0xfffffffffffffff1L, &x321); + { uint64_t x324; uint8_t x325 = _subborrow_u64(x322, x311, 0xffffffffffffffffL, &x324); + { uint64_t x327; uint8_t x328 = _subborrow_u64(x325, x314, 0xffffffffffffffffL, &x327); + { uint64_t x330; uint8_t x331 = _subborrow_u64(x328, x317, 0xf, &x330); + { uint64_t _; uint8_t x334 = _subborrow_u64(x331, x319, 0x0, &_); + { uint64_t x335 = cmovznz(x334, x330, x317); + { uint64_t x336 = cmovznz(x334, x327, x314); + { uint64_t x337 = cmovznz(x334, x324, x311); + { uint64_t x338 = cmovznz(x334, x321, x308); + out[0] = x338; + out[1] = x337; + out[2] = x336; + out[3] = x335; + }}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +} diff --git a/src/Specific/montgomery64_2e196m15/fenz.c b/src/Specific/montgomery64_2e196m15/fenz.c index 51bde0513..7541094ff 100644 --- a/src/Specific/montgomery64_2e196m15/fenz.c +++ b/src/Specific/montgomery64_2e196m15/fenz.c @@ -1,25 +1,11 @@ -#include <stdint.h> -#include <stdbool.h> -#include <x86intrin.h> -#include "liblow.h" - -#include "fenz.h" - -typedef unsigned int uint128_t __attribute__((mode(TI))); - -#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) -// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 -#define _subborrow_u32 __builtin_ia32_sbb_u32 -#define _subborrow_u64 __builtin_ia32_sbb_u64 -#endif - -#undef force_inline -#define force_inline __attribute__((always_inline)) - -void force_inline fenz(uint64_t* out, uint64_t x5, uint64_t x6, uint64_t x4, uint64_t x2) -{ uint64_t x7 = (x6 | x5); -{ uint64_t x8 = (x4 | x7); -{ uint64_t x9 = (x2 | x8); -out[0] = x9; -}}} -// caller: uint64_t out[1]; +static void fenz(ReturnType uint64_t out[1], const uint64_t in1[4]) { + { const uint64_t x5 = in1[3]; + { const uint64_t x6 = in1[2]; + { const uint64_t x4 = in1[1]; + { const uint64_t x2 = in1[0]; + { uint64_t x7 = (x6 | x5); + { uint64_t x8 = (x4 | x7); + { uint64_t x9 = (x2 | x8); + out[0] = x9; + }}}}}}} +} diff --git a/src/Specific/montgomery64_2e196m15/feopp.c b/src/Specific/montgomery64_2e196m15/feopp.c index c78613e0e..b8d1c31ca 100644 --- a/src/Specific/montgomery64_2e196m15/feopp.c +++ b/src/Specific/montgomery64_2e196m15/feopp.c @@ -1,38 +1,24 @@ -#include <stdint.h> -#include <stdbool.h> -#include <x86intrin.h> -#include "liblow.h" - -#include "feopp.h" - -typedef unsigned int uint128_t __attribute__((mode(TI))); - -#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) -// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 -#define _subborrow_u32 __builtin_ia32_sbb_u32 -#define _subborrow_u64 __builtin_ia32_sbb_u64 -#endif - -#undef force_inline -#define force_inline __attribute__((always_inline)) - -void force_inline feopp(uint64_t* out, uint64_t x5, uint64_t x6, uint64_t x4, uint64_t x2) -{ uint64_t x8; uint8_t x9 = _subborrow_u64(0x0, 0x0, x2, &x8); -{ uint64_t x11; uint8_t x12 = _subborrow_u64(x9, 0x0, x4, &x11); -{ uint64_t x14; uint8_t x15 = _subborrow_u64(x12, 0x0, x6, &x14); -{ uint64_t x17; uint8_t x18 = _subborrow_u64(x15, 0x0, x5, &x17); -{ uint64_t x19 = (uint64_t)cmovznz(x18, 0x0, 0xffffffffffffffffL); -{ uint64_t x20 = (x19 & 0xfffffffffffffff1L); -{ uint64_t x22; uint8_t x23 = _addcarryx_u64(0x0, x8, x20, &x22); -{ uint64_t x24 = (x19 & 0xffffffffffffffffL); -{ uint64_t x26; uint8_t x27 = _addcarryx_u64(x23, x11, x24, &x26); -{ uint64_t x28 = (x19 & 0xffffffffffffffffL); -{ uint64_t x30; uint8_t x31 = _addcarryx_u64(x27, x14, x28, &x30); -{ uint8_t x32 = ((uint8_t)x19 & 0xf); -{ uint64_t x34; uint8_t _ = _addcarryx_u64(x31, x17, x32, &x34); -out[0] = x34; -out[1] = x30; -out[2] = x26; -out[3] = x22; -}}}}}}}}}}}}} -// caller: uint64_t out[4]; +static void feopp(uint64_t out[4], const uint64_t in1[4]) { + { const uint64_t x5 = in1[3]; + { const uint64_t x6 = in1[2]; + { const uint64_t x4 = in1[1]; + { const uint64_t x2 = in1[0]; + { uint64_t x8; uint8_t x9 = _subborrow_u64(0x0, 0x0, x2, &x8); + { uint64_t x11; uint8_t x12 = _subborrow_u64(x9, 0x0, x4, &x11); + { uint64_t x14; uint8_t x15 = _subborrow_u64(x12, 0x0, x6, &x14); + { uint64_t x17; uint8_t x18 = _subborrow_u64(x15, 0x0, x5, &x17); + { uint64_t x19 = (uint64_t)cmovznz(x18, 0x0, 0xffffffffffffffffL); + { uint64_t x20 = (x19 & 0xfffffffffffffff1L); + { uint64_t x22; uint8_t x23 = _addcarryx_u64(0x0, x8, x20, &x22); + { uint64_t x24 = (x19 & 0xffffffffffffffffL); + { uint64_t x26; uint8_t x27 = _addcarryx_u64(x23, x11, x24, &x26); + { uint64_t x28 = (x19 & 0xffffffffffffffffL); + { uint64_t x30; uint8_t x31 = _addcarryx_u64(x27, x14, x28, &x30); + { uint8_t x32 = ((uint8_t)x19 & 0xf); + { uint64_t x34; uint8_t _ = _addcarryx_u64(x31, x17, x32, &x34); + out[0] = x22; + out[1] = x26; + out[2] = x30; + out[3] = x34; + }}}}}}}}}}}}}}}}} +} diff --git a/src/Specific/montgomery64_2e196m15/fesub.c b/src/Specific/montgomery64_2e196m15/fesub.c index 982a6ed70..c98c307bd 100644 --- a/src/Specific/montgomery64_2e196m15/fesub.c +++ b/src/Specific/montgomery64_2e196m15/fesub.c @@ -1,38 +1,28 @@ -#include <stdint.h> -#include <stdbool.h> -#include <x86intrin.h> -#include "liblow.h" - -#include "fesub.h" - -typedef unsigned int uint128_t __attribute__((mode(TI))); - -#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) -// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 -#define _subborrow_u32 __builtin_ia32_sbb_u32 -#define _subborrow_u64 __builtin_ia32_sbb_u64 -#endif - -#undef force_inline -#define force_inline __attribute__((always_inline)) - -void force_inline fesub(uint64_t* out, uint64_t x8, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x14, uint64_t x15, uint64_t x13, uint64_t x11) -{ uint64_t x17; uint8_t x18 = _subborrow_u64(0x0, x5, x11, &x17); -{ uint64_t x20; uint8_t x21 = _subborrow_u64(x18, x7, x13, &x20); -{ uint64_t x23; uint8_t x24 = _subborrow_u64(x21, x9, x15, &x23); -{ uint64_t x26; uint8_t x27 = _subborrow_u64(x24, x8, x14, &x26); -{ uint64_t x28 = (uint64_t)cmovznz(x27, 0x0, 0xffffffffffffffffL); -{ uint64_t x29 = (x28 & 0xfffffffffffffff1L); -{ uint64_t x31; uint8_t x32 = _addcarryx_u64(0x0, x17, x29, &x31); -{ uint64_t x33 = (x28 & 0xffffffffffffffffL); -{ uint64_t x35; uint8_t x36 = _addcarryx_u64(x32, x20, x33, &x35); -{ uint64_t x37 = (x28 & 0xffffffffffffffffL); -{ uint64_t x39; uint8_t x40 = _addcarryx_u64(x36, x23, x37, &x39); -{ uint8_t x41 = ((uint8_t)x28 & 0xf); -{ uint64_t x43; uint8_t _ = _addcarryx_u64(x40, x26, x41, &x43); -out[0] = x43; -out[1] = x39; -out[2] = x35; -out[3] = x31; -}}}}}}}}}}}}} -// caller: uint64_t out[4]; +static void fesub(uint64_t out[4], const uint64_t in1[4], const uint64_t in2[4]) { + { const uint64_t x8 = in1[3]; + { const uint64_t x9 = in1[2]; + { const uint64_t x7 = in1[1]; + { const uint64_t x5 = in1[0]; + { const uint64_t x14 = in2[3]; + { const uint64_t x15 = in2[2]; + { const uint64_t x13 = in2[1]; + { const uint64_t x11 = in2[0]; + { uint64_t x17; uint8_t x18 = _subborrow_u64(0x0, x5, x11, &x17); + { uint64_t x20; uint8_t x21 = _subborrow_u64(x18, x7, x13, &x20); + { uint64_t x23; uint8_t x24 = _subborrow_u64(x21, x9, x15, &x23); + { uint64_t x26; uint8_t x27 = _subborrow_u64(x24, x8, x14, &x26); + { uint64_t x28 = (uint64_t)cmovznz(x27, 0x0, 0xffffffffffffffffL); + { uint64_t x29 = (x28 & 0xfffffffffffffff1L); + { uint64_t x31; uint8_t x32 = _addcarryx_u64(0x0, x17, x29, &x31); + { uint64_t x33 = (x28 & 0xffffffffffffffffL); + { uint64_t x35; uint8_t x36 = _addcarryx_u64(x32, x20, x33, &x35); + { uint64_t x37 = (x28 & 0xffffffffffffffffL); + { uint64_t x39; uint8_t x40 = _addcarryx_u64(x36, x23, x37, &x39); + { uint8_t x41 = ((uint8_t)x28 & 0xf); + { uint64_t x43; uint8_t _ = _addcarryx_u64(x40, x26, x41, &x43); + out[0] = x31; + out[1] = x35; + out[2] = x39; + out[3] = x43; + }}}}}}}}}}}}}}}}}}}}} +} |