diff options
author | 2017-11-02 01:36:04 -0400 | |
---|---|---|
committer | 2017-11-02 01:36:04 -0400 | |
commit | 5b45aa93efa19d54e50299ff0df8ee46c60f891b (patch) | |
tree | 9cea98ab783f557b5cbca0456a4dc3b4498e43c5 /src/Specific/montgomery32_2e369m25 | |
parent | e8bda9b779d5762c5868cd09c85142151655d5ca (diff) |
Update display logs and c files
Diffstat (limited to 'src/Specific/montgomery32_2e369m25')
-rw-r--r-- | src/Specific/montgomery32_2e369m25/feadd.c | 70 | ||||
-rw-r--r-- | src/Specific/montgomery32_2e369m25/feadd.h | 6 | ||||
-rw-r--r-- | src/Specific/montgomery32_2e369m25/fenz.c | 33 | ||||
-rw-r--r-- | src/Specific/montgomery32_2e369m25/fenz.h | 6 |
4 files changed, 115 insertions, 0 deletions
diff --git a/src/Specific/montgomery32_2e369m25/feadd.c b/src/Specific/montgomery32_2e369m25/feadd.c new file mode 100644 index 000000000..340cf25c9 --- /dev/null +++ b/src/Specific/montgomery32_2e369m25/feadd.c @@ -0,0 +1,70 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "feadd.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline feadd(uint64_t* out, uint64_t x24, uint64_t x25, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x46, uint64_t x47, uint64_t x45, uint64_t x43, uint64_t x41, uint64_t x39, uint64_t x37, uint64_t x35, uint64_t x33, uint64_t x31, uint64_t x29, uint64_t x27) +{ uint32_t x49; uint8_t x50 = _addcarryx_u32(0x0, x5, x27, &x49); +{ uint32_t x52; uint8_t x53 = _addcarryx_u32(x50, x7, x29, &x52); +{ uint32_t x55; uint8_t x56 = _addcarryx_u32(x53, x9, x31, &x55); +{ uint32_t x58; uint8_t x59 = _addcarryx_u32(x56, x11, x33, &x58); +{ uint32_t x61; uint8_t x62 = _addcarryx_u32(x59, x13, x35, &x61); +{ uint32_t x64; uint8_t x65 = _addcarryx_u32(x62, x15, x37, &x64); +{ uint32_t x67; uint8_t x68 = _addcarryx_u32(x65, x17, x39, &x67); +{ uint32_t x70; uint8_t x71 = _addcarryx_u32(x68, x19, x41, &x70); +{ uint32_t x73; uint8_t x74 = _addcarryx_u32(x71, x21, x43, &x73); +{ uint32_t x76; uint8_t x77 = _addcarryx_u32(x74, x23, x45, &x76); +{ uint32_t x79; uint8_t x80 = _addcarryx_u32(x77, x25, x47, &x79); +{ uint32_t x82; uint8_t x83 = _addcarryx_u32(x80, x24, x46, &x82); +{ uint32_t x85; uint8_t x86 = _subborrow_u32(0x0, x49, 0xffffffe7, &x85); +{ uint32_t x88; uint8_t x89 = _subborrow_u32(x86, x52, 0xffffffff, &x88); +{ uint32_t x91; uint8_t x92 = _subborrow_u32(x89, x55, 0xffffffff, &x91); +{ uint32_t x94; uint8_t x95 = _subborrow_u32(x92, x58, 0xffffffff, &x94); +{ uint32_t x97; uint8_t x98 = _subborrow_u32(x95, x61, 0xffffffff, &x97); +{ uint32_t x100; uint8_t x101 = _subborrow_u32(x98, x64, 0xffffffff, &x100); +{ uint32_t x103; uint8_t x104 = _subborrow_u32(x101, x67, 0xffffffff, &x103); +{ uint32_t x106; uint8_t x107 = _subborrow_u32(x104, x70, 0xffffffff, &x106); +{ uint32_t x109; uint8_t x110 = _subborrow_u32(x107, x73, 0xffffffff, &x109); +{ uint32_t x112; uint8_t x113 = _subborrow_u32(x110, x76, 0xffffffff, &x112); +{ uint32_t x115; uint8_t x116 = _subborrow_u32(x113, x79, 0xffffffff, &x115); +{ uint32_t x118; uint8_t x119 = _subborrow_u32(x116, x82, 0x1ffff, &x118); +{ uint32_t _; uint8_t x122 = _subborrow_u32(x119, x83, 0x0, &_); +{ uint32_t x123 = cmovznz(x122, x118, x82); +{ uint32_t x124 = cmovznz(x122, x115, x79); +{ uint32_t x125 = cmovznz(x122, x112, x76); +{ uint32_t x126 = cmovznz(x122, x109, x73); +{ uint32_t x127 = cmovznz(x122, x106, x70); +{ uint32_t x128 = cmovznz(x122, x103, x67); +{ uint32_t x129 = cmovznz(x122, x100, x64); +{ uint32_t x130 = cmovznz(x122, x97, x61); +{ uint32_t x131 = cmovznz(x122, x94, x58); +{ uint32_t x132 = cmovznz(x122, x91, x55); +{ uint32_t x133 = cmovznz(x122, x88, x52); +{ uint32_t x134 = cmovznz(x122, x85, x49); +out[0] = x123; +out[1] = x124; +out[2] = x125; +out[3] = x126; +out[4] = x127; +out[5] = x128; +out[6] = x129; +out[7] = x130; +out[8] = x131; +out[9] = x132; +out[10] = x133; +out[11] = x134; +}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}} +// caller: uint64_t out[12]; diff --git a/src/Specific/montgomery32_2e369m25/feadd.h b/src/Specific/montgomery32_2e369m25/feadd.h new file mode 100644 index 000000000..06344a9dc --- /dev/null +++ b/src/Specific/montgomery32_2e369m25/feadd.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline feadd(uint64_t* out, uint64_t x24, uint64_t x25, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x46, uint64_t x47, uint64_t x45, uint64_t x43, uint64_t x41, uint64_t x39, uint64_t x37, uint64_t x35, uint64_t x33, uint64_t x31, uint64_t x29, uint64_t x27); diff --git a/src/Specific/montgomery32_2e369m25/fenz.c b/src/Specific/montgomery32_2e369m25/fenz.c new file mode 100644 index 000000000..047ff14c3 --- /dev/null +++ b/src/Specific/montgomery32_2e369m25/fenz.c @@ -0,0 +1,33 @@ +#include <stdint.h> +#include <stdbool.h> +#include <x86intrin.h> +#include "liblow.h" + +#include "fenz.h" + +typedef unsigned int uint128_t __attribute__((mode(TI))); + +#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER)) +// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294 +#define _subborrow_u32 __builtin_ia32_sbb_u32 +#define _subborrow_u64 __builtin_ia32_sbb_u64 +#endif + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline fenz(uint64_t* out, uint64_t x21, uint64_t x22, uint64_t x20, uint64_t x18, uint64_t x16, uint64_t x14, uint64_t x12, uint64_t x10, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2) +{ uint32_t x23 = (x22 | x21); +{ uint32_t x24 = (x20 | x23); +{ uint32_t x25 = (x18 | x24); +{ uint32_t x26 = (x16 | x25); +{ uint32_t x27 = (x14 | x26); +{ uint32_t x28 = (x12 | x27); +{ uint32_t x29 = (x10 | x28); +{ uint32_t x30 = (x8 | x29); +{ uint32_t x31 = (x6 | x30); +{ uint32_t x32 = (x4 | x31); +{ uint32_t x33 = (x2 | x32); +out[0] = x33; +}}}}}}}}}}} +// caller: uint64_t out[1]; diff --git a/src/Specific/montgomery32_2e369m25/fenz.h b/src/Specific/montgomery32_2e369m25/fenz.h new file mode 100644 index 000000000..8d17e783b --- /dev/null +++ b/src/Specific/montgomery32_2e369m25/fenz.h @@ -0,0 +1,6 @@ +#include <stdint.h> + +#undef force_inline +#define force_inline __attribute__((always_inline)) + +void force_inline fenz(uint64_t* out, uint64_t x21, uint64_t x22, uint64_t x20, uint64_t x18, uint64_t x16, uint64_t x14, uint64_t x12, uint64_t x10, uint64_t x8, uint64_t x6, uint64_t x4, uint64_t x2); |