aboutsummaryrefslogtreecommitdiff
path: root/src/Specific/montgomery32_2e383m187/feadd.c
blob: da64dfe0ced83de41e517141335197d430edeeaa (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
#include <stdint.h>
#include <stdbool.h>
#include <x86intrin.h>
#include "liblow.h"

#include "feadd.h"

typedef unsigned int uint128_t __attribute__((mode(TI)));

#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER))
// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294
#define _subborrow_u32 __builtin_ia32_sbb_u32
#define _subborrow_u64 __builtin_ia32_sbb_u64
#endif

#undef force_inline
#define force_inline __attribute__((always_inline))

void force_inline feadd(uint64_t* out, uint64_t x24, uint64_t x25, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17, uint64_t x15, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x46, uint64_t x47, uint64_t x45, uint64_t x43, uint64_t x41, uint64_t x39, uint64_t x37, uint64_t x35, uint64_t x33, uint64_t x31, uint64_t x29, uint64_t x27)
{  uint32_t x49; uint8_t x50 = _addcarryx_u32(0x0, x5, x27, &x49);
{  uint32_t x52; uint8_t x53 = _addcarryx_u32(x50, x7, x29, &x52);
{  uint32_t x55; uint8_t x56 = _addcarryx_u32(x53, x9, x31, &x55);
{  uint32_t x58; uint8_t x59 = _addcarryx_u32(x56, x11, x33, &x58);
{  uint32_t x61; uint8_t x62 = _addcarryx_u32(x59, x13, x35, &x61);
{  uint32_t x64; uint8_t x65 = _addcarryx_u32(x62, x15, x37, &x64);
{  uint32_t x67; uint8_t x68 = _addcarryx_u32(x65, x17, x39, &x67);
{  uint32_t x70; uint8_t x71 = _addcarryx_u32(x68, x19, x41, &x70);
{  uint32_t x73; uint8_t x74 = _addcarryx_u32(x71, x21, x43, &x73);
{  uint32_t x76; uint8_t x77 = _addcarryx_u32(x74, x23, x45, &x76);
{  uint32_t x79; uint8_t x80 = _addcarryx_u32(x77, x25, x47, &x79);
{  uint32_t x82; uint8_t x83 = _addcarryx_u32(x80, x24, x46, &x82);
{  uint32_t x85; uint8_t x86 = _subborrow_u32(0x0, x49, 0xffffff45, &x85);
{  uint32_t x88; uint8_t x89 = _subborrow_u32(x86, x52, 0xffffffff, &x88);
{  uint32_t x91; uint8_t x92 = _subborrow_u32(x89, x55, 0xffffffff, &x91);
{  uint32_t x94; uint8_t x95 = _subborrow_u32(x92, x58, 0xffffffff, &x94);
{  uint32_t x97; uint8_t x98 = _subborrow_u32(x95, x61, 0xffffffff, &x97);
{  uint32_t x100; uint8_t x101 = _subborrow_u32(x98, x64, 0xffffffff, &x100);
{  uint32_t x103; uint8_t x104 = _subborrow_u32(x101, x67, 0xffffffff, &x103);
{  uint32_t x106; uint8_t x107 = _subborrow_u32(x104, x70, 0xffffffff, &x106);
{  uint32_t x109; uint8_t x110 = _subborrow_u32(x107, x73, 0xffffffff, &x109);
{  uint32_t x112; uint8_t x113 = _subborrow_u32(x110, x76, 0xffffffff, &x112);
{  uint32_t x115; uint8_t x116 = _subborrow_u32(x113, x79, 0xffffffff, &x115);
{  uint32_t x118; uint8_t x119 = _subborrow_u32(x116, x82, 0x7fffffff, &x118);
{  uint32_t _; uint8_t x122 = _subborrow_u32(x119, x83, 0x0, &_);
{  uint32_t x123 = cmovznz(x122, x118, x82);
{  uint32_t x124 = cmovznz(x122, x115, x79);
{  uint32_t x125 = cmovznz(x122, x112, x76);
{  uint32_t x126 = cmovznz(x122, x109, x73);
{  uint32_t x127 = cmovznz(x122, x106, x70);
{  uint32_t x128 = cmovznz(x122, x103, x67);
{  uint32_t x129 = cmovznz(x122, x100, x64);
{  uint32_t x130 = cmovznz(x122, x97, x61);
{  uint32_t x131 = cmovznz(x122, x94, x58);
{  uint32_t x132 = cmovznz(x122, x91, x55);
{  uint32_t x133 = cmovznz(x122, x88, x52);
{  uint32_t x134 = cmovznz(x122, x85, x49);
out[0] = x123;
out[1] = x124;
out[2] = x125;
out[3] = x126;
out[4] = x127;
out[5] = x128;
out[6] = x129;
out[7] = x130;
out[8] = x131;
out[9] = x132;
out[10] = x133;
out[11] = x134;
}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}}
// caller: uint64_t out[12];