1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
|
#include <stdint.h>
#include <stdbool.h>
#include <x86intrin.h>
#include "liblow.h"
#include "femul.h"
typedef unsigned int uint128_t __attribute__((mode(TI)));
#if (defined(__GNUC__) || defined(__GNUG__)) && !(defined(__clang__)||defined(__INTEL_COMPILER))
// https://gcc.gnu.org/bugzilla/show_bug.cgi?id=81294
#define _subborrow_u32 __builtin_ia32_sbb_u32
#define _subborrow_u64 __builtin_ia32_sbb_u64
#endif
#undef force_inline
#define force_inline __attribute__((always_inline))
void force_inline femul(uint64_t* out, uint64_t x12, uint64_t x13, uint64_t x11, uint64_t x9, uint64_t x7, uint64_t x5, uint64_t x22, uint64_t x23, uint64_t x21, uint64_t x19, uint64_t x17, uint64_t x15)
{ uint64_t x26; uint64_t x25 = _mulx_u64(x5, x15, &x26);
{ uint64_t x29; uint64_t x28 = _mulx_u64(x5, x17, &x29);
{ uint64_t x32; uint64_t x31 = _mulx_u64(x5, x19, &x32);
{ uint64_t x35; uint64_t x34 = _mulx_u64(x5, x21, &x35);
{ uint64_t x38; uint64_t x37 = _mulx_u64(x5, x23, &x38);
{ uint64_t x41; uint64_t x40 = _mulx_u64(x5, x22, &x41);
{ uint64_t x43; uint8_t x44 = _addcarryx_u64(0x0, x26, x28, &x43);
{ uint64_t x46; uint8_t x47 = _addcarryx_u64(x44, x29, x31, &x46);
{ uint64_t x49; uint8_t x50 = _addcarryx_u64(x47, x32, x34, &x49);
{ uint64_t x52; uint8_t x53 = _addcarryx_u64(x50, x35, x37, &x52);
{ uint64_t x55; uint8_t x56 = _addcarryx_u64(x53, x38, x40, &x55);
{ uint64_t x58; uint8_t _ = _addcarryx_u64(0x0, x56, x41, &x58);
{ uint64_t x62; uint64_t x61 = _mulx_u64(x25, 0xffffffffffffffffL, &x62);
{ uint64_t x65; uint64_t x64 = _mulx_u64(x25, 0xffffffffffffffffL, &x65);
{ uint64_t x68; uint64_t x67 = _mulx_u64(x25, 0xfffffffdffffffffL, &x68);
{ uint64_t x71; uint64_t x70 = _mulx_u64(x25, 0xffffffffffffffffL, &x71);
{ uint64_t x74; uint64_t x73 = _mulx_u64(x25, 0xffffffffffffffffL, &x74);
out[0] = uint64_t x76;
out[1] = uint8_t x77 = Op Syntax.MulSplit 64 Syntax.TWord 6 Syntax.TWord 3 Syntax.TWord 6 Syntax.TWord 3 x25;
out[2] = 0x3;;
}}}}}}}}}}}}}}}}}
// caller: uint64_t out[3];
|