1 #include "vec128.h"
2 
PQCLEAN_MCELIECE348864F_AVX_vec128_set1_16b(uint16_t a)3 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_set1_16b(uint16_t a) {
4     return _mm_set1_epi16(a);
5 }
6 
PQCLEAN_MCELIECE348864F_AVX_vec128_testz(vec128 a)7 int PQCLEAN_MCELIECE348864F_AVX_vec128_testz(vec128 a) {
8     return _mm_testz_si128(a, a);
9 }
10 
PQCLEAN_MCELIECE348864F_AVX_vec128_setzero(void)11 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_setzero(void) {
12     return _mm_setzero_si128();
13 }
14 
PQCLEAN_MCELIECE348864F_AVX_vec128_and(vec128 a,vec128 b)15 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_and(vec128 a, vec128 b) {
16     return _mm_and_si128(a, b);
17 }
18 
PQCLEAN_MCELIECE348864F_AVX_vec128_xor(vec128 a,vec128 b)19 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_xor(vec128 a, vec128 b) {
20     return _mm_xor_si128(a, b);
21 }
22 
PQCLEAN_MCELIECE348864F_AVX_vec128_or(vec128 a,vec128 b)23 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_or(vec128 a, vec128 b) {
24     return _mm_or_si128(a, b);
25 }
26 
PQCLEAN_MCELIECE348864F_AVX_vec128_sll_2x(vec128 a,int s)27 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_sll_2x(vec128 a, int s) {
28     return _mm_slli_epi64(a, s);
29 }
30 
PQCLEAN_MCELIECE348864F_AVX_vec128_srl_2x(vec128 a,int s)31 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_srl_2x(vec128 a, int s) {
32     return _mm_srli_epi64(a, s);
33 }
34 
PQCLEAN_MCELIECE348864F_AVX_vec128_set2x(uint64_t a0,uint64_t a1)35 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_set2x(uint64_t a0, uint64_t a1) {
36     return _mm_set_epi64x(a1, a0);
37 }
38 
PQCLEAN_MCELIECE348864F_AVX_vec128_unpack_low(vec128 a,vec128 b)39 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_unpack_low(vec128 a, vec128 b) {
40     return _mm_unpacklo_epi64(a, b);
41 }
42 
PQCLEAN_MCELIECE348864F_AVX_vec128_unpack_high(vec128 a,vec128 b)43 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_unpack_high(vec128 a, vec128 b) {
44     return _mm_unpackhi_epi64(a, b);
45 }
46 
PQCLEAN_MCELIECE348864F_AVX_vec128_setbits(uint64_t a)47 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_setbits(uint64_t a) {
48     return _mm_set1_epi64x(-a);
49 }
50 
PQCLEAN_MCELIECE348864F_AVX_vec128_copy(vec128 * dest,const vec128 * src)51 void PQCLEAN_MCELIECE348864F_AVX_vec128_copy(vec128 *dest, const vec128 *src) {
52     int i;
53 
54     for (i = 0; i < GFBITS; i++) {
55         dest[i] = src[i];
56     }
57 }
58 
PQCLEAN_MCELIECE348864F_AVX_vec128_add(vec128 * c,const vec128 * a,const vec128 * b)59 void PQCLEAN_MCELIECE348864F_AVX_vec128_add(vec128 *c, const vec128 *a, const vec128 *b) {
60     int i;
61 
62     for (i = 0; i < GFBITS; i++) {
63         c[i] = PQCLEAN_MCELIECE348864F_AVX_vec128_xor(a[i], b[i]);
64     }
65 }
66 
PQCLEAN_MCELIECE348864F_AVX_vec128_or_reduce(const vec128 * a)67 vec128 PQCLEAN_MCELIECE348864F_AVX_vec128_or_reduce(const vec128 *a) {
68     int i;
69     vec128 ret;
70 
71     ret = a[0];
72     for (i = 1; i < GFBITS; i++) {
73         ret = PQCLEAN_MCELIECE348864F_AVX_vec128_or(ret, a[i]);
74     }
75 
76     return ret;
77 }
78 
79 /* bitsliced field multiplications */
PQCLEAN_MCELIECE348864F_AVX_vec128_mul(vec128 * h,vec128 * f,const vec128 * g)80 void PQCLEAN_MCELIECE348864F_AVX_vec128_mul(vec128 *h, vec128 *f, const vec128 *g) {
81     PQCLEAN_MCELIECE348864F_AVX_vec128_mul_asm(h, f, g, 16);
82 }
83 
84