1 /* Autogenerated: src/ExtractionOCaml/word_by_word_montgomery --static p256 '2^256 - 2^224 + 2^192 + 2^96 - 1' 32 mul square add sub opp from_montgomery nonzero selectznz to_bytes from_bytes */
2 /* curve description: p256 */
3 /* requested operations: mul, square, add, sub, opp, from_montgomery, nonzero, selectznz, to_bytes, from_bytes */
4 /* m = 0xffffffff00000001000000000000000000000000ffffffffffffffffffffffff (from "2^256 - 2^224 + 2^192 + 2^96 - 1") */
5 /* machine_wordsize = 32 (from "32") */
6 /*                                                                    */
7 /* NOTE: In addition to the bounds specified above each function, all */
8 /*   functions synthesized for this Montgomery arithmetic require the */
9 /*   input to be strictly less than the prime modulus (m), and also   */
10 /*   require the input to be in the unique saturated representation.  */
11 /*   All functions also ensure that these two properties are true of  */
12 /*   return values.                                                   */
13 
14 #include <stdint.h>
15 typedef unsigned char fiat_p256_uint1;
16 typedef signed char fiat_p256_int1;
17 
18 #if (-1 & 3) != 3
19 #error "This code only works on a two's complement system"
20 #endif
21 
22 
23 /*
24  * The function fiat_p256_addcarryx_u32 is an addition with carry.
25  * Postconditions:
26  *   out1 = (arg1 + arg2 + arg3) mod 2^32
27  *   out2 = ⌊(arg1 + arg2 + arg3) / 2^32⌋
28  *
29  * Input Bounds:
30  *   arg1: [0x0 ~> 0x1]
31  *   arg2: [0x0 ~> 0xffffffff]
32  *   arg3: [0x0 ~> 0xffffffff]
33  * Output Bounds:
34  *   out1: [0x0 ~> 0xffffffff]
35  *   out2: [0x0 ~> 0x1]
36  */
fiat_p256_addcarryx_u32(uint32_t * out1,fiat_p256_uint1 * out2,fiat_p256_uint1 arg1,uint32_t arg2,uint32_t arg3)37 static void fiat_p256_addcarryx_u32(uint32_t* out1, fiat_p256_uint1* out2, fiat_p256_uint1 arg1, uint32_t arg2, uint32_t arg3) {
38   uint64_t x1 = ((arg1 + (uint64_t)arg2) + arg3);
39   uint32_t x2 = (uint32_t)(x1 & UINT32_C(0xffffffff));
40   fiat_p256_uint1 x3 = (fiat_p256_uint1)(x1 >> 32);
41   *out1 = x2;
42   *out2 = x3;
43 }
44 
45 /*
46  * The function fiat_p256_subborrowx_u32 is a subtraction with borrow.
47  * Postconditions:
48  *   out1 = (-arg1 + arg2 + -arg3) mod 2^32
49  *   out2 = -⌊(-arg1 + arg2 + -arg3) / 2^32⌋
50  *
51  * Input Bounds:
52  *   arg1: [0x0 ~> 0x1]
53  *   arg2: [0x0 ~> 0xffffffff]
54  *   arg3: [0x0 ~> 0xffffffff]
55  * Output Bounds:
56  *   out1: [0x0 ~> 0xffffffff]
57  *   out2: [0x0 ~> 0x1]
58  */
fiat_p256_subborrowx_u32(uint32_t * out1,fiat_p256_uint1 * out2,fiat_p256_uint1 arg1,uint32_t arg2,uint32_t arg3)59 static void fiat_p256_subborrowx_u32(uint32_t* out1, fiat_p256_uint1* out2, fiat_p256_uint1 arg1, uint32_t arg2, uint32_t arg3) {
60   int64_t x1 = ((arg2 - (int64_t)arg1) - arg3);
61   fiat_p256_int1 x2 = (fiat_p256_int1)(x1 >> 32);
62   uint32_t x3 = (uint32_t)(x1 & UINT32_C(0xffffffff));
63   *out1 = x3;
64   *out2 = (fiat_p256_uint1)(0x0 - x2);
65 }
66 
67 /*
68  * The function fiat_p256_mulx_u32 is a multiplication, returning the full double-width result.
69  * Postconditions:
70  *   out1 = (arg1 * arg2) mod 2^32
71  *   out2 = ⌊arg1 * arg2 / 2^32⌋
72  *
73  * Input Bounds:
74  *   arg1: [0x0 ~> 0xffffffff]
75  *   arg2: [0x0 ~> 0xffffffff]
76  * Output Bounds:
77  *   out1: [0x0 ~> 0xffffffff]
78  *   out2: [0x0 ~> 0xffffffff]
79  */
fiat_p256_mulx_u32(uint32_t * out1,uint32_t * out2,uint32_t arg1,uint32_t arg2)80 static void fiat_p256_mulx_u32(uint32_t* out1, uint32_t* out2, uint32_t arg1, uint32_t arg2) {
81   uint64_t x1 = ((uint64_t)arg1 * arg2);
82   uint32_t x2 = (uint32_t)(x1 & UINT32_C(0xffffffff));
83   uint32_t x3 = (uint32_t)(x1 >> 32);
84   *out1 = x2;
85   *out2 = x3;
86 }
87 
88 /*
89  * The function fiat_p256_cmovznz_u32 is a single-word conditional move.
90  * Postconditions:
91  *   out1 = (if arg1 = 0 then arg2 else arg3)
92  *
93  * Input Bounds:
94  *   arg1: [0x0 ~> 0x1]
95  *   arg2: [0x0 ~> 0xffffffff]
96  *   arg3: [0x0 ~> 0xffffffff]
97  * Output Bounds:
98  *   out1: [0x0 ~> 0xffffffff]
99  */
fiat_p256_cmovznz_u32(uint32_t * out1,fiat_p256_uint1 arg1,uint32_t arg2,uint32_t arg3)100 static void fiat_p256_cmovznz_u32(uint32_t* out1, fiat_p256_uint1 arg1, uint32_t arg2, uint32_t arg3) {
101   fiat_p256_uint1 x1 = (!(!arg1));
102   uint32_t x2 = ((fiat_p256_int1)(0x0 - x1) & UINT32_C(0xffffffff));
103   // Note this line has been patched from the synthesized code to add value
104   // barriers.
105   //
106   // Clang recognizes this pattern as a select. While it usually transforms it
107   // to a cmov, it sometimes further transforms it into a branch, which we do
108   // not want.
109   uint32_t x3 = ((value_barrier_u32(x2) & arg3) | (value_barrier_u32(~x2) & arg2));
110   *out1 = x3;
111 }
112 
113 /*
114  * The function fiat_p256_mul multiplies two field elements in the Montgomery domain.
115  * Preconditions:
116  *   0 ≤ eval arg1 < m
117  *   0 ≤ eval arg2 < m
118  * Postconditions:
119  *   eval (from_montgomery out1) mod m = (eval (from_montgomery arg1) * eval (from_montgomery arg2)) mod m
120  *   0 ≤ eval out1 < m
121  *
122  * Input Bounds:
123  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
124  *   arg2: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
125  * Output Bounds:
126  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
127  */
fiat_p256_mul(uint32_t out1[8],const uint32_t arg1[8],const uint32_t arg2[8])128 static void fiat_p256_mul(uint32_t out1[8], const uint32_t arg1[8], const uint32_t arg2[8]) {
129   uint32_t x1 = (arg1[1]);
130   uint32_t x2 = (arg1[2]);
131   uint32_t x3 = (arg1[3]);
132   uint32_t x4 = (arg1[4]);
133   uint32_t x5 = (arg1[5]);
134   uint32_t x6 = (arg1[6]);
135   uint32_t x7 = (arg1[7]);
136   uint32_t x8 = (arg1[0]);
137   uint32_t x9;
138   uint32_t x10;
139   fiat_p256_mulx_u32(&x9, &x10, x8, (arg2[7]));
140   uint32_t x11;
141   uint32_t x12;
142   fiat_p256_mulx_u32(&x11, &x12, x8, (arg2[6]));
143   uint32_t x13;
144   uint32_t x14;
145   fiat_p256_mulx_u32(&x13, &x14, x8, (arg2[5]));
146   uint32_t x15;
147   uint32_t x16;
148   fiat_p256_mulx_u32(&x15, &x16, x8, (arg2[4]));
149   uint32_t x17;
150   uint32_t x18;
151   fiat_p256_mulx_u32(&x17, &x18, x8, (arg2[3]));
152   uint32_t x19;
153   uint32_t x20;
154   fiat_p256_mulx_u32(&x19, &x20, x8, (arg2[2]));
155   uint32_t x21;
156   uint32_t x22;
157   fiat_p256_mulx_u32(&x21, &x22, x8, (arg2[1]));
158   uint32_t x23;
159   uint32_t x24;
160   fiat_p256_mulx_u32(&x23, &x24, x8, (arg2[0]));
161   uint32_t x25;
162   fiat_p256_uint1 x26;
163   fiat_p256_addcarryx_u32(&x25, &x26, 0x0, x24, x21);
164   uint32_t x27;
165   fiat_p256_uint1 x28;
166   fiat_p256_addcarryx_u32(&x27, &x28, x26, x22, x19);
167   uint32_t x29;
168   fiat_p256_uint1 x30;
169   fiat_p256_addcarryx_u32(&x29, &x30, x28, x20, x17);
170   uint32_t x31;
171   fiat_p256_uint1 x32;
172   fiat_p256_addcarryx_u32(&x31, &x32, x30, x18, x15);
173   uint32_t x33;
174   fiat_p256_uint1 x34;
175   fiat_p256_addcarryx_u32(&x33, &x34, x32, x16, x13);
176   uint32_t x35;
177   fiat_p256_uint1 x36;
178   fiat_p256_addcarryx_u32(&x35, &x36, x34, x14, x11);
179   uint32_t x37;
180   fiat_p256_uint1 x38;
181   fiat_p256_addcarryx_u32(&x37, &x38, x36, x12, x9);
182   uint32_t x39 = (x38 + x10);
183   uint32_t x40;
184   uint32_t x41;
185   fiat_p256_mulx_u32(&x40, &x41, x23, UINT32_C(0xffffffff));
186   uint32_t x42;
187   uint32_t x43;
188   fiat_p256_mulx_u32(&x42, &x43, x23, UINT32_C(0xffffffff));
189   uint32_t x44;
190   uint32_t x45;
191   fiat_p256_mulx_u32(&x44, &x45, x23, UINT32_C(0xffffffff));
192   uint32_t x46;
193   uint32_t x47;
194   fiat_p256_mulx_u32(&x46, &x47, x23, UINT32_C(0xffffffff));
195   uint32_t x48;
196   fiat_p256_uint1 x49;
197   fiat_p256_addcarryx_u32(&x48, &x49, 0x0, x47, x44);
198   uint32_t x50;
199   fiat_p256_uint1 x51;
200   fiat_p256_addcarryx_u32(&x50, &x51, x49, x45, x42);
201   uint32_t x52 = (x51 + x43);
202   uint32_t x53;
203   fiat_p256_uint1 x54;
204   fiat_p256_addcarryx_u32(&x53, &x54, 0x0, x23, x46);
205   uint32_t x55;
206   fiat_p256_uint1 x56;
207   fiat_p256_addcarryx_u32(&x55, &x56, x54, x25, x48);
208   uint32_t x57;
209   fiat_p256_uint1 x58;
210   fiat_p256_addcarryx_u32(&x57, &x58, x56, x27, x50);
211   uint32_t x59;
212   fiat_p256_uint1 x60;
213   fiat_p256_addcarryx_u32(&x59, &x60, x58, x29, x52);
214   uint32_t x61;
215   fiat_p256_uint1 x62;
216   fiat_p256_addcarryx_u32(&x61, &x62, x60, x31, 0x0);
217   uint32_t x63;
218   fiat_p256_uint1 x64;
219   fiat_p256_addcarryx_u32(&x63, &x64, x62, x33, 0x0);
220   uint32_t x65;
221   fiat_p256_uint1 x66;
222   fiat_p256_addcarryx_u32(&x65, &x66, x64, x35, x23);
223   uint32_t x67;
224   fiat_p256_uint1 x68;
225   fiat_p256_addcarryx_u32(&x67, &x68, x66, x37, x40);
226   uint32_t x69;
227   fiat_p256_uint1 x70;
228   fiat_p256_addcarryx_u32(&x69, &x70, x68, x39, x41);
229   uint32_t x71;
230   uint32_t x72;
231   fiat_p256_mulx_u32(&x71, &x72, x1, (arg2[7]));
232   uint32_t x73;
233   uint32_t x74;
234   fiat_p256_mulx_u32(&x73, &x74, x1, (arg2[6]));
235   uint32_t x75;
236   uint32_t x76;
237   fiat_p256_mulx_u32(&x75, &x76, x1, (arg2[5]));
238   uint32_t x77;
239   uint32_t x78;
240   fiat_p256_mulx_u32(&x77, &x78, x1, (arg2[4]));
241   uint32_t x79;
242   uint32_t x80;
243   fiat_p256_mulx_u32(&x79, &x80, x1, (arg2[3]));
244   uint32_t x81;
245   uint32_t x82;
246   fiat_p256_mulx_u32(&x81, &x82, x1, (arg2[2]));
247   uint32_t x83;
248   uint32_t x84;
249   fiat_p256_mulx_u32(&x83, &x84, x1, (arg2[1]));
250   uint32_t x85;
251   uint32_t x86;
252   fiat_p256_mulx_u32(&x85, &x86, x1, (arg2[0]));
253   uint32_t x87;
254   fiat_p256_uint1 x88;
255   fiat_p256_addcarryx_u32(&x87, &x88, 0x0, x86, x83);
256   uint32_t x89;
257   fiat_p256_uint1 x90;
258   fiat_p256_addcarryx_u32(&x89, &x90, x88, x84, x81);
259   uint32_t x91;
260   fiat_p256_uint1 x92;
261   fiat_p256_addcarryx_u32(&x91, &x92, x90, x82, x79);
262   uint32_t x93;
263   fiat_p256_uint1 x94;
264   fiat_p256_addcarryx_u32(&x93, &x94, x92, x80, x77);
265   uint32_t x95;
266   fiat_p256_uint1 x96;
267   fiat_p256_addcarryx_u32(&x95, &x96, x94, x78, x75);
268   uint32_t x97;
269   fiat_p256_uint1 x98;
270   fiat_p256_addcarryx_u32(&x97, &x98, x96, x76, x73);
271   uint32_t x99;
272   fiat_p256_uint1 x100;
273   fiat_p256_addcarryx_u32(&x99, &x100, x98, x74, x71);
274   uint32_t x101 = (x100 + x72);
275   uint32_t x102;
276   fiat_p256_uint1 x103;
277   fiat_p256_addcarryx_u32(&x102, &x103, 0x0, x55, x85);
278   uint32_t x104;
279   fiat_p256_uint1 x105;
280   fiat_p256_addcarryx_u32(&x104, &x105, x103, x57, x87);
281   uint32_t x106;
282   fiat_p256_uint1 x107;
283   fiat_p256_addcarryx_u32(&x106, &x107, x105, x59, x89);
284   uint32_t x108;
285   fiat_p256_uint1 x109;
286   fiat_p256_addcarryx_u32(&x108, &x109, x107, x61, x91);
287   uint32_t x110;
288   fiat_p256_uint1 x111;
289   fiat_p256_addcarryx_u32(&x110, &x111, x109, x63, x93);
290   uint32_t x112;
291   fiat_p256_uint1 x113;
292   fiat_p256_addcarryx_u32(&x112, &x113, x111, x65, x95);
293   uint32_t x114;
294   fiat_p256_uint1 x115;
295   fiat_p256_addcarryx_u32(&x114, &x115, x113, x67, x97);
296   uint32_t x116;
297   fiat_p256_uint1 x117;
298   fiat_p256_addcarryx_u32(&x116, &x117, x115, x69, x99);
299   uint32_t x118;
300   fiat_p256_uint1 x119;
301   fiat_p256_addcarryx_u32(&x118, &x119, x117, x70, x101);
302   uint32_t x120;
303   uint32_t x121;
304   fiat_p256_mulx_u32(&x120, &x121, x102, UINT32_C(0xffffffff));
305   uint32_t x122;
306   uint32_t x123;
307   fiat_p256_mulx_u32(&x122, &x123, x102, UINT32_C(0xffffffff));
308   uint32_t x124;
309   uint32_t x125;
310   fiat_p256_mulx_u32(&x124, &x125, x102, UINT32_C(0xffffffff));
311   uint32_t x126;
312   uint32_t x127;
313   fiat_p256_mulx_u32(&x126, &x127, x102, UINT32_C(0xffffffff));
314   uint32_t x128;
315   fiat_p256_uint1 x129;
316   fiat_p256_addcarryx_u32(&x128, &x129, 0x0, x127, x124);
317   uint32_t x130;
318   fiat_p256_uint1 x131;
319   fiat_p256_addcarryx_u32(&x130, &x131, x129, x125, x122);
320   uint32_t x132 = (x131 + x123);
321   uint32_t x133;
322   fiat_p256_uint1 x134;
323   fiat_p256_addcarryx_u32(&x133, &x134, 0x0, x102, x126);
324   uint32_t x135;
325   fiat_p256_uint1 x136;
326   fiat_p256_addcarryx_u32(&x135, &x136, x134, x104, x128);
327   uint32_t x137;
328   fiat_p256_uint1 x138;
329   fiat_p256_addcarryx_u32(&x137, &x138, x136, x106, x130);
330   uint32_t x139;
331   fiat_p256_uint1 x140;
332   fiat_p256_addcarryx_u32(&x139, &x140, x138, x108, x132);
333   uint32_t x141;
334   fiat_p256_uint1 x142;
335   fiat_p256_addcarryx_u32(&x141, &x142, x140, x110, 0x0);
336   uint32_t x143;
337   fiat_p256_uint1 x144;
338   fiat_p256_addcarryx_u32(&x143, &x144, x142, x112, 0x0);
339   uint32_t x145;
340   fiat_p256_uint1 x146;
341   fiat_p256_addcarryx_u32(&x145, &x146, x144, x114, x102);
342   uint32_t x147;
343   fiat_p256_uint1 x148;
344   fiat_p256_addcarryx_u32(&x147, &x148, x146, x116, x120);
345   uint32_t x149;
346   fiat_p256_uint1 x150;
347   fiat_p256_addcarryx_u32(&x149, &x150, x148, x118, x121);
348   uint32_t x151 = ((uint32_t)x150 + x119);
349   uint32_t x152;
350   uint32_t x153;
351   fiat_p256_mulx_u32(&x152, &x153, x2, (arg2[7]));
352   uint32_t x154;
353   uint32_t x155;
354   fiat_p256_mulx_u32(&x154, &x155, x2, (arg2[6]));
355   uint32_t x156;
356   uint32_t x157;
357   fiat_p256_mulx_u32(&x156, &x157, x2, (arg2[5]));
358   uint32_t x158;
359   uint32_t x159;
360   fiat_p256_mulx_u32(&x158, &x159, x2, (arg2[4]));
361   uint32_t x160;
362   uint32_t x161;
363   fiat_p256_mulx_u32(&x160, &x161, x2, (arg2[3]));
364   uint32_t x162;
365   uint32_t x163;
366   fiat_p256_mulx_u32(&x162, &x163, x2, (arg2[2]));
367   uint32_t x164;
368   uint32_t x165;
369   fiat_p256_mulx_u32(&x164, &x165, x2, (arg2[1]));
370   uint32_t x166;
371   uint32_t x167;
372   fiat_p256_mulx_u32(&x166, &x167, x2, (arg2[0]));
373   uint32_t x168;
374   fiat_p256_uint1 x169;
375   fiat_p256_addcarryx_u32(&x168, &x169, 0x0, x167, x164);
376   uint32_t x170;
377   fiat_p256_uint1 x171;
378   fiat_p256_addcarryx_u32(&x170, &x171, x169, x165, x162);
379   uint32_t x172;
380   fiat_p256_uint1 x173;
381   fiat_p256_addcarryx_u32(&x172, &x173, x171, x163, x160);
382   uint32_t x174;
383   fiat_p256_uint1 x175;
384   fiat_p256_addcarryx_u32(&x174, &x175, x173, x161, x158);
385   uint32_t x176;
386   fiat_p256_uint1 x177;
387   fiat_p256_addcarryx_u32(&x176, &x177, x175, x159, x156);
388   uint32_t x178;
389   fiat_p256_uint1 x179;
390   fiat_p256_addcarryx_u32(&x178, &x179, x177, x157, x154);
391   uint32_t x180;
392   fiat_p256_uint1 x181;
393   fiat_p256_addcarryx_u32(&x180, &x181, x179, x155, x152);
394   uint32_t x182 = (x181 + x153);
395   uint32_t x183;
396   fiat_p256_uint1 x184;
397   fiat_p256_addcarryx_u32(&x183, &x184, 0x0, x135, x166);
398   uint32_t x185;
399   fiat_p256_uint1 x186;
400   fiat_p256_addcarryx_u32(&x185, &x186, x184, x137, x168);
401   uint32_t x187;
402   fiat_p256_uint1 x188;
403   fiat_p256_addcarryx_u32(&x187, &x188, x186, x139, x170);
404   uint32_t x189;
405   fiat_p256_uint1 x190;
406   fiat_p256_addcarryx_u32(&x189, &x190, x188, x141, x172);
407   uint32_t x191;
408   fiat_p256_uint1 x192;
409   fiat_p256_addcarryx_u32(&x191, &x192, x190, x143, x174);
410   uint32_t x193;
411   fiat_p256_uint1 x194;
412   fiat_p256_addcarryx_u32(&x193, &x194, x192, x145, x176);
413   uint32_t x195;
414   fiat_p256_uint1 x196;
415   fiat_p256_addcarryx_u32(&x195, &x196, x194, x147, x178);
416   uint32_t x197;
417   fiat_p256_uint1 x198;
418   fiat_p256_addcarryx_u32(&x197, &x198, x196, x149, x180);
419   uint32_t x199;
420   fiat_p256_uint1 x200;
421   fiat_p256_addcarryx_u32(&x199, &x200, x198, x151, x182);
422   uint32_t x201;
423   uint32_t x202;
424   fiat_p256_mulx_u32(&x201, &x202, x183, UINT32_C(0xffffffff));
425   uint32_t x203;
426   uint32_t x204;
427   fiat_p256_mulx_u32(&x203, &x204, x183, UINT32_C(0xffffffff));
428   uint32_t x205;
429   uint32_t x206;
430   fiat_p256_mulx_u32(&x205, &x206, x183, UINT32_C(0xffffffff));
431   uint32_t x207;
432   uint32_t x208;
433   fiat_p256_mulx_u32(&x207, &x208, x183, UINT32_C(0xffffffff));
434   uint32_t x209;
435   fiat_p256_uint1 x210;
436   fiat_p256_addcarryx_u32(&x209, &x210, 0x0, x208, x205);
437   uint32_t x211;
438   fiat_p256_uint1 x212;
439   fiat_p256_addcarryx_u32(&x211, &x212, x210, x206, x203);
440   uint32_t x213 = (x212 + x204);
441   uint32_t x214;
442   fiat_p256_uint1 x215;
443   fiat_p256_addcarryx_u32(&x214, &x215, 0x0, x183, x207);
444   uint32_t x216;
445   fiat_p256_uint1 x217;
446   fiat_p256_addcarryx_u32(&x216, &x217, x215, x185, x209);
447   uint32_t x218;
448   fiat_p256_uint1 x219;
449   fiat_p256_addcarryx_u32(&x218, &x219, x217, x187, x211);
450   uint32_t x220;
451   fiat_p256_uint1 x221;
452   fiat_p256_addcarryx_u32(&x220, &x221, x219, x189, x213);
453   uint32_t x222;
454   fiat_p256_uint1 x223;
455   fiat_p256_addcarryx_u32(&x222, &x223, x221, x191, 0x0);
456   uint32_t x224;
457   fiat_p256_uint1 x225;
458   fiat_p256_addcarryx_u32(&x224, &x225, x223, x193, 0x0);
459   uint32_t x226;
460   fiat_p256_uint1 x227;
461   fiat_p256_addcarryx_u32(&x226, &x227, x225, x195, x183);
462   uint32_t x228;
463   fiat_p256_uint1 x229;
464   fiat_p256_addcarryx_u32(&x228, &x229, x227, x197, x201);
465   uint32_t x230;
466   fiat_p256_uint1 x231;
467   fiat_p256_addcarryx_u32(&x230, &x231, x229, x199, x202);
468   uint32_t x232 = ((uint32_t)x231 + x200);
469   uint32_t x233;
470   uint32_t x234;
471   fiat_p256_mulx_u32(&x233, &x234, x3, (arg2[7]));
472   uint32_t x235;
473   uint32_t x236;
474   fiat_p256_mulx_u32(&x235, &x236, x3, (arg2[6]));
475   uint32_t x237;
476   uint32_t x238;
477   fiat_p256_mulx_u32(&x237, &x238, x3, (arg2[5]));
478   uint32_t x239;
479   uint32_t x240;
480   fiat_p256_mulx_u32(&x239, &x240, x3, (arg2[4]));
481   uint32_t x241;
482   uint32_t x242;
483   fiat_p256_mulx_u32(&x241, &x242, x3, (arg2[3]));
484   uint32_t x243;
485   uint32_t x244;
486   fiat_p256_mulx_u32(&x243, &x244, x3, (arg2[2]));
487   uint32_t x245;
488   uint32_t x246;
489   fiat_p256_mulx_u32(&x245, &x246, x3, (arg2[1]));
490   uint32_t x247;
491   uint32_t x248;
492   fiat_p256_mulx_u32(&x247, &x248, x3, (arg2[0]));
493   uint32_t x249;
494   fiat_p256_uint1 x250;
495   fiat_p256_addcarryx_u32(&x249, &x250, 0x0, x248, x245);
496   uint32_t x251;
497   fiat_p256_uint1 x252;
498   fiat_p256_addcarryx_u32(&x251, &x252, x250, x246, x243);
499   uint32_t x253;
500   fiat_p256_uint1 x254;
501   fiat_p256_addcarryx_u32(&x253, &x254, x252, x244, x241);
502   uint32_t x255;
503   fiat_p256_uint1 x256;
504   fiat_p256_addcarryx_u32(&x255, &x256, x254, x242, x239);
505   uint32_t x257;
506   fiat_p256_uint1 x258;
507   fiat_p256_addcarryx_u32(&x257, &x258, x256, x240, x237);
508   uint32_t x259;
509   fiat_p256_uint1 x260;
510   fiat_p256_addcarryx_u32(&x259, &x260, x258, x238, x235);
511   uint32_t x261;
512   fiat_p256_uint1 x262;
513   fiat_p256_addcarryx_u32(&x261, &x262, x260, x236, x233);
514   uint32_t x263 = (x262 + x234);
515   uint32_t x264;
516   fiat_p256_uint1 x265;
517   fiat_p256_addcarryx_u32(&x264, &x265, 0x0, x216, x247);
518   uint32_t x266;
519   fiat_p256_uint1 x267;
520   fiat_p256_addcarryx_u32(&x266, &x267, x265, x218, x249);
521   uint32_t x268;
522   fiat_p256_uint1 x269;
523   fiat_p256_addcarryx_u32(&x268, &x269, x267, x220, x251);
524   uint32_t x270;
525   fiat_p256_uint1 x271;
526   fiat_p256_addcarryx_u32(&x270, &x271, x269, x222, x253);
527   uint32_t x272;
528   fiat_p256_uint1 x273;
529   fiat_p256_addcarryx_u32(&x272, &x273, x271, x224, x255);
530   uint32_t x274;
531   fiat_p256_uint1 x275;
532   fiat_p256_addcarryx_u32(&x274, &x275, x273, x226, x257);
533   uint32_t x276;
534   fiat_p256_uint1 x277;
535   fiat_p256_addcarryx_u32(&x276, &x277, x275, x228, x259);
536   uint32_t x278;
537   fiat_p256_uint1 x279;
538   fiat_p256_addcarryx_u32(&x278, &x279, x277, x230, x261);
539   uint32_t x280;
540   fiat_p256_uint1 x281;
541   fiat_p256_addcarryx_u32(&x280, &x281, x279, x232, x263);
542   uint32_t x282;
543   uint32_t x283;
544   fiat_p256_mulx_u32(&x282, &x283, x264, UINT32_C(0xffffffff));
545   uint32_t x284;
546   uint32_t x285;
547   fiat_p256_mulx_u32(&x284, &x285, x264, UINT32_C(0xffffffff));
548   uint32_t x286;
549   uint32_t x287;
550   fiat_p256_mulx_u32(&x286, &x287, x264, UINT32_C(0xffffffff));
551   uint32_t x288;
552   uint32_t x289;
553   fiat_p256_mulx_u32(&x288, &x289, x264, UINT32_C(0xffffffff));
554   uint32_t x290;
555   fiat_p256_uint1 x291;
556   fiat_p256_addcarryx_u32(&x290, &x291, 0x0, x289, x286);
557   uint32_t x292;
558   fiat_p256_uint1 x293;
559   fiat_p256_addcarryx_u32(&x292, &x293, x291, x287, x284);
560   uint32_t x294 = (x293 + x285);
561   uint32_t x295;
562   fiat_p256_uint1 x296;
563   fiat_p256_addcarryx_u32(&x295, &x296, 0x0, x264, x288);
564   uint32_t x297;
565   fiat_p256_uint1 x298;
566   fiat_p256_addcarryx_u32(&x297, &x298, x296, x266, x290);
567   uint32_t x299;
568   fiat_p256_uint1 x300;
569   fiat_p256_addcarryx_u32(&x299, &x300, x298, x268, x292);
570   uint32_t x301;
571   fiat_p256_uint1 x302;
572   fiat_p256_addcarryx_u32(&x301, &x302, x300, x270, x294);
573   uint32_t x303;
574   fiat_p256_uint1 x304;
575   fiat_p256_addcarryx_u32(&x303, &x304, x302, x272, 0x0);
576   uint32_t x305;
577   fiat_p256_uint1 x306;
578   fiat_p256_addcarryx_u32(&x305, &x306, x304, x274, 0x0);
579   uint32_t x307;
580   fiat_p256_uint1 x308;
581   fiat_p256_addcarryx_u32(&x307, &x308, x306, x276, x264);
582   uint32_t x309;
583   fiat_p256_uint1 x310;
584   fiat_p256_addcarryx_u32(&x309, &x310, x308, x278, x282);
585   uint32_t x311;
586   fiat_p256_uint1 x312;
587   fiat_p256_addcarryx_u32(&x311, &x312, x310, x280, x283);
588   uint32_t x313 = ((uint32_t)x312 + x281);
589   uint32_t x314;
590   uint32_t x315;
591   fiat_p256_mulx_u32(&x314, &x315, x4, (arg2[7]));
592   uint32_t x316;
593   uint32_t x317;
594   fiat_p256_mulx_u32(&x316, &x317, x4, (arg2[6]));
595   uint32_t x318;
596   uint32_t x319;
597   fiat_p256_mulx_u32(&x318, &x319, x4, (arg2[5]));
598   uint32_t x320;
599   uint32_t x321;
600   fiat_p256_mulx_u32(&x320, &x321, x4, (arg2[4]));
601   uint32_t x322;
602   uint32_t x323;
603   fiat_p256_mulx_u32(&x322, &x323, x4, (arg2[3]));
604   uint32_t x324;
605   uint32_t x325;
606   fiat_p256_mulx_u32(&x324, &x325, x4, (arg2[2]));
607   uint32_t x326;
608   uint32_t x327;
609   fiat_p256_mulx_u32(&x326, &x327, x4, (arg2[1]));
610   uint32_t x328;
611   uint32_t x329;
612   fiat_p256_mulx_u32(&x328, &x329, x4, (arg2[0]));
613   uint32_t x330;
614   fiat_p256_uint1 x331;
615   fiat_p256_addcarryx_u32(&x330, &x331, 0x0, x329, x326);
616   uint32_t x332;
617   fiat_p256_uint1 x333;
618   fiat_p256_addcarryx_u32(&x332, &x333, x331, x327, x324);
619   uint32_t x334;
620   fiat_p256_uint1 x335;
621   fiat_p256_addcarryx_u32(&x334, &x335, x333, x325, x322);
622   uint32_t x336;
623   fiat_p256_uint1 x337;
624   fiat_p256_addcarryx_u32(&x336, &x337, x335, x323, x320);
625   uint32_t x338;
626   fiat_p256_uint1 x339;
627   fiat_p256_addcarryx_u32(&x338, &x339, x337, x321, x318);
628   uint32_t x340;
629   fiat_p256_uint1 x341;
630   fiat_p256_addcarryx_u32(&x340, &x341, x339, x319, x316);
631   uint32_t x342;
632   fiat_p256_uint1 x343;
633   fiat_p256_addcarryx_u32(&x342, &x343, x341, x317, x314);
634   uint32_t x344 = (x343 + x315);
635   uint32_t x345;
636   fiat_p256_uint1 x346;
637   fiat_p256_addcarryx_u32(&x345, &x346, 0x0, x297, x328);
638   uint32_t x347;
639   fiat_p256_uint1 x348;
640   fiat_p256_addcarryx_u32(&x347, &x348, x346, x299, x330);
641   uint32_t x349;
642   fiat_p256_uint1 x350;
643   fiat_p256_addcarryx_u32(&x349, &x350, x348, x301, x332);
644   uint32_t x351;
645   fiat_p256_uint1 x352;
646   fiat_p256_addcarryx_u32(&x351, &x352, x350, x303, x334);
647   uint32_t x353;
648   fiat_p256_uint1 x354;
649   fiat_p256_addcarryx_u32(&x353, &x354, x352, x305, x336);
650   uint32_t x355;
651   fiat_p256_uint1 x356;
652   fiat_p256_addcarryx_u32(&x355, &x356, x354, x307, x338);
653   uint32_t x357;
654   fiat_p256_uint1 x358;
655   fiat_p256_addcarryx_u32(&x357, &x358, x356, x309, x340);
656   uint32_t x359;
657   fiat_p256_uint1 x360;
658   fiat_p256_addcarryx_u32(&x359, &x360, x358, x311, x342);
659   uint32_t x361;
660   fiat_p256_uint1 x362;
661   fiat_p256_addcarryx_u32(&x361, &x362, x360, x313, x344);
662   uint32_t x363;
663   uint32_t x364;
664   fiat_p256_mulx_u32(&x363, &x364, x345, UINT32_C(0xffffffff));
665   uint32_t x365;
666   uint32_t x366;
667   fiat_p256_mulx_u32(&x365, &x366, x345, UINT32_C(0xffffffff));
668   uint32_t x367;
669   uint32_t x368;
670   fiat_p256_mulx_u32(&x367, &x368, x345, UINT32_C(0xffffffff));
671   uint32_t x369;
672   uint32_t x370;
673   fiat_p256_mulx_u32(&x369, &x370, x345, UINT32_C(0xffffffff));
674   uint32_t x371;
675   fiat_p256_uint1 x372;
676   fiat_p256_addcarryx_u32(&x371, &x372, 0x0, x370, x367);
677   uint32_t x373;
678   fiat_p256_uint1 x374;
679   fiat_p256_addcarryx_u32(&x373, &x374, x372, x368, x365);
680   uint32_t x375 = (x374 + x366);
681   uint32_t x376;
682   fiat_p256_uint1 x377;
683   fiat_p256_addcarryx_u32(&x376, &x377, 0x0, x345, x369);
684   uint32_t x378;
685   fiat_p256_uint1 x379;
686   fiat_p256_addcarryx_u32(&x378, &x379, x377, x347, x371);
687   uint32_t x380;
688   fiat_p256_uint1 x381;
689   fiat_p256_addcarryx_u32(&x380, &x381, x379, x349, x373);
690   uint32_t x382;
691   fiat_p256_uint1 x383;
692   fiat_p256_addcarryx_u32(&x382, &x383, x381, x351, x375);
693   uint32_t x384;
694   fiat_p256_uint1 x385;
695   fiat_p256_addcarryx_u32(&x384, &x385, x383, x353, 0x0);
696   uint32_t x386;
697   fiat_p256_uint1 x387;
698   fiat_p256_addcarryx_u32(&x386, &x387, x385, x355, 0x0);
699   uint32_t x388;
700   fiat_p256_uint1 x389;
701   fiat_p256_addcarryx_u32(&x388, &x389, x387, x357, x345);
702   uint32_t x390;
703   fiat_p256_uint1 x391;
704   fiat_p256_addcarryx_u32(&x390, &x391, x389, x359, x363);
705   uint32_t x392;
706   fiat_p256_uint1 x393;
707   fiat_p256_addcarryx_u32(&x392, &x393, x391, x361, x364);
708   uint32_t x394 = ((uint32_t)x393 + x362);
709   uint32_t x395;
710   uint32_t x396;
711   fiat_p256_mulx_u32(&x395, &x396, x5, (arg2[7]));
712   uint32_t x397;
713   uint32_t x398;
714   fiat_p256_mulx_u32(&x397, &x398, x5, (arg2[6]));
715   uint32_t x399;
716   uint32_t x400;
717   fiat_p256_mulx_u32(&x399, &x400, x5, (arg2[5]));
718   uint32_t x401;
719   uint32_t x402;
720   fiat_p256_mulx_u32(&x401, &x402, x5, (arg2[4]));
721   uint32_t x403;
722   uint32_t x404;
723   fiat_p256_mulx_u32(&x403, &x404, x5, (arg2[3]));
724   uint32_t x405;
725   uint32_t x406;
726   fiat_p256_mulx_u32(&x405, &x406, x5, (arg2[2]));
727   uint32_t x407;
728   uint32_t x408;
729   fiat_p256_mulx_u32(&x407, &x408, x5, (arg2[1]));
730   uint32_t x409;
731   uint32_t x410;
732   fiat_p256_mulx_u32(&x409, &x410, x5, (arg2[0]));
733   uint32_t x411;
734   fiat_p256_uint1 x412;
735   fiat_p256_addcarryx_u32(&x411, &x412, 0x0, x410, x407);
736   uint32_t x413;
737   fiat_p256_uint1 x414;
738   fiat_p256_addcarryx_u32(&x413, &x414, x412, x408, x405);
739   uint32_t x415;
740   fiat_p256_uint1 x416;
741   fiat_p256_addcarryx_u32(&x415, &x416, x414, x406, x403);
742   uint32_t x417;
743   fiat_p256_uint1 x418;
744   fiat_p256_addcarryx_u32(&x417, &x418, x416, x404, x401);
745   uint32_t x419;
746   fiat_p256_uint1 x420;
747   fiat_p256_addcarryx_u32(&x419, &x420, x418, x402, x399);
748   uint32_t x421;
749   fiat_p256_uint1 x422;
750   fiat_p256_addcarryx_u32(&x421, &x422, x420, x400, x397);
751   uint32_t x423;
752   fiat_p256_uint1 x424;
753   fiat_p256_addcarryx_u32(&x423, &x424, x422, x398, x395);
754   uint32_t x425 = (x424 + x396);
755   uint32_t x426;
756   fiat_p256_uint1 x427;
757   fiat_p256_addcarryx_u32(&x426, &x427, 0x0, x378, x409);
758   uint32_t x428;
759   fiat_p256_uint1 x429;
760   fiat_p256_addcarryx_u32(&x428, &x429, x427, x380, x411);
761   uint32_t x430;
762   fiat_p256_uint1 x431;
763   fiat_p256_addcarryx_u32(&x430, &x431, x429, x382, x413);
764   uint32_t x432;
765   fiat_p256_uint1 x433;
766   fiat_p256_addcarryx_u32(&x432, &x433, x431, x384, x415);
767   uint32_t x434;
768   fiat_p256_uint1 x435;
769   fiat_p256_addcarryx_u32(&x434, &x435, x433, x386, x417);
770   uint32_t x436;
771   fiat_p256_uint1 x437;
772   fiat_p256_addcarryx_u32(&x436, &x437, x435, x388, x419);
773   uint32_t x438;
774   fiat_p256_uint1 x439;
775   fiat_p256_addcarryx_u32(&x438, &x439, x437, x390, x421);
776   uint32_t x440;
777   fiat_p256_uint1 x441;
778   fiat_p256_addcarryx_u32(&x440, &x441, x439, x392, x423);
779   uint32_t x442;
780   fiat_p256_uint1 x443;
781   fiat_p256_addcarryx_u32(&x442, &x443, x441, x394, x425);
782   uint32_t x444;
783   uint32_t x445;
784   fiat_p256_mulx_u32(&x444, &x445, x426, UINT32_C(0xffffffff));
785   uint32_t x446;
786   uint32_t x447;
787   fiat_p256_mulx_u32(&x446, &x447, x426, UINT32_C(0xffffffff));
788   uint32_t x448;
789   uint32_t x449;
790   fiat_p256_mulx_u32(&x448, &x449, x426, UINT32_C(0xffffffff));
791   uint32_t x450;
792   uint32_t x451;
793   fiat_p256_mulx_u32(&x450, &x451, x426, UINT32_C(0xffffffff));
794   uint32_t x452;
795   fiat_p256_uint1 x453;
796   fiat_p256_addcarryx_u32(&x452, &x453, 0x0, x451, x448);
797   uint32_t x454;
798   fiat_p256_uint1 x455;
799   fiat_p256_addcarryx_u32(&x454, &x455, x453, x449, x446);
800   uint32_t x456 = (x455 + x447);
801   uint32_t x457;
802   fiat_p256_uint1 x458;
803   fiat_p256_addcarryx_u32(&x457, &x458, 0x0, x426, x450);
804   uint32_t x459;
805   fiat_p256_uint1 x460;
806   fiat_p256_addcarryx_u32(&x459, &x460, x458, x428, x452);
807   uint32_t x461;
808   fiat_p256_uint1 x462;
809   fiat_p256_addcarryx_u32(&x461, &x462, x460, x430, x454);
810   uint32_t x463;
811   fiat_p256_uint1 x464;
812   fiat_p256_addcarryx_u32(&x463, &x464, x462, x432, x456);
813   uint32_t x465;
814   fiat_p256_uint1 x466;
815   fiat_p256_addcarryx_u32(&x465, &x466, x464, x434, 0x0);
816   uint32_t x467;
817   fiat_p256_uint1 x468;
818   fiat_p256_addcarryx_u32(&x467, &x468, x466, x436, 0x0);
819   uint32_t x469;
820   fiat_p256_uint1 x470;
821   fiat_p256_addcarryx_u32(&x469, &x470, x468, x438, x426);
822   uint32_t x471;
823   fiat_p256_uint1 x472;
824   fiat_p256_addcarryx_u32(&x471, &x472, x470, x440, x444);
825   uint32_t x473;
826   fiat_p256_uint1 x474;
827   fiat_p256_addcarryx_u32(&x473, &x474, x472, x442, x445);
828   uint32_t x475 = ((uint32_t)x474 + x443);
829   uint32_t x476;
830   uint32_t x477;
831   fiat_p256_mulx_u32(&x476, &x477, x6, (arg2[7]));
832   uint32_t x478;
833   uint32_t x479;
834   fiat_p256_mulx_u32(&x478, &x479, x6, (arg2[6]));
835   uint32_t x480;
836   uint32_t x481;
837   fiat_p256_mulx_u32(&x480, &x481, x6, (arg2[5]));
838   uint32_t x482;
839   uint32_t x483;
840   fiat_p256_mulx_u32(&x482, &x483, x6, (arg2[4]));
841   uint32_t x484;
842   uint32_t x485;
843   fiat_p256_mulx_u32(&x484, &x485, x6, (arg2[3]));
844   uint32_t x486;
845   uint32_t x487;
846   fiat_p256_mulx_u32(&x486, &x487, x6, (arg2[2]));
847   uint32_t x488;
848   uint32_t x489;
849   fiat_p256_mulx_u32(&x488, &x489, x6, (arg2[1]));
850   uint32_t x490;
851   uint32_t x491;
852   fiat_p256_mulx_u32(&x490, &x491, x6, (arg2[0]));
853   uint32_t x492;
854   fiat_p256_uint1 x493;
855   fiat_p256_addcarryx_u32(&x492, &x493, 0x0, x491, x488);
856   uint32_t x494;
857   fiat_p256_uint1 x495;
858   fiat_p256_addcarryx_u32(&x494, &x495, x493, x489, x486);
859   uint32_t x496;
860   fiat_p256_uint1 x497;
861   fiat_p256_addcarryx_u32(&x496, &x497, x495, x487, x484);
862   uint32_t x498;
863   fiat_p256_uint1 x499;
864   fiat_p256_addcarryx_u32(&x498, &x499, x497, x485, x482);
865   uint32_t x500;
866   fiat_p256_uint1 x501;
867   fiat_p256_addcarryx_u32(&x500, &x501, x499, x483, x480);
868   uint32_t x502;
869   fiat_p256_uint1 x503;
870   fiat_p256_addcarryx_u32(&x502, &x503, x501, x481, x478);
871   uint32_t x504;
872   fiat_p256_uint1 x505;
873   fiat_p256_addcarryx_u32(&x504, &x505, x503, x479, x476);
874   uint32_t x506 = (x505 + x477);
875   uint32_t x507;
876   fiat_p256_uint1 x508;
877   fiat_p256_addcarryx_u32(&x507, &x508, 0x0, x459, x490);
878   uint32_t x509;
879   fiat_p256_uint1 x510;
880   fiat_p256_addcarryx_u32(&x509, &x510, x508, x461, x492);
881   uint32_t x511;
882   fiat_p256_uint1 x512;
883   fiat_p256_addcarryx_u32(&x511, &x512, x510, x463, x494);
884   uint32_t x513;
885   fiat_p256_uint1 x514;
886   fiat_p256_addcarryx_u32(&x513, &x514, x512, x465, x496);
887   uint32_t x515;
888   fiat_p256_uint1 x516;
889   fiat_p256_addcarryx_u32(&x515, &x516, x514, x467, x498);
890   uint32_t x517;
891   fiat_p256_uint1 x518;
892   fiat_p256_addcarryx_u32(&x517, &x518, x516, x469, x500);
893   uint32_t x519;
894   fiat_p256_uint1 x520;
895   fiat_p256_addcarryx_u32(&x519, &x520, x518, x471, x502);
896   uint32_t x521;
897   fiat_p256_uint1 x522;
898   fiat_p256_addcarryx_u32(&x521, &x522, x520, x473, x504);
899   uint32_t x523;
900   fiat_p256_uint1 x524;
901   fiat_p256_addcarryx_u32(&x523, &x524, x522, x475, x506);
902   uint32_t x525;
903   uint32_t x526;
904   fiat_p256_mulx_u32(&x525, &x526, x507, UINT32_C(0xffffffff));
905   uint32_t x527;
906   uint32_t x528;
907   fiat_p256_mulx_u32(&x527, &x528, x507, UINT32_C(0xffffffff));
908   uint32_t x529;
909   uint32_t x530;
910   fiat_p256_mulx_u32(&x529, &x530, x507, UINT32_C(0xffffffff));
911   uint32_t x531;
912   uint32_t x532;
913   fiat_p256_mulx_u32(&x531, &x532, x507, UINT32_C(0xffffffff));
914   uint32_t x533;
915   fiat_p256_uint1 x534;
916   fiat_p256_addcarryx_u32(&x533, &x534, 0x0, x532, x529);
917   uint32_t x535;
918   fiat_p256_uint1 x536;
919   fiat_p256_addcarryx_u32(&x535, &x536, x534, x530, x527);
920   uint32_t x537 = (x536 + x528);
921   uint32_t x538;
922   fiat_p256_uint1 x539;
923   fiat_p256_addcarryx_u32(&x538, &x539, 0x0, x507, x531);
924   uint32_t x540;
925   fiat_p256_uint1 x541;
926   fiat_p256_addcarryx_u32(&x540, &x541, x539, x509, x533);
927   uint32_t x542;
928   fiat_p256_uint1 x543;
929   fiat_p256_addcarryx_u32(&x542, &x543, x541, x511, x535);
930   uint32_t x544;
931   fiat_p256_uint1 x545;
932   fiat_p256_addcarryx_u32(&x544, &x545, x543, x513, x537);
933   uint32_t x546;
934   fiat_p256_uint1 x547;
935   fiat_p256_addcarryx_u32(&x546, &x547, x545, x515, 0x0);
936   uint32_t x548;
937   fiat_p256_uint1 x549;
938   fiat_p256_addcarryx_u32(&x548, &x549, x547, x517, 0x0);
939   uint32_t x550;
940   fiat_p256_uint1 x551;
941   fiat_p256_addcarryx_u32(&x550, &x551, x549, x519, x507);
942   uint32_t x552;
943   fiat_p256_uint1 x553;
944   fiat_p256_addcarryx_u32(&x552, &x553, x551, x521, x525);
945   uint32_t x554;
946   fiat_p256_uint1 x555;
947   fiat_p256_addcarryx_u32(&x554, &x555, x553, x523, x526);
948   uint32_t x556 = ((uint32_t)x555 + x524);
949   uint32_t x557;
950   uint32_t x558;
951   fiat_p256_mulx_u32(&x557, &x558, x7, (arg2[7]));
952   uint32_t x559;
953   uint32_t x560;
954   fiat_p256_mulx_u32(&x559, &x560, x7, (arg2[6]));
955   uint32_t x561;
956   uint32_t x562;
957   fiat_p256_mulx_u32(&x561, &x562, x7, (arg2[5]));
958   uint32_t x563;
959   uint32_t x564;
960   fiat_p256_mulx_u32(&x563, &x564, x7, (arg2[4]));
961   uint32_t x565;
962   uint32_t x566;
963   fiat_p256_mulx_u32(&x565, &x566, x7, (arg2[3]));
964   uint32_t x567;
965   uint32_t x568;
966   fiat_p256_mulx_u32(&x567, &x568, x7, (arg2[2]));
967   uint32_t x569;
968   uint32_t x570;
969   fiat_p256_mulx_u32(&x569, &x570, x7, (arg2[1]));
970   uint32_t x571;
971   uint32_t x572;
972   fiat_p256_mulx_u32(&x571, &x572, x7, (arg2[0]));
973   uint32_t x573;
974   fiat_p256_uint1 x574;
975   fiat_p256_addcarryx_u32(&x573, &x574, 0x0, x572, x569);
976   uint32_t x575;
977   fiat_p256_uint1 x576;
978   fiat_p256_addcarryx_u32(&x575, &x576, x574, x570, x567);
979   uint32_t x577;
980   fiat_p256_uint1 x578;
981   fiat_p256_addcarryx_u32(&x577, &x578, x576, x568, x565);
982   uint32_t x579;
983   fiat_p256_uint1 x580;
984   fiat_p256_addcarryx_u32(&x579, &x580, x578, x566, x563);
985   uint32_t x581;
986   fiat_p256_uint1 x582;
987   fiat_p256_addcarryx_u32(&x581, &x582, x580, x564, x561);
988   uint32_t x583;
989   fiat_p256_uint1 x584;
990   fiat_p256_addcarryx_u32(&x583, &x584, x582, x562, x559);
991   uint32_t x585;
992   fiat_p256_uint1 x586;
993   fiat_p256_addcarryx_u32(&x585, &x586, x584, x560, x557);
994   uint32_t x587 = (x586 + x558);
995   uint32_t x588;
996   fiat_p256_uint1 x589;
997   fiat_p256_addcarryx_u32(&x588, &x589, 0x0, x540, x571);
998   uint32_t x590;
999   fiat_p256_uint1 x591;
1000   fiat_p256_addcarryx_u32(&x590, &x591, x589, x542, x573);
1001   uint32_t x592;
1002   fiat_p256_uint1 x593;
1003   fiat_p256_addcarryx_u32(&x592, &x593, x591, x544, x575);
1004   uint32_t x594;
1005   fiat_p256_uint1 x595;
1006   fiat_p256_addcarryx_u32(&x594, &x595, x593, x546, x577);
1007   uint32_t x596;
1008   fiat_p256_uint1 x597;
1009   fiat_p256_addcarryx_u32(&x596, &x597, x595, x548, x579);
1010   uint32_t x598;
1011   fiat_p256_uint1 x599;
1012   fiat_p256_addcarryx_u32(&x598, &x599, x597, x550, x581);
1013   uint32_t x600;
1014   fiat_p256_uint1 x601;
1015   fiat_p256_addcarryx_u32(&x600, &x601, x599, x552, x583);
1016   uint32_t x602;
1017   fiat_p256_uint1 x603;
1018   fiat_p256_addcarryx_u32(&x602, &x603, x601, x554, x585);
1019   uint32_t x604;
1020   fiat_p256_uint1 x605;
1021   fiat_p256_addcarryx_u32(&x604, &x605, x603, x556, x587);
1022   uint32_t x606;
1023   uint32_t x607;
1024   fiat_p256_mulx_u32(&x606, &x607, x588, UINT32_C(0xffffffff));
1025   uint32_t x608;
1026   uint32_t x609;
1027   fiat_p256_mulx_u32(&x608, &x609, x588, UINT32_C(0xffffffff));
1028   uint32_t x610;
1029   uint32_t x611;
1030   fiat_p256_mulx_u32(&x610, &x611, x588, UINT32_C(0xffffffff));
1031   uint32_t x612;
1032   uint32_t x613;
1033   fiat_p256_mulx_u32(&x612, &x613, x588, UINT32_C(0xffffffff));
1034   uint32_t x614;
1035   fiat_p256_uint1 x615;
1036   fiat_p256_addcarryx_u32(&x614, &x615, 0x0, x613, x610);
1037   uint32_t x616;
1038   fiat_p256_uint1 x617;
1039   fiat_p256_addcarryx_u32(&x616, &x617, x615, x611, x608);
1040   uint32_t x618 = (x617 + x609);
1041   uint32_t x619;
1042   fiat_p256_uint1 x620;
1043   fiat_p256_addcarryx_u32(&x619, &x620, 0x0, x588, x612);
1044   uint32_t x621;
1045   fiat_p256_uint1 x622;
1046   fiat_p256_addcarryx_u32(&x621, &x622, x620, x590, x614);
1047   uint32_t x623;
1048   fiat_p256_uint1 x624;
1049   fiat_p256_addcarryx_u32(&x623, &x624, x622, x592, x616);
1050   uint32_t x625;
1051   fiat_p256_uint1 x626;
1052   fiat_p256_addcarryx_u32(&x625, &x626, x624, x594, x618);
1053   uint32_t x627;
1054   fiat_p256_uint1 x628;
1055   fiat_p256_addcarryx_u32(&x627, &x628, x626, x596, 0x0);
1056   uint32_t x629;
1057   fiat_p256_uint1 x630;
1058   fiat_p256_addcarryx_u32(&x629, &x630, x628, x598, 0x0);
1059   uint32_t x631;
1060   fiat_p256_uint1 x632;
1061   fiat_p256_addcarryx_u32(&x631, &x632, x630, x600, x588);
1062   uint32_t x633;
1063   fiat_p256_uint1 x634;
1064   fiat_p256_addcarryx_u32(&x633, &x634, x632, x602, x606);
1065   uint32_t x635;
1066   fiat_p256_uint1 x636;
1067   fiat_p256_addcarryx_u32(&x635, &x636, x634, x604, x607);
1068   uint32_t x637 = ((uint32_t)x636 + x605);
1069   uint32_t x638;
1070   fiat_p256_uint1 x639;
1071   fiat_p256_subborrowx_u32(&x638, &x639, 0x0, x621, UINT32_C(0xffffffff));
1072   uint32_t x640;
1073   fiat_p256_uint1 x641;
1074   fiat_p256_subborrowx_u32(&x640, &x641, x639, x623, UINT32_C(0xffffffff));
1075   uint32_t x642;
1076   fiat_p256_uint1 x643;
1077   fiat_p256_subborrowx_u32(&x642, &x643, x641, x625, UINT32_C(0xffffffff));
1078   uint32_t x644;
1079   fiat_p256_uint1 x645;
1080   fiat_p256_subborrowx_u32(&x644, &x645, x643, x627, 0x0);
1081   uint32_t x646;
1082   fiat_p256_uint1 x647;
1083   fiat_p256_subborrowx_u32(&x646, &x647, x645, x629, 0x0);
1084   uint32_t x648;
1085   fiat_p256_uint1 x649;
1086   fiat_p256_subborrowx_u32(&x648, &x649, x647, x631, 0x0);
1087   uint32_t x650;
1088   fiat_p256_uint1 x651;
1089   fiat_p256_subborrowx_u32(&x650, &x651, x649, x633, 0x1);
1090   uint32_t x652;
1091   fiat_p256_uint1 x653;
1092   fiat_p256_subborrowx_u32(&x652, &x653, x651, x635, UINT32_C(0xffffffff));
1093   uint32_t x654;
1094   fiat_p256_uint1 x655;
1095   fiat_p256_subborrowx_u32(&x654, &x655, x653, x637, 0x0);
1096   uint32_t x656;
1097   fiat_p256_cmovznz_u32(&x656, x655, x638, x621);
1098   uint32_t x657;
1099   fiat_p256_cmovznz_u32(&x657, x655, x640, x623);
1100   uint32_t x658;
1101   fiat_p256_cmovznz_u32(&x658, x655, x642, x625);
1102   uint32_t x659;
1103   fiat_p256_cmovznz_u32(&x659, x655, x644, x627);
1104   uint32_t x660;
1105   fiat_p256_cmovznz_u32(&x660, x655, x646, x629);
1106   uint32_t x661;
1107   fiat_p256_cmovznz_u32(&x661, x655, x648, x631);
1108   uint32_t x662;
1109   fiat_p256_cmovznz_u32(&x662, x655, x650, x633);
1110   uint32_t x663;
1111   fiat_p256_cmovznz_u32(&x663, x655, x652, x635);
1112   out1[0] = x656;
1113   out1[1] = x657;
1114   out1[2] = x658;
1115   out1[3] = x659;
1116   out1[4] = x660;
1117   out1[5] = x661;
1118   out1[6] = x662;
1119   out1[7] = x663;
1120 }
1121 
1122 /*
1123  * The function fiat_p256_square squares a field element in the Montgomery domain.
1124  * Preconditions:
1125  *   0 ≤ eval arg1 < m
1126  * Postconditions:
1127  *   eval (from_montgomery out1) mod m = (eval (from_montgomery arg1) * eval (from_montgomery arg1)) mod m
1128  *   0 ≤ eval out1 < m
1129  *
1130  * Input Bounds:
1131  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
1132  * Output Bounds:
1133  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
1134  */
fiat_p256_square(uint32_t out1[8],const uint32_t arg1[8])1135 static void fiat_p256_square(uint32_t out1[8], const uint32_t arg1[8]) {
1136   uint32_t x1 = (arg1[1]);
1137   uint32_t x2 = (arg1[2]);
1138   uint32_t x3 = (arg1[3]);
1139   uint32_t x4 = (arg1[4]);
1140   uint32_t x5 = (arg1[5]);
1141   uint32_t x6 = (arg1[6]);
1142   uint32_t x7 = (arg1[7]);
1143   uint32_t x8 = (arg1[0]);
1144   uint32_t x9;
1145   uint32_t x10;
1146   fiat_p256_mulx_u32(&x9, &x10, x8, (arg1[7]));
1147   uint32_t x11;
1148   uint32_t x12;
1149   fiat_p256_mulx_u32(&x11, &x12, x8, (arg1[6]));
1150   uint32_t x13;
1151   uint32_t x14;
1152   fiat_p256_mulx_u32(&x13, &x14, x8, (arg1[5]));
1153   uint32_t x15;
1154   uint32_t x16;
1155   fiat_p256_mulx_u32(&x15, &x16, x8, (arg1[4]));
1156   uint32_t x17;
1157   uint32_t x18;
1158   fiat_p256_mulx_u32(&x17, &x18, x8, (arg1[3]));
1159   uint32_t x19;
1160   uint32_t x20;
1161   fiat_p256_mulx_u32(&x19, &x20, x8, (arg1[2]));
1162   uint32_t x21;
1163   uint32_t x22;
1164   fiat_p256_mulx_u32(&x21, &x22, x8, (arg1[1]));
1165   uint32_t x23;
1166   uint32_t x24;
1167   fiat_p256_mulx_u32(&x23, &x24, x8, (arg1[0]));
1168   uint32_t x25;
1169   fiat_p256_uint1 x26;
1170   fiat_p256_addcarryx_u32(&x25, &x26, 0x0, x24, x21);
1171   uint32_t x27;
1172   fiat_p256_uint1 x28;
1173   fiat_p256_addcarryx_u32(&x27, &x28, x26, x22, x19);
1174   uint32_t x29;
1175   fiat_p256_uint1 x30;
1176   fiat_p256_addcarryx_u32(&x29, &x30, x28, x20, x17);
1177   uint32_t x31;
1178   fiat_p256_uint1 x32;
1179   fiat_p256_addcarryx_u32(&x31, &x32, x30, x18, x15);
1180   uint32_t x33;
1181   fiat_p256_uint1 x34;
1182   fiat_p256_addcarryx_u32(&x33, &x34, x32, x16, x13);
1183   uint32_t x35;
1184   fiat_p256_uint1 x36;
1185   fiat_p256_addcarryx_u32(&x35, &x36, x34, x14, x11);
1186   uint32_t x37;
1187   fiat_p256_uint1 x38;
1188   fiat_p256_addcarryx_u32(&x37, &x38, x36, x12, x9);
1189   uint32_t x39 = (x38 + x10);
1190   uint32_t x40;
1191   uint32_t x41;
1192   fiat_p256_mulx_u32(&x40, &x41, x23, UINT32_C(0xffffffff));
1193   uint32_t x42;
1194   uint32_t x43;
1195   fiat_p256_mulx_u32(&x42, &x43, x23, UINT32_C(0xffffffff));
1196   uint32_t x44;
1197   uint32_t x45;
1198   fiat_p256_mulx_u32(&x44, &x45, x23, UINT32_C(0xffffffff));
1199   uint32_t x46;
1200   uint32_t x47;
1201   fiat_p256_mulx_u32(&x46, &x47, x23, UINT32_C(0xffffffff));
1202   uint32_t x48;
1203   fiat_p256_uint1 x49;
1204   fiat_p256_addcarryx_u32(&x48, &x49, 0x0, x47, x44);
1205   uint32_t x50;
1206   fiat_p256_uint1 x51;
1207   fiat_p256_addcarryx_u32(&x50, &x51, x49, x45, x42);
1208   uint32_t x52 = (x51 + x43);
1209   uint32_t x53;
1210   fiat_p256_uint1 x54;
1211   fiat_p256_addcarryx_u32(&x53, &x54, 0x0, x23, x46);
1212   uint32_t x55;
1213   fiat_p256_uint1 x56;
1214   fiat_p256_addcarryx_u32(&x55, &x56, x54, x25, x48);
1215   uint32_t x57;
1216   fiat_p256_uint1 x58;
1217   fiat_p256_addcarryx_u32(&x57, &x58, x56, x27, x50);
1218   uint32_t x59;
1219   fiat_p256_uint1 x60;
1220   fiat_p256_addcarryx_u32(&x59, &x60, x58, x29, x52);
1221   uint32_t x61;
1222   fiat_p256_uint1 x62;
1223   fiat_p256_addcarryx_u32(&x61, &x62, x60, x31, 0x0);
1224   uint32_t x63;
1225   fiat_p256_uint1 x64;
1226   fiat_p256_addcarryx_u32(&x63, &x64, x62, x33, 0x0);
1227   uint32_t x65;
1228   fiat_p256_uint1 x66;
1229   fiat_p256_addcarryx_u32(&x65, &x66, x64, x35, x23);
1230   uint32_t x67;
1231   fiat_p256_uint1 x68;
1232   fiat_p256_addcarryx_u32(&x67, &x68, x66, x37, x40);
1233   uint32_t x69;
1234   fiat_p256_uint1 x70;
1235   fiat_p256_addcarryx_u32(&x69, &x70, x68, x39, x41);
1236   uint32_t x71;
1237   uint32_t x72;
1238   fiat_p256_mulx_u32(&x71, &x72, x1, (arg1[7]));
1239   uint32_t x73;
1240   uint32_t x74;
1241   fiat_p256_mulx_u32(&x73, &x74, x1, (arg1[6]));
1242   uint32_t x75;
1243   uint32_t x76;
1244   fiat_p256_mulx_u32(&x75, &x76, x1, (arg1[5]));
1245   uint32_t x77;
1246   uint32_t x78;
1247   fiat_p256_mulx_u32(&x77, &x78, x1, (arg1[4]));
1248   uint32_t x79;
1249   uint32_t x80;
1250   fiat_p256_mulx_u32(&x79, &x80, x1, (arg1[3]));
1251   uint32_t x81;
1252   uint32_t x82;
1253   fiat_p256_mulx_u32(&x81, &x82, x1, (arg1[2]));
1254   uint32_t x83;
1255   uint32_t x84;
1256   fiat_p256_mulx_u32(&x83, &x84, x1, (arg1[1]));
1257   uint32_t x85;
1258   uint32_t x86;
1259   fiat_p256_mulx_u32(&x85, &x86, x1, (arg1[0]));
1260   uint32_t x87;
1261   fiat_p256_uint1 x88;
1262   fiat_p256_addcarryx_u32(&x87, &x88, 0x0, x86, x83);
1263   uint32_t x89;
1264   fiat_p256_uint1 x90;
1265   fiat_p256_addcarryx_u32(&x89, &x90, x88, x84, x81);
1266   uint32_t x91;
1267   fiat_p256_uint1 x92;
1268   fiat_p256_addcarryx_u32(&x91, &x92, x90, x82, x79);
1269   uint32_t x93;
1270   fiat_p256_uint1 x94;
1271   fiat_p256_addcarryx_u32(&x93, &x94, x92, x80, x77);
1272   uint32_t x95;
1273   fiat_p256_uint1 x96;
1274   fiat_p256_addcarryx_u32(&x95, &x96, x94, x78, x75);
1275   uint32_t x97;
1276   fiat_p256_uint1 x98;
1277   fiat_p256_addcarryx_u32(&x97, &x98, x96, x76, x73);
1278   uint32_t x99;
1279   fiat_p256_uint1 x100;
1280   fiat_p256_addcarryx_u32(&x99, &x100, x98, x74, x71);
1281   uint32_t x101 = (x100 + x72);
1282   uint32_t x102;
1283   fiat_p256_uint1 x103;
1284   fiat_p256_addcarryx_u32(&x102, &x103, 0x0, x55, x85);
1285   uint32_t x104;
1286   fiat_p256_uint1 x105;
1287   fiat_p256_addcarryx_u32(&x104, &x105, x103, x57, x87);
1288   uint32_t x106;
1289   fiat_p256_uint1 x107;
1290   fiat_p256_addcarryx_u32(&x106, &x107, x105, x59, x89);
1291   uint32_t x108;
1292   fiat_p256_uint1 x109;
1293   fiat_p256_addcarryx_u32(&x108, &x109, x107, x61, x91);
1294   uint32_t x110;
1295   fiat_p256_uint1 x111;
1296   fiat_p256_addcarryx_u32(&x110, &x111, x109, x63, x93);
1297   uint32_t x112;
1298   fiat_p256_uint1 x113;
1299   fiat_p256_addcarryx_u32(&x112, &x113, x111, x65, x95);
1300   uint32_t x114;
1301   fiat_p256_uint1 x115;
1302   fiat_p256_addcarryx_u32(&x114, &x115, x113, x67, x97);
1303   uint32_t x116;
1304   fiat_p256_uint1 x117;
1305   fiat_p256_addcarryx_u32(&x116, &x117, x115, x69, x99);
1306   uint32_t x118;
1307   fiat_p256_uint1 x119;
1308   fiat_p256_addcarryx_u32(&x118, &x119, x117, x70, x101);
1309   uint32_t x120;
1310   uint32_t x121;
1311   fiat_p256_mulx_u32(&x120, &x121, x102, UINT32_C(0xffffffff));
1312   uint32_t x122;
1313   uint32_t x123;
1314   fiat_p256_mulx_u32(&x122, &x123, x102, UINT32_C(0xffffffff));
1315   uint32_t x124;
1316   uint32_t x125;
1317   fiat_p256_mulx_u32(&x124, &x125, x102, UINT32_C(0xffffffff));
1318   uint32_t x126;
1319   uint32_t x127;
1320   fiat_p256_mulx_u32(&x126, &x127, x102, UINT32_C(0xffffffff));
1321   uint32_t x128;
1322   fiat_p256_uint1 x129;
1323   fiat_p256_addcarryx_u32(&x128, &x129, 0x0, x127, x124);
1324   uint32_t x130;
1325   fiat_p256_uint1 x131;
1326   fiat_p256_addcarryx_u32(&x130, &x131, x129, x125, x122);
1327   uint32_t x132 = (x131 + x123);
1328   uint32_t x133;
1329   fiat_p256_uint1 x134;
1330   fiat_p256_addcarryx_u32(&x133, &x134, 0x0, x102, x126);
1331   uint32_t x135;
1332   fiat_p256_uint1 x136;
1333   fiat_p256_addcarryx_u32(&x135, &x136, x134, x104, x128);
1334   uint32_t x137;
1335   fiat_p256_uint1 x138;
1336   fiat_p256_addcarryx_u32(&x137, &x138, x136, x106, x130);
1337   uint32_t x139;
1338   fiat_p256_uint1 x140;
1339   fiat_p256_addcarryx_u32(&x139, &x140, x138, x108, x132);
1340   uint32_t x141;
1341   fiat_p256_uint1 x142;
1342   fiat_p256_addcarryx_u32(&x141, &x142, x140, x110, 0x0);
1343   uint32_t x143;
1344   fiat_p256_uint1 x144;
1345   fiat_p256_addcarryx_u32(&x143, &x144, x142, x112, 0x0);
1346   uint32_t x145;
1347   fiat_p256_uint1 x146;
1348   fiat_p256_addcarryx_u32(&x145, &x146, x144, x114, x102);
1349   uint32_t x147;
1350   fiat_p256_uint1 x148;
1351   fiat_p256_addcarryx_u32(&x147, &x148, x146, x116, x120);
1352   uint32_t x149;
1353   fiat_p256_uint1 x150;
1354   fiat_p256_addcarryx_u32(&x149, &x150, x148, x118, x121);
1355   uint32_t x151 = ((uint32_t)x150 + x119);
1356   uint32_t x152;
1357   uint32_t x153;
1358   fiat_p256_mulx_u32(&x152, &x153, x2, (arg1[7]));
1359   uint32_t x154;
1360   uint32_t x155;
1361   fiat_p256_mulx_u32(&x154, &x155, x2, (arg1[6]));
1362   uint32_t x156;
1363   uint32_t x157;
1364   fiat_p256_mulx_u32(&x156, &x157, x2, (arg1[5]));
1365   uint32_t x158;
1366   uint32_t x159;
1367   fiat_p256_mulx_u32(&x158, &x159, x2, (arg1[4]));
1368   uint32_t x160;
1369   uint32_t x161;
1370   fiat_p256_mulx_u32(&x160, &x161, x2, (arg1[3]));
1371   uint32_t x162;
1372   uint32_t x163;
1373   fiat_p256_mulx_u32(&x162, &x163, x2, (arg1[2]));
1374   uint32_t x164;
1375   uint32_t x165;
1376   fiat_p256_mulx_u32(&x164, &x165, x2, (arg1[1]));
1377   uint32_t x166;
1378   uint32_t x167;
1379   fiat_p256_mulx_u32(&x166, &x167, x2, (arg1[0]));
1380   uint32_t x168;
1381   fiat_p256_uint1 x169;
1382   fiat_p256_addcarryx_u32(&x168, &x169, 0x0, x167, x164);
1383   uint32_t x170;
1384   fiat_p256_uint1 x171;
1385   fiat_p256_addcarryx_u32(&x170, &x171, x169, x165, x162);
1386   uint32_t x172;
1387   fiat_p256_uint1 x173;
1388   fiat_p256_addcarryx_u32(&x172, &x173, x171, x163, x160);
1389   uint32_t x174;
1390   fiat_p256_uint1 x175;
1391   fiat_p256_addcarryx_u32(&x174, &x175, x173, x161, x158);
1392   uint32_t x176;
1393   fiat_p256_uint1 x177;
1394   fiat_p256_addcarryx_u32(&x176, &x177, x175, x159, x156);
1395   uint32_t x178;
1396   fiat_p256_uint1 x179;
1397   fiat_p256_addcarryx_u32(&x178, &x179, x177, x157, x154);
1398   uint32_t x180;
1399   fiat_p256_uint1 x181;
1400   fiat_p256_addcarryx_u32(&x180, &x181, x179, x155, x152);
1401   uint32_t x182 = (x181 + x153);
1402   uint32_t x183;
1403   fiat_p256_uint1 x184;
1404   fiat_p256_addcarryx_u32(&x183, &x184, 0x0, x135, x166);
1405   uint32_t x185;
1406   fiat_p256_uint1 x186;
1407   fiat_p256_addcarryx_u32(&x185, &x186, x184, x137, x168);
1408   uint32_t x187;
1409   fiat_p256_uint1 x188;
1410   fiat_p256_addcarryx_u32(&x187, &x188, x186, x139, x170);
1411   uint32_t x189;
1412   fiat_p256_uint1 x190;
1413   fiat_p256_addcarryx_u32(&x189, &x190, x188, x141, x172);
1414   uint32_t x191;
1415   fiat_p256_uint1 x192;
1416   fiat_p256_addcarryx_u32(&x191, &x192, x190, x143, x174);
1417   uint32_t x193;
1418   fiat_p256_uint1 x194;
1419   fiat_p256_addcarryx_u32(&x193, &x194, x192, x145, x176);
1420   uint32_t x195;
1421   fiat_p256_uint1 x196;
1422   fiat_p256_addcarryx_u32(&x195, &x196, x194, x147, x178);
1423   uint32_t x197;
1424   fiat_p256_uint1 x198;
1425   fiat_p256_addcarryx_u32(&x197, &x198, x196, x149, x180);
1426   uint32_t x199;
1427   fiat_p256_uint1 x200;
1428   fiat_p256_addcarryx_u32(&x199, &x200, x198, x151, x182);
1429   uint32_t x201;
1430   uint32_t x202;
1431   fiat_p256_mulx_u32(&x201, &x202, x183, UINT32_C(0xffffffff));
1432   uint32_t x203;
1433   uint32_t x204;
1434   fiat_p256_mulx_u32(&x203, &x204, x183, UINT32_C(0xffffffff));
1435   uint32_t x205;
1436   uint32_t x206;
1437   fiat_p256_mulx_u32(&x205, &x206, x183, UINT32_C(0xffffffff));
1438   uint32_t x207;
1439   uint32_t x208;
1440   fiat_p256_mulx_u32(&x207, &x208, x183, UINT32_C(0xffffffff));
1441   uint32_t x209;
1442   fiat_p256_uint1 x210;
1443   fiat_p256_addcarryx_u32(&x209, &x210, 0x0, x208, x205);
1444   uint32_t x211;
1445   fiat_p256_uint1 x212;
1446   fiat_p256_addcarryx_u32(&x211, &x212, x210, x206, x203);
1447   uint32_t x213 = (x212 + x204);
1448   uint32_t x214;
1449   fiat_p256_uint1 x215;
1450   fiat_p256_addcarryx_u32(&x214, &x215, 0x0, x183, x207);
1451   uint32_t x216;
1452   fiat_p256_uint1 x217;
1453   fiat_p256_addcarryx_u32(&x216, &x217, x215, x185, x209);
1454   uint32_t x218;
1455   fiat_p256_uint1 x219;
1456   fiat_p256_addcarryx_u32(&x218, &x219, x217, x187, x211);
1457   uint32_t x220;
1458   fiat_p256_uint1 x221;
1459   fiat_p256_addcarryx_u32(&x220, &x221, x219, x189, x213);
1460   uint32_t x222;
1461   fiat_p256_uint1 x223;
1462   fiat_p256_addcarryx_u32(&x222, &x223, x221, x191, 0x0);
1463   uint32_t x224;
1464   fiat_p256_uint1 x225;
1465   fiat_p256_addcarryx_u32(&x224, &x225, x223, x193, 0x0);
1466   uint32_t x226;
1467   fiat_p256_uint1 x227;
1468   fiat_p256_addcarryx_u32(&x226, &x227, x225, x195, x183);
1469   uint32_t x228;
1470   fiat_p256_uint1 x229;
1471   fiat_p256_addcarryx_u32(&x228, &x229, x227, x197, x201);
1472   uint32_t x230;
1473   fiat_p256_uint1 x231;
1474   fiat_p256_addcarryx_u32(&x230, &x231, x229, x199, x202);
1475   uint32_t x232 = ((uint32_t)x231 + x200);
1476   uint32_t x233;
1477   uint32_t x234;
1478   fiat_p256_mulx_u32(&x233, &x234, x3, (arg1[7]));
1479   uint32_t x235;
1480   uint32_t x236;
1481   fiat_p256_mulx_u32(&x235, &x236, x3, (arg1[6]));
1482   uint32_t x237;
1483   uint32_t x238;
1484   fiat_p256_mulx_u32(&x237, &x238, x3, (arg1[5]));
1485   uint32_t x239;
1486   uint32_t x240;
1487   fiat_p256_mulx_u32(&x239, &x240, x3, (arg1[4]));
1488   uint32_t x241;
1489   uint32_t x242;
1490   fiat_p256_mulx_u32(&x241, &x242, x3, (arg1[3]));
1491   uint32_t x243;
1492   uint32_t x244;
1493   fiat_p256_mulx_u32(&x243, &x244, x3, (arg1[2]));
1494   uint32_t x245;
1495   uint32_t x246;
1496   fiat_p256_mulx_u32(&x245, &x246, x3, (arg1[1]));
1497   uint32_t x247;
1498   uint32_t x248;
1499   fiat_p256_mulx_u32(&x247, &x248, x3, (arg1[0]));
1500   uint32_t x249;
1501   fiat_p256_uint1 x250;
1502   fiat_p256_addcarryx_u32(&x249, &x250, 0x0, x248, x245);
1503   uint32_t x251;
1504   fiat_p256_uint1 x252;
1505   fiat_p256_addcarryx_u32(&x251, &x252, x250, x246, x243);
1506   uint32_t x253;
1507   fiat_p256_uint1 x254;
1508   fiat_p256_addcarryx_u32(&x253, &x254, x252, x244, x241);
1509   uint32_t x255;
1510   fiat_p256_uint1 x256;
1511   fiat_p256_addcarryx_u32(&x255, &x256, x254, x242, x239);
1512   uint32_t x257;
1513   fiat_p256_uint1 x258;
1514   fiat_p256_addcarryx_u32(&x257, &x258, x256, x240, x237);
1515   uint32_t x259;
1516   fiat_p256_uint1 x260;
1517   fiat_p256_addcarryx_u32(&x259, &x260, x258, x238, x235);
1518   uint32_t x261;
1519   fiat_p256_uint1 x262;
1520   fiat_p256_addcarryx_u32(&x261, &x262, x260, x236, x233);
1521   uint32_t x263 = (x262 + x234);
1522   uint32_t x264;
1523   fiat_p256_uint1 x265;
1524   fiat_p256_addcarryx_u32(&x264, &x265, 0x0, x216, x247);
1525   uint32_t x266;
1526   fiat_p256_uint1 x267;
1527   fiat_p256_addcarryx_u32(&x266, &x267, x265, x218, x249);
1528   uint32_t x268;
1529   fiat_p256_uint1 x269;
1530   fiat_p256_addcarryx_u32(&x268, &x269, x267, x220, x251);
1531   uint32_t x270;
1532   fiat_p256_uint1 x271;
1533   fiat_p256_addcarryx_u32(&x270, &x271, x269, x222, x253);
1534   uint32_t x272;
1535   fiat_p256_uint1 x273;
1536   fiat_p256_addcarryx_u32(&x272, &x273, x271, x224, x255);
1537   uint32_t x274;
1538   fiat_p256_uint1 x275;
1539   fiat_p256_addcarryx_u32(&x274, &x275, x273, x226, x257);
1540   uint32_t x276;
1541   fiat_p256_uint1 x277;
1542   fiat_p256_addcarryx_u32(&x276, &x277, x275, x228, x259);
1543   uint32_t x278;
1544   fiat_p256_uint1 x279;
1545   fiat_p256_addcarryx_u32(&x278, &x279, x277, x230, x261);
1546   uint32_t x280;
1547   fiat_p256_uint1 x281;
1548   fiat_p256_addcarryx_u32(&x280, &x281, x279, x232, x263);
1549   uint32_t x282;
1550   uint32_t x283;
1551   fiat_p256_mulx_u32(&x282, &x283, x264, UINT32_C(0xffffffff));
1552   uint32_t x284;
1553   uint32_t x285;
1554   fiat_p256_mulx_u32(&x284, &x285, x264, UINT32_C(0xffffffff));
1555   uint32_t x286;
1556   uint32_t x287;
1557   fiat_p256_mulx_u32(&x286, &x287, x264, UINT32_C(0xffffffff));
1558   uint32_t x288;
1559   uint32_t x289;
1560   fiat_p256_mulx_u32(&x288, &x289, x264, UINT32_C(0xffffffff));
1561   uint32_t x290;
1562   fiat_p256_uint1 x291;
1563   fiat_p256_addcarryx_u32(&x290, &x291, 0x0, x289, x286);
1564   uint32_t x292;
1565   fiat_p256_uint1 x293;
1566   fiat_p256_addcarryx_u32(&x292, &x293, x291, x287, x284);
1567   uint32_t x294 = (x293 + x285);
1568   uint32_t x295;
1569   fiat_p256_uint1 x296;
1570   fiat_p256_addcarryx_u32(&x295, &x296, 0x0, x264, x288);
1571   uint32_t x297;
1572   fiat_p256_uint1 x298;
1573   fiat_p256_addcarryx_u32(&x297, &x298, x296, x266, x290);
1574   uint32_t x299;
1575   fiat_p256_uint1 x300;
1576   fiat_p256_addcarryx_u32(&x299, &x300, x298, x268, x292);
1577   uint32_t x301;
1578   fiat_p256_uint1 x302;
1579   fiat_p256_addcarryx_u32(&x301, &x302, x300, x270, x294);
1580   uint32_t x303;
1581   fiat_p256_uint1 x304;
1582   fiat_p256_addcarryx_u32(&x303, &x304, x302, x272, 0x0);
1583   uint32_t x305;
1584   fiat_p256_uint1 x306;
1585   fiat_p256_addcarryx_u32(&x305, &x306, x304, x274, 0x0);
1586   uint32_t x307;
1587   fiat_p256_uint1 x308;
1588   fiat_p256_addcarryx_u32(&x307, &x308, x306, x276, x264);
1589   uint32_t x309;
1590   fiat_p256_uint1 x310;
1591   fiat_p256_addcarryx_u32(&x309, &x310, x308, x278, x282);
1592   uint32_t x311;
1593   fiat_p256_uint1 x312;
1594   fiat_p256_addcarryx_u32(&x311, &x312, x310, x280, x283);
1595   uint32_t x313 = ((uint32_t)x312 + x281);
1596   uint32_t x314;
1597   uint32_t x315;
1598   fiat_p256_mulx_u32(&x314, &x315, x4, (arg1[7]));
1599   uint32_t x316;
1600   uint32_t x317;
1601   fiat_p256_mulx_u32(&x316, &x317, x4, (arg1[6]));
1602   uint32_t x318;
1603   uint32_t x319;
1604   fiat_p256_mulx_u32(&x318, &x319, x4, (arg1[5]));
1605   uint32_t x320;
1606   uint32_t x321;
1607   fiat_p256_mulx_u32(&x320, &x321, x4, (arg1[4]));
1608   uint32_t x322;
1609   uint32_t x323;
1610   fiat_p256_mulx_u32(&x322, &x323, x4, (arg1[3]));
1611   uint32_t x324;
1612   uint32_t x325;
1613   fiat_p256_mulx_u32(&x324, &x325, x4, (arg1[2]));
1614   uint32_t x326;
1615   uint32_t x327;
1616   fiat_p256_mulx_u32(&x326, &x327, x4, (arg1[1]));
1617   uint32_t x328;
1618   uint32_t x329;
1619   fiat_p256_mulx_u32(&x328, &x329, x4, (arg1[0]));
1620   uint32_t x330;
1621   fiat_p256_uint1 x331;
1622   fiat_p256_addcarryx_u32(&x330, &x331, 0x0, x329, x326);
1623   uint32_t x332;
1624   fiat_p256_uint1 x333;
1625   fiat_p256_addcarryx_u32(&x332, &x333, x331, x327, x324);
1626   uint32_t x334;
1627   fiat_p256_uint1 x335;
1628   fiat_p256_addcarryx_u32(&x334, &x335, x333, x325, x322);
1629   uint32_t x336;
1630   fiat_p256_uint1 x337;
1631   fiat_p256_addcarryx_u32(&x336, &x337, x335, x323, x320);
1632   uint32_t x338;
1633   fiat_p256_uint1 x339;
1634   fiat_p256_addcarryx_u32(&x338, &x339, x337, x321, x318);
1635   uint32_t x340;
1636   fiat_p256_uint1 x341;
1637   fiat_p256_addcarryx_u32(&x340, &x341, x339, x319, x316);
1638   uint32_t x342;
1639   fiat_p256_uint1 x343;
1640   fiat_p256_addcarryx_u32(&x342, &x343, x341, x317, x314);
1641   uint32_t x344 = (x343 + x315);
1642   uint32_t x345;
1643   fiat_p256_uint1 x346;
1644   fiat_p256_addcarryx_u32(&x345, &x346, 0x0, x297, x328);
1645   uint32_t x347;
1646   fiat_p256_uint1 x348;
1647   fiat_p256_addcarryx_u32(&x347, &x348, x346, x299, x330);
1648   uint32_t x349;
1649   fiat_p256_uint1 x350;
1650   fiat_p256_addcarryx_u32(&x349, &x350, x348, x301, x332);
1651   uint32_t x351;
1652   fiat_p256_uint1 x352;
1653   fiat_p256_addcarryx_u32(&x351, &x352, x350, x303, x334);
1654   uint32_t x353;
1655   fiat_p256_uint1 x354;
1656   fiat_p256_addcarryx_u32(&x353, &x354, x352, x305, x336);
1657   uint32_t x355;
1658   fiat_p256_uint1 x356;
1659   fiat_p256_addcarryx_u32(&x355, &x356, x354, x307, x338);
1660   uint32_t x357;
1661   fiat_p256_uint1 x358;
1662   fiat_p256_addcarryx_u32(&x357, &x358, x356, x309, x340);
1663   uint32_t x359;
1664   fiat_p256_uint1 x360;
1665   fiat_p256_addcarryx_u32(&x359, &x360, x358, x311, x342);
1666   uint32_t x361;
1667   fiat_p256_uint1 x362;
1668   fiat_p256_addcarryx_u32(&x361, &x362, x360, x313, x344);
1669   uint32_t x363;
1670   uint32_t x364;
1671   fiat_p256_mulx_u32(&x363, &x364, x345, UINT32_C(0xffffffff));
1672   uint32_t x365;
1673   uint32_t x366;
1674   fiat_p256_mulx_u32(&x365, &x366, x345, UINT32_C(0xffffffff));
1675   uint32_t x367;
1676   uint32_t x368;
1677   fiat_p256_mulx_u32(&x367, &x368, x345, UINT32_C(0xffffffff));
1678   uint32_t x369;
1679   uint32_t x370;
1680   fiat_p256_mulx_u32(&x369, &x370, x345, UINT32_C(0xffffffff));
1681   uint32_t x371;
1682   fiat_p256_uint1 x372;
1683   fiat_p256_addcarryx_u32(&x371, &x372, 0x0, x370, x367);
1684   uint32_t x373;
1685   fiat_p256_uint1 x374;
1686   fiat_p256_addcarryx_u32(&x373, &x374, x372, x368, x365);
1687   uint32_t x375 = (x374 + x366);
1688   uint32_t x376;
1689   fiat_p256_uint1 x377;
1690   fiat_p256_addcarryx_u32(&x376, &x377, 0x0, x345, x369);
1691   uint32_t x378;
1692   fiat_p256_uint1 x379;
1693   fiat_p256_addcarryx_u32(&x378, &x379, x377, x347, x371);
1694   uint32_t x380;
1695   fiat_p256_uint1 x381;
1696   fiat_p256_addcarryx_u32(&x380, &x381, x379, x349, x373);
1697   uint32_t x382;
1698   fiat_p256_uint1 x383;
1699   fiat_p256_addcarryx_u32(&x382, &x383, x381, x351, x375);
1700   uint32_t x384;
1701   fiat_p256_uint1 x385;
1702   fiat_p256_addcarryx_u32(&x384, &x385, x383, x353, 0x0);
1703   uint32_t x386;
1704   fiat_p256_uint1 x387;
1705   fiat_p256_addcarryx_u32(&x386, &x387, x385, x355, 0x0);
1706   uint32_t x388;
1707   fiat_p256_uint1 x389;
1708   fiat_p256_addcarryx_u32(&x388, &x389, x387, x357, x345);
1709   uint32_t x390;
1710   fiat_p256_uint1 x391;
1711   fiat_p256_addcarryx_u32(&x390, &x391, x389, x359, x363);
1712   uint32_t x392;
1713   fiat_p256_uint1 x393;
1714   fiat_p256_addcarryx_u32(&x392, &x393, x391, x361, x364);
1715   uint32_t x394 = ((uint32_t)x393 + x362);
1716   uint32_t x395;
1717   uint32_t x396;
1718   fiat_p256_mulx_u32(&x395, &x396, x5, (arg1[7]));
1719   uint32_t x397;
1720   uint32_t x398;
1721   fiat_p256_mulx_u32(&x397, &x398, x5, (arg1[6]));
1722   uint32_t x399;
1723   uint32_t x400;
1724   fiat_p256_mulx_u32(&x399, &x400, x5, (arg1[5]));
1725   uint32_t x401;
1726   uint32_t x402;
1727   fiat_p256_mulx_u32(&x401, &x402, x5, (arg1[4]));
1728   uint32_t x403;
1729   uint32_t x404;
1730   fiat_p256_mulx_u32(&x403, &x404, x5, (arg1[3]));
1731   uint32_t x405;
1732   uint32_t x406;
1733   fiat_p256_mulx_u32(&x405, &x406, x5, (arg1[2]));
1734   uint32_t x407;
1735   uint32_t x408;
1736   fiat_p256_mulx_u32(&x407, &x408, x5, (arg1[1]));
1737   uint32_t x409;
1738   uint32_t x410;
1739   fiat_p256_mulx_u32(&x409, &x410, x5, (arg1[0]));
1740   uint32_t x411;
1741   fiat_p256_uint1 x412;
1742   fiat_p256_addcarryx_u32(&x411, &x412, 0x0, x410, x407);
1743   uint32_t x413;
1744   fiat_p256_uint1 x414;
1745   fiat_p256_addcarryx_u32(&x413, &x414, x412, x408, x405);
1746   uint32_t x415;
1747   fiat_p256_uint1 x416;
1748   fiat_p256_addcarryx_u32(&x415, &x416, x414, x406, x403);
1749   uint32_t x417;
1750   fiat_p256_uint1 x418;
1751   fiat_p256_addcarryx_u32(&x417, &x418, x416, x404, x401);
1752   uint32_t x419;
1753   fiat_p256_uint1 x420;
1754   fiat_p256_addcarryx_u32(&x419, &x420, x418, x402, x399);
1755   uint32_t x421;
1756   fiat_p256_uint1 x422;
1757   fiat_p256_addcarryx_u32(&x421, &x422, x420, x400, x397);
1758   uint32_t x423;
1759   fiat_p256_uint1 x424;
1760   fiat_p256_addcarryx_u32(&x423, &x424, x422, x398, x395);
1761   uint32_t x425 = (x424 + x396);
1762   uint32_t x426;
1763   fiat_p256_uint1 x427;
1764   fiat_p256_addcarryx_u32(&x426, &x427, 0x0, x378, x409);
1765   uint32_t x428;
1766   fiat_p256_uint1 x429;
1767   fiat_p256_addcarryx_u32(&x428, &x429, x427, x380, x411);
1768   uint32_t x430;
1769   fiat_p256_uint1 x431;
1770   fiat_p256_addcarryx_u32(&x430, &x431, x429, x382, x413);
1771   uint32_t x432;
1772   fiat_p256_uint1 x433;
1773   fiat_p256_addcarryx_u32(&x432, &x433, x431, x384, x415);
1774   uint32_t x434;
1775   fiat_p256_uint1 x435;
1776   fiat_p256_addcarryx_u32(&x434, &x435, x433, x386, x417);
1777   uint32_t x436;
1778   fiat_p256_uint1 x437;
1779   fiat_p256_addcarryx_u32(&x436, &x437, x435, x388, x419);
1780   uint32_t x438;
1781   fiat_p256_uint1 x439;
1782   fiat_p256_addcarryx_u32(&x438, &x439, x437, x390, x421);
1783   uint32_t x440;
1784   fiat_p256_uint1 x441;
1785   fiat_p256_addcarryx_u32(&x440, &x441, x439, x392, x423);
1786   uint32_t x442;
1787   fiat_p256_uint1 x443;
1788   fiat_p256_addcarryx_u32(&x442, &x443, x441, x394, x425);
1789   uint32_t x444;
1790   uint32_t x445;
1791   fiat_p256_mulx_u32(&x444, &x445, x426, UINT32_C(0xffffffff));
1792   uint32_t x446;
1793   uint32_t x447;
1794   fiat_p256_mulx_u32(&x446, &x447, x426, UINT32_C(0xffffffff));
1795   uint32_t x448;
1796   uint32_t x449;
1797   fiat_p256_mulx_u32(&x448, &x449, x426, UINT32_C(0xffffffff));
1798   uint32_t x450;
1799   uint32_t x451;
1800   fiat_p256_mulx_u32(&x450, &x451, x426, UINT32_C(0xffffffff));
1801   uint32_t x452;
1802   fiat_p256_uint1 x453;
1803   fiat_p256_addcarryx_u32(&x452, &x453, 0x0, x451, x448);
1804   uint32_t x454;
1805   fiat_p256_uint1 x455;
1806   fiat_p256_addcarryx_u32(&x454, &x455, x453, x449, x446);
1807   uint32_t x456 = (x455 + x447);
1808   uint32_t x457;
1809   fiat_p256_uint1 x458;
1810   fiat_p256_addcarryx_u32(&x457, &x458, 0x0, x426, x450);
1811   uint32_t x459;
1812   fiat_p256_uint1 x460;
1813   fiat_p256_addcarryx_u32(&x459, &x460, x458, x428, x452);
1814   uint32_t x461;
1815   fiat_p256_uint1 x462;
1816   fiat_p256_addcarryx_u32(&x461, &x462, x460, x430, x454);
1817   uint32_t x463;
1818   fiat_p256_uint1 x464;
1819   fiat_p256_addcarryx_u32(&x463, &x464, x462, x432, x456);
1820   uint32_t x465;
1821   fiat_p256_uint1 x466;
1822   fiat_p256_addcarryx_u32(&x465, &x466, x464, x434, 0x0);
1823   uint32_t x467;
1824   fiat_p256_uint1 x468;
1825   fiat_p256_addcarryx_u32(&x467, &x468, x466, x436, 0x0);
1826   uint32_t x469;
1827   fiat_p256_uint1 x470;
1828   fiat_p256_addcarryx_u32(&x469, &x470, x468, x438, x426);
1829   uint32_t x471;
1830   fiat_p256_uint1 x472;
1831   fiat_p256_addcarryx_u32(&x471, &x472, x470, x440, x444);
1832   uint32_t x473;
1833   fiat_p256_uint1 x474;
1834   fiat_p256_addcarryx_u32(&x473, &x474, x472, x442, x445);
1835   uint32_t x475 = ((uint32_t)x474 + x443);
1836   uint32_t x476;
1837   uint32_t x477;
1838   fiat_p256_mulx_u32(&x476, &x477, x6, (arg1[7]));
1839   uint32_t x478;
1840   uint32_t x479;
1841   fiat_p256_mulx_u32(&x478, &x479, x6, (arg1[6]));
1842   uint32_t x480;
1843   uint32_t x481;
1844   fiat_p256_mulx_u32(&x480, &x481, x6, (arg1[5]));
1845   uint32_t x482;
1846   uint32_t x483;
1847   fiat_p256_mulx_u32(&x482, &x483, x6, (arg1[4]));
1848   uint32_t x484;
1849   uint32_t x485;
1850   fiat_p256_mulx_u32(&x484, &x485, x6, (arg1[3]));
1851   uint32_t x486;
1852   uint32_t x487;
1853   fiat_p256_mulx_u32(&x486, &x487, x6, (arg1[2]));
1854   uint32_t x488;
1855   uint32_t x489;
1856   fiat_p256_mulx_u32(&x488, &x489, x6, (arg1[1]));
1857   uint32_t x490;
1858   uint32_t x491;
1859   fiat_p256_mulx_u32(&x490, &x491, x6, (arg1[0]));
1860   uint32_t x492;
1861   fiat_p256_uint1 x493;
1862   fiat_p256_addcarryx_u32(&x492, &x493, 0x0, x491, x488);
1863   uint32_t x494;
1864   fiat_p256_uint1 x495;
1865   fiat_p256_addcarryx_u32(&x494, &x495, x493, x489, x486);
1866   uint32_t x496;
1867   fiat_p256_uint1 x497;
1868   fiat_p256_addcarryx_u32(&x496, &x497, x495, x487, x484);
1869   uint32_t x498;
1870   fiat_p256_uint1 x499;
1871   fiat_p256_addcarryx_u32(&x498, &x499, x497, x485, x482);
1872   uint32_t x500;
1873   fiat_p256_uint1 x501;
1874   fiat_p256_addcarryx_u32(&x500, &x501, x499, x483, x480);
1875   uint32_t x502;
1876   fiat_p256_uint1 x503;
1877   fiat_p256_addcarryx_u32(&x502, &x503, x501, x481, x478);
1878   uint32_t x504;
1879   fiat_p256_uint1 x505;
1880   fiat_p256_addcarryx_u32(&x504, &x505, x503, x479, x476);
1881   uint32_t x506 = (x505 + x477);
1882   uint32_t x507;
1883   fiat_p256_uint1 x508;
1884   fiat_p256_addcarryx_u32(&x507, &x508, 0x0, x459, x490);
1885   uint32_t x509;
1886   fiat_p256_uint1 x510;
1887   fiat_p256_addcarryx_u32(&x509, &x510, x508, x461, x492);
1888   uint32_t x511;
1889   fiat_p256_uint1 x512;
1890   fiat_p256_addcarryx_u32(&x511, &x512, x510, x463, x494);
1891   uint32_t x513;
1892   fiat_p256_uint1 x514;
1893   fiat_p256_addcarryx_u32(&x513, &x514, x512, x465, x496);
1894   uint32_t x515;
1895   fiat_p256_uint1 x516;
1896   fiat_p256_addcarryx_u32(&x515, &x516, x514, x467, x498);
1897   uint32_t x517;
1898   fiat_p256_uint1 x518;
1899   fiat_p256_addcarryx_u32(&x517, &x518, x516, x469, x500);
1900   uint32_t x519;
1901   fiat_p256_uint1 x520;
1902   fiat_p256_addcarryx_u32(&x519, &x520, x518, x471, x502);
1903   uint32_t x521;
1904   fiat_p256_uint1 x522;
1905   fiat_p256_addcarryx_u32(&x521, &x522, x520, x473, x504);
1906   uint32_t x523;
1907   fiat_p256_uint1 x524;
1908   fiat_p256_addcarryx_u32(&x523, &x524, x522, x475, x506);
1909   uint32_t x525;
1910   uint32_t x526;
1911   fiat_p256_mulx_u32(&x525, &x526, x507, UINT32_C(0xffffffff));
1912   uint32_t x527;
1913   uint32_t x528;
1914   fiat_p256_mulx_u32(&x527, &x528, x507, UINT32_C(0xffffffff));
1915   uint32_t x529;
1916   uint32_t x530;
1917   fiat_p256_mulx_u32(&x529, &x530, x507, UINT32_C(0xffffffff));
1918   uint32_t x531;
1919   uint32_t x532;
1920   fiat_p256_mulx_u32(&x531, &x532, x507, UINT32_C(0xffffffff));
1921   uint32_t x533;
1922   fiat_p256_uint1 x534;
1923   fiat_p256_addcarryx_u32(&x533, &x534, 0x0, x532, x529);
1924   uint32_t x535;
1925   fiat_p256_uint1 x536;
1926   fiat_p256_addcarryx_u32(&x535, &x536, x534, x530, x527);
1927   uint32_t x537 = (x536 + x528);
1928   uint32_t x538;
1929   fiat_p256_uint1 x539;
1930   fiat_p256_addcarryx_u32(&x538, &x539, 0x0, x507, x531);
1931   uint32_t x540;
1932   fiat_p256_uint1 x541;
1933   fiat_p256_addcarryx_u32(&x540, &x541, x539, x509, x533);
1934   uint32_t x542;
1935   fiat_p256_uint1 x543;
1936   fiat_p256_addcarryx_u32(&x542, &x543, x541, x511, x535);
1937   uint32_t x544;
1938   fiat_p256_uint1 x545;
1939   fiat_p256_addcarryx_u32(&x544, &x545, x543, x513, x537);
1940   uint32_t x546;
1941   fiat_p256_uint1 x547;
1942   fiat_p256_addcarryx_u32(&x546, &x547, x545, x515, 0x0);
1943   uint32_t x548;
1944   fiat_p256_uint1 x549;
1945   fiat_p256_addcarryx_u32(&x548, &x549, x547, x517, 0x0);
1946   uint32_t x550;
1947   fiat_p256_uint1 x551;
1948   fiat_p256_addcarryx_u32(&x550, &x551, x549, x519, x507);
1949   uint32_t x552;
1950   fiat_p256_uint1 x553;
1951   fiat_p256_addcarryx_u32(&x552, &x553, x551, x521, x525);
1952   uint32_t x554;
1953   fiat_p256_uint1 x555;
1954   fiat_p256_addcarryx_u32(&x554, &x555, x553, x523, x526);
1955   uint32_t x556 = ((uint32_t)x555 + x524);
1956   uint32_t x557;
1957   uint32_t x558;
1958   fiat_p256_mulx_u32(&x557, &x558, x7, (arg1[7]));
1959   uint32_t x559;
1960   uint32_t x560;
1961   fiat_p256_mulx_u32(&x559, &x560, x7, (arg1[6]));
1962   uint32_t x561;
1963   uint32_t x562;
1964   fiat_p256_mulx_u32(&x561, &x562, x7, (arg1[5]));
1965   uint32_t x563;
1966   uint32_t x564;
1967   fiat_p256_mulx_u32(&x563, &x564, x7, (arg1[4]));
1968   uint32_t x565;
1969   uint32_t x566;
1970   fiat_p256_mulx_u32(&x565, &x566, x7, (arg1[3]));
1971   uint32_t x567;
1972   uint32_t x568;
1973   fiat_p256_mulx_u32(&x567, &x568, x7, (arg1[2]));
1974   uint32_t x569;
1975   uint32_t x570;
1976   fiat_p256_mulx_u32(&x569, &x570, x7, (arg1[1]));
1977   uint32_t x571;
1978   uint32_t x572;
1979   fiat_p256_mulx_u32(&x571, &x572, x7, (arg1[0]));
1980   uint32_t x573;
1981   fiat_p256_uint1 x574;
1982   fiat_p256_addcarryx_u32(&x573, &x574, 0x0, x572, x569);
1983   uint32_t x575;
1984   fiat_p256_uint1 x576;
1985   fiat_p256_addcarryx_u32(&x575, &x576, x574, x570, x567);
1986   uint32_t x577;
1987   fiat_p256_uint1 x578;
1988   fiat_p256_addcarryx_u32(&x577, &x578, x576, x568, x565);
1989   uint32_t x579;
1990   fiat_p256_uint1 x580;
1991   fiat_p256_addcarryx_u32(&x579, &x580, x578, x566, x563);
1992   uint32_t x581;
1993   fiat_p256_uint1 x582;
1994   fiat_p256_addcarryx_u32(&x581, &x582, x580, x564, x561);
1995   uint32_t x583;
1996   fiat_p256_uint1 x584;
1997   fiat_p256_addcarryx_u32(&x583, &x584, x582, x562, x559);
1998   uint32_t x585;
1999   fiat_p256_uint1 x586;
2000   fiat_p256_addcarryx_u32(&x585, &x586, x584, x560, x557);
2001   uint32_t x587 = (x586 + x558);
2002   uint32_t x588;
2003   fiat_p256_uint1 x589;
2004   fiat_p256_addcarryx_u32(&x588, &x589, 0x0, x540, x571);
2005   uint32_t x590;
2006   fiat_p256_uint1 x591;
2007   fiat_p256_addcarryx_u32(&x590, &x591, x589, x542, x573);
2008   uint32_t x592;
2009   fiat_p256_uint1 x593;
2010   fiat_p256_addcarryx_u32(&x592, &x593, x591, x544, x575);
2011   uint32_t x594;
2012   fiat_p256_uint1 x595;
2013   fiat_p256_addcarryx_u32(&x594, &x595, x593, x546, x577);
2014   uint32_t x596;
2015   fiat_p256_uint1 x597;
2016   fiat_p256_addcarryx_u32(&x596, &x597, x595, x548, x579);
2017   uint32_t x598;
2018   fiat_p256_uint1 x599;
2019   fiat_p256_addcarryx_u32(&x598, &x599, x597, x550, x581);
2020   uint32_t x600;
2021   fiat_p256_uint1 x601;
2022   fiat_p256_addcarryx_u32(&x600, &x601, x599, x552, x583);
2023   uint32_t x602;
2024   fiat_p256_uint1 x603;
2025   fiat_p256_addcarryx_u32(&x602, &x603, x601, x554, x585);
2026   uint32_t x604;
2027   fiat_p256_uint1 x605;
2028   fiat_p256_addcarryx_u32(&x604, &x605, x603, x556, x587);
2029   uint32_t x606;
2030   uint32_t x607;
2031   fiat_p256_mulx_u32(&x606, &x607, x588, UINT32_C(0xffffffff));
2032   uint32_t x608;
2033   uint32_t x609;
2034   fiat_p256_mulx_u32(&x608, &x609, x588, UINT32_C(0xffffffff));
2035   uint32_t x610;
2036   uint32_t x611;
2037   fiat_p256_mulx_u32(&x610, &x611, x588, UINT32_C(0xffffffff));
2038   uint32_t x612;
2039   uint32_t x613;
2040   fiat_p256_mulx_u32(&x612, &x613, x588, UINT32_C(0xffffffff));
2041   uint32_t x614;
2042   fiat_p256_uint1 x615;
2043   fiat_p256_addcarryx_u32(&x614, &x615, 0x0, x613, x610);
2044   uint32_t x616;
2045   fiat_p256_uint1 x617;
2046   fiat_p256_addcarryx_u32(&x616, &x617, x615, x611, x608);
2047   uint32_t x618 = (x617 + x609);
2048   uint32_t x619;
2049   fiat_p256_uint1 x620;
2050   fiat_p256_addcarryx_u32(&x619, &x620, 0x0, x588, x612);
2051   uint32_t x621;
2052   fiat_p256_uint1 x622;
2053   fiat_p256_addcarryx_u32(&x621, &x622, x620, x590, x614);
2054   uint32_t x623;
2055   fiat_p256_uint1 x624;
2056   fiat_p256_addcarryx_u32(&x623, &x624, x622, x592, x616);
2057   uint32_t x625;
2058   fiat_p256_uint1 x626;
2059   fiat_p256_addcarryx_u32(&x625, &x626, x624, x594, x618);
2060   uint32_t x627;
2061   fiat_p256_uint1 x628;
2062   fiat_p256_addcarryx_u32(&x627, &x628, x626, x596, 0x0);
2063   uint32_t x629;
2064   fiat_p256_uint1 x630;
2065   fiat_p256_addcarryx_u32(&x629, &x630, x628, x598, 0x0);
2066   uint32_t x631;
2067   fiat_p256_uint1 x632;
2068   fiat_p256_addcarryx_u32(&x631, &x632, x630, x600, x588);
2069   uint32_t x633;
2070   fiat_p256_uint1 x634;
2071   fiat_p256_addcarryx_u32(&x633, &x634, x632, x602, x606);
2072   uint32_t x635;
2073   fiat_p256_uint1 x636;
2074   fiat_p256_addcarryx_u32(&x635, &x636, x634, x604, x607);
2075   uint32_t x637 = ((uint32_t)x636 + x605);
2076   uint32_t x638;
2077   fiat_p256_uint1 x639;
2078   fiat_p256_subborrowx_u32(&x638, &x639, 0x0, x621, UINT32_C(0xffffffff));
2079   uint32_t x640;
2080   fiat_p256_uint1 x641;
2081   fiat_p256_subborrowx_u32(&x640, &x641, x639, x623, UINT32_C(0xffffffff));
2082   uint32_t x642;
2083   fiat_p256_uint1 x643;
2084   fiat_p256_subborrowx_u32(&x642, &x643, x641, x625, UINT32_C(0xffffffff));
2085   uint32_t x644;
2086   fiat_p256_uint1 x645;
2087   fiat_p256_subborrowx_u32(&x644, &x645, x643, x627, 0x0);
2088   uint32_t x646;
2089   fiat_p256_uint1 x647;
2090   fiat_p256_subborrowx_u32(&x646, &x647, x645, x629, 0x0);
2091   uint32_t x648;
2092   fiat_p256_uint1 x649;
2093   fiat_p256_subborrowx_u32(&x648, &x649, x647, x631, 0x0);
2094   uint32_t x650;
2095   fiat_p256_uint1 x651;
2096   fiat_p256_subborrowx_u32(&x650, &x651, x649, x633, 0x1);
2097   uint32_t x652;
2098   fiat_p256_uint1 x653;
2099   fiat_p256_subborrowx_u32(&x652, &x653, x651, x635, UINT32_C(0xffffffff));
2100   uint32_t x654;
2101   fiat_p256_uint1 x655;
2102   fiat_p256_subborrowx_u32(&x654, &x655, x653, x637, 0x0);
2103   uint32_t x656;
2104   fiat_p256_cmovznz_u32(&x656, x655, x638, x621);
2105   uint32_t x657;
2106   fiat_p256_cmovznz_u32(&x657, x655, x640, x623);
2107   uint32_t x658;
2108   fiat_p256_cmovznz_u32(&x658, x655, x642, x625);
2109   uint32_t x659;
2110   fiat_p256_cmovznz_u32(&x659, x655, x644, x627);
2111   uint32_t x660;
2112   fiat_p256_cmovznz_u32(&x660, x655, x646, x629);
2113   uint32_t x661;
2114   fiat_p256_cmovznz_u32(&x661, x655, x648, x631);
2115   uint32_t x662;
2116   fiat_p256_cmovznz_u32(&x662, x655, x650, x633);
2117   uint32_t x663;
2118   fiat_p256_cmovznz_u32(&x663, x655, x652, x635);
2119   out1[0] = x656;
2120   out1[1] = x657;
2121   out1[2] = x658;
2122   out1[3] = x659;
2123   out1[4] = x660;
2124   out1[5] = x661;
2125   out1[6] = x662;
2126   out1[7] = x663;
2127 }
2128 
2129 /*
2130  * The function fiat_p256_add adds two field elements in the Montgomery domain.
2131  * Preconditions:
2132  *   0 ≤ eval arg1 < m
2133  *   0 ≤ eval arg2 < m
2134  * Postconditions:
2135  *   eval (from_montgomery out1) mod m = (eval (from_montgomery arg1) + eval (from_montgomery arg2)) mod m
2136  *   0 ≤ eval out1 < m
2137  *
2138  * Input Bounds:
2139  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2140  *   arg2: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2141  * Output Bounds:
2142  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2143  */
fiat_p256_add(uint32_t out1[8],const uint32_t arg1[8],const uint32_t arg2[8])2144 static void fiat_p256_add(uint32_t out1[8], const uint32_t arg1[8], const uint32_t arg2[8]) {
2145   uint32_t x1;
2146   fiat_p256_uint1 x2;
2147   fiat_p256_addcarryx_u32(&x1, &x2, 0x0, (arg1[0]), (arg2[0]));
2148   uint32_t x3;
2149   fiat_p256_uint1 x4;
2150   fiat_p256_addcarryx_u32(&x3, &x4, x2, (arg1[1]), (arg2[1]));
2151   uint32_t x5;
2152   fiat_p256_uint1 x6;
2153   fiat_p256_addcarryx_u32(&x5, &x6, x4, (arg1[2]), (arg2[2]));
2154   uint32_t x7;
2155   fiat_p256_uint1 x8;
2156   fiat_p256_addcarryx_u32(&x7, &x8, x6, (arg1[3]), (arg2[3]));
2157   uint32_t x9;
2158   fiat_p256_uint1 x10;
2159   fiat_p256_addcarryx_u32(&x9, &x10, x8, (arg1[4]), (arg2[4]));
2160   uint32_t x11;
2161   fiat_p256_uint1 x12;
2162   fiat_p256_addcarryx_u32(&x11, &x12, x10, (arg1[5]), (arg2[5]));
2163   uint32_t x13;
2164   fiat_p256_uint1 x14;
2165   fiat_p256_addcarryx_u32(&x13, &x14, x12, (arg1[6]), (arg2[6]));
2166   uint32_t x15;
2167   fiat_p256_uint1 x16;
2168   fiat_p256_addcarryx_u32(&x15, &x16, x14, (arg1[7]), (arg2[7]));
2169   uint32_t x17;
2170   fiat_p256_uint1 x18;
2171   fiat_p256_subborrowx_u32(&x17, &x18, 0x0, x1, UINT32_C(0xffffffff));
2172   uint32_t x19;
2173   fiat_p256_uint1 x20;
2174   fiat_p256_subborrowx_u32(&x19, &x20, x18, x3, UINT32_C(0xffffffff));
2175   uint32_t x21;
2176   fiat_p256_uint1 x22;
2177   fiat_p256_subborrowx_u32(&x21, &x22, x20, x5, UINT32_C(0xffffffff));
2178   uint32_t x23;
2179   fiat_p256_uint1 x24;
2180   fiat_p256_subborrowx_u32(&x23, &x24, x22, x7, 0x0);
2181   uint32_t x25;
2182   fiat_p256_uint1 x26;
2183   fiat_p256_subborrowx_u32(&x25, &x26, x24, x9, 0x0);
2184   uint32_t x27;
2185   fiat_p256_uint1 x28;
2186   fiat_p256_subborrowx_u32(&x27, &x28, x26, x11, 0x0);
2187   uint32_t x29;
2188   fiat_p256_uint1 x30;
2189   fiat_p256_subborrowx_u32(&x29, &x30, x28, x13, 0x1);
2190   uint32_t x31;
2191   fiat_p256_uint1 x32;
2192   fiat_p256_subborrowx_u32(&x31, &x32, x30, x15, UINT32_C(0xffffffff));
2193   uint32_t x33;
2194   fiat_p256_uint1 x34;
2195   fiat_p256_subborrowx_u32(&x33, &x34, x32, x16, 0x0);
2196   uint32_t x35;
2197   fiat_p256_cmovznz_u32(&x35, x34, x17, x1);
2198   uint32_t x36;
2199   fiat_p256_cmovznz_u32(&x36, x34, x19, x3);
2200   uint32_t x37;
2201   fiat_p256_cmovznz_u32(&x37, x34, x21, x5);
2202   uint32_t x38;
2203   fiat_p256_cmovznz_u32(&x38, x34, x23, x7);
2204   uint32_t x39;
2205   fiat_p256_cmovznz_u32(&x39, x34, x25, x9);
2206   uint32_t x40;
2207   fiat_p256_cmovznz_u32(&x40, x34, x27, x11);
2208   uint32_t x41;
2209   fiat_p256_cmovznz_u32(&x41, x34, x29, x13);
2210   uint32_t x42;
2211   fiat_p256_cmovznz_u32(&x42, x34, x31, x15);
2212   out1[0] = x35;
2213   out1[1] = x36;
2214   out1[2] = x37;
2215   out1[3] = x38;
2216   out1[4] = x39;
2217   out1[5] = x40;
2218   out1[6] = x41;
2219   out1[7] = x42;
2220 }
2221 
2222 /*
2223  * The function fiat_p256_sub subtracts two field elements in the Montgomery domain.
2224  * Preconditions:
2225  *   0 ≤ eval arg1 < m
2226  *   0 ≤ eval arg2 < m
2227  * Postconditions:
2228  *   eval (from_montgomery out1) mod m = (eval (from_montgomery arg1) - eval (from_montgomery arg2)) mod m
2229  *   0 ≤ eval out1 < m
2230  *
2231  * Input Bounds:
2232  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2233  *   arg2: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2234  * Output Bounds:
2235  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2236  */
fiat_p256_sub(uint32_t out1[8],const uint32_t arg1[8],const uint32_t arg2[8])2237 static void fiat_p256_sub(uint32_t out1[8], const uint32_t arg1[8], const uint32_t arg2[8]) {
2238   uint32_t x1;
2239   fiat_p256_uint1 x2;
2240   fiat_p256_subborrowx_u32(&x1, &x2, 0x0, (arg1[0]), (arg2[0]));
2241   uint32_t x3;
2242   fiat_p256_uint1 x4;
2243   fiat_p256_subborrowx_u32(&x3, &x4, x2, (arg1[1]), (arg2[1]));
2244   uint32_t x5;
2245   fiat_p256_uint1 x6;
2246   fiat_p256_subborrowx_u32(&x5, &x6, x4, (arg1[2]), (arg2[2]));
2247   uint32_t x7;
2248   fiat_p256_uint1 x8;
2249   fiat_p256_subborrowx_u32(&x7, &x8, x6, (arg1[3]), (arg2[3]));
2250   uint32_t x9;
2251   fiat_p256_uint1 x10;
2252   fiat_p256_subborrowx_u32(&x9, &x10, x8, (arg1[4]), (arg2[4]));
2253   uint32_t x11;
2254   fiat_p256_uint1 x12;
2255   fiat_p256_subborrowx_u32(&x11, &x12, x10, (arg1[5]), (arg2[5]));
2256   uint32_t x13;
2257   fiat_p256_uint1 x14;
2258   fiat_p256_subborrowx_u32(&x13, &x14, x12, (arg1[6]), (arg2[6]));
2259   uint32_t x15;
2260   fiat_p256_uint1 x16;
2261   fiat_p256_subborrowx_u32(&x15, &x16, x14, (arg1[7]), (arg2[7]));
2262   uint32_t x17;
2263   fiat_p256_cmovznz_u32(&x17, x16, 0x0, UINT32_C(0xffffffff));
2264   uint32_t x18;
2265   fiat_p256_uint1 x19;
2266   fiat_p256_addcarryx_u32(&x18, &x19, 0x0, x1, (x17 & UINT32_C(0xffffffff)));
2267   uint32_t x20;
2268   fiat_p256_uint1 x21;
2269   fiat_p256_addcarryx_u32(&x20, &x21, x19, x3, (x17 & UINT32_C(0xffffffff)));
2270   uint32_t x22;
2271   fiat_p256_uint1 x23;
2272   fiat_p256_addcarryx_u32(&x22, &x23, x21, x5, (x17 & UINT32_C(0xffffffff)));
2273   uint32_t x24;
2274   fiat_p256_uint1 x25;
2275   fiat_p256_addcarryx_u32(&x24, &x25, x23, x7, 0x0);
2276   uint32_t x26;
2277   fiat_p256_uint1 x27;
2278   fiat_p256_addcarryx_u32(&x26, &x27, x25, x9, 0x0);
2279   uint32_t x28;
2280   fiat_p256_uint1 x29;
2281   fiat_p256_addcarryx_u32(&x28, &x29, x27, x11, 0x0);
2282   uint32_t x30;
2283   fiat_p256_uint1 x31;
2284   fiat_p256_addcarryx_u32(&x30, &x31, x29, x13, (fiat_p256_uint1)(x17 & 0x1));
2285   uint32_t x32;
2286   fiat_p256_uint1 x33;
2287   fiat_p256_addcarryx_u32(&x32, &x33, x31, x15, (x17 & UINT32_C(0xffffffff)));
2288   out1[0] = x18;
2289   out1[1] = x20;
2290   out1[2] = x22;
2291   out1[3] = x24;
2292   out1[4] = x26;
2293   out1[5] = x28;
2294   out1[6] = x30;
2295   out1[7] = x32;
2296 }
2297 
2298 /*
2299  * The function fiat_p256_opp negates a field element in the Montgomery domain.
2300  * Preconditions:
2301  *   0 ≤ eval arg1 < m
2302  * Postconditions:
2303  *   eval (from_montgomery out1) mod m = -eval (from_montgomery arg1) mod m
2304  *   0 ≤ eval out1 < m
2305  *
2306  * Input Bounds:
2307  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2308  * Output Bounds:
2309  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2310  */
fiat_p256_opp(uint32_t out1[8],const uint32_t arg1[8])2311 static void fiat_p256_opp(uint32_t out1[8], const uint32_t arg1[8]) {
2312   uint32_t x1;
2313   fiat_p256_uint1 x2;
2314   fiat_p256_subborrowx_u32(&x1, &x2, 0x0, 0x0, (arg1[0]));
2315   uint32_t x3;
2316   fiat_p256_uint1 x4;
2317   fiat_p256_subborrowx_u32(&x3, &x4, x2, 0x0, (arg1[1]));
2318   uint32_t x5;
2319   fiat_p256_uint1 x6;
2320   fiat_p256_subborrowx_u32(&x5, &x6, x4, 0x0, (arg1[2]));
2321   uint32_t x7;
2322   fiat_p256_uint1 x8;
2323   fiat_p256_subborrowx_u32(&x7, &x8, x6, 0x0, (arg1[3]));
2324   uint32_t x9;
2325   fiat_p256_uint1 x10;
2326   fiat_p256_subborrowx_u32(&x9, &x10, x8, 0x0, (arg1[4]));
2327   uint32_t x11;
2328   fiat_p256_uint1 x12;
2329   fiat_p256_subborrowx_u32(&x11, &x12, x10, 0x0, (arg1[5]));
2330   uint32_t x13;
2331   fiat_p256_uint1 x14;
2332   fiat_p256_subborrowx_u32(&x13, &x14, x12, 0x0, (arg1[6]));
2333   uint32_t x15;
2334   fiat_p256_uint1 x16;
2335   fiat_p256_subborrowx_u32(&x15, &x16, x14, 0x0, (arg1[7]));
2336   uint32_t x17;
2337   fiat_p256_cmovznz_u32(&x17, x16, 0x0, UINT32_C(0xffffffff));
2338   uint32_t x18;
2339   fiat_p256_uint1 x19;
2340   fiat_p256_addcarryx_u32(&x18, &x19, 0x0, x1, (x17 & UINT32_C(0xffffffff)));
2341   uint32_t x20;
2342   fiat_p256_uint1 x21;
2343   fiat_p256_addcarryx_u32(&x20, &x21, x19, x3, (x17 & UINT32_C(0xffffffff)));
2344   uint32_t x22;
2345   fiat_p256_uint1 x23;
2346   fiat_p256_addcarryx_u32(&x22, &x23, x21, x5, (x17 & UINT32_C(0xffffffff)));
2347   uint32_t x24;
2348   fiat_p256_uint1 x25;
2349   fiat_p256_addcarryx_u32(&x24, &x25, x23, x7, 0x0);
2350   uint32_t x26;
2351   fiat_p256_uint1 x27;
2352   fiat_p256_addcarryx_u32(&x26, &x27, x25, x9, 0x0);
2353   uint32_t x28;
2354   fiat_p256_uint1 x29;
2355   fiat_p256_addcarryx_u32(&x28, &x29, x27, x11, 0x0);
2356   uint32_t x30;
2357   fiat_p256_uint1 x31;
2358   fiat_p256_addcarryx_u32(&x30, &x31, x29, x13, (fiat_p256_uint1)(x17 & 0x1));
2359   uint32_t x32;
2360   fiat_p256_uint1 x33;
2361   fiat_p256_addcarryx_u32(&x32, &x33, x31, x15, (x17 & UINT32_C(0xffffffff)));
2362   out1[0] = x18;
2363   out1[1] = x20;
2364   out1[2] = x22;
2365   out1[3] = x24;
2366   out1[4] = x26;
2367   out1[5] = x28;
2368   out1[6] = x30;
2369   out1[7] = x32;
2370 }
2371 
2372 /*
2373  * The function fiat_p256_from_montgomery translates a field element out of the Montgomery domain.
2374  * Preconditions:
2375  *   0 ≤ eval arg1 < m
2376  * Postconditions:
2377  *   eval out1 mod m = (eval arg1 * ((2^32)⁻¹ mod m)^8) mod m
2378  *   0 ≤ eval out1 < m
2379  *
2380  * Input Bounds:
2381  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2382  * Output Bounds:
2383  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2384  */
fiat_p256_from_montgomery(uint32_t out1[8],const uint32_t arg1[8])2385 static void fiat_p256_from_montgomery(uint32_t out1[8], const uint32_t arg1[8]) {
2386   uint32_t x1 = (arg1[0]);
2387   uint32_t x2;
2388   uint32_t x3;
2389   fiat_p256_mulx_u32(&x2, &x3, x1, UINT32_C(0xffffffff));
2390   uint32_t x4;
2391   uint32_t x5;
2392   fiat_p256_mulx_u32(&x4, &x5, x1, UINT32_C(0xffffffff));
2393   uint32_t x6;
2394   uint32_t x7;
2395   fiat_p256_mulx_u32(&x6, &x7, x1, UINT32_C(0xffffffff));
2396   uint32_t x8;
2397   uint32_t x9;
2398   fiat_p256_mulx_u32(&x8, &x9, x1, UINT32_C(0xffffffff));
2399   uint32_t x10;
2400   fiat_p256_uint1 x11;
2401   fiat_p256_addcarryx_u32(&x10, &x11, 0x0, x9, x6);
2402   uint32_t x12;
2403   fiat_p256_uint1 x13;
2404   fiat_p256_addcarryx_u32(&x12, &x13, x11, x7, x4);
2405   uint32_t x14;
2406   fiat_p256_uint1 x15;
2407   fiat_p256_addcarryx_u32(&x14, &x15, 0x0, x1, x8);
2408   uint32_t x16;
2409   fiat_p256_uint1 x17;
2410   fiat_p256_addcarryx_u32(&x16, &x17, x15, 0x0, x10);
2411   uint32_t x18;
2412   fiat_p256_uint1 x19;
2413   fiat_p256_addcarryx_u32(&x18, &x19, x17, 0x0, x12);
2414   uint32_t x20;
2415   fiat_p256_uint1 x21;
2416   fiat_p256_addcarryx_u32(&x20, &x21, x19, 0x0, (x13 + x5));
2417   uint32_t x22;
2418   fiat_p256_uint1 x23;
2419   fiat_p256_addcarryx_u32(&x22, &x23, 0x0, x16, (arg1[1]));
2420   uint32_t x24;
2421   fiat_p256_uint1 x25;
2422   fiat_p256_addcarryx_u32(&x24, &x25, x23, x18, 0x0);
2423   uint32_t x26;
2424   fiat_p256_uint1 x27;
2425   fiat_p256_addcarryx_u32(&x26, &x27, x25, x20, 0x0);
2426   uint32_t x28;
2427   uint32_t x29;
2428   fiat_p256_mulx_u32(&x28, &x29, x22, UINT32_C(0xffffffff));
2429   uint32_t x30;
2430   uint32_t x31;
2431   fiat_p256_mulx_u32(&x30, &x31, x22, UINT32_C(0xffffffff));
2432   uint32_t x32;
2433   uint32_t x33;
2434   fiat_p256_mulx_u32(&x32, &x33, x22, UINT32_C(0xffffffff));
2435   uint32_t x34;
2436   uint32_t x35;
2437   fiat_p256_mulx_u32(&x34, &x35, x22, UINT32_C(0xffffffff));
2438   uint32_t x36;
2439   fiat_p256_uint1 x37;
2440   fiat_p256_addcarryx_u32(&x36, &x37, 0x0, x35, x32);
2441   uint32_t x38;
2442   fiat_p256_uint1 x39;
2443   fiat_p256_addcarryx_u32(&x38, &x39, x37, x33, x30);
2444   uint32_t x40;
2445   fiat_p256_uint1 x41;
2446   fiat_p256_addcarryx_u32(&x40, &x41, 0x0, x22, x34);
2447   uint32_t x42;
2448   fiat_p256_uint1 x43;
2449   fiat_p256_addcarryx_u32(&x42, &x43, x41, x24, x36);
2450   uint32_t x44;
2451   fiat_p256_uint1 x45;
2452   fiat_p256_addcarryx_u32(&x44, &x45, x43, x26, x38);
2453   uint32_t x46;
2454   fiat_p256_uint1 x47;
2455   fiat_p256_addcarryx_u32(&x46, &x47, x45, ((uint32_t)x27 + x21), (x39 + x31));
2456   uint32_t x48;
2457   fiat_p256_uint1 x49;
2458   fiat_p256_addcarryx_u32(&x48, &x49, 0x0, x2, x22);
2459   uint32_t x50;
2460   fiat_p256_uint1 x51;
2461   fiat_p256_addcarryx_u32(&x50, &x51, x49, x3, x28);
2462   uint32_t x52;
2463   fiat_p256_uint1 x53;
2464   fiat_p256_addcarryx_u32(&x52, &x53, 0x0, x42, (arg1[2]));
2465   uint32_t x54;
2466   fiat_p256_uint1 x55;
2467   fiat_p256_addcarryx_u32(&x54, &x55, x53, x44, 0x0);
2468   uint32_t x56;
2469   fiat_p256_uint1 x57;
2470   fiat_p256_addcarryx_u32(&x56, &x57, x55, x46, 0x0);
2471   uint32_t x58;
2472   uint32_t x59;
2473   fiat_p256_mulx_u32(&x58, &x59, x52, UINT32_C(0xffffffff));
2474   uint32_t x60;
2475   uint32_t x61;
2476   fiat_p256_mulx_u32(&x60, &x61, x52, UINT32_C(0xffffffff));
2477   uint32_t x62;
2478   uint32_t x63;
2479   fiat_p256_mulx_u32(&x62, &x63, x52, UINT32_C(0xffffffff));
2480   uint32_t x64;
2481   uint32_t x65;
2482   fiat_p256_mulx_u32(&x64, &x65, x52, UINT32_C(0xffffffff));
2483   uint32_t x66;
2484   fiat_p256_uint1 x67;
2485   fiat_p256_addcarryx_u32(&x66, &x67, 0x0, x65, x62);
2486   uint32_t x68;
2487   fiat_p256_uint1 x69;
2488   fiat_p256_addcarryx_u32(&x68, &x69, x67, x63, x60);
2489   uint32_t x70;
2490   fiat_p256_uint1 x71;
2491   fiat_p256_addcarryx_u32(&x70, &x71, 0x0, x52, x64);
2492   uint32_t x72;
2493   fiat_p256_uint1 x73;
2494   fiat_p256_addcarryx_u32(&x72, &x73, x71, x54, x66);
2495   uint32_t x74;
2496   fiat_p256_uint1 x75;
2497   fiat_p256_addcarryx_u32(&x74, &x75, x73, x56, x68);
2498   uint32_t x76;
2499   fiat_p256_uint1 x77;
2500   fiat_p256_addcarryx_u32(&x76, &x77, x75, ((uint32_t)x57 + x47), (x69 + x61));
2501   uint32_t x78;
2502   fiat_p256_uint1 x79;
2503   fiat_p256_addcarryx_u32(&x78, &x79, x77, x1, 0x0);
2504   uint32_t x80;
2505   fiat_p256_uint1 x81;
2506   fiat_p256_addcarryx_u32(&x80, &x81, x79, x48, 0x0);
2507   uint32_t x82;
2508   fiat_p256_uint1 x83;
2509   fiat_p256_addcarryx_u32(&x82, &x83, x81, x50, x52);
2510   uint32_t x84;
2511   fiat_p256_uint1 x85;
2512   fiat_p256_addcarryx_u32(&x84, &x85, x83, (x51 + x29), x58);
2513   uint32_t x86;
2514   fiat_p256_uint1 x87;
2515   fiat_p256_addcarryx_u32(&x86, &x87, 0x0, x72, (arg1[3]));
2516   uint32_t x88;
2517   fiat_p256_uint1 x89;
2518   fiat_p256_addcarryx_u32(&x88, &x89, x87, x74, 0x0);
2519   uint32_t x90;
2520   fiat_p256_uint1 x91;
2521   fiat_p256_addcarryx_u32(&x90, &x91, x89, x76, 0x0);
2522   uint32_t x92;
2523   fiat_p256_uint1 x93;
2524   fiat_p256_addcarryx_u32(&x92, &x93, x91, x78, 0x0);
2525   uint32_t x94;
2526   fiat_p256_uint1 x95;
2527   fiat_p256_addcarryx_u32(&x94, &x95, x93, x80, 0x0);
2528   uint32_t x96;
2529   fiat_p256_uint1 x97;
2530   fiat_p256_addcarryx_u32(&x96, &x97, x95, x82, 0x0);
2531   uint32_t x98;
2532   fiat_p256_uint1 x99;
2533   fiat_p256_addcarryx_u32(&x98, &x99, x97, x84, 0x0);
2534   uint32_t x100;
2535   fiat_p256_uint1 x101;
2536   fiat_p256_addcarryx_u32(&x100, &x101, x99, (x85 + x59), 0x0);
2537   uint32_t x102;
2538   uint32_t x103;
2539   fiat_p256_mulx_u32(&x102, &x103, x86, UINT32_C(0xffffffff));
2540   uint32_t x104;
2541   uint32_t x105;
2542   fiat_p256_mulx_u32(&x104, &x105, x86, UINT32_C(0xffffffff));
2543   uint32_t x106;
2544   uint32_t x107;
2545   fiat_p256_mulx_u32(&x106, &x107, x86, UINT32_C(0xffffffff));
2546   uint32_t x108;
2547   uint32_t x109;
2548   fiat_p256_mulx_u32(&x108, &x109, x86, UINT32_C(0xffffffff));
2549   uint32_t x110;
2550   fiat_p256_uint1 x111;
2551   fiat_p256_addcarryx_u32(&x110, &x111, 0x0, x109, x106);
2552   uint32_t x112;
2553   fiat_p256_uint1 x113;
2554   fiat_p256_addcarryx_u32(&x112, &x113, x111, x107, x104);
2555   uint32_t x114;
2556   fiat_p256_uint1 x115;
2557   fiat_p256_addcarryx_u32(&x114, &x115, 0x0, x86, x108);
2558   uint32_t x116;
2559   fiat_p256_uint1 x117;
2560   fiat_p256_addcarryx_u32(&x116, &x117, x115, x88, x110);
2561   uint32_t x118;
2562   fiat_p256_uint1 x119;
2563   fiat_p256_addcarryx_u32(&x118, &x119, x117, x90, x112);
2564   uint32_t x120;
2565   fiat_p256_uint1 x121;
2566   fiat_p256_addcarryx_u32(&x120, &x121, x119, x92, (x113 + x105));
2567   uint32_t x122;
2568   fiat_p256_uint1 x123;
2569   fiat_p256_addcarryx_u32(&x122, &x123, x121, x94, 0x0);
2570   uint32_t x124;
2571   fiat_p256_uint1 x125;
2572   fiat_p256_addcarryx_u32(&x124, &x125, x123, x96, 0x0);
2573   uint32_t x126;
2574   fiat_p256_uint1 x127;
2575   fiat_p256_addcarryx_u32(&x126, &x127, x125, x98, x86);
2576   uint32_t x128;
2577   fiat_p256_uint1 x129;
2578   fiat_p256_addcarryx_u32(&x128, &x129, x127, x100, x102);
2579   uint32_t x130;
2580   fiat_p256_uint1 x131;
2581   fiat_p256_addcarryx_u32(&x130, &x131, x129, x101, x103);
2582   uint32_t x132;
2583   fiat_p256_uint1 x133;
2584   fiat_p256_addcarryx_u32(&x132, &x133, 0x0, x116, (arg1[4]));
2585   uint32_t x134;
2586   fiat_p256_uint1 x135;
2587   fiat_p256_addcarryx_u32(&x134, &x135, x133, x118, 0x0);
2588   uint32_t x136;
2589   fiat_p256_uint1 x137;
2590   fiat_p256_addcarryx_u32(&x136, &x137, x135, x120, 0x0);
2591   uint32_t x138;
2592   fiat_p256_uint1 x139;
2593   fiat_p256_addcarryx_u32(&x138, &x139, x137, x122, 0x0);
2594   uint32_t x140;
2595   fiat_p256_uint1 x141;
2596   fiat_p256_addcarryx_u32(&x140, &x141, x139, x124, 0x0);
2597   uint32_t x142;
2598   fiat_p256_uint1 x143;
2599   fiat_p256_addcarryx_u32(&x142, &x143, x141, x126, 0x0);
2600   uint32_t x144;
2601   fiat_p256_uint1 x145;
2602   fiat_p256_addcarryx_u32(&x144, &x145, x143, x128, 0x0);
2603   uint32_t x146;
2604   fiat_p256_uint1 x147;
2605   fiat_p256_addcarryx_u32(&x146, &x147, x145, x130, 0x0);
2606   uint32_t x148;
2607   uint32_t x149;
2608   fiat_p256_mulx_u32(&x148, &x149, x132, UINT32_C(0xffffffff));
2609   uint32_t x150;
2610   uint32_t x151;
2611   fiat_p256_mulx_u32(&x150, &x151, x132, UINT32_C(0xffffffff));
2612   uint32_t x152;
2613   uint32_t x153;
2614   fiat_p256_mulx_u32(&x152, &x153, x132, UINT32_C(0xffffffff));
2615   uint32_t x154;
2616   uint32_t x155;
2617   fiat_p256_mulx_u32(&x154, &x155, x132, UINT32_C(0xffffffff));
2618   uint32_t x156;
2619   fiat_p256_uint1 x157;
2620   fiat_p256_addcarryx_u32(&x156, &x157, 0x0, x155, x152);
2621   uint32_t x158;
2622   fiat_p256_uint1 x159;
2623   fiat_p256_addcarryx_u32(&x158, &x159, x157, x153, x150);
2624   uint32_t x160;
2625   fiat_p256_uint1 x161;
2626   fiat_p256_addcarryx_u32(&x160, &x161, 0x0, x132, x154);
2627   uint32_t x162;
2628   fiat_p256_uint1 x163;
2629   fiat_p256_addcarryx_u32(&x162, &x163, x161, x134, x156);
2630   uint32_t x164;
2631   fiat_p256_uint1 x165;
2632   fiat_p256_addcarryx_u32(&x164, &x165, x163, x136, x158);
2633   uint32_t x166;
2634   fiat_p256_uint1 x167;
2635   fiat_p256_addcarryx_u32(&x166, &x167, x165, x138, (x159 + x151));
2636   uint32_t x168;
2637   fiat_p256_uint1 x169;
2638   fiat_p256_addcarryx_u32(&x168, &x169, x167, x140, 0x0);
2639   uint32_t x170;
2640   fiat_p256_uint1 x171;
2641   fiat_p256_addcarryx_u32(&x170, &x171, x169, x142, 0x0);
2642   uint32_t x172;
2643   fiat_p256_uint1 x173;
2644   fiat_p256_addcarryx_u32(&x172, &x173, x171, x144, x132);
2645   uint32_t x174;
2646   fiat_p256_uint1 x175;
2647   fiat_p256_addcarryx_u32(&x174, &x175, x173, x146, x148);
2648   uint32_t x176;
2649   fiat_p256_uint1 x177;
2650   fiat_p256_addcarryx_u32(&x176, &x177, x175, ((uint32_t)x147 + x131), x149);
2651   uint32_t x178;
2652   fiat_p256_uint1 x179;
2653   fiat_p256_addcarryx_u32(&x178, &x179, 0x0, x162, (arg1[5]));
2654   uint32_t x180;
2655   fiat_p256_uint1 x181;
2656   fiat_p256_addcarryx_u32(&x180, &x181, x179, x164, 0x0);
2657   uint32_t x182;
2658   fiat_p256_uint1 x183;
2659   fiat_p256_addcarryx_u32(&x182, &x183, x181, x166, 0x0);
2660   uint32_t x184;
2661   fiat_p256_uint1 x185;
2662   fiat_p256_addcarryx_u32(&x184, &x185, x183, x168, 0x0);
2663   uint32_t x186;
2664   fiat_p256_uint1 x187;
2665   fiat_p256_addcarryx_u32(&x186, &x187, x185, x170, 0x0);
2666   uint32_t x188;
2667   fiat_p256_uint1 x189;
2668   fiat_p256_addcarryx_u32(&x188, &x189, x187, x172, 0x0);
2669   uint32_t x190;
2670   fiat_p256_uint1 x191;
2671   fiat_p256_addcarryx_u32(&x190, &x191, x189, x174, 0x0);
2672   uint32_t x192;
2673   fiat_p256_uint1 x193;
2674   fiat_p256_addcarryx_u32(&x192, &x193, x191, x176, 0x0);
2675   uint32_t x194;
2676   uint32_t x195;
2677   fiat_p256_mulx_u32(&x194, &x195, x178, UINT32_C(0xffffffff));
2678   uint32_t x196;
2679   uint32_t x197;
2680   fiat_p256_mulx_u32(&x196, &x197, x178, UINT32_C(0xffffffff));
2681   uint32_t x198;
2682   uint32_t x199;
2683   fiat_p256_mulx_u32(&x198, &x199, x178, UINT32_C(0xffffffff));
2684   uint32_t x200;
2685   uint32_t x201;
2686   fiat_p256_mulx_u32(&x200, &x201, x178, UINT32_C(0xffffffff));
2687   uint32_t x202;
2688   fiat_p256_uint1 x203;
2689   fiat_p256_addcarryx_u32(&x202, &x203, 0x0, x201, x198);
2690   uint32_t x204;
2691   fiat_p256_uint1 x205;
2692   fiat_p256_addcarryx_u32(&x204, &x205, x203, x199, x196);
2693   uint32_t x206;
2694   fiat_p256_uint1 x207;
2695   fiat_p256_addcarryx_u32(&x206, &x207, 0x0, x178, x200);
2696   uint32_t x208;
2697   fiat_p256_uint1 x209;
2698   fiat_p256_addcarryx_u32(&x208, &x209, x207, x180, x202);
2699   uint32_t x210;
2700   fiat_p256_uint1 x211;
2701   fiat_p256_addcarryx_u32(&x210, &x211, x209, x182, x204);
2702   uint32_t x212;
2703   fiat_p256_uint1 x213;
2704   fiat_p256_addcarryx_u32(&x212, &x213, x211, x184, (x205 + x197));
2705   uint32_t x214;
2706   fiat_p256_uint1 x215;
2707   fiat_p256_addcarryx_u32(&x214, &x215, x213, x186, 0x0);
2708   uint32_t x216;
2709   fiat_p256_uint1 x217;
2710   fiat_p256_addcarryx_u32(&x216, &x217, x215, x188, 0x0);
2711   uint32_t x218;
2712   fiat_p256_uint1 x219;
2713   fiat_p256_addcarryx_u32(&x218, &x219, x217, x190, x178);
2714   uint32_t x220;
2715   fiat_p256_uint1 x221;
2716   fiat_p256_addcarryx_u32(&x220, &x221, x219, x192, x194);
2717   uint32_t x222;
2718   fiat_p256_uint1 x223;
2719   fiat_p256_addcarryx_u32(&x222, &x223, x221, ((uint32_t)x193 + x177), x195);
2720   uint32_t x224;
2721   fiat_p256_uint1 x225;
2722   fiat_p256_addcarryx_u32(&x224, &x225, 0x0, x208, (arg1[6]));
2723   uint32_t x226;
2724   fiat_p256_uint1 x227;
2725   fiat_p256_addcarryx_u32(&x226, &x227, x225, x210, 0x0);
2726   uint32_t x228;
2727   fiat_p256_uint1 x229;
2728   fiat_p256_addcarryx_u32(&x228, &x229, x227, x212, 0x0);
2729   uint32_t x230;
2730   fiat_p256_uint1 x231;
2731   fiat_p256_addcarryx_u32(&x230, &x231, x229, x214, 0x0);
2732   uint32_t x232;
2733   fiat_p256_uint1 x233;
2734   fiat_p256_addcarryx_u32(&x232, &x233, x231, x216, 0x0);
2735   uint32_t x234;
2736   fiat_p256_uint1 x235;
2737   fiat_p256_addcarryx_u32(&x234, &x235, x233, x218, 0x0);
2738   uint32_t x236;
2739   fiat_p256_uint1 x237;
2740   fiat_p256_addcarryx_u32(&x236, &x237, x235, x220, 0x0);
2741   uint32_t x238;
2742   fiat_p256_uint1 x239;
2743   fiat_p256_addcarryx_u32(&x238, &x239, x237, x222, 0x0);
2744   uint32_t x240;
2745   uint32_t x241;
2746   fiat_p256_mulx_u32(&x240, &x241, x224, UINT32_C(0xffffffff));
2747   uint32_t x242;
2748   uint32_t x243;
2749   fiat_p256_mulx_u32(&x242, &x243, x224, UINT32_C(0xffffffff));
2750   uint32_t x244;
2751   uint32_t x245;
2752   fiat_p256_mulx_u32(&x244, &x245, x224, UINT32_C(0xffffffff));
2753   uint32_t x246;
2754   uint32_t x247;
2755   fiat_p256_mulx_u32(&x246, &x247, x224, UINT32_C(0xffffffff));
2756   uint32_t x248;
2757   fiat_p256_uint1 x249;
2758   fiat_p256_addcarryx_u32(&x248, &x249, 0x0, x247, x244);
2759   uint32_t x250;
2760   fiat_p256_uint1 x251;
2761   fiat_p256_addcarryx_u32(&x250, &x251, x249, x245, x242);
2762   uint32_t x252;
2763   fiat_p256_uint1 x253;
2764   fiat_p256_addcarryx_u32(&x252, &x253, 0x0, x224, x246);
2765   uint32_t x254;
2766   fiat_p256_uint1 x255;
2767   fiat_p256_addcarryx_u32(&x254, &x255, x253, x226, x248);
2768   uint32_t x256;
2769   fiat_p256_uint1 x257;
2770   fiat_p256_addcarryx_u32(&x256, &x257, x255, x228, x250);
2771   uint32_t x258;
2772   fiat_p256_uint1 x259;
2773   fiat_p256_addcarryx_u32(&x258, &x259, x257, x230, (x251 + x243));
2774   uint32_t x260;
2775   fiat_p256_uint1 x261;
2776   fiat_p256_addcarryx_u32(&x260, &x261, x259, x232, 0x0);
2777   uint32_t x262;
2778   fiat_p256_uint1 x263;
2779   fiat_p256_addcarryx_u32(&x262, &x263, x261, x234, 0x0);
2780   uint32_t x264;
2781   fiat_p256_uint1 x265;
2782   fiat_p256_addcarryx_u32(&x264, &x265, x263, x236, x224);
2783   uint32_t x266;
2784   fiat_p256_uint1 x267;
2785   fiat_p256_addcarryx_u32(&x266, &x267, x265, x238, x240);
2786   uint32_t x268;
2787   fiat_p256_uint1 x269;
2788   fiat_p256_addcarryx_u32(&x268, &x269, x267, ((uint32_t)x239 + x223), x241);
2789   uint32_t x270;
2790   fiat_p256_uint1 x271;
2791   fiat_p256_addcarryx_u32(&x270, &x271, 0x0, x254, (arg1[7]));
2792   uint32_t x272;
2793   fiat_p256_uint1 x273;
2794   fiat_p256_addcarryx_u32(&x272, &x273, x271, x256, 0x0);
2795   uint32_t x274;
2796   fiat_p256_uint1 x275;
2797   fiat_p256_addcarryx_u32(&x274, &x275, x273, x258, 0x0);
2798   uint32_t x276;
2799   fiat_p256_uint1 x277;
2800   fiat_p256_addcarryx_u32(&x276, &x277, x275, x260, 0x0);
2801   uint32_t x278;
2802   fiat_p256_uint1 x279;
2803   fiat_p256_addcarryx_u32(&x278, &x279, x277, x262, 0x0);
2804   uint32_t x280;
2805   fiat_p256_uint1 x281;
2806   fiat_p256_addcarryx_u32(&x280, &x281, x279, x264, 0x0);
2807   uint32_t x282;
2808   fiat_p256_uint1 x283;
2809   fiat_p256_addcarryx_u32(&x282, &x283, x281, x266, 0x0);
2810   uint32_t x284;
2811   fiat_p256_uint1 x285;
2812   fiat_p256_addcarryx_u32(&x284, &x285, x283, x268, 0x0);
2813   uint32_t x286;
2814   uint32_t x287;
2815   fiat_p256_mulx_u32(&x286, &x287, x270, UINT32_C(0xffffffff));
2816   uint32_t x288;
2817   uint32_t x289;
2818   fiat_p256_mulx_u32(&x288, &x289, x270, UINT32_C(0xffffffff));
2819   uint32_t x290;
2820   uint32_t x291;
2821   fiat_p256_mulx_u32(&x290, &x291, x270, UINT32_C(0xffffffff));
2822   uint32_t x292;
2823   uint32_t x293;
2824   fiat_p256_mulx_u32(&x292, &x293, x270, UINT32_C(0xffffffff));
2825   uint32_t x294;
2826   fiat_p256_uint1 x295;
2827   fiat_p256_addcarryx_u32(&x294, &x295, 0x0, x293, x290);
2828   uint32_t x296;
2829   fiat_p256_uint1 x297;
2830   fiat_p256_addcarryx_u32(&x296, &x297, x295, x291, x288);
2831   uint32_t x298;
2832   fiat_p256_uint1 x299;
2833   fiat_p256_addcarryx_u32(&x298, &x299, 0x0, x270, x292);
2834   uint32_t x300;
2835   fiat_p256_uint1 x301;
2836   fiat_p256_addcarryx_u32(&x300, &x301, x299, x272, x294);
2837   uint32_t x302;
2838   fiat_p256_uint1 x303;
2839   fiat_p256_addcarryx_u32(&x302, &x303, x301, x274, x296);
2840   uint32_t x304;
2841   fiat_p256_uint1 x305;
2842   fiat_p256_addcarryx_u32(&x304, &x305, x303, x276, (x297 + x289));
2843   uint32_t x306;
2844   fiat_p256_uint1 x307;
2845   fiat_p256_addcarryx_u32(&x306, &x307, x305, x278, 0x0);
2846   uint32_t x308;
2847   fiat_p256_uint1 x309;
2848   fiat_p256_addcarryx_u32(&x308, &x309, x307, x280, 0x0);
2849   uint32_t x310;
2850   fiat_p256_uint1 x311;
2851   fiat_p256_addcarryx_u32(&x310, &x311, x309, x282, x270);
2852   uint32_t x312;
2853   fiat_p256_uint1 x313;
2854   fiat_p256_addcarryx_u32(&x312, &x313, x311, x284, x286);
2855   uint32_t x314;
2856   fiat_p256_uint1 x315;
2857   fiat_p256_addcarryx_u32(&x314, &x315, x313, ((uint32_t)x285 + x269), x287);
2858   uint32_t x316;
2859   fiat_p256_uint1 x317;
2860   fiat_p256_subborrowx_u32(&x316, &x317, 0x0, x300, UINT32_C(0xffffffff));
2861   uint32_t x318;
2862   fiat_p256_uint1 x319;
2863   fiat_p256_subborrowx_u32(&x318, &x319, x317, x302, UINT32_C(0xffffffff));
2864   uint32_t x320;
2865   fiat_p256_uint1 x321;
2866   fiat_p256_subborrowx_u32(&x320, &x321, x319, x304, UINT32_C(0xffffffff));
2867   uint32_t x322;
2868   fiat_p256_uint1 x323;
2869   fiat_p256_subborrowx_u32(&x322, &x323, x321, x306, 0x0);
2870   uint32_t x324;
2871   fiat_p256_uint1 x325;
2872   fiat_p256_subborrowx_u32(&x324, &x325, x323, x308, 0x0);
2873   uint32_t x326;
2874   fiat_p256_uint1 x327;
2875   fiat_p256_subborrowx_u32(&x326, &x327, x325, x310, 0x0);
2876   uint32_t x328;
2877   fiat_p256_uint1 x329;
2878   fiat_p256_subborrowx_u32(&x328, &x329, x327, x312, 0x1);
2879   uint32_t x330;
2880   fiat_p256_uint1 x331;
2881   fiat_p256_subborrowx_u32(&x330, &x331, x329, x314, UINT32_C(0xffffffff));
2882   uint32_t x332;
2883   fiat_p256_uint1 x333;
2884   fiat_p256_subborrowx_u32(&x332, &x333, x331, x315, 0x0);
2885   uint32_t x334;
2886   fiat_p256_cmovznz_u32(&x334, x333, x316, x300);
2887   uint32_t x335;
2888   fiat_p256_cmovznz_u32(&x335, x333, x318, x302);
2889   uint32_t x336;
2890   fiat_p256_cmovznz_u32(&x336, x333, x320, x304);
2891   uint32_t x337;
2892   fiat_p256_cmovznz_u32(&x337, x333, x322, x306);
2893   uint32_t x338;
2894   fiat_p256_cmovznz_u32(&x338, x333, x324, x308);
2895   uint32_t x339;
2896   fiat_p256_cmovznz_u32(&x339, x333, x326, x310);
2897   uint32_t x340;
2898   fiat_p256_cmovznz_u32(&x340, x333, x328, x312);
2899   uint32_t x341;
2900   fiat_p256_cmovznz_u32(&x341, x333, x330, x314);
2901   out1[0] = x334;
2902   out1[1] = x335;
2903   out1[2] = x336;
2904   out1[3] = x337;
2905   out1[4] = x338;
2906   out1[5] = x339;
2907   out1[6] = x340;
2908   out1[7] = x341;
2909 }
2910 
2911 /*
2912  * The function fiat_p256_nonzero outputs a single non-zero word if the input is non-zero and zero otherwise.
2913  * Preconditions:
2914  *   0 ≤ eval arg1 < m
2915  * Postconditions:
2916  *   out1 = 0 ↔ eval (from_montgomery arg1) mod m = 0
2917  *
2918  * Input Bounds:
2919  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2920  * Output Bounds:
2921  *   out1: [0x0 ~> 0xffffffff]
2922  */
fiat_p256_nonzero(uint32_t * out1,const uint32_t arg1[8])2923 static void fiat_p256_nonzero(uint32_t* out1, const uint32_t arg1[8]) {
2924   uint32_t x1 = ((arg1[0]) | ((arg1[1]) | ((arg1[2]) | ((arg1[3]) | ((arg1[4]) | ((arg1[5]) | ((arg1[6]) | ((arg1[7]) | (uint32_t)0x0))))))));
2925   *out1 = x1;
2926 }
2927 
2928 /*
2929  * The function fiat_p256_selectznz is a multi-limb conditional select.
2930  * Postconditions:
2931  *   eval out1 = (if arg1 = 0 then eval arg2 else eval arg3)
2932  *
2933  * Input Bounds:
2934  *   arg1: [0x0 ~> 0x1]
2935  *   arg2: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2936  *   arg3: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2937  * Output Bounds:
2938  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2939  */
fiat_p256_selectznz(uint32_t out1[8],fiat_p256_uint1 arg1,const uint32_t arg2[8],const uint32_t arg3[8])2940 static void fiat_p256_selectznz(uint32_t out1[8], fiat_p256_uint1 arg1, const uint32_t arg2[8], const uint32_t arg3[8]) {
2941   uint32_t x1;
2942   fiat_p256_cmovznz_u32(&x1, arg1, (arg2[0]), (arg3[0]));
2943   uint32_t x2;
2944   fiat_p256_cmovznz_u32(&x2, arg1, (arg2[1]), (arg3[1]));
2945   uint32_t x3;
2946   fiat_p256_cmovznz_u32(&x3, arg1, (arg2[2]), (arg3[2]));
2947   uint32_t x4;
2948   fiat_p256_cmovznz_u32(&x4, arg1, (arg2[3]), (arg3[3]));
2949   uint32_t x5;
2950   fiat_p256_cmovznz_u32(&x5, arg1, (arg2[4]), (arg3[4]));
2951   uint32_t x6;
2952   fiat_p256_cmovznz_u32(&x6, arg1, (arg2[5]), (arg3[5]));
2953   uint32_t x7;
2954   fiat_p256_cmovznz_u32(&x7, arg1, (arg2[6]), (arg3[6]));
2955   uint32_t x8;
2956   fiat_p256_cmovznz_u32(&x8, arg1, (arg2[7]), (arg3[7]));
2957   out1[0] = x1;
2958   out1[1] = x2;
2959   out1[2] = x3;
2960   out1[3] = x4;
2961   out1[4] = x5;
2962   out1[5] = x6;
2963   out1[6] = x7;
2964   out1[7] = x8;
2965 }
2966 
2967 /*
2968  * The function fiat_p256_to_bytes serializes a field element in the Montgomery domain to bytes in little-endian order.
2969  * Preconditions:
2970  *   0 ≤ eval arg1 < m
2971  * Postconditions:
2972  *   out1 = map (λ x, ⌊((eval arg1 mod m) mod 2^(8 * (x + 1))) / 2^(8 * x)⌋) [0..31]
2973  *
2974  * Input Bounds:
2975  *   arg1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
2976  * Output Bounds:
2977  *   out1: [[0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff]]
2978  */
fiat_p256_to_bytes(uint8_t out1[32],const uint32_t arg1[8])2979 static void fiat_p256_to_bytes(uint8_t out1[32], const uint32_t arg1[8]) {
2980   uint32_t x1 = (arg1[7]);
2981   uint32_t x2 = (arg1[6]);
2982   uint32_t x3 = (arg1[5]);
2983   uint32_t x4 = (arg1[4]);
2984   uint32_t x5 = (arg1[3]);
2985   uint32_t x6 = (arg1[2]);
2986   uint32_t x7 = (arg1[1]);
2987   uint32_t x8 = (arg1[0]);
2988   uint32_t x9 = (x8 >> 8);
2989   uint8_t x10 = (uint8_t)(x8 & UINT8_C(0xff));
2990   uint32_t x11 = (x9 >> 8);
2991   uint8_t x12 = (uint8_t)(x9 & UINT8_C(0xff));
2992   uint8_t x13 = (uint8_t)(x11 >> 8);
2993   uint8_t x14 = (uint8_t)(x11 & UINT8_C(0xff));
2994   uint8_t x15 = (uint8_t)(x13 & UINT8_C(0xff));
2995   uint32_t x16 = (x7 >> 8);
2996   uint8_t x17 = (uint8_t)(x7 & UINT8_C(0xff));
2997   uint32_t x18 = (x16 >> 8);
2998   uint8_t x19 = (uint8_t)(x16 & UINT8_C(0xff));
2999   uint8_t x20 = (uint8_t)(x18 >> 8);
3000   uint8_t x21 = (uint8_t)(x18 & UINT8_C(0xff));
3001   uint8_t x22 = (uint8_t)(x20 & UINT8_C(0xff));
3002   uint32_t x23 = (x6 >> 8);
3003   uint8_t x24 = (uint8_t)(x6 & UINT8_C(0xff));
3004   uint32_t x25 = (x23 >> 8);
3005   uint8_t x26 = (uint8_t)(x23 & UINT8_C(0xff));
3006   uint8_t x27 = (uint8_t)(x25 >> 8);
3007   uint8_t x28 = (uint8_t)(x25 & UINT8_C(0xff));
3008   uint8_t x29 = (uint8_t)(x27 & UINT8_C(0xff));
3009   uint32_t x30 = (x5 >> 8);
3010   uint8_t x31 = (uint8_t)(x5 & UINT8_C(0xff));
3011   uint32_t x32 = (x30 >> 8);
3012   uint8_t x33 = (uint8_t)(x30 & UINT8_C(0xff));
3013   uint8_t x34 = (uint8_t)(x32 >> 8);
3014   uint8_t x35 = (uint8_t)(x32 & UINT8_C(0xff));
3015   uint8_t x36 = (uint8_t)(x34 & UINT8_C(0xff));
3016   uint32_t x37 = (x4 >> 8);
3017   uint8_t x38 = (uint8_t)(x4 & UINT8_C(0xff));
3018   uint32_t x39 = (x37 >> 8);
3019   uint8_t x40 = (uint8_t)(x37 & UINT8_C(0xff));
3020   uint8_t x41 = (uint8_t)(x39 >> 8);
3021   uint8_t x42 = (uint8_t)(x39 & UINT8_C(0xff));
3022   uint8_t x43 = (uint8_t)(x41 & UINT8_C(0xff));
3023   uint32_t x44 = (x3 >> 8);
3024   uint8_t x45 = (uint8_t)(x3 & UINT8_C(0xff));
3025   uint32_t x46 = (x44 >> 8);
3026   uint8_t x47 = (uint8_t)(x44 & UINT8_C(0xff));
3027   uint8_t x48 = (uint8_t)(x46 >> 8);
3028   uint8_t x49 = (uint8_t)(x46 & UINT8_C(0xff));
3029   uint8_t x50 = (uint8_t)(x48 & UINT8_C(0xff));
3030   uint32_t x51 = (x2 >> 8);
3031   uint8_t x52 = (uint8_t)(x2 & UINT8_C(0xff));
3032   uint32_t x53 = (x51 >> 8);
3033   uint8_t x54 = (uint8_t)(x51 & UINT8_C(0xff));
3034   uint8_t x55 = (uint8_t)(x53 >> 8);
3035   uint8_t x56 = (uint8_t)(x53 & UINT8_C(0xff));
3036   uint8_t x57 = (uint8_t)(x55 & UINT8_C(0xff));
3037   uint32_t x58 = (x1 >> 8);
3038   uint8_t x59 = (uint8_t)(x1 & UINT8_C(0xff));
3039   uint32_t x60 = (x58 >> 8);
3040   uint8_t x61 = (uint8_t)(x58 & UINT8_C(0xff));
3041   uint8_t x62 = (uint8_t)(x60 >> 8);
3042   uint8_t x63 = (uint8_t)(x60 & UINT8_C(0xff));
3043   out1[0] = x10;
3044   out1[1] = x12;
3045   out1[2] = x14;
3046   out1[3] = x15;
3047   out1[4] = x17;
3048   out1[5] = x19;
3049   out1[6] = x21;
3050   out1[7] = x22;
3051   out1[8] = x24;
3052   out1[9] = x26;
3053   out1[10] = x28;
3054   out1[11] = x29;
3055   out1[12] = x31;
3056   out1[13] = x33;
3057   out1[14] = x35;
3058   out1[15] = x36;
3059   out1[16] = x38;
3060   out1[17] = x40;
3061   out1[18] = x42;
3062   out1[19] = x43;
3063   out1[20] = x45;
3064   out1[21] = x47;
3065   out1[22] = x49;
3066   out1[23] = x50;
3067   out1[24] = x52;
3068   out1[25] = x54;
3069   out1[26] = x56;
3070   out1[27] = x57;
3071   out1[28] = x59;
3072   out1[29] = x61;
3073   out1[30] = x63;
3074   out1[31] = x62;
3075 }
3076 
3077 /*
3078  * The function fiat_p256_from_bytes deserializes a field element in the Montgomery domain from bytes in little-endian order.
3079  * Preconditions:
3080  *   0 ≤ bytes_eval arg1 < m
3081  * Postconditions:
3082  *   eval out1 mod m = bytes_eval arg1 mod m
3083  *   0 ≤ eval out1 < m
3084  *
3085  * Input Bounds:
3086  *   arg1: [[0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff], [0x0 ~> 0xff]]
3087  * Output Bounds:
3088  *   out1: [[0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff], [0x0 ~> 0xffffffff]]
3089  */
fiat_p256_from_bytes(uint32_t out1[8],const uint8_t arg1[32])3090 static void fiat_p256_from_bytes(uint32_t out1[8], const uint8_t arg1[32]) {
3091   uint32_t x1 = ((uint32_t)(arg1[31]) << 24);
3092   uint32_t x2 = ((uint32_t)(arg1[30]) << 16);
3093   uint32_t x3 = ((uint32_t)(arg1[29]) << 8);
3094   uint8_t x4 = (arg1[28]);
3095   uint32_t x5 = ((uint32_t)(arg1[27]) << 24);
3096   uint32_t x6 = ((uint32_t)(arg1[26]) << 16);
3097   uint32_t x7 = ((uint32_t)(arg1[25]) << 8);
3098   uint8_t x8 = (arg1[24]);
3099   uint32_t x9 = ((uint32_t)(arg1[23]) << 24);
3100   uint32_t x10 = ((uint32_t)(arg1[22]) << 16);
3101   uint32_t x11 = ((uint32_t)(arg1[21]) << 8);
3102   uint8_t x12 = (arg1[20]);
3103   uint32_t x13 = ((uint32_t)(arg1[19]) << 24);
3104   uint32_t x14 = ((uint32_t)(arg1[18]) << 16);
3105   uint32_t x15 = ((uint32_t)(arg1[17]) << 8);
3106   uint8_t x16 = (arg1[16]);
3107   uint32_t x17 = ((uint32_t)(arg1[15]) << 24);
3108   uint32_t x18 = ((uint32_t)(arg1[14]) << 16);
3109   uint32_t x19 = ((uint32_t)(arg1[13]) << 8);
3110   uint8_t x20 = (arg1[12]);
3111   uint32_t x21 = ((uint32_t)(arg1[11]) << 24);
3112   uint32_t x22 = ((uint32_t)(arg1[10]) << 16);
3113   uint32_t x23 = ((uint32_t)(arg1[9]) << 8);
3114   uint8_t x24 = (arg1[8]);
3115   uint32_t x25 = ((uint32_t)(arg1[7]) << 24);
3116   uint32_t x26 = ((uint32_t)(arg1[6]) << 16);
3117   uint32_t x27 = ((uint32_t)(arg1[5]) << 8);
3118   uint8_t x28 = (arg1[4]);
3119   uint32_t x29 = ((uint32_t)(arg1[3]) << 24);
3120   uint32_t x30 = ((uint32_t)(arg1[2]) << 16);
3121   uint32_t x31 = ((uint32_t)(arg1[1]) << 8);
3122   uint8_t x32 = (arg1[0]);
3123   uint32_t x33 = (x32 + (x31 + (x30 + x29)));
3124   uint32_t x34 = (x33 & UINT32_C(0xffffffff));
3125   uint32_t x35 = (x4 + (x3 + (x2 + x1)));
3126   uint32_t x36 = (x8 + (x7 + (x6 + x5)));
3127   uint32_t x37 = (x12 + (x11 + (x10 + x9)));
3128   uint32_t x38 = (x16 + (x15 + (x14 + x13)));
3129   uint32_t x39 = (x20 + (x19 + (x18 + x17)));
3130   uint32_t x40 = (x24 + (x23 + (x22 + x21)));
3131   uint32_t x41 = (x28 + (x27 + (x26 + x25)));
3132   uint32_t x42 = (x41 & UINT32_C(0xffffffff));
3133   uint32_t x43 = (x40 & UINT32_C(0xffffffff));
3134   uint32_t x44 = (x39 & UINT32_C(0xffffffff));
3135   uint32_t x45 = (x38 & UINT32_C(0xffffffff));
3136   uint32_t x46 = (x37 & UINT32_C(0xffffffff));
3137   uint32_t x47 = (x36 & UINT32_C(0xffffffff));
3138   out1[0] = x34;
3139   out1[1] = x42;
3140   out1[2] = x43;
3141   out1[3] = x44;
3142   out1[4] = x45;
3143   out1[5] = x46;
3144   out1[6] = x47;
3145   out1[7] = x35;
3146 }
3147 
3148