xref: /aosp_15_r20/external/mbedtls/3rdparty/everest/library/Hacl_Curve25519.c (revision 62c56f9862f102b96d72393aff6076c951fb8148)
1*62c56f98SSadaf Ebrahimi /* Copyright (c) INRIA and Microsoft Corporation. All rights reserved.
2*62c56f98SSadaf Ebrahimi    Licensed under the Apache 2.0 License. */
3*62c56f98SSadaf Ebrahimi 
4*62c56f98SSadaf Ebrahimi /* This file was generated by KreMLin <https://github.com/FStarLang/kremlin>
5*62c56f98SSadaf Ebrahimi  * KreMLin invocation: /mnt/e/everest/verify/kremlin/krml -fc89 -fparentheses -fno-shadow -header /mnt/e/everest/verify/hdrcLh -minimal -fbuiltin-uint128 -fc89 -fparentheses -fno-shadow -header /mnt/e/everest/verify/hdrcLh -minimal -I /mnt/e/everest/verify/hacl-star/code/lib/kremlin -I /mnt/e/everest/verify/kremlin/kremlib/compat -I /mnt/e/everest/verify/hacl-star/specs -I /mnt/e/everest/verify/hacl-star/specs/old -I . -ccopt -march=native -verbose -ldopt -flto -tmpdir x25519-c -I ../bignum -bundle Hacl.Curve25519=* -minimal -add-include "kremlib.h" -skip-compilation x25519-c/out.krml -o x25519-c/Hacl_Curve25519.c
6*62c56f98SSadaf Ebrahimi  * F* version: 059db0c8
7*62c56f98SSadaf Ebrahimi  * KreMLin version: 916c37ac
8*62c56f98SSadaf Ebrahimi  */
9*62c56f98SSadaf Ebrahimi 
10*62c56f98SSadaf Ebrahimi 
11*62c56f98SSadaf Ebrahimi #include "Hacl_Curve25519.h"
12*62c56f98SSadaf Ebrahimi 
13*62c56f98SSadaf Ebrahimi extern uint64_t FStar_UInt64_eq_mask(uint64_t x0, uint64_t x1);
14*62c56f98SSadaf Ebrahimi 
15*62c56f98SSadaf Ebrahimi extern uint64_t FStar_UInt64_gte_mask(uint64_t x0, uint64_t x1);
16*62c56f98SSadaf Ebrahimi 
17*62c56f98SSadaf Ebrahimi extern uint128_t FStar_UInt128_add(uint128_t x0, uint128_t x1);
18*62c56f98SSadaf Ebrahimi 
19*62c56f98SSadaf Ebrahimi extern uint128_t FStar_UInt128_add_mod(uint128_t x0, uint128_t x1);
20*62c56f98SSadaf Ebrahimi 
21*62c56f98SSadaf Ebrahimi extern uint128_t FStar_UInt128_logand(uint128_t x0, uint128_t x1);
22*62c56f98SSadaf Ebrahimi 
23*62c56f98SSadaf Ebrahimi extern uint128_t FStar_UInt128_shift_right(uint128_t x0, uint32_t x1);
24*62c56f98SSadaf Ebrahimi 
25*62c56f98SSadaf Ebrahimi extern uint128_t FStar_UInt128_uint64_to_uint128(uint64_t x0);
26*62c56f98SSadaf Ebrahimi 
27*62c56f98SSadaf Ebrahimi extern uint64_t FStar_UInt128_uint128_to_uint64(uint128_t x0);
28*62c56f98SSadaf Ebrahimi 
29*62c56f98SSadaf Ebrahimi extern uint128_t FStar_UInt128_mul_wide(uint64_t x0, uint64_t x1);
30*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Modulo_carry_top(uint64_t * b)31*62c56f98SSadaf Ebrahimi static void Hacl_Bignum_Modulo_carry_top(uint64_t *b)
32*62c56f98SSadaf Ebrahimi {
33*62c56f98SSadaf Ebrahimi   uint64_t b4 = b[4U];
34*62c56f98SSadaf Ebrahimi   uint64_t b0 = b[0U];
35*62c56f98SSadaf Ebrahimi   uint64_t b4_ = b4 & (uint64_t)0x7ffffffffffffU;
36*62c56f98SSadaf Ebrahimi   uint64_t b0_ = b0 + (uint64_t)19U * (b4 >> (uint32_t)51U);
37*62c56f98SSadaf Ebrahimi   b[4U] = b4_;
38*62c56f98SSadaf Ebrahimi   b[0U] = b0_;
39*62c56f98SSadaf Ebrahimi }
40*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fproduct_copy_from_wide_(uint64_t * output,uint128_t * input)41*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fproduct_copy_from_wide_(uint64_t *output, uint128_t *input)
42*62c56f98SSadaf Ebrahimi {
43*62c56f98SSadaf Ebrahimi   uint32_t i;
44*62c56f98SSadaf Ebrahimi   for (i = (uint32_t)0U; i < (uint32_t)5U; i = i + (uint32_t)1U)
45*62c56f98SSadaf Ebrahimi   {
46*62c56f98SSadaf Ebrahimi     uint128_t xi = input[i];
47*62c56f98SSadaf Ebrahimi     output[i] = (uint64_t)xi;
48*62c56f98SSadaf Ebrahimi   }
49*62c56f98SSadaf Ebrahimi }
50*62c56f98SSadaf Ebrahimi 
51*62c56f98SSadaf Ebrahimi inline static void
Hacl_Bignum_Fproduct_sum_scalar_multiplication_(uint128_t * output,uint64_t * input,uint64_t s)52*62c56f98SSadaf Ebrahimi Hacl_Bignum_Fproduct_sum_scalar_multiplication_(uint128_t *output, uint64_t *input, uint64_t s)
53*62c56f98SSadaf Ebrahimi {
54*62c56f98SSadaf Ebrahimi   uint32_t i;
55*62c56f98SSadaf Ebrahimi   for (i = (uint32_t)0U; i < (uint32_t)5U; i = i + (uint32_t)1U)
56*62c56f98SSadaf Ebrahimi   {
57*62c56f98SSadaf Ebrahimi     uint128_t xi = output[i];
58*62c56f98SSadaf Ebrahimi     uint64_t yi = input[i];
59*62c56f98SSadaf Ebrahimi     output[i] = xi + (uint128_t)yi * s;
60*62c56f98SSadaf Ebrahimi   }
61*62c56f98SSadaf Ebrahimi }
62*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fproduct_carry_wide_(uint128_t * tmp)63*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fproduct_carry_wide_(uint128_t *tmp)
64*62c56f98SSadaf Ebrahimi {
65*62c56f98SSadaf Ebrahimi   uint32_t i;
66*62c56f98SSadaf Ebrahimi   for (i = (uint32_t)0U; i < (uint32_t)4U; i = i + (uint32_t)1U)
67*62c56f98SSadaf Ebrahimi   {
68*62c56f98SSadaf Ebrahimi     uint32_t ctr = i;
69*62c56f98SSadaf Ebrahimi     uint128_t tctr = tmp[ctr];
70*62c56f98SSadaf Ebrahimi     uint128_t tctrp1 = tmp[ctr + (uint32_t)1U];
71*62c56f98SSadaf Ebrahimi     uint64_t r0 = (uint64_t)tctr & (uint64_t)0x7ffffffffffffU;
72*62c56f98SSadaf Ebrahimi     uint128_t c = tctr >> (uint32_t)51U;
73*62c56f98SSadaf Ebrahimi     tmp[ctr] = (uint128_t)r0;
74*62c56f98SSadaf Ebrahimi     tmp[ctr + (uint32_t)1U] = tctrp1 + c;
75*62c56f98SSadaf Ebrahimi   }
76*62c56f98SSadaf Ebrahimi }
77*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fmul_shift_reduce(uint64_t * output)78*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fmul_shift_reduce(uint64_t *output)
79*62c56f98SSadaf Ebrahimi {
80*62c56f98SSadaf Ebrahimi   uint64_t tmp = output[4U];
81*62c56f98SSadaf Ebrahimi   uint64_t b0;
82*62c56f98SSadaf Ebrahimi   {
83*62c56f98SSadaf Ebrahimi     uint32_t i;
84*62c56f98SSadaf Ebrahimi     for (i = (uint32_t)0U; i < (uint32_t)4U; i = i + (uint32_t)1U)
85*62c56f98SSadaf Ebrahimi     {
86*62c56f98SSadaf Ebrahimi       uint32_t ctr = (uint32_t)5U - i - (uint32_t)1U;
87*62c56f98SSadaf Ebrahimi       uint64_t z = output[ctr - (uint32_t)1U];
88*62c56f98SSadaf Ebrahimi       output[ctr] = z;
89*62c56f98SSadaf Ebrahimi     }
90*62c56f98SSadaf Ebrahimi   }
91*62c56f98SSadaf Ebrahimi   output[0U] = tmp;
92*62c56f98SSadaf Ebrahimi   b0 = output[0U];
93*62c56f98SSadaf Ebrahimi   output[0U] = (uint64_t)19U * b0;
94*62c56f98SSadaf Ebrahimi }
95*62c56f98SSadaf Ebrahimi 
96*62c56f98SSadaf Ebrahimi static void
Hacl_Bignum_Fmul_mul_shift_reduce_(uint128_t * output,uint64_t * input,uint64_t * input2)97*62c56f98SSadaf Ebrahimi Hacl_Bignum_Fmul_mul_shift_reduce_(uint128_t *output, uint64_t *input, uint64_t *input2)
98*62c56f98SSadaf Ebrahimi {
99*62c56f98SSadaf Ebrahimi   uint32_t i;
100*62c56f98SSadaf Ebrahimi   uint64_t input2i;
101*62c56f98SSadaf Ebrahimi   {
102*62c56f98SSadaf Ebrahimi     uint32_t i0;
103*62c56f98SSadaf Ebrahimi     for (i0 = (uint32_t)0U; i0 < (uint32_t)4U; i0 = i0 + (uint32_t)1U)
104*62c56f98SSadaf Ebrahimi     {
105*62c56f98SSadaf Ebrahimi       uint64_t input2i0 = input2[i0];
106*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fproduct_sum_scalar_multiplication_(output, input, input2i0);
107*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fmul_shift_reduce(input);
108*62c56f98SSadaf Ebrahimi     }
109*62c56f98SSadaf Ebrahimi   }
110*62c56f98SSadaf Ebrahimi   i = (uint32_t)4U;
111*62c56f98SSadaf Ebrahimi   input2i = input2[i];
112*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fproduct_sum_scalar_multiplication_(output, input, input2i);
113*62c56f98SSadaf Ebrahimi }
114*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fmul_fmul(uint64_t * output,uint64_t * input,uint64_t * input2)115*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fmul_fmul(uint64_t *output, uint64_t *input, uint64_t *input2)
116*62c56f98SSadaf Ebrahimi {
117*62c56f98SSadaf Ebrahimi   uint64_t tmp[5U] = { 0U };
118*62c56f98SSadaf Ebrahimi   memcpy(tmp, input, (uint32_t)5U * sizeof input[0U]);
119*62c56f98SSadaf Ebrahimi   KRML_CHECK_SIZE(sizeof (uint128_t), (uint32_t)5U);
120*62c56f98SSadaf Ebrahimi   {
121*62c56f98SSadaf Ebrahimi     uint128_t t[5U];
122*62c56f98SSadaf Ebrahimi     {
123*62c56f98SSadaf Ebrahimi       uint32_t _i;
124*62c56f98SSadaf Ebrahimi       for (_i = 0U; _i < (uint32_t)5U; ++_i)
125*62c56f98SSadaf Ebrahimi         t[_i] = (uint128_t)(uint64_t)0U;
126*62c56f98SSadaf Ebrahimi     }
127*62c56f98SSadaf Ebrahimi     {
128*62c56f98SSadaf Ebrahimi       uint128_t b4;
129*62c56f98SSadaf Ebrahimi       uint128_t b0;
130*62c56f98SSadaf Ebrahimi       uint128_t b4_;
131*62c56f98SSadaf Ebrahimi       uint128_t b0_;
132*62c56f98SSadaf Ebrahimi       uint64_t i0;
133*62c56f98SSadaf Ebrahimi       uint64_t i1;
134*62c56f98SSadaf Ebrahimi       uint64_t i0_;
135*62c56f98SSadaf Ebrahimi       uint64_t i1_;
136*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fmul_mul_shift_reduce_(t, tmp, input2);
137*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fproduct_carry_wide_(t);
138*62c56f98SSadaf Ebrahimi       b4 = t[4U];
139*62c56f98SSadaf Ebrahimi       b0 = t[0U];
140*62c56f98SSadaf Ebrahimi       b4_ = b4 & (uint128_t)(uint64_t)0x7ffffffffffffU;
141*62c56f98SSadaf Ebrahimi       b0_ = b0 + (uint128_t)(uint64_t)19U * (uint64_t)(b4 >> (uint32_t)51U);
142*62c56f98SSadaf Ebrahimi       t[4U] = b4_;
143*62c56f98SSadaf Ebrahimi       t[0U] = b0_;
144*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fproduct_copy_from_wide_(output, t);
145*62c56f98SSadaf Ebrahimi       i0 = output[0U];
146*62c56f98SSadaf Ebrahimi       i1 = output[1U];
147*62c56f98SSadaf Ebrahimi       i0_ = i0 & (uint64_t)0x7ffffffffffffU;
148*62c56f98SSadaf Ebrahimi       i1_ = i1 + (i0 >> (uint32_t)51U);
149*62c56f98SSadaf Ebrahimi       output[0U] = i0_;
150*62c56f98SSadaf Ebrahimi       output[1U] = i1_;
151*62c56f98SSadaf Ebrahimi     }
152*62c56f98SSadaf Ebrahimi   }
153*62c56f98SSadaf Ebrahimi }
154*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fsquare_fsquare__(uint128_t * tmp,uint64_t * output)155*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fsquare_fsquare__(uint128_t *tmp, uint64_t *output)
156*62c56f98SSadaf Ebrahimi {
157*62c56f98SSadaf Ebrahimi   uint64_t r0 = output[0U];
158*62c56f98SSadaf Ebrahimi   uint64_t r1 = output[1U];
159*62c56f98SSadaf Ebrahimi   uint64_t r2 = output[2U];
160*62c56f98SSadaf Ebrahimi   uint64_t r3 = output[3U];
161*62c56f98SSadaf Ebrahimi   uint64_t r4 = output[4U];
162*62c56f98SSadaf Ebrahimi   uint64_t d0 = r0 * (uint64_t)2U;
163*62c56f98SSadaf Ebrahimi   uint64_t d1 = r1 * (uint64_t)2U;
164*62c56f98SSadaf Ebrahimi   uint64_t d2 = r2 * (uint64_t)2U * (uint64_t)19U;
165*62c56f98SSadaf Ebrahimi   uint64_t d419 = r4 * (uint64_t)19U;
166*62c56f98SSadaf Ebrahimi   uint64_t d4 = d419 * (uint64_t)2U;
167*62c56f98SSadaf Ebrahimi   uint128_t s0 = (uint128_t)r0 * r0 + (uint128_t)d4 * r1 + (uint128_t)d2 * r3;
168*62c56f98SSadaf Ebrahimi   uint128_t s1 = (uint128_t)d0 * r1 + (uint128_t)d4 * r2 + (uint128_t)(r3 * (uint64_t)19U) * r3;
169*62c56f98SSadaf Ebrahimi   uint128_t s2 = (uint128_t)d0 * r2 + (uint128_t)r1 * r1 + (uint128_t)d4 * r3;
170*62c56f98SSadaf Ebrahimi   uint128_t s3 = (uint128_t)d0 * r3 + (uint128_t)d1 * r2 + (uint128_t)r4 * d419;
171*62c56f98SSadaf Ebrahimi   uint128_t s4 = (uint128_t)d0 * r4 + (uint128_t)d1 * r3 + (uint128_t)r2 * r2;
172*62c56f98SSadaf Ebrahimi   tmp[0U] = s0;
173*62c56f98SSadaf Ebrahimi   tmp[1U] = s1;
174*62c56f98SSadaf Ebrahimi   tmp[2U] = s2;
175*62c56f98SSadaf Ebrahimi   tmp[3U] = s3;
176*62c56f98SSadaf Ebrahimi   tmp[4U] = s4;
177*62c56f98SSadaf Ebrahimi }
178*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fsquare_fsquare_(uint128_t * tmp,uint64_t * output)179*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fsquare_fsquare_(uint128_t *tmp, uint64_t *output)
180*62c56f98SSadaf Ebrahimi {
181*62c56f98SSadaf Ebrahimi   uint128_t b4;
182*62c56f98SSadaf Ebrahimi   uint128_t b0;
183*62c56f98SSadaf Ebrahimi   uint128_t b4_;
184*62c56f98SSadaf Ebrahimi   uint128_t b0_;
185*62c56f98SSadaf Ebrahimi   uint64_t i0;
186*62c56f98SSadaf Ebrahimi   uint64_t i1;
187*62c56f98SSadaf Ebrahimi   uint64_t i0_;
188*62c56f98SSadaf Ebrahimi   uint64_t i1_;
189*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare__(tmp, output);
190*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fproduct_carry_wide_(tmp);
191*62c56f98SSadaf Ebrahimi   b4 = tmp[4U];
192*62c56f98SSadaf Ebrahimi   b0 = tmp[0U];
193*62c56f98SSadaf Ebrahimi   b4_ = b4 & (uint128_t)(uint64_t)0x7ffffffffffffU;
194*62c56f98SSadaf Ebrahimi   b0_ = b0 + (uint128_t)(uint64_t)19U * (uint64_t)(b4 >> (uint32_t)51U);
195*62c56f98SSadaf Ebrahimi   tmp[4U] = b4_;
196*62c56f98SSadaf Ebrahimi   tmp[0U] = b0_;
197*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fproduct_copy_from_wide_(output, tmp);
198*62c56f98SSadaf Ebrahimi   i0 = output[0U];
199*62c56f98SSadaf Ebrahimi   i1 = output[1U];
200*62c56f98SSadaf Ebrahimi   i0_ = i0 & (uint64_t)0x7ffffffffffffU;
201*62c56f98SSadaf Ebrahimi   i1_ = i1 + (i0 >> (uint32_t)51U);
202*62c56f98SSadaf Ebrahimi   output[0U] = i0_;
203*62c56f98SSadaf Ebrahimi   output[1U] = i1_;
204*62c56f98SSadaf Ebrahimi }
205*62c56f98SSadaf Ebrahimi 
206*62c56f98SSadaf Ebrahimi static void
Hacl_Bignum_Fsquare_fsquare_times_(uint64_t * input,uint128_t * tmp,uint32_t count1)207*62c56f98SSadaf Ebrahimi Hacl_Bignum_Fsquare_fsquare_times_(uint64_t *input, uint128_t *tmp, uint32_t count1)
208*62c56f98SSadaf Ebrahimi {
209*62c56f98SSadaf Ebrahimi   uint32_t i;
210*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_(tmp, input);
211*62c56f98SSadaf Ebrahimi   for (i = (uint32_t)1U; i < count1; i = i + (uint32_t)1U)
212*62c56f98SSadaf Ebrahimi     Hacl_Bignum_Fsquare_fsquare_(tmp, input);
213*62c56f98SSadaf Ebrahimi }
214*62c56f98SSadaf Ebrahimi 
215*62c56f98SSadaf Ebrahimi inline static void
Hacl_Bignum_Fsquare_fsquare_times(uint64_t * output,uint64_t * input,uint32_t count1)216*62c56f98SSadaf Ebrahimi Hacl_Bignum_Fsquare_fsquare_times(uint64_t *output, uint64_t *input, uint32_t count1)
217*62c56f98SSadaf Ebrahimi {
218*62c56f98SSadaf Ebrahimi   KRML_CHECK_SIZE(sizeof (uint128_t), (uint32_t)5U);
219*62c56f98SSadaf Ebrahimi   {
220*62c56f98SSadaf Ebrahimi     uint128_t t[5U];
221*62c56f98SSadaf Ebrahimi     {
222*62c56f98SSadaf Ebrahimi       uint32_t _i;
223*62c56f98SSadaf Ebrahimi       for (_i = 0U; _i < (uint32_t)5U; ++_i)
224*62c56f98SSadaf Ebrahimi         t[_i] = (uint128_t)(uint64_t)0U;
225*62c56f98SSadaf Ebrahimi     }
226*62c56f98SSadaf Ebrahimi     memcpy(output, input, (uint32_t)5U * sizeof input[0U]);
227*62c56f98SSadaf Ebrahimi     Hacl_Bignum_Fsquare_fsquare_times_(output, t, count1);
228*62c56f98SSadaf Ebrahimi   }
229*62c56f98SSadaf Ebrahimi }
230*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Fsquare_fsquare_times_inplace(uint64_t * output,uint32_t count1)231*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Fsquare_fsquare_times_inplace(uint64_t *output, uint32_t count1)
232*62c56f98SSadaf Ebrahimi {
233*62c56f98SSadaf Ebrahimi   KRML_CHECK_SIZE(sizeof (uint128_t), (uint32_t)5U);
234*62c56f98SSadaf Ebrahimi   {
235*62c56f98SSadaf Ebrahimi     uint128_t t[5U];
236*62c56f98SSadaf Ebrahimi     {
237*62c56f98SSadaf Ebrahimi       uint32_t _i;
238*62c56f98SSadaf Ebrahimi       for (_i = 0U; _i < (uint32_t)5U; ++_i)
239*62c56f98SSadaf Ebrahimi         t[_i] = (uint128_t)(uint64_t)0U;
240*62c56f98SSadaf Ebrahimi     }
241*62c56f98SSadaf Ebrahimi     Hacl_Bignum_Fsquare_fsquare_times_(output, t, count1);
242*62c56f98SSadaf Ebrahimi   }
243*62c56f98SSadaf Ebrahimi }
244*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_Crecip_crecip(uint64_t * out,uint64_t * z)245*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_Crecip_crecip(uint64_t *out, uint64_t *z)
246*62c56f98SSadaf Ebrahimi {
247*62c56f98SSadaf Ebrahimi   uint64_t buf[20U] = { 0U };
248*62c56f98SSadaf Ebrahimi   uint64_t *a0 = buf;
249*62c56f98SSadaf Ebrahimi   uint64_t *t00 = buf + (uint32_t)5U;
250*62c56f98SSadaf Ebrahimi   uint64_t *b0 = buf + (uint32_t)10U;
251*62c56f98SSadaf Ebrahimi   uint64_t *t01;
252*62c56f98SSadaf Ebrahimi   uint64_t *b1;
253*62c56f98SSadaf Ebrahimi   uint64_t *c0;
254*62c56f98SSadaf Ebrahimi   uint64_t *a;
255*62c56f98SSadaf Ebrahimi   uint64_t *t0;
256*62c56f98SSadaf Ebrahimi   uint64_t *b;
257*62c56f98SSadaf Ebrahimi   uint64_t *c;
258*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(a0, z, (uint32_t)1U);
259*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t00, a0, (uint32_t)2U);
260*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(b0, t00, z);
261*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(a0, b0, a0);
262*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t00, a0, (uint32_t)1U);
263*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(b0, t00, b0);
264*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t00, b0, (uint32_t)5U);
265*62c56f98SSadaf Ebrahimi   t01 = buf + (uint32_t)5U;
266*62c56f98SSadaf Ebrahimi   b1 = buf + (uint32_t)10U;
267*62c56f98SSadaf Ebrahimi   c0 = buf + (uint32_t)15U;
268*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(b1, t01, b1);
269*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t01, b1, (uint32_t)10U);
270*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(c0, t01, b1);
271*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t01, c0, (uint32_t)20U);
272*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(t01, t01, c0);
273*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times_inplace(t01, (uint32_t)10U);
274*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(b1, t01, b1);
275*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t01, b1, (uint32_t)50U);
276*62c56f98SSadaf Ebrahimi   a = buf;
277*62c56f98SSadaf Ebrahimi   t0 = buf + (uint32_t)5U;
278*62c56f98SSadaf Ebrahimi   b = buf + (uint32_t)10U;
279*62c56f98SSadaf Ebrahimi   c = buf + (uint32_t)15U;
280*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(c, t0, b);
281*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(t0, c, (uint32_t)100U);
282*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(t0, t0, c);
283*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times_inplace(t0, (uint32_t)50U);
284*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(t0, t0, b);
285*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times_inplace(t0, (uint32_t)5U);
286*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(out, t0, a);
287*62c56f98SSadaf Ebrahimi }
288*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_fsum(uint64_t * a,uint64_t * b)289*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_fsum(uint64_t *a, uint64_t *b)
290*62c56f98SSadaf Ebrahimi {
291*62c56f98SSadaf Ebrahimi   uint32_t i;
292*62c56f98SSadaf Ebrahimi   for (i = (uint32_t)0U; i < (uint32_t)5U; i = i + (uint32_t)1U)
293*62c56f98SSadaf Ebrahimi   {
294*62c56f98SSadaf Ebrahimi     uint64_t xi = a[i];
295*62c56f98SSadaf Ebrahimi     uint64_t yi = b[i];
296*62c56f98SSadaf Ebrahimi     a[i] = xi + yi;
297*62c56f98SSadaf Ebrahimi   }
298*62c56f98SSadaf Ebrahimi }
299*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_fdifference(uint64_t * a,uint64_t * b)300*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_fdifference(uint64_t *a, uint64_t *b)
301*62c56f98SSadaf Ebrahimi {
302*62c56f98SSadaf Ebrahimi   uint64_t tmp[5U] = { 0U };
303*62c56f98SSadaf Ebrahimi   uint64_t b0;
304*62c56f98SSadaf Ebrahimi   uint64_t b1;
305*62c56f98SSadaf Ebrahimi   uint64_t b2;
306*62c56f98SSadaf Ebrahimi   uint64_t b3;
307*62c56f98SSadaf Ebrahimi   uint64_t b4;
308*62c56f98SSadaf Ebrahimi   memcpy(tmp, b, (uint32_t)5U * sizeof b[0U]);
309*62c56f98SSadaf Ebrahimi   b0 = tmp[0U];
310*62c56f98SSadaf Ebrahimi   b1 = tmp[1U];
311*62c56f98SSadaf Ebrahimi   b2 = tmp[2U];
312*62c56f98SSadaf Ebrahimi   b3 = tmp[3U];
313*62c56f98SSadaf Ebrahimi   b4 = tmp[4U];
314*62c56f98SSadaf Ebrahimi   tmp[0U] = b0 + (uint64_t)0x3fffffffffff68U;
315*62c56f98SSadaf Ebrahimi   tmp[1U] = b1 + (uint64_t)0x3ffffffffffff8U;
316*62c56f98SSadaf Ebrahimi   tmp[2U] = b2 + (uint64_t)0x3ffffffffffff8U;
317*62c56f98SSadaf Ebrahimi   tmp[3U] = b3 + (uint64_t)0x3ffffffffffff8U;
318*62c56f98SSadaf Ebrahimi   tmp[4U] = b4 + (uint64_t)0x3ffffffffffff8U;
319*62c56f98SSadaf Ebrahimi   {
320*62c56f98SSadaf Ebrahimi     uint32_t i;
321*62c56f98SSadaf Ebrahimi     for (i = (uint32_t)0U; i < (uint32_t)5U; i = i + (uint32_t)1U)
322*62c56f98SSadaf Ebrahimi     {
323*62c56f98SSadaf Ebrahimi       uint64_t xi = a[i];
324*62c56f98SSadaf Ebrahimi       uint64_t yi = tmp[i];
325*62c56f98SSadaf Ebrahimi       a[i] = yi - xi;
326*62c56f98SSadaf Ebrahimi     }
327*62c56f98SSadaf Ebrahimi   }
328*62c56f98SSadaf Ebrahimi }
329*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_fscalar(uint64_t * output,uint64_t * b,uint64_t s)330*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_fscalar(uint64_t *output, uint64_t *b, uint64_t s)
331*62c56f98SSadaf Ebrahimi {
332*62c56f98SSadaf Ebrahimi   KRML_CHECK_SIZE(sizeof (uint128_t), (uint32_t)5U);
333*62c56f98SSadaf Ebrahimi   {
334*62c56f98SSadaf Ebrahimi     uint128_t tmp[5U];
335*62c56f98SSadaf Ebrahimi     {
336*62c56f98SSadaf Ebrahimi       uint32_t _i;
337*62c56f98SSadaf Ebrahimi       for (_i = 0U; _i < (uint32_t)5U; ++_i)
338*62c56f98SSadaf Ebrahimi         tmp[_i] = (uint128_t)(uint64_t)0U;
339*62c56f98SSadaf Ebrahimi     }
340*62c56f98SSadaf Ebrahimi     {
341*62c56f98SSadaf Ebrahimi       uint128_t b4;
342*62c56f98SSadaf Ebrahimi       uint128_t b0;
343*62c56f98SSadaf Ebrahimi       uint128_t b4_;
344*62c56f98SSadaf Ebrahimi       uint128_t b0_;
345*62c56f98SSadaf Ebrahimi       {
346*62c56f98SSadaf Ebrahimi         uint32_t i;
347*62c56f98SSadaf Ebrahimi         for (i = (uint32_t)0U; i < (uint32_t)5U; i = i + (uint32_t)1U)
348*62c56f98SSadaf Ebrahimi         {
349*62c56f98SSadaf Ebrahimi           uint64_t xi = b[i];
350*62c56f98SSadaf Ebrahimi           tmp[i] = (uint128_t)xi * s;
351*62c56f98SSadaf Ebrahimi         }
352*62c56f98SSadaf Ebrahimi       }
353*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fproduct_carry_wide_(tmp);
354*62c56f98SSadaf Ebrahimi       b4 = tmp[4U];
355*62c56f98SSadaf Ebrahimi       b0 = tmp[0U];
356*62c56f98SSadaf Ebrahimi       b4_ = b4 & (uint128_t)(uint64_t)0x7ffffffffffffU;
357*62c56f98SSadaf Ebrahimi       b0_ = b0 + (uint128_t)(uint64_t)19U * (uint64_t)(b4 >> (uint32_t)51U);
358*62c56f98SSadaf Ebrahimi       tmp[4U] = b4_;
359*62c56f98SSadaf Ebrahimi       tmp[0U] = b0_;
360*62c56f98SSadaf Ebrahimi       Hacl_Bignum_Fproduct_copy_from_wide_(output, tmp);
361*62c56f98SSadaf Ebrahimi     }
362*62c56f98SSadaf Ebrahimi   }
363*62c56f98SSadaf Ebrahimi }
364*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_fmul(uint64_t * output,uint64_t * a,uint64_t * b)365*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_fmul(uint64_t *output, uint64_t *a, uint64_t *b)
366*62c56f98SSadaf Ebrahimi {
367*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fmul_fmul(output, a, b);
368*62c56f98SSadaf Ebrahimi }
369*62c56f98SSadaf Ebrahimi 
Hacl_Bignum_crecip(uint64_t * output,uint64_t * input)370*62c56f98SSadaf Ebrahimi inline static void Hacl_Bignum_crecip(uint64_t *output, uint64_t *input)
371*62c56f98SSadaf Ebrahimi {
372*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Crecip_crecip(output, input);
373*62c56f98SSadaf Ebrahimi }
374*62c56f98SSadaf Ebrahimi 
375*62c56f98SSadaf Ebrahimi static void
Hacl_EC_Point_swap_conditional_step(uint64_t * a,uint64_t * b,uint64_t swap1,uint32_t ctr)376*62c56f98SSadaf Ebrahimi Hacl_EC_Point_swap_conditional_step(uint64_t *a, uint64_t *b, uint64_t swap1, uint32_t ctr)
377*62c56f98SSadaf Ebrahimi {
378*62c56f98SSadaf Ebrahimi   uint32_t i = ctr - (uint32_t)1U;
379*62c56f98SSadaf Ebrahimi   uint64_t ai = a[i];
380*62c56f98SSadaf Ebrahimi   uint64_t bi = b[i];
381*62c56f98SSadaf Ebrahimi   uint64_t x = swap1 & (ai ^ bi);
382*62c56f98SSadaf Ebrahimi   uint64_t ai1 = ai ^ x;
383*62c56f98SSadaf Ebrahimi   uint64_t bi1 = bi ^ x;
384*62c56f98SSadaf Ebrahimi   a[i] = ai1;
385*62c56f98SSadaf Ebrahimi   b[i] = bi1;
386*62c56f98SSadaf Ebrahimi }
387*62c56f98SSadaf Ebrahimi 
388*62c56f98SSadaf Ebrahimi static void
Hacl_EC_Point_swap_conditional_(uint64_t * a,uint64_t * b,uint64_t swap1,uint32_t ctr)389*62c56f98SSadaf Ebrahimi Hacl_EC_Point_swap_conditional_(uint64_t *a, uint64_t *b, uint64_t swap1, uint32_t ctr)
390*62c56f98SSadaf Ebrahimi {
391*62c56f98SSadaf Ebrahimi   if (!(ctr == (uint32_t)0U))
392*62c56f98SSadaf Ebrahimi   {
393*62c56f98SSadaf Ebrahimi     uint32_t i;
394*62c56f98SSadaf Ebrahimi     Hacl_EC_Point_swap_conditional_step(a, b, swap1, ctr);
395*62c56f98SSadaf Ebrahimi     i = ctr - (uint32_t)1U;
396*62c56f98SSadaf Ebrahimi     Hacl_EC_Point_swap_conditional_(a, b, swap1, i);
397*62c56f98SSadaf Ebrahimi   }
398*62c56f98SSadaf Ebrahimi }
399*62c56f98SSadaf Ebrahimi 
Hacl_EC_Point_swap_conditional(uint64_t * a,uint64_t * b,uint64_t iswap)400*62c56f98SSadaf Ebrahimi static void Hacl_EC_Point_swap_conditional(uint64_t *a, uint64_t *b, uint64_t iswap)
401*62c56f98SSadaf Ebrahimi {
402*62c56f98SSadaf Ebrahimi   uint64_t swap1 = (uint64_t)0U - iswap;
403*62c56f98SSadaf Ebrahimi   Hacl_EC_Point_swap_conditional_(a, b, swap1, (uint32_t)5U);
404*62c56f98SSadaf Ebrahimi   Hacl_EC_Point_swap_conditional_(a + (uint32_t)5U, b + (uint32_t)5U, swap1, (uint32_t)5U);
405*62c56f98SSadaf Ebrahimi }
406*62c56f98SSadaf Ebrahimi 
Hacl_EC_Point_copy(uint64_t * output,uint64_t * input)407*62c56f98SSadaf Ebrahimi static void Hacl_EC_Point_copy(uint64_t *output, uint64_t *input)
408*62c56f98SSadaf Ebrahimi {
409*62c56f98SSadaf Ebrahimi   memcpy(output, input, (uint32_t)5U * sizeof input[0U]);
410*62c56f98SSadaf Ebrahimi   memcpy(output + (uint32_t)5U,
411*62c56f98SSadaf Ebrahimi     input + (uint32_t)5U,
412*62c56f98SSadaf Ebrahimi     (uint32_t)5U * sizeof (input + (uint32_t)5U)[0U]);
413*62c56f98SSadaf Ebrahimi }
414*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fexpand(uint64_t * output,uint8_t * input)415*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fexpand(uint64_t *output, uint8_t *input)
416*62c56f98SSadaf Ebrahimi {
417*62c56f98SSadaf Ebrahimi   uint64_t i0 = load64_le(input);
418*62c56f98SSadaf Ebrahimi   uint8_t *x00 = input + (uint32_t)6U;
419*62c56f98SSadaf Ebrahimi   uint64_t i1 = load64_le(x00);
420*62c56f98SSadaf Ebrahimi   uint8_t *x01 = input + (uint32_t)12U;
421*62c56f98SSadaf Ebrahimi   uint64_t i2 = load64_le(x01);
422*62c56f98SSadaf Ebrahimi   uint8_t *x02 = input + (uint32_t)19U;
423*62c56f98SSadaf Ebrahimi   uint64_t i3 = load64_le(x02);
424*62c56f98SSadaf Ebrahimi   uint8_t *x0 = input + (uint32_t)24U;
425*62c56f98SSadaf Ebrahimi   uint64_t i4 = load64_le(x0);
426*62c56f98SSadaf Ebrahimi   uint64_t output0 = i0 & (uint64_t)0x7ffffffffffffU;
427*62c56f98SSadaf Ebrahimi   uint64_t output1 = i1 >> (uint32_t)3U & (uint64_t)0x7ffffffffffffU;
428*62c56f98SSadaf Ebrahimi   uint64_t output2 = i2 >> (uint32_t)6U & (uint64_t)0x7ffffffffffffU;
429*62c56f98SSadaf Ebrahimi   uint64_t output3 = i3 >> (uint32_t)1U & (uint64_t)0x7ffffffffffffU;
430*62c56f98SSadaf Ebrahimi   uint64_t output4 = i4 >> (uint32_t)12U & (uint64_t)0x7ffffffffffffU;
431*62c56f98SSadaf Ebrahimi   output[0U] = output0;
432*62c56f98SSadaf Ebrahimi   output[1U] = output1;
433*62c56f98SSadaf Ebrahimi   output[2U] = output2;
434*62c56f98SSadaf Ebrahimi   output[3U] = output3;
435*62c56f98SSadaf Ebrahimi   output[4U] = output4;
436*62c56f98SSadaf Ebrahimi }
437*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract_first_carry_pass(uint64_t * input)438*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract_first_carry_pass(uint64_t *input)
439*62c56f98SSadaf Ebrahimi {
440*62c56f98SSadaf Ebrahimi   uint64_t t0 = input[0U];
441*62c56f98SSadaf Ebrahimi   uint64_t t1 = input[1U];
442*62c56f98SSadaf Ebrahimi   uint64_t t2 = input[2U];
443*62c56f98SSadaf Ebrahimi   uint64_t t3 = input[3U];
444*62c56f98SSadaf Ebrahimi   uint64_t t4 = input[4U];
445*62c56f98SSadaf Ebrahimi   uint64_t t1_ = t1 + (t0 >> (uint32_t)51U);
446*62c56f98SSadaf Ebrahimi   uint64_t t0_ = t0 & (uint64_t)0x7ffffffffffffU;
447*62c56f98SSadaf Ebrahimi   uint64_t t2_ = t2 + (t1_ >> (uint32_t)51U);
448*62c56f98SSadaf Ebrahimi   uint64_t t1__ = t1_ & (uint64_t)0x7ffffffffffffU;
449*62c56f98SSadaf Ebrahimi   uint64_t t3_ = t3 + (t2_ >> (uint32_t)51U);
450*62c56f98SSadaf Ebrahimi   uint64_t t2__ = t2_ & (uint64_t)0x7ffffffffffffU;
451*62c56f98SSadaf Ebrahimi   uint64_t t4_ = t4 + (t3_ >> (uint32_t)51U);
452*62c56f98SSadaf Ebrahimi   uint64_t t3__ = t3_ & (uint64_t)0x7ffffffffffffU;
453*62c56f98SSadaf Ebrahimi   input[0U] = t0_;
454*62c56f98SSadaf Ebrahimi   input[1U] = t1__;
455*62c56f98SSadaf Ebrahimi   input[2U] = t2__;
456*62c56f98SSadaf Ebrahimi   input[3U] = t3__;
457*62c56f98SSadaf Ebrahimi   input[4U] = t4_;
458*62c56f98SSadaf Ebrahimi }
459*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract_first_carry_full(uint64_t * input)460*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract_first_carry_full(uint64_t *input)
461*62c56f98SSadaf Ebrahimi {
462*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract_first_carry_pass(input);
463*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Modulo_carry_top(input);
464*62c56f98SSadaf Ebrahimi }
465*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract_second_carry_pass(uint64_t * input)466*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract_second_carry_pass(uint64_t *input)
467*62c56f98SSadaf Ebrahimi {
468*62c56f98SSadaf Ebrahimi   uint64_t t0 = input[0U];
469*62c56f98SSadaf Ebrahimi   uint64_t t1 = input[1U];
470*62c56f98SSadaf Ebrahimi   uint64_t t2 = input[2U];
471*62c56f98SSadaf Ebrahimi   uint64_t t3 = input[3U];
472*62c56f98SSadaf Ebrahimi   uint64_t t4 = input[4U];
473*62c56f98SSadaf Ebrahimi   uint64_t t1_ = t1 + (t0 >> (uint32_t)51U);
474*62c56f98SSadaf Ebrahimi   uint64_t t0_ = t0 & (uint64_t)0x7ffffffffffffU;
475*62c56f98SSadaf Ebrahimi   uint64_t t2_ = t2 + (t1_ >> (uint32_t)51U);
476*62c56f98SSadaf Ebrahimi   uint64_t t1__ = t1_ & (uint64_t)0x7ffffffffffffU;
477*62c56f98SSadaf Ebrahimi   uint64_t t3_ = t3 + (t2_ >> (uint32_t)51U);
478*62c56f98SSadaf Ebrahimi   uint64_t t2__ = t2_ & (uint64_t)0x7ffffffffffffU;
479*62c56f98SSadaf Ebrahimi   uint64_t t4_ = t4 + (t3_ >> (uint32_t)51U);
480*62c56f98SSadaf Ebrahimi   uint64_t t3__ = t3_ & (uint64_t)0x7ffffffffffffU;
481*62c56f98SSadaf Ebrahimi   input[0U] = t0_;
482*62c56f98SSadaf Ebrahimi   input[1U] = t1__;
483*62c56f98SSadaf Ebrahimi   input[2U] = t2__;
484*62c56f98SSadaf Ebrahimi   input[3U] = t3__;
485*62c56f98SSadaf Ebrahimi   input[4U] = t4_;
486*62c56f98SSadaf Ebrahimi }
487*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract_second_carry_full(uint64_t * input)488*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract_second_carry_full(uint64_t *input)
489*62c56f98SSadaf Ebrahimi {
490*62c56f98SSadaf Ebrahimi   uint64_t i0;
491*62c56f98SSadaf Ebrahimi   uint64_t i1;
492*62c56f98SSadaf Ebrahimi   uint64_t i0_;
493*62c56f98SSadaf Ebrahimi   uint64_t i1_;
494*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract_second_carry_pass(input);
495*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Modulo_carry_top(input);
496*62c56f98SSadaf Ebrahimi   i0 = input[0U];
497*62c56f98SSadaf Ebrahimi   i1 = input[1U];
498*62c56f98SSadaf Ebrahimi   i0_ = i0 & (uint64_t)0x7ffffffffffffU;
499*62c56f98SSadaf Ebrahimi   i1_ = i1 + (i0 >> (uint32_t)51U);
500*62c56f98SSadaf Ebrahimi   input[0U] = i0_;
501*62c56f98SSadaf Ebrahimi   input[1U] = i1_;
502*62c56f98SSadaf Ebrahimi }
503*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract_trim(uint64_t * input)504*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract_trim(uint64_t *input)
505*62c56f98SSadaf Ebrahimi {
506*62c56f98SSadaf Ebrahimi   uint64_t a0 = input[0U];
507*62c56f98SSadaf Ebrahimi   uint64_t a1 = input[1U];
508*62c56f98SSadaf Ebrahimi   uint64_t a2 = input[2U];
509*62c56f98SSadaf Ebrahimi   uint64_t a3 = input[3U];
510*62c56f98SSadaf Ebrahimi   uint64_t a4 = input[4U];
511*62c56f98SSadaf Ebrahimi   uint64_t mask0 = FStar_UInt64_gte_mask(a0, (uint64_t)0x7ffffffffffedU);
512*62c56f98SSadaf Ebrahimi   uint64_t mask1 = FStar_UInt64_eq_mask(a1, (uint64_t)0x7ffffffffffffU);
513*62c56f98SSadaf Ebrahimi   uint64_t mask2 = FStar_UInt64_eq_mask(a2, (uint64_t)0x7ffffffffffffU);
514*62c56f98SSadaf Ebrahimi   uint64_t mask3 = FStar_UInt64_eq_mask(a3, (uint64_t)0x7ffffffffffffU);
515*62c56f98SSadaf Ebrahimi   uint64_t mask4 = FStar_UInt64_eq_mask(a4, (uint64_t)0x7ffffffffffffU);
516*62c56f98SSadaf Ebrahimi   uint64_t mask = (((mask0 & mask1) & mask2) & mask3) & mask4;
517*62c56f98SSadaf Ebrahimi   uint64_t a0_ = a0 - ((uint64_t)0x7ffffffffffedU & mask);
518*62c56f98SSadaf Ebrahimi   uint64_t a1_ = a1 - ((uint64_t)0x7ffffffffffffU & mask);
519*62c56f98SSadaf Ebrahimi   uint64_t a2_ = a2 - ((uint64_t)0x7ffffffffffffU & mask);
520*62c56f98SSadaf Ebrahimi   uint64_t a3_ = a3 - ((uint64_t)0x7ffffffffffffU & mask);
521*62c56f98SSadaf Ebrahimi   uint64_t a4_ = a4 - ((uint64_t)0x7ffffffffffffU & mask);
522*62c56f98SSadaf Ebrahimi   input[0U] = a0_;
523*62c56f98SSadaf Ebrahimi   input[1U] = a1_;
524*62c56f98SSadaf Ebrahimi   input[2U] = a2_;
525*62c56f98SSadaf Ebrahimi   input[3U] = a3_;
526*62c56f98SSadaf Ebrahimi   input[4U] = a4_;
527*62c56f98SSadaf Ebrahimi }
528*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract_store(uint8_t * output,uint64_t * input)529*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract_store(uint8_t *output, uint64_t *input)
530*62c56f98SSadaf Ebrahimi {
531*62c56f98SSadaf Ebrahimi   uint64_t t0 = input[0U];
532*62c56f98SSadaf Ebrahimi   uint64_t t1 = input[1U];
533*62c56f98SSadaf Ebrahimi   uint64_t t2 = input[2U];
534*62c56f98SSadaf Ebrahimi   uint64_t t3 = input[3U];
535*62c56f98SSadaf Ebrahimi   uint64_t t4 = input[4U];
536*62c56f98SSadaf Ebrahimi   uint64_t o0 = t1 << (uint32_t)51U | t0;
537*62c56f98SSadaf Ebrahimi   uint64_t o1 = t2 << (uint32_t)38U | t1 >> (uint32_t)13U;
538*62c56f98SSadaf Ebrahimi   uint64_t o2 = t3 << (uint32_t)25U | t2 >> (uint32_t)26U;
539*62c56f98SSadaf Ebrahimi   uint64_t o3 = t4 << (uint32_t)12U | t3 >> (uint32_t)39U;
540*62c56f98SSadaf Ebrahimi   uint8_t *b0 = output;
541*62c56f98SSadaf Ebrahimi   uint8_t *b1 = output + (uint32_t)8U;
542*62c56f98SSadaf Ebrahimi   uint8_t *b2 = output + (uint32_t)16U;
543*62c56f98SSadaf Ebrahimi   uint8_t *b3 = output + (uint32_t)24U;
544*62c56f98SSadaf Ebrahimi   store64_le(b0, o0);
545*62c56f98SSadaf Ebrahimi   store64_le(b1, o1);
546*62c56f98SSadaf Ebrahimi   store64_le(b2, o2);
547*62c56f98SSadaf Ebrahimi   store64_le(b3, o3);
548*62c56f98SSadaf Ebrahimi }
549*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_fcontract(uint8_t * output,uint64_t * input)550*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_fcontract(uint8_t *output, uint64_t *input)
551*62c56f98SSadaf Ebrahimi {
552*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract_first_carry_full(input);
553*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract_second_carry_full(input);
554*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract_trim(input);
555*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract_store(output, input);
556*62c56f98SSadaf Ebrahimi }
557*62c56f98SSadaf Ebrahimi 
Hacl_EC_Format_scalar_of_point(uint8_t * scalar,uint64_t * point)558*62c56f98SSadaf Ebrahimi static void Hacl_EC_Format_scalar_of_point(uint8_t *scalar, uint64_t *point)
559*62c56f98SSadaf Ebrahimi {
560*62c56f98SSadaf Ebrahimi   uint64_t *x = point;
561*62c56f98SSadaf Ebrahimi   uint64_t *z = point + (uint32_t)5U;
562*62c56f98SSadaf Ebrahimi   uint64_t buf[10U] = { 0U };
563*62c56f98SSadaf Ebrahimi   uint64_t *zmone = buf;
564*62c56f98SSadaf Ebrahimi   uint64_t *sc = buf + (uint32_t)5U;
565*62c56f98SSadaf Ebrahimi   Hacl_Bignum_crecip(zmone, z);
566*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fmul(sc, x, zmone);
567*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fcontract(scalar, sc);
568*62c56f98SSadaf Ebrahimi }
569*62c56f98SSadaf Ebrahimi 
570*62c56f98SSadaf Ebrahimi static void
Hacl_EC_AddAndDouble_fmonty(uint64_t * pp,uint64_t * ppq,uint64_t * p,uint64_t * pq,uint64_t * qmqp)571*62c56f98SSadaf Ebrahimi Hacl_EC_AddAndDouble_fmonty(
572*62c56f98SSadaf Ebrahimi   uint64_t *pp,
573*62c56f98SSadaf Ebrahimi   uint64_t *ppq,
574*62c56f98SSadaf Ebrahimi   uint64_t *p,
575*62c56f98SSadaf Ebrahimi   uint64_t *pq,
576*62c56f98SSadaf Ebrahimi   uint64_t *qmqp
577*62c56f98SSadaf Ebrahimi )
578*62c56f98SSadaf Ebrahimi {
579*62c56f98SSadaf Ebrahimi   uint64_t *qx = qmqp;
580*62c56f98SSadaf Ebrahimi   uint64_t *x2 = pp;
581*62c56f98SSadaf Ebrahimi   uint64_t *z2 = pp + (uint32_t)5U;
582*62c56f98SSadaf Ebrahimi   uint64_t *x3 = ppq;
583*62c56f98SSadaf Ebrahimi   uint64_t *z3 = ppq + (uint32_t)5U;
584*62c56f98SSadaf Ebrahimi   uint64_t *x = p;
585*62c56f98SSadaf Ebrahimi   uint64_t *z = p + (uint32_t)5U;
586*62c56f98SSadaf Ebrahimi   uint64_t *xprime = pq;
587*62c56f98SSadaf Ebrahimi   uint64_t *zprime = pq + (uint32_t)5U;
588*62c56f98SSadaf Ebrahimi   uint64_t buf[40U] = { 0U };
589*62c56f98SSadaf Ebrahimi   uint64_t *origx = buf;
590*62c56f98SSadaf Ebrahimi   uint64_t *origxprime0 = buf + (uint32_t)5U;
591*62c56f98SSadaf Ebrahimi   uint64_t *xxprime0 = buf + (uint32_t)25U;
592*62c56f98SSadaf Ebrahimi   uint64_t *zzprime0 = buf + (uint32_t)30U;
593*62c56f98SSadaf Ebrahimi   uint64_t *origxprime;
594*62c56f98SSadaf Ebrahimi   uint64_t *xx0;
595*62c56f98SSadaf Ebrahimi   uint64_t *zz0;
596*62c56f98SSadaf Ebrahimi   uint64_t *xxprime;
597*62c56f98SSadaf Ebrahimi   uint64_t *zzprime;
598*62c56f98SSadaf Ebrahimi   uint64_t *zzzprime;
599*62c56f98SSadaf Ebrahimi   uint64_t *zzz;
600*62c56f98SSadaf Ebrahimi   uint64_t *xx;
601*62c56f98SSadaf Ebrahimi   uint64_t *zz;
602*62c56f98SSadaf Ebrahimi   uint64_t scalar;
603*62c56f98SSadaf Ebrahimi   memcpy(origx, x, (uint32_t)5U * sizeof x[0U]);
604*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fsum(x, z);
605*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fdifference(z, origx);
606*62c56f98SSadaf Ebrahimi   memcpy(origxprime0, xprime, (uint32_t)5U * sizeof xprime[0U]);
607*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fsum(xprime, zprime);
608*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fdifference(zprime, origxprime0);
609*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fmul(xxprime0, xprime, z);
610*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fmul(zzprime0, x, zprime);
611*62c56f98SSadaf Ebrahimi   origxprime = buf + (uint32_t)5U;
612*62c56f98SSadaf Ebrahimi   xx0 = buf + (uint32_t)15U;
613*62c56f98SSadaf Ebrahimi   zz0 = buf + (uint32_t)20U;
614*62c56f98SSadaf Ebrahimi   xxprime = buf + (uint32_t)25U;
615*62c56f98SSadaf Ebrahimi   zzprime = buf + (uint32_t)30U;
616*62c56f98SSadaf Ebrahimi   zzzprime = buf + (uint32_t)35U;
617*62c56f98SSadaf Ebrahimi   memcpy(origxprime, xxprime, (uint32_t)5U * sizeof xxprime[0U]);
618*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fsum(xxprime, zzprime);
619*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fdifference(zzprime, origxprime);
620*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(x3, xxprime, (uint32_t)1U);
621*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(zzzprime, zzprime, (uint32_t)1U);
622*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fmul(z3, zzzprime, qx);
623*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(xx0, x, (uint32_t)1U);
624*62c56f98SSadaf Ebrahimi   Hacl_Bignum_Fsquare_fsquare_times(zz0, z, (uint32_t)1U);
625*62c56f98SSadaf Ebrahimi   zzz = buf + (uint32_t)10U;
626*62c56f98SSadaf Ebrahimi   xx = buf + (uint32_t)15U;
627*62c56f98SSadaf Ebrahimi   zz = buf + (uint32_t)20U;
628*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fmul(x2, xx, zz);
629*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fdifference(zz, xx);
630*62c56f98SSadaf Ebrahimi   scalar = (uint64_t)121665U;
631*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fscalar(zzz, zz, scalar);
632*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fsum(zzz, xx);
633*62c56f98SSadaf Ebrahimi   Hacl_Bignum_fmul(z2, zzz, zz);
634*62c56f98SSadaf Ebrahimi }
635*62c56f98SSadaf Ebrahimi 
636*62c56f98SSadaf Ebrahimi static void
Hacl_EC_Ladder_SmallLoop_cmult_small_loop_step(uint64_t * nq,uint64_t * nqpq,uint64_t * nq2,uint64_t * nqpq2,uint64_t * q,uint8_t byt)637*62c56f98SSadaf Ebrahimi Hacl_EC_Ladder_SmallLoop_cmult_small_loop_step(
638*62c56f98SSadaf Ebrahimi   uint64_t *nq,
639*62c56f98SSadaf Ebrahimi   uint64_t *nqpq,
640*62c56f98SSadaf Ebrahimi   uint64_t *nq2,
641*62c56f98SSadaf Ebrahimi   uint64_t *nqpq2,
642*62c56f98SSadaf Ebrahimi   uint64_t *q,
643*62c56f98SSadaf Ebrahimi   uint8_t byt
644*62c56f98SSadaf Ebrahimi )
645*62c56f98SSadaf Ebrahimi {
646*62c56f98SSadaf Ebrahimi   uint64_t bit0 = (uint64_t)(byt >> (uint32_t)7U);
647*62c56f98SSadaf Ebrahimi   uint64_t bit;
648*62c56f98SSadaf Ebrahimi   Hacl_EC_Point_swap_conditional(nq, nqpq, bit0);
649*62c56f98SSadaf Ebrahimi   Hacl_EC_AddAndDouble_fmonty(nq2, nqpq2, nq, nqpq, q);
650*62c56f98SSadaf Ebrahimi   bit = (uint64_t)(byt >> (uint32_t)7U);
651*62c56f98SSadaf Ebrahimi   Hacl_EC_Point_swap_conditional(nq2, nqpq2, bit);
652*62c56f98SSadaf Ebrahimi }
653*62c56f98SSadaf Ebrahimi 
654*62c56f98SSadaf Ebrahimi static void
Hacl_EC_Ladder_SmallLoop_cmult_small_loop_double_step(uint64_t * nq,uint64_t * nqpq,uint64_t * nq2,uint64_t * nqpq2,uint64_t * q,uint8_t byt)655*62c56f98SSadaf Ebrahimi Hacl_EC_Ladder_SmallLoop_cmult_small_loop_double_step(
656*62c56f98SSadaf Ebrahimi   uint64_t *nq,
657*62c56f98SSadaf Ebrahimi   uint64_t *nqpq,
658*62c56f98SSadaf Ebrahimi   uint64_t *nq2,
659*62c56f98SSadaf Ebrahimi   uint64_t *nqpq2,
660*62c56f98SSadaf Ebrahimi   uint64_t *q,
661*62c56f98SSadaf Ebrahimi   uint8_t byt
662*62c56f98SSadaf Ebrahimi )
663*62c56f98SSadaf Ebrahimi {
664*62c56f98SSadaf Ebrahimi   uint8_t byt1;
665*62c56f98SSadaf Ebrahimi   Hacl_EC_Ladder_SmallLoop_cmult_small_loop_step(nq, nqpq, nq2, nqpq2, q, byt);
666*62c56f98SSadaf Ebrahimi   byt1 = byt << (uint32_t)1U;
667*62c56f98SSadaf Ebrahimi   Hacl_EC_Ladder_SmallLoop_cmult_small_loop_step(nq2, nqpq2, nq, nqpq, q, byt1);
668*62c56f98SSadaf Ebrahimi }
669*62c56f98SSadaf Ebrahimi 
670*62c56f98SSadaf Ebrahimi static void
Hacl_EC_Ladder_SmallLoop_cmult_small_loop(uint64_t * nq,uint64_t * nqpq,uint64_t * nq2,uint64_t * nqpq2,uint64_t * q,uint8_t byt,uint32_t i)671*62c56f98SSadaf Ebrahimi Hacl_EC_Ladder_SmallLoop_cmult_small_loop(
672*62c56f98SSadaf Ebrahimi   uint64_t *nq,
673*62c56f98SSadaf Ebrahimi   uint64_t *nqpq,
674*62c56f98SSadaf Ebrahimi   uint64_t *nq2,
675*62c56f98SSadaf Ebrahimi   uint64_t *nqpq2,
676*62c56f98SSadaf Ebrahimi   uint64_t *q,
677*62c56f98SSadaf Ebrahimi   uint8_t byt,
678*62c56f98SSadaf Ebrahimi   uint32_t i
679*62c56f98SSadaf Ebrahimi )
680*62c56f98SSadaf Ebrahimi {
681*62c56f98SSadaf Ebrahimi   if (!(i == (uint32_t)0U))
682*62c56f98SSadaf Ebrahimi   {
683*62c56f98SSadaf Ebrahimi     uint32_t i_ = i - (uint32_t)1U;
684*62c56f98SSadaf Ebrahimi     uint8_t byt_;
685*62c56f98SSadaf Ebrahimi     Hacl_EC_Ladder_SmallLoop_cmult_small_loop_double_step(nq, nqpq, nq2, nqpq2, q, byt);
686*62c56f98SSadaf Ebrahimi     byt_ = byt << (uint32_t)2U;
687*62c56f98SSadaf Ebrahimi     Hacl_EC_Ladder_SmallLoop_cmult_small_loop(nq, nqpq, nq2, nqpq2, q, byt_, i_);
688*62c56f98SSadaf Ebrahimi   }
689*62c56f98SSadaf Ebrahimi }
690*62c56f98SSadaf Ebrahimi 
691*62c56f98SSadaf Ebrahimi static void
Hacl_EC_Ladder_BigLoop_cmult_big_loop(uint8_t * n1,uint64_t * nq,uint64_t * nqpq,uint64_t * nq2,uint64_t * nqpq2,uint64_t * q,uint32_t i)692*62c56f98SSadaf Ebrahimi Hacl_EC_Ladder_BigLoop_cmult_big_loop(
693*62c56f98SSadaf Ebrahimi   uint8_t *n1,
694*62c56f98SSadaf Ebrahimi   uint64_t *nq,
695*62c56f98SSadaf Ebrahimi   uint64_t *nqpq,
696*62c56f98SSadaf Ebrahimi   uint64_t *nq2,
697*62c56f98SSadaf Ebrahimi   uint64_t *nqpq2,
698*62c56f98SSadaf Ebrahimi   uint64_t *q,
699*62c56f98SSadaf Ebrahimi   uint32_t i
700*62c56f98SSadaf Ebrahimi )
701*62c56f98SSadaf Ebrahimi {
702*62c56f98SSadaf Ebrahimi   if (!(i == (uint32_t)0U))
703*62c56f98SSadaf Ebrahimi   {
704*62c56f98SSadaf Ebrahimi     uint32_t i1 = i - (uint32_t)1U;
705*62c56f98SSadaf Ebrahimi     uint8_t byte = n1[i1];
706*62c56f98SSadaf Ebrahimi     Hacl_EC_Ladder_SmallLoop_cmult_small_loop(nq, nqpq, nq2, nqpq2, q, byte, (uint32_t)4U);
707*62c56f98SSadaf Ebrahimi     Hacl_EC_Ladder_BigLoop_cmult_big_loop(n1, nq, nqpq, nq2, nqpq2, q, i1);
708*62c56f98SSadaf Ebrahimi   }
709*62c56f98SSadaf Ebrahimi }
710*62c56f98SSadaf Ebrahimi 
Hacl_EC_Ladder_cmult(uint64_t * result,uint8_t * n1,uint64_t * q)711*62c56f98SSadaf Ebrahimi static void Hacl_EC_Ladder_cmult(uint64_t *result, uint8_t *n1, uint64_t *q)
712*62c56f98SSadaf Ebrahimi {
713*62c56f98SSadaf Ebrahimi   uint64_t point_buf[40U] = { 0U };
714*62c56f98SSadaf Ebrahimi   uint64_t *nq = point_buf;
715*62c56f98SSadaf Ebrahimi   uint64_t *nqpq = point_buf + (uint32_t)10U;
716*62c56f98SSadaf Ebrahimi   uint64_t *nq2 = point_buf + (uint32_t)20U;
717*62c56f98SSadaf Ebrahimi   uint64_t *nqpq2 = point_buf + (uint32_t)30U;
718*62c56f98SSadaf Ebrahimi   Hacl_EC_Point_copy(nqpq, q);
719*62c56f98SSadaf Ebrahimi   nq[0U] = (uint64_t)1U;
720*62c56f98SSadaf Ebrahimi   Hacl_EC_Ladder_BigLoop_cmult_big_loop(n1, nq, nqpq, nq2, nqpq2, q, (uint32_t)32U);
721*62c56f98SSadaf Ebrahimi   Hacl_EC_Point_copy(result, nq);
722*62c56f98SSadaf Ebrahimi }
723*62c56f98SSadaf Ebrahimi 
Hacl_Curve25519_crypto_scalarmult(uint8_t * mypublic,uint8_t * secret,uint8_t * basepoint)724*62c56f98SSadaf Ebrahimi void Hacl_Curve25519_crypto_scalarmult(uint8_t *mypublic, uint8_t *secret, uint8_t *basepoint)
725*62c56f98SSadaf Ebrahimi {
726*62c56f98SSadaf Ebrahimi   uint64_t buf0[10U] = { 0U };
727*62c56f98SSadaf Ebrahimi   uint64_t *x0 = buf0;
728*62c56f98SSadaf Ebrahimi   uint64_t *z = buf0 + (uint32_t)5U;
729*62c56f98SSadaf Ebrahimi   uint64_t *q;
730*62c56f98SSadaf Ebrahimi   Hacl_EC_Format_fexpand(x0, basepoint);
731*62c56f98SSadaf Ebrahimi   z[0U] = (uint64_t)1U;
732*62c56f98SSadaf Ebrahimi   q = buf0;
733*62c56f98SSadaf Ebrahimi   {
734*62c56f98SSadaf Ebrahimi     uint8_t e[32U] = { 0U };
735*62c56f98SSadaf Ebrahimi     uint8_t e0;
736*62c56f98SSadaf Ebrahimi     uint8_t e31;
737*62c56f98SSadaf Ebrahimi     uint8_t e01;
738*62c56f98SSadaf Ebrahimi     uint8_t e311;
739*62c56f98SSadaf Ebrahimi     uint8_t e312;
740*62c56f98SSadaf Ebrahimi     uint8_t *scalar;
741*62c56f98SSadaf Ebrahimi     memcpy(e, secret, (uint32_t)32U * sizeof secret[0U]);
742*62c56f98SSadaf Ebrahimi     e0 = e[0U];
743*62c56f98SSadaf Ebrahimi     e31 = e[31U];
744*62c56f98SSadaf Ebrahimi     e01 = e0 & (uint8_t)248U;
745*62c56f98SSadaf Ebrahimi     e311 = e31 & (uint8_t)127U;
746*62c56f98SSadaf Ebrahimi     e312 = e311 | (uint8_t)64U;
747*62c56f98SSadaf Ebrahimi     e[0U] = e01;
748*62c56f98SSadaf Ebrahimi     e[31U] = e312;
749*62c56f98SSadaf Ebrahimi     scalar = e;
750*62c56f98SSadaf Ebrahimi     {
751*62c56f98SSadaf Ebrahimi       uint64_t buf[15U] = { 0U };
752*62c56f98SSadaf Ebrahimi       uint64_t *nq = buf;
753*62c56f98SSadaf Ebrahimi       uint64_t *x = nq;
754*62c56f98SSadaf Ebrahimi       x[0U] = (uint64_t)1U;
755*62c56f98SSadaf Ebrahimi       Hacl_EC_Ladder_cmult(nq, scalar, q);
756*62c56f98SSadaf Ebrahimi       Hacl_EC_Format_scalar_of_point(mypublic, nq);
757*62c56f98SSadaf Ebrahimi     }
758*62c56f98SSadaf Ebrahimi   }
759*62c56f98SSadaf Ebrahimi }
760*62c56f98SSadaf Ebrahimi 
761