1*8fb009dcSAndroid Build Coastguard Worker /* Copyright (c) 2014, Google Inc.
2*8fb009dcSAndroid Build Coastguard Worker *
3*8fb009dcSAndroid Build Coastguard Worker * Permission to use, copy, modify, and/or distribute this software for any
4*8fb009dcSAndroid Build Coastguard Worker * purpose with or without fee is hereby granted, provided that the above
5*8fb009dcSAndroid Build Coastguard Worker * copyright notice and this permission notice appear in all copies.
6*8fb009dcSAndroid Build Coastguard Worker *
7*8fb009dcSAndroid Build Coastguard Worker * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
8*8fb009dcSAndroid Build Coastguard Worker * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
9*8fb009dcSAndroid Build Coastguard Worker * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
10*8fb009dcSAndroid Build Coastguard Worker * SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
11*8fb009dcSAndroid Build Coastguard Worker * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
12*8fb009dcSAndroid Build Coastguard Worker * OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
13*8fb009dcSAndroid Build Coastguard Worker * CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */
14*8fb009dcSAndroid Build Coastguard Worker
15*8fb009dcSAndroid Build Coastguard Worker // Adapted from the public domain, estream code by D. Bernstein.
16*8fb009dcSAndroid Build Coastguard Worker
17*8fb009dcSAndroid Build Coastguard Worker #include <openssl/chacha.h>
18*8fb009dcSAndroid Build Coastguard Worker
19*8fb009dcSAndroid Build Coastguard Worker #include <assert.h>
20*8fb009dcSAndroid Build Coastguard Worker #include <string.h>
21*8fb009dcSAndroid Build Coastguard Worker
22*8fb009dcSAndroid Build Coastguard Worker #include "../internal.h"
23*8fb009dcSAndroid Build Coastguard Worker #include "internal.h"
24*8fb009dcSAndroid Build Coastguard Worker
25*8fb009dcSAndroid Build Coastguard Worker
26*8fb009dcSAndroid Build Coastguard Worker // sigma contains the ChaCha constants, which happen to be an ASCII string.
27*8fb009dcSAndroid Build Coastguard Worker static const uint8_t sigma[16] = { 'e', 'x', 'p', 'a', 'n', 'd', ' ', '3',
28*8fb009dcSAndroid Build Coastguard Worker '2', '-', 'b', 'y', 't', 'e', ' ', 'k' };
29*8fb009dcSAndroid Build Coastguard Worker
30*8fb009dcSAndroid Build Coastguard Worker // QUARTERROUND updates a, b, c, d with a ChaCha "quarter" round.
31*8fb009dcSAndroid Build Coastguard Worker #define QUARTERROUND(a, b, c, d) \
32*8fb009dcSAndroid Build Coastguard Worker x[a] += x[b]; \
33*8fb009dcSAndroid Build Coastguard Worker x[d] = CRYPTO_rotl_u32(x[d] ^ x[a], 16); \
34*8fb009dcSAndroid Build Coastguard Worker x[c] += x[d]; \
35*8fb009dcSAndroid Build Coastguard Worker x[b] = CRYPTO_rotl_u32(x[b] ^ x[c], 12); \
36*8fb009dcSAndroid Build Coastguard Worker x[a] += x[b]; \
37*8fb009dcSAndroid Build Coastguard Worker x[d] = CRYPTO_rotl_u32(x[d] ^ x[a], 8); \
38*8fb009dcSAndroid Build Coastguard Worker x[c] += x[d]; \
39*8fb009dcSAndroid Build Coastguard Worker x[b] = CRYPTO_rotl_u32(x[b] ^ x[c], 7);
40*8fb009dcSAndroid Build Coastguard Worker
CRYPTO_hchacha20(uint8_t out[32],const uint8_t key[32],const uint8_t nonce[16])41*8fb009dcSAndroid Build Coastguard Worker void CRYPTO_hchacha20(uint8_t out[32], const uint8_t key[32],
42*8fb009dcSAndroid Build Coastguard Worker const uint8_t nonce[16]) {
43*8fb009dcSAndroid Build Coastguard Worker uint32_t x[16];
44*8fb009dcSAndroid Build Coastguard Worker OPENSSL_memcpy(x, sigma, sizeof(sigma));
45*8fb009dcSAndroid Build Coastguard Worker OPENSSL_memcpy(&x[4], key, 32);
46*8fb009dcSAndroid Build Coastguard Worker OPENSSL_memcpy(&x[12], nonce, 16);
47*8fb009dcSAndroid Build Coastguard Worker
48*8fb009dcSAndroid Build Coastguard Worker for (size_t i = 0; i < 20; i += 2) {
49*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(0, 4, 8, 12)
50*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(1, 5, 9, 13)
51*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(2, 6, 10, 14)
52*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(3, 7, 11, 15)
53*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(0, 5, 10, 15)
54*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(1, 6, 11, 12)
55*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(2, 7, 8, 13)
56*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(3, 4, 9, 14)
57*8fb009dcSAndroid Build Coastguard Worker }
58*8fb009dcSAndroid Build Coastguard Worker
59*8fb009dcSAndroid Build Coastguard Worker OPENSSL_memcpy(out, &x[0], sizeof(uint32_t) * 4);
60*8fb009dcSAndroid Build Coastguard Worker OPENSSL_memcpy(&out[16], &x[12], sizeof(uint32_t) * 4);
61*8fb009dcSAndroid Build Coastguard Worker }
62*8fb009dcSAndroid Build Coastguard Worker
63*8fb009dcSAndroid Build Coastguard Worker #if defined(CHACHA20_ASM_NOHW)
ChaCha20_ctr32(uint8_t * out,const uint8_t * in,size_t in_len,const uint32_t key[8],const uint32_t counter[4])64*8fb009dcSAndroid Build Coastguard Worker static void ChaCha20_ctr32(uint8_t *out, const uint8_t *in, size_t in_len,
65*8fb009dcSAndroid Build Coastguard Worker const uint32_t key[8], const uint32_t counter[4]) {
66*8fb009dcSAndroid Build Coastguard Worker #if defined(CHACHA20_ASM_NEON)
67*8fb009dcSAndroid Build Coastguard Worker if (ChaCha20_ctr32_neon_capable(in_len)) {
68*8fb009dcSAndroid Build Coastguard Worker ChaCha20_ctr32_neon(out, in, in_len, key, counter);
69*8fb009dcSAndroid Build Coastguard Worker return;
70*8fb009dcSAndroid Build Coastguard Worker }
71*8fb009dcSAndroid Build Coastguard Worker #endif
72*8fb009dcSAndroid Build Coastguard Worker #if defined(CHACHA20_ASM_AVX2)
73*8fb009dcSAndroid Build Coastguard Worker if (ChaCha20_ctr32_avx2_capable(in_len)) {
74*8fb009dcSAndroid Build Coastguard Worker ChaCha20_ctr32_avx2(out, in, in_len, key, counter);
75*8fb009dcSAndroid Build Coastguard Worker return;
76*8fb009dcSAndroid Build Coastguard Worker }
77*8fb009dcSAndroid Build Coastguard Worker #endif
78*8fb009dcSAndroid Build Coastguard Worker #if defined(CHACHA20_ASM_SSSE3_4X)
79*8fb009dcSAndroid Build Coastguard Worker if (ChaCha20_ctr32_ssse3_4x_capable(in_len)) {
80*8fb009dcSAndroid Build Coastguard Worker ChaCha20_ctr32_ssse3_4x(out, in, in_len, key, counter);
81*8fb009dcSAndroid Build Coastguard Worker return;
82*8fb009dcSAndroid Build Coastguard Worker }
83*8fb009dcSAndroid Build Coastguard Worker #endif
84*8fb009dcSAndroid Build Coastguard Worker #if defined(CHACHA20_ASM_SSSE3)
85*8fb009dcSAndroid Build Coastguard Worker if (ChaCha20_ctr32_ssse3_capable(in_len)) {
86*8fb009dcSAndroid Build Coastguard Worker ChaCha20_ctr32_ssse3(out, in, in_len, key, counter);
87*8fb009dcSAndroid Build Coastguard Worker return;
88*8fb009dcSAndroid Build Coastguard Worker }
89*8fb009dcSAndroid Build Coastguard Worker #endif
90*8fb009dcSAndroid Build Coastguard Worker if (in_len > 0) {
91*8fb009dcSAndroid Build Coastguard Worker ChaCha20_ctr32_nohw(out, in, in_len, key, counter);
92*8fb009dcSAndroid Build Coastguard Worker }
93*8fb009dcSAndroid Build Coastguard Worker }
94*8fb009dcSAndroid Build Coastguard Worker #endif
95*8fb009dcSAndroid Build Coastguard Worker
96*8fb009dcSAndroid Build Coastguard Worker #if defined(CHACHA20_ASM_NOHW)
97*8fb009dcSAndroid Build Coastguard Worker
CRYPTO_chacha_20(uint8_t * out,const uint8_t * in,size_t in_len,const uint8_t key[32],const uint8_t nonce[12],uint32_t counter)98*8fb009dcSAndroid Build Coastguard Worker void CRYPTO_chacha_20(uint8_t *out, const uint8_t *in, size_t in_len,
99*8fb009dcSAndroid Build Coastguard Worker const uint8_t key[32], const uint8_t nonce[12],
100*8fb009dcSAndroid Build Coastguard Worker uint32_t counter) {
101*8fb009dcSAndroid Build Coastguard Worker assert(!buffers_alias(out, in_len, in, in_len) || in == out);
102*8fb009dcSAndroid Build Coastguard Worker
103*8fb009dcSAndroid Build Coastguard Worker uint32_t counter_nonce[4];
104*8fb009dcSAndroid Build Coastguard Worker counter_nonce[0] = counter;
105*8fb009dcSAndroid Build Coastguard Worker counter_nonce[1] = CRYPTO_load_u32_le(nonce + 0);
106*8fb009dcSAndroid Build Coastguard Worker counter_nonce[2] = CRYPTO_load_u32_le(nonce + 4);
107*8fb009dcSAndroid Build Coastguard Worker counter_nonce[3] = CRYPTO_load_u32_le(nonce + 8);
108*8fb009dcSAndroid Build Coastguard Worker
109*8fb009dcSAndroid Build Coastguard Worker const uint32_t *key_ptr = (const uint32_t *)key;
110*8fb009dcSAndroid Build Coastguard Worker #if !defined(OPENSSL_X86) && !defined(OPENSSL_X86_64)
111*8fb009dcSAndroid Build Coastguard Worker // The assembly expects the key to be four-byte aligned.
112*8fb009dcSAndroid Build Coastguard Worker uint32_t key_u32[8];
113*8fb009dcSAndroid Build Coastguard Worker if ((((uintptr_t)key) & 3) != 0) {
114*8fb009dcSAndroid Build Coastguard Worker key_u32[0] = CRYPTO_load_u32_le(key + 0);
115*8fb009dcSAndroid Build Coastguard Worker key_u32[1] = CRYPTO_load_u32_le(key + 4);
116*8fb009dcSAndroid Build Coastguard Worker key_u32[2] = CRYPTO_load_u32_le(key + 8);
117*8fb009dcSAndroid Build Coastguard Worker key_u32[3] = CRYPTO_load_u32_le(key + 12);
118*8fb009dcSAndroid Build Coastguard Worker key_u32[4] = CRYPTO_load_u32_le(key + 16);
119*8fb009dcSAndroid Build Coastguard Worker key_u32[5] = CRYPTO_load_u32_le(key + 20);
120*8fb009dcSAndroid Build Coastguard Worker key_u32[6] = CRYPTO_load_u32_le(key + 24);
121*8fb009dcSAndroid Build Coastguard Worker key_u32[7] = CRYPTO_load_u32_le(key + 28);
122*8fb009dcSAndroid Build Coastguard Worker
123*8fb009dcSAndroid Build Coastguard Worker key_ptr = key_u32;
124*8fb009dcSAndroid Build Coastguard Worker }
125*8fb009dcSAndroid Build Coastguard Worker #endif
126*8fb009dcSAndroid Build Coastguard Worker
127*8fb009dcSAndroid Build Coastguard Worker while (in_len > 0) {
128*8fb009dcSAndroid Build Coastguard Worker // The assembly functions do not have defined overflow behavior. While
129*8fb009dcSAndroid Build Coastguard Worker // overflow is almost always a bug in the caller, we prefer our functions to
130*8fb009dcSAndroid Build Coastguard Worker // behave the same across platforms, so divide into multiple calls to avoid
131*8fb009dcSAndroid Build Coastguard Worker // this case.
132*8fb009dcSAndroid Build Coastguard Worker uint64_t todo = 64 * ((UINT64_C(1) << 32) - counter_nonce[0]);
133*8fb009dcSAndroid Build Coastguard Worker if (todo > in_len) {
134*8fb009dcSAndroid Build Coastguard Worker todo = in_len;
135*8fb009dcSAndroid Build Coastguard Worker }
136*8fb009dcSAndroid Build Coastguard Worker
137*8fb009dcSAndroid Build Coastguard Worker ChaCha20_ctr32(out, in, (size_t)todo, key_ptr, counter_nonce);
138*8fb009dcSAndroid Build Coastguard Worker in += todo;
139*8fb009dcSAndroid Build Coastguard Worker out += todo;
140*8fb009dcSAndroid Build Coastguard Worker in_len -= todo;
141*8fb009dcSAndroid Build Coastguard Worker
142*8fb009dcSAndroid Build Coastguard Worker // We're either done and will next break out of the loop, or we stopped at
143*8fb009dcSAndroid Build Coastguard Worker // the wraparound point and the counter should continue at zero.
144*8fb009dcSAndroid Build Coastguard Worker counter_nonce[0] = 0;
145*8fb009dcSAndroid Build Coastguard Worker }
146*8fb009dcSAndroid Build Coastguard Worker }
147*8fb009dcSAndroid Build Coastguard Worker
148*8fb009dcSAndroid Build Coastguard Worker #else
149*8fb009dcSAndroid Build Coastguard Worker
150*8fb009dcSAndroid Build Coastguard Worker // chacha_core performs 20 rounds of ChaCha on the input words in
151*8fb009dcSAndroid Build Coastguard Worker // |input| and writes the 64 output bytes to |output|.
chacha_core(uint8_t output[64],const uint32_t input[16])152*8fb009dcSAndroid Build Coastguard Worker static void chacha_core(uint8_t output[64], const uint32_t input[16]) {
153*8fb009dcSAndroid Build Coastguard Worker uint32_t x[16];
154*8fb009dcSAndroid Build Coastguard Worker int i;
155*8fb009dcSAndroid Build Coastguard Worker
156*8fb009dcSAndroid Build Coastguard Worker OPENSSL_memcpy(x, input, sizeof(uint32_t) * 16);
157*8fb009dcSAndroid Build Coastguard Worker for (i = 20; i > 0; i -= 2) {
158*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(0, 4, 8, 12)
159*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(1, 5, 9, 13)
160*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(2, 6, 10, 14)
161*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(3, 7, 11, 15)
162*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(0, 5, 10, 15)
163*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(1, 6, 11, 12)
164*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(2, 7, 8, 13)
165*8fb009dcSAndroid Build Coastguard Worker QUARTERROUND(3, 4, 9, 14)
166*8fb009dcSAndroid Build Coastguard Worker }
167*8fb009dcSAndroid Build Coastguard Worker
168*8fb009dcSAndroid Build Coastguard Worker for (i = 0; i < 16; ++i) {
169*8fb009dcSAndroid Build Coastguard Worker x[i] += input[i];
170*8fb009dcSAndroid Build Coastguard Worker }
171*8fb009dcSAndroid Build Coastguard Worker for (i = 0; i < 16; ++i) {
172*8fb009dcSAndroid Build Coastguard Worker CRYPTO_store_u32_le(output + 4 * i, x[i]);
173*8fb009dcSAndroid Build Coastguard Worker }
174*8fb009dcSAndroid Build Coastguard Worker }
175*8fb009dcSAndroid Build Coastguard Worker
CRYPTO_chacha_20(uint8_t * out,const uint8_t * in,size_t in_len,const uint8_t key[32],const uint8_t nonce[12],uint32_t counter)176*8fb009dcSAndroid Build Coastguard Worker void CRYPTO_chacha_20(uint8_t *out, const uint8_t *in, size_t in_len,
177*8fb009dcSAndroid Build Coastguard Worker const uint8_t key[32], const uint8_t nonce[12],
178*8fb009dcSAndroid Build Coastguard Worker uint32_t counter) {
179*8fb009dcSAndroid Build Coastguard Worker assert(!buffers_alias(out, in_len, in, in_len) || in == out);
180*8fb009dcSAndroid Build Coastguard Worker
181*8fb009dcSAndroid Build Coastguard Worker uint32_t input[16];
182*8fb009dcSAndroid Build Coastguard Worker uint8_t buf[64];
183*8fb009dcSAndroid Build Coastguard Worker size_t todo, i;
184*8fb009dcSAndroid Build Coastguard Worker
185*8fb009dcSAndroid Build Coastguard Worker input[0] = CRYPTO_load_u32_le(sigma + 0);
186*8fb009dcSAndroid Build Coastguard Worker input[1] = CRYPTO_load_u32_le(sigma + 4);
187*8fb009dcSAndroid Build Coastguard Worker input[2] = CRYPTO_load_u32_le(sigma + 8);
188*8fb009dcSAndroid Build Coastguard Worker input[3] = CRYPTO_load_u32_le(sigma + 12);
189*8fb009dcSAndroid Build Coastguard Worker
190*8fb009dcSAndroid Build Coastguard Worker input[4] = CRYPTO_load_u32_le(key + 0);
191*8fb009dcSAndroid Build Coastguard Worker input[5] = CRYPTO_load_u32_le(key + 4);
192*8fb009dcSAndroid Build Coastguard Worker input[6] = CRYPTO_load_u32_le(key + 8);
193*8fb009dcSAndroid Build Coastguard Worker input[7] = CRYPTO_load_u32_le(key + 12);
194*8fb009dcSAndroid Build Coastguard Worker
195*8fb009dcSAndroid Build Coastguard Worker input[8] = CRYPTO_load_u32_le(key + 16);
196*8fb009dcSAndroid Build Coastguard Worker input[9] = CRYPTO_load_u32_le(key + 20);
197*8fb009dcSAndroid Build Coastguard Worker input[10] = CRYPTO_load_u32_le(key + 24);
198*8fb009dcSAndroid Build Coastguard Worker input[11] = CRYPTO_load_u32_le(key + 28);
199*8fb009dcSAndroid Build Coastguard Worker
200*8fb009dcSAndroid Build Coastguard Worker input[12] = counter;
201*8fb009dcSAndroid Build Coastguard Worker input[13] = CRYPTO_load_u32_le(nonce + 0);
202*8fb009dcSAndroid Build Coastguard Worker input[14] = CRYPTO_load_u32_le(nonce + 4);
203*8fb009dcSAndroid Build Coastguard Worker input[15] = CRYPTO_load_u32_le(nonce + 8);
204*8fb009dcSAndroid Build Coastguard Worker
205*8fb009dcSAndroid Build Coastguard Worker while (in_len > 0) {
206*8fb009dcSAndroid Build Coastguard Worker todo = sizeof(buf);
207*8fb009dcSAndroid Build Coastguard Worker if (in_len < todo) {
208*8fb009dcSAndroid Build Coastguard Worker todo = in_len;
209*8fb009dcSAndroid Build Coastguard Worker }
210*8fb009dcSAndroid Build Coastguard Worker
211*8fb009dcSAndroid Build Coastguard Worker chacha_core(buf, input);
212*8fb009dcSAndroid Build Coastguard Worker for (i = 0; i < todo; i++) {
213*8fb009dcSAndroid Build Coastguard Worker out[i] = in[i] ^ buf[i];
214*8fb009dcSAndroid Build Coastguard Worker }
215*8fb009dcSAndroid Build Coastguard Worker
216*8fb009dcSAndroid Build Coastguard Worker out += todo;
217*8fb009dcSAndroid Build Coastguard Worker in += todo;
218*8fb009dcSAndroid Build Coastguard Worker in_len -= todo;
219*8fb009dcSAndroid Build Coastguard Worker
220*8fb009dcSAndroid Build Coastguard Worker input[12]++;
221*8fb009dcSAndroid Build Coastguard Worker }
222*8fb009dcSAndroid Build Coastguard Worker }
223*8fb009dcSAndroid Build Coastguard Worker
224*8fb009dcSAndroid Build Coastguard Worker #endif
225