1*f6dc9357SAndroid Build Coastguard Worker /* Aes.c -- AES encryption / decryption
2*f6dc9357SAndroid Build Coastguard Worker 2024-03-01 : Igor Pavlov : Public domain */
3*f6dc9357SAndroid Build Coastguard Worker
4*f6dc9357SAndroid Build Coastguard Worker #include "Precomp.h"
5*f6dc9357SAndroid Build Coastguard Worker
6*f6dc9357SAndroid Build Coastguard Worker #include "CpuArch.h"
7*f6dc9357SAndroid Build Coastguard Worker #include "Aes.h"
8*f6dc9357SAndroid Build Coastguard Worker
9*f6dc9357SAndroid Build Coastguard Worker AES_CODE_FUNC g_AesCbc_Decode;
10*f6dc9357SAndroid Build Coastguard Worker #ifndef Z7_SFX
11*f6dc9357SAndroid Build Coastguard Worker AES_CODE_FUNC g_AesCbc_Encode;
12*f6dc9357SAndroid Build Coastguard Worker AES_CODE_FUNC g_AesCtr_Code;
13*f6dc9357SAndroid Build Coastguard Worker UInt32 g_Aes_SupportedFunctions_Flags;
14*f6dc9357SAndroid Build Coastguard Worker #endif
15*f6dc9357SAndroid Build Coastguard Worker
16*f6dc9357SAndroid Build Coastguard Worker MY_ALIGN(64)
17*f6dc9357SAndroid Build Coastguard Worker static UInt32 T[256 * 4];
18*f6dc9357SAndroid Build Coastguard Worker MY_ALIGN(64)
19*f6dc9357SAndroid Build Coastguard Worker static const Byte Sbox[256] = {
20*f6dc9357SAndroid Build Coastguard Worker 0x63, 0x7c, 0x77, 0x7b, 0xf2, 0x6b, 0x6f, 0xc5, 0x30, 0x01, 0x67, 0x2b, 0xfe, 0xd7, 0xab, 0x76,
21*f6dc9357SAndroid Build Coastguard Worker 0xca, 0x82, 0xc9, 0x7d, 0xfa, 0x59, 0x47, 0xf0, 0xad, 0xd4, 0xa2, 0xaf, 0x9c, 0xa4, 0x72, 0xc0,
22*f6dc9357SAndroid Build Coastguard Worker 0xb7, 0xfd, 0x93, 0x26, 0x36, 0x3f, 0xf7, 0xcc, 0x34, 0xa5, 0xe5, 0xf1, 0x71, 0xd8, 0x31, 0x15,
23*f6dc9357SAndroid Build Coastguard Worker 0x04, 0xc7, 0x23, 0xc3, 0x18, 0x96, 0x05, 0x9a, 0x07, 0x12, 0x80, 0xe2, 0xeb, 0x27, 0xb2, 0x75,
24*f6dc9357SAndroid Build Coastguard Worker 0x09, 0x83, 0x2c, 0x1a, 0x1b, 0x6e, 0x5a, 0xa0, 0x52, 0x3b, 0xd6, 0xb3, 0x29, 0xe3, 0x2f, 0x84,
25*f6dc9357SAndroid Build Coastguard Worker 0x53, 0xd1, 0x00, 0xed, 0x20, 0xfc, 0xb1, 0x5b, 0x6a, 0xcb, 0xbe, 0x39, 0x4a, 0x4c, 0x58, 0xcf,
26*f6dc9357SAndroid Build Coastguard Worker 0xd0, 0xef, 0xaa, 0xfb, 0x43, 0x4d, 0x33, 0x85, 0x45, 0xf9, 0x02, 0x7f, 0x50, 0x3c, 0x9f, 0xa8,
27*f6dc9357SAndroid Build Coastguard Worker 0x51, 0xa3, 0x40, 0x8f, 0x92, 0x9d, 0x38, 0xf5, 0xbc, 0xb6, 0xda, 0x21, 0x10, 0xff, 0xf3, 0xd2,
28*f6dc9357SAndroid Build Coastguard Worker 0xcd, 0x0c, 0x13, 0xec, 0x5f, 0x97, 0x44, 0x17, 0xc4, 0xa7, 0x7e, 0x3d, 0x64, 0x5d, 0x19, 0x73,
29*f6dc9357SAndroid Build Coastguard Worker 0x60, 0x81, 0x4f, 0xdc, 0x22, 0x2a, 0x90, 0x88, 0x46, 0xee, 0xb8, 0x14, 0xde, 0x5e, 0x0b, 0xdb,
30*f6dc9357SAndroid Build Coastguard Worker 0xe0, 0x32, 0x3a, 0x0a, 0x49, 0x06, 0x24, 0x5c, 0xc2, 0xd3, 0xac, 0x62, 0x91, 0x95, 0xe4, 0x79,
31*f6dc9357SAndroid Build Coastguard Worker 0xe7, 0xc8, 0x37, 0x6d, 0x8d, 0xd5, 0x4e, 0xa9, 0x6c, 0x56, 0xf4, 0xea, 0x65, 0x7a, 0xae, 0x08,
32*f6dc9357SAndroid Build Coastguard Worker 0xba, 0x78, 0x25, 0x2e, 0x1c, 0xa6, 0xb4, 0xc6, 0xe8, 0xdd, 0x74, 0x1f, 0x4b, 0xbd, 0x8b, 0x8a,
33*f6dc9357SAndroid Build Coastguard Worker 0x70, 0x3e, 0xb5, 0x66, 0x48, 0x03, 0xf6, 0x0e, 0x61, 0x35, 0x57, 0xb9, 0x86, 0xc1, 0x1d, 0x9e,
34*f6dc9357SAndroid Build Coastguard Worker 0xe1, 0xf8, 0x98, 0x11, 0x69, 0xd9, 0x8e, 0x94, 0x9b, 0x1e, 0x87, 0xe9, 0xce, 0x55, 0x28, 0xdf,
35*f6dc9357SAndroid Build Coastguard Worker 0x8c, 0xa1, 0x89, 0x0d, 0xbf, 0xe6, 0x42, 0x68, 0x41, 0x99, 0x2d, 0x0f, 0xb0, 0x54, 0xbb, 0x16};
36*f6dc9357SAndroid Build Coastguard Worker
37*f6dc9357SAndroid Build Coastguard Worker
38*f6dc9357SAndroid Build Coastguard Worker MY_ALIGN(64)
39*f6dc9357SAndroid Build Coastguard Worker static UInt32 D[256 * 4];
40*f6dc9357SAndroid Build Coastguard Worker MY_ALIGN(64)
41*f6dc9357SAndroid Build Coastguard Worker static Byte InvS[256];
42*f6dc9357SAndroid Build Coastguard Worker
43*f6dc9357SAndroid Build Coastguard Worker #define xtime(x) ((((x) << 1) ^ (((x) & 0x80) != 0 ? 0x1B : 0)) & 0xFF)
44*f6dc9357SAndroid Build Coastguard Worker
45*f6dc9357SAndroid Build Coastguard Worker #define Ui32(a0, a1, a2, a3) ((UInt32)(a0) | ((UInt32)(a1) << 8) | ((UInt32)(a2) << 16) | ((UInt32)(a3) << 24))
46*f6dc9357SAndroid Build Coastguard Worker
47*f6dc9357SAndroid Build Coastguard Worker #define gb0(x) ( (x) & 0xFF)
48*f6dc9357SAndroid Build Coastguard Worker #define gb1(x) (((x) >> ( 8)) & 0xFF)
49*f6dc9357SAndroid Build Coastguard Worker #define gb2(x) (((x) >> (16)) & 0xFF)
50*f6dc9357SAndroid Build Coastguard Worker #define gb3(x) (((x) >> (24)))
51*f6dc9357SAndroid Build Coastguard Worker
52*f6dc9357SAndroid Build Coastguard Worker #define gb(n, x) gb ## n(x)
53*f6dc9357SAndroid Build Coastguard Worker
54*f6dc9357SAndroid Build Coastguard Worker #define TT(x) (T + (x << 8))
55*f6dc9357SAndroid Build Coastguard Worker #define DD(x) (D + (x << 8))
56*f6dc9357SAndroid Build Coastguard Worker
57*f6dc9357SAndroid Build Coastguard Worker
58*f6dc9357SAndroid Build Coastguard Worker // #define Z7_SHOW_AES_STATUS
59*f6dc9357SAndroid Build Coastguard Worker
60*f6dc9357SAndroid Build Coastguard Worker #ifdef MY_CPU_X86_OR_AMD64
61*f6dc9357SAndroid Build Coastguard Worker
62*f6dc9357SAndroid Build Coastguard Worker #if defined(__INTEL_COMPILER)
63*f6dc9357SAndroid Build Coastguard Worker #if (__INTEL_COMPILER >= 1110)
64*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_AES
65*f6dc9357SAndroid Build Coastguard Worker #if (__INTEL_COMPILER >= 1900)
66*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_VAES
67*f6dc9357SAndroid Build Coastguard Worker #endif
68*f6dc9357SAndroid Build Coastguard Worker #endif
69*f6dc9357SAndroid Build Coastguard Worker #elif defined(Z7_CLANG_VERSION) && (Z7_CLANG_VERSION >= 30800) \
70*f6dc9357SAndroid Build Coastguard Worker || defined(Z7_GCC_VERSION) && (Z7_GCC_VERSION >= 40400)
71*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_AES
72*f6dc9357SAndroid Build Coastguard Worker #if defined(__clang__) && (__clang_major__ >= 8) \
73*f6dc9357SAndroid Build Coastguard Worker || defined(__GNUC__) && (__GNUC__ >= 8)
74*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_VAES
75*f6dc9357SAndroid Build Coastguard Worker #endif
76*f6dc9357SAndroid Build Coastguard Worker #elif defined(_MSC_VER)
77*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_AES
78*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_VAES
79*f6dc9357SAndroid Build Coastguard Worker #endif
80*f6dc9357SAndroid Build Coastguard Worker
81*f6dc9357SAndroid Build Coastguard Worker #elif defined(MY_CPU_ARM_OR_ARM64) && defined(MY_CPU_LE)
82*f6dc9357SAndroid Build Coastguard Worker
83*f6dc9357SAndroid Build Coastguard Worker #if defined(__ARM_FEATURE_AES) \
84*f6dc9357SAndroid Build Coastguard Worker || defined(__ARM_FEATURE_CRYPTO)
85*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_AES
86*f6dc9357SAndroid Build Coastguard Worker #else
87*f6dc9357SAndroid Build Coastguard Worker #if defined(MY_CPU_ARM64) \
88*f6dc9357SAndroid Build Coastguard Worker || defined(__ARM_ARCH) && (__ARM_ARCH >= 4) \
89*f6dc9357SAndroid Build Coastguard Worker || defined(Z7_MSC_VER_ORIGINAL)
90*f6dc9357SAndroid Build Coastguard Worker #if defined(__ARM_FP) && \
91*f6dc9357SAndroid Build Coastguard Worker ( defined(Z7_CLANG_VERSION) && (Z7_CLANG_VERSION >= 30800) \
92*f6dc9357SAndroid Build Coastguard Worker || defined(__GNUC__) && (__GNUC__ >= 6) \
93*f6dc9357SAndroid Build Coastguard Worker ) \
94*f6dc9357SAndroid Build Coastguard Worker || defined(Z7_MSC_VER_ORIGINAL) && (_MSC_VER >= 1910)
95*f6dc9357SAndroid Build Coastguard Worker #if defined(MY_CPU_ARM64) \
96*f6dc9357SAndroid Build Coastguard Worker || !defined(Z7_CLANG_VERSION) \
97*f6dc9357SAndroid Build Coastguard Worker || defined(__ARM_NEON) && \
98*f6dc9357SAndroid Build Coastguard Worker (Z7_CLANG_VERSION < 170000 || \
99*f6dc9357SAndroid Build Coastguard Worker Z7_CLANG_VERSION > 170001)
100*f6dc9357SAndroid Build Coastguard Worker #define USE_HW_AES
101*f6dc9357SAndroid Build Coastguard Worker #endif
102*f6dc9357SAndroid Build Coastguard Worker #endif
103*f6dc9357SAndroid Build Coastguard Worker #endif
104*f6dc9357SAndroid Build Coastguard Worker #endif
105*f6dc9357SAndroid Build Coastguard Worker #endif
106*f6dc9357SAndroid Build Coastguard Worker
107*f6dc9357SAndroid Build Coastguard Worker #ifdef USE_HW_AES
108*f6dc9357SAndroid Build Coastguard Worker // #pragma message("=== Aes.c USE_HW_AES === ")
109*f6dc9357SAndroid Build Coastguard Worker #ifdef Z7_SHOW_AES_STATUS
110*f6dc9357SAndroid Build Coastguard Worker #include <stdio.h>
111*f6dc9357SAndroid Build Coastguard Worker #define PRF(x) x
112*f6dc9357SAndroid Build Coastguard Worker #else
113*f6dc9357SAndroid Build Coastguard Worker #define PRF(x)
114*f6dc9357SAndroid Build Coastguard Worker #endif
115*f6dc9357SAndroid Build Coastguard Worker #endif
116*f6dc9357SAndroid Build Coastguard Worker
117*f6dc9357SAndroid Build Coastguard Worker
AesGenTables(void)118*f6dc9357SAndroid Build Coastguard Worker void AesGenTables(void)
119*f6dc9357SAndroid Build Coastguard Worker {
120*f6dc9357SAndroid Build Coastguard Worker unsigned i;
121*f6dc9357SAndroid Build Coastguard Worker for (i = 0; i < 256; i++)
122*f6dc9357SAndroid Build Coastguard Worker InvS[Sbox[i]] = (Byte)i;
123*f6dc9357SAndroid Build Coastguard Worker
124*f6dc9357SAndroid Build Coastguard Worker for (i = 0; i < 256; i++)
125*f6dc9357SAndroid Build Coastguard Worker {
126*f6dc9357SAndroid Build Coastguard Worker {
127*f6dc9357SAndroid Build Coastguard Worker const UInt32 a1 = Sbox[i];
128*f6dc9357SAndroid Build Coastguard Worker const UInt32 a2 = xtime(a1);
129*f6dc9357SAndroid Build Coastguard Worker const UInt32 a3 = a2 ^ a1;
130*f6dc9357SAndroid Build Coastguard Worker TT(0)[i] = Ui32(a2, a1, a1, a3);
131*f6dc9357SAndroid Build Coastguard Worker TT(1)[i] = Ui32(a3, a2, a1, a1);
132*f6dc9357SAndroid Build Coastguard Worker TT(2)[i] = Ui32(a1, a3, a2, a1);
133*f6dc9357SAndroid Build Coastguard Worker TT(3)[i] = Ui32(a1, a1, a3, a2);
134*f6dc9357SAndroid Build Coastguard Worker }
135*f6dc9357SAndroid Build Coastguard Worker {
136*f6dc9357SAndroid Build Coastguard Worker const UInt32 a1 = InvS[i];
137*f6dc9357SAndroid Build Coastguard Worker const UInt32 a2 = xtime(a1);
138*f6dc9357SAndroid Build Coastguard Worker const UInt32 a4 = xtime(a2);
139*f6dc9357SAndroid Build Coastguard Worker const UInt32 a8 = xtime(a4);
140*f6dc9357SAndroid Build Coastguard Worker const UInt32 a9 = a8 ^ a1;
141*f6dc9357SAndroid Build Coastguard Worker const UInt32 aB = a8 ^ a2 ^ a1;
142*f6dc9357SAndroid Build Coastguard Worker const UInt32 aD = a8 ^ a4 ^ a1;
143*f6dc9357SAndroid Build Coastguard Worker const UInt32 aE = a8 ^ a4 ^ a2;
144*f6dc9357SAndroid Build Coastguard Worker DD(0)[i] = Ui32(aE, a9, aD, aB);
145*f6dc9357SAndroid Build Coastguard Worker DD(1)[i] = Ui32(aB, aE, a9, aD);
146*f6dc9357SAndroid Build Coastguard Worker DD(2)[i] = Ui32(aD, aB, aE, a9);
147*f6dc9357SAndroid Build Coastguard Worker DD(3)[i] = Ui32(a9, aD, aB, aE);
148*f6dc9357SAndroid Build Coastguard Worker }
149*f6dc9357SAndroid Build Coastguard Worker }
150*f6dc9357SAndroid Build Coastguard Worker
151*f6dc9357SAndroid Build Coastguard Worker {
152*f6dc9357SAndroid Build Coastguard Worker AES_CODE_FUNC d = AesCbc_Decode;
153*f6dc9357SAndroid Build Coastguard Worker #ifndef Z7_SFX
154*f6dc9357SAndroid Build Coastguard Worker AES_CODE_FUNC e = AesCbc_Encode;
155*f6dc9357SAndroid Build Coastguard Worker AES_CODE_FUNC c = AesCtr_Code;
156*f6dc9357SAndroid Build Coastguard Worker UInt32 flags = 0;
157*f6dc9357SAndroid Build Coastguard Worker #endif
158*f6dc9357SAndroid Build Coastguard Worker
159*f6dc9357SAndroid Build Coastguard Worker #ifdef USE_HW_AES
160*f6dc9357SAndroid Build Coastguard Worker if (CPU_IsSupported_AES())
161*f6dc9357SAndroid Build Coastguard Worker {
162*f6dc9357SAndroid Build Coastguard Worker // #pragma message ("AES HW")
163*f6dc9357SAndroid Build Coastguard Worker PRF(printf("\n===AES HW\n"));
164*f6dc9357SAndroid Build Coastguard Worker d = AesCbc_Decode_HW;
165*f6dc9357SAndroid Build Coastguard Worker
166*f6dc9357SAndroid Build Coastguard Worker #ifndef Z7_SFX
167*f6dc9357SAndroid Build Coastguard Worker e = AesCbc_Encode_HW;
168*f6dc9357SAndroid Build Coastguard Worker c = AesCtr_Code_HW;
169*f6dc9357SAndroid Build Coastguard Worker flags = k_Aes_SupportedFunctions_HW;
170*f6dc9357SAndroid Build Coastguard Worker #endif
171*f6dc9357SAndroid Build Coastguard Worker
172*f6dc9357SAndroid Build Coastguard Worker #ifdef MY_CPU_X86_OR_AMD64
173*f6dc9357SAndroid Build Coastguard Worker #ifdef USE_HW_VAES
174*f6dc9357SAndroid Build Coastguard Worker if (CPU_IsSupported_VAES_AVX2())
175*f6dc9357SAndroid Build Coastguard Worker {
176*f6dc9357SAndroid Build Coastguard Worker PRF(printf("\n===vaes avx2\n"));
177*f6dc9357SAndroid Build Coastguard Worker d = AesCbc_Decode_HW_256;
178*f6dc9357SAndroid Build Coastguard Worker #ifndef Z7_SFX
179*f6dc9357SAndroid Build Coastguard Worker c = AesCtr_Code_HW_256;
180*f6dc9357SAndroid Build Coastguard Worker flags |= k_Aes_SupportedFunctions_HW_256;
181*f6dc9357SAndroid Build Coastguard Worker #endif
182*f6dc9357SAndroid Build Coastguard Worker }
183*f6dc9357SAndroid Build Coastguard Worker #endif
184*f6dc9357SAndroid Build Coastguard Worker #endif
185*f6dc9357SAndroid Build Coastguard Worker }
186*f6dc9357SAndroid Build Coastguard Worker #endif
187*f6dc9357SAndroid Build Coastguard Worker
188*f6dc9357SAndroid Build Coastguard Worker g_AesCbc_Decode = d;
189*f6dc9357SAndroid Build Coastguard Worker #ifndef Z7_SFX
190*f6dc9357SAndroid Build Coastguard Worker g_AesCbc_Encode = e;
191*f6dc9357SAndroid Build Coastguard Worker g_AesCtr_Code = c;
192*f6dc9357SAndroid Build Coastguard Worker g_Aes_SupportedFunctions_Flags = flags;
193*f6dc9357SAndroid Build Coastguard Worker #endif
194*f6dc9357SAndroid Build Coastguard Worker }
195*f6dc9357SAndroid Build Coastguard Worker }
196*f6dc9357SAndroid Build Coastguard Worker
197*f6dc9357SAndroid Build Coastguard Worker
198*f6dc9357SAndroid Build Coastguard Worker #define HT(i, x, s) TT(x)[gb(x, s[(i + x) & 3])]
199*f6dc9357SAndroid Build Coastguard Worker
200*f6dc9357SAndroid Build Coastguard Worker #define HT4(m, i, s, p) m[i] = \
201*f6dc9357SAndroid Build Coastguard Worker HT(i, 0, s) ^ \
202*f6dc9357SAndroid Build Coastguard Worker HT(i, 1, s) ^ \
203*f6dc9357SAndroid Build Coastguard Worker HT(i, 2, s) ^ \
204*f6dc9357SAndroid Build Coastguard Worker HT(i, 3, s) ^ w[p + i]
205*f6dc9357SAndroid Build Coastguard Worker
206*f6dc9357SAndroid Build Coastguard Worker #define HT16(m, s, p) \
207*f6dc9357SAndroid Build Coastguard Worker HT4(m, 0, s, p); \
208*f6dc9357SAndroid Build Coastguard Worker HT4(m, 1, s, p); \
209*f6dc9357SAndroid Build Coastguard Worker HT4(m, 2, s, p); \
210*f6dc9357SAndroid Build Coastguard Worker HT4(m, 3, s, p); \
211*f6dc9357SAndroid Build Coastguard Worker
212*f6dc9357SAndroid Build Coastguard Worker #define FT(i, x) Sbox[gb(x, m[(i + x) & 3])]
213*f6dc9357SAndroid Build Coastguard Worker #define FT4(i) dest[i] = Ui32(FT(i, 0), FT(i, 1), FT(i, 2), FT(i, 3)) ^ w[i];
214*f6dc9357SAndroid Build Coastguard Worker
215*f6dc9357SAndroid Build Coastguard Worker
216*f6dc9357SAndroid Build Coastguard Worker #define HD(i, x, s) DD(x)[gb(x, s[(i - x) & 3])]
217*f6dc9357SAndroid Build Coastguard Worker
218*f6dc9357SAndroid Build Coastguard Worker #define HD4(m, i, s, p) m[i] = \
219*f6dc9357SAndroid Build Coastguard Worker HD(i, 0, s) ^ \
220*f6dc9357SAndroid Build Coastguard Worker HD(i, 1, s) ^ \
221*f6dc9357SAndroid Build Coastguard Worker HD(i, 2, s) ^ \
222*f6dc9357SAndroid Build Coastguard Worker HD(i, 3, s) ^ w[p + i];
223*f6dc9357SAndroid Build Coastguard Worker
224*f6dc9357SAndroid Build Coastguard Worker #define HD16(m, s, p) \
225*f6dc9357SAndroid Build Coastguard Worker HD4(m, 0, s, p); \
226*f6dc9357SAndroid Build Coastguard Worker HD4(m, 1, s, p); \
227*f6dc9357SAndroid Build Coastguard Worker HD4(m, 2, s, p); \
228*f6dc9357SAndroid Build Coastguard Worker HD4(m, 3, s, p); \
229*f6dc9357SAndroid Build Coastguard Worker
230*f6dc9357SAndroid Build Coastguard Worker #define FD(i, x) InvS[gb(x, m[(i - x) & 3])]
231*f6dc9357SAndroid Build Coastguard Worker #define FD4(i) dest[i] = Ui32(FD(i, 0), FD(i, 1), FD(i, 2), FD(i, 3)) ^ w[i];
232*f6dc9357SAndroid Build Coastguard Worker
Aes_SetKey_Enc(UInt32 * w,const Byte * key,unsigned keySize)233*f6dc9357SAndroid Build Coastguard Worker void Z7_FASTCALL Aes_SetKey_Enc(UInt32 *w, const Byte *key, unsigned keySize)
234*f6dc9357SAndroid Build Coastguard Worker {
235*f6dc9357SAndroid Build Coastguard Worker unsigned i, m;
236*f6dc9357SAndroid Build Coastguard Worker const UInt32 *wLim;
237*f6dc9357SAndroid Build Coastguard Worker UInt32 t;
238*f6dc9357SAndroid Build Coastguard Worker UInt32 rcon = 1;
239*f6dc9357SAndroid Build Coastguard Worker
240*f6dc9357SAndroid Build Coastguard Worker keySize /= 4;
241*f6dc9357SAndroid Build Coastguard Worker w[0] = ((UInt32)keySize / 2) + 3;
242*f6dc9357SAndroid Build Coastguard Worker w += 4;
243*f6dc9357SAndroid Build Coastguard Worker
244*f6dc9357SAndroid Build Coastguard Worker for (i = 0; i < keySize; i++, key += 4)
245*f6dc9357SAndroid Build Coastguard Worker w[i] = GetUi32(key);
246*f6dc9357SAndroid Build Coastguard Worker
247*f6dc9357SAndroid Build Coastguard Worker t = w[(size_t)keySize - 1];
248*f6dc9357SAndroid Build Coastguard Worker wLim = w + (size_t)keySize * 3 + 28;
249*f6dc9357SAndroid Build Coastguard Worker m = 0;
250*f6dc9357SAndroid Build Coastguard Worker do
251*f6dc9357SAndroid Build Coastguard Worker {
252*f6dc9357SAndroid Build Coastguard Worker if (m == 0)
253*f6dc9357SAndroid Build Coastguard Worker {
254*f6dc9357SAndroid Build Coastguard Worker t = Ui32(Sbox[gb1(t)] ^ rcon, Sbox[gb2(t)], Sbox[gb3(t)], Sbox[gb0(t)]);
255*f6dc9357SAndroid Build Coastguard Worker rcon <<= 1;
256*f6dc9357SAndroid Build Coastguard Worker if (rcon & 0x100)
257*f6dc9357SAndroid Build Coastguard Worker rcon = 0x1b;
258*f6dc9357SAndroid Build Coastguard Worker m = keySize;
259*f6dc9357SAndroid Build Coastguard Worker }
260*f6dc9357SAndroid Build Coastguard Worker else if (m == 4 && keySize > 6)
261*f6dc9357SAndroid Build Coastguard Worker t = Ui32(Sbox[gb0(t)], Sbox[gb1(t)], Sbox[gb2(t)], Sbox[gb3(t)]);
262*f6dc9357SAndroid Build Coastguard Worker m--;
263*f6dc9357SAndroid Build Coastguard Worker t ^= w[0];
264*f6dc9357SAndroid Build Coastguard Worker w[keySize] = t;
265*f6dc9357SAndroid Build Coastguard Worker }
266*f6dc9357SAndroid Build Coastguard Worker while (++w != wLim);
267*f6dc9357SAndroid Build Coastguard Worker }
268*f6dc9357SAndroid Build Coastguard Worker
Aes_SetKey_Dec(UInt32 * w,const Byte * key,unsigned keySize)269*f6dc9357SAndroid Build Coastguard Worker void Z7_FASTCALL Aes_SetKey_Dec(UInt32 *w, const Byte *key, unsigned keySize)
270*f6dc9357SAndroid Build Coastguard Worker {
271*f6dc9357SAndroid Build Coastguard Worker unsigned i, num;
272*f6dc9357SAndroid Build Coastguard Worker Aes_SetKey_Enc(w, key, keySize);
273*f6dc9357SAndroid Build Coastguard Worker num = keySize + 20;
274*f6dc9357SAndroid Build Coastguard Worker w += 8;
275*f6dc9357SAndroid Build Coastguard Worker for (i = 0; i < num; i++)
276*f6dc9357SAndroid Build Coastguard Worker {
277*f6dc9357SAndroid Build Coastguard Worker UInt32 r = w[i];
278*f6dc9357SAndroid Build Coastguard Worker w[i] =
279*f6dc9357SAndroid Build Coastguard Worker DD(0)[Sbox[gb0(r)]] ^
280*f6dc9357SAndroid Build Coastguard Worker DD(1)[Sbox[gb1(r)]] ^
281*f6dc9357SAndroid Build Coastguard Worker DD(2)[Sbox[gb2(r)]] ^
282*f6dc9357SAndroid Build Coastguard Worker DD(3)[Sbox[gb3(r)]];
283*f6dc9357SAndroid Build Coastguard Worker }
284*f6dc9357SAndroid Build Coastguard Worker }
285*f6dc9357SAndroid Build Coastguard Worker
286*f6dc9357SAndroid Build Coastguard Worker /* Aes_Encode and Aes_Decode functions work with little-endian words.
287*f6dc9357SAndroid Build Coastguard Worker src and dest are pointers to 4 UInt32 words.
288*f6dc9357SAndroid Build Coastguard Worker src and dest can point to same block */
289*f6dc9357SAndroid Build Coastguard Worker
290*f6dc9357SAndroid Build Coastguard Worker // Z7_FORCE_INLINE
Aes_Encode(const UInt32 * w,UInt32 * dest,const UInt32 * src)291*f6dc9357SAndroid Build Coastguard Worker static void Aes_Encode(const UInt32 *w, UInt32 *dest, const UInt32 *src)
292*f6dc9357SAndroid Build Coastguard Worker {
293*f6dc9357SAndroid Build Coastguard Worker UInt32 s[4];
294*f6dc9357SAndroid Build Coastguard Worker UInt32 m[4];
295*f6dc9357SAndroid Build Coastguard Worker UInt32 numRounds2 = w[0];
296*f6dc9357SAndroid Build Coastguard Worker w += 4;
297*f6dc9357SAndroid Build Coastguard Worker s[0] = src[0] ^ w[0];
298*f6dc9357SAndroid Build Coastguard Worker s[1] = src[1] ^ w[1];
299*f6dc9357SAndroid Build Coastguard Worker s[2] = src[2] ^ w[2];
300*f6dc9357SAndroid Build Coastguard Worker s[3] = src[3] ^ w[3];
301*f6dc9357SAndroid Build Coastguard Worker w += 4;
302*f6dc9357SAndroid Build Coastguard Worker for (;;)
303*f6dc9357SAndroid Build Coastguard Worker {
304*f6dc9357SAndroid Build Coastguard Worker HT16(m, s, 0)
305*f6dc9357SAndroid Build Coastguard Worker if (--numRounds2 == 0)
306*f6dc9357SAndroid Build Coastguard Worker break;
307*f6dc9357SAndroid Build Coastguard Worker HT16(s, m, 4)
308*f6dc9357SAndroid Build Coastguard Worker w += 8;
309*f6dc9357SAndroid Build Coastguard Worker }
310*f6dc9357SAndroid Build Coastguard Worker w += 4;
311*f6dc9357SAndroid Build Coastguard Worker FT4(0)
312*f6dc9357SAndroid Build Coastguard Worker FT4(1)
313*f6dc9357SAndroid Build Coastguard Worker FT4(2)
314*f6dc9357SAndroid Build Coastguard Worker FT4(3)
315*f6dc9357SAndroid Build Coastguard Worker }
316*f6dc9357SAndroid Build Coastguard Worker
317*f6dc9357SAndroid Build Coastguard Worker Z7_FORCE_INLINE
Aes_Decode(const UInt32 * w,UInt32 * dest,const UInt32 * src)318*f6dc9357SAndroid Build Coastguard Worker static void Aes_Decode(const UInt32 *w, UInt32 *dest, const UInt32 *src)
319*f6dc9357SAndroid Build Coastguard Worker {
320*f6dc9357SAndroid Build Coastguard Worker UInt32 s[4];
321*f6dc9357SAndroid Build Coastguard Worker UInt32 m[4];
322*f6dc9357SAndroid Build Coastguard Worker UInt32 numRounds2 = w[0];
323*f6dc9357SAndroid Build Coastguard Worker w += 4 + numRounds2 * 8;
324*f6dc9357SAndroid Build Coastguard Worker s[0] = src[0] ^ w[0];
325*f6dc9357SAndroid Build Coastguard Worker s[1] = src[1] ^ w[1];
326*f6dc9357SAndroid Build Coastguard Worker s[2] = src[2] ^ w[2];
327*f6dc9357SAndroid Build Coastguard Worker s[3] = src[3] ^ w[3];
328*f6dc9357SAndroid Build Coastguard Worker for (;;)
329*f6dc9357SAndroid Build Coastguard Worker {
330*f6dc9357SAndroid Build Coastguard Worker w -= 8;
331*f6dc9357SAndroid Build Coastguard Worker HD16(m, s, 4)
332*f6dc9357SAndroid Build Coastguard Worker if (--numRounds2 == 0)
333*f6dc9357SAndroid Build Coastguard Worker break;
334*f6dc9357SAndroid Build Coastguard Worker HD16(s, m, 0)
335*f6dc9357SAndroid Build Coastguard Worker }
336*f6dc9357SAndroid Build Coastguard Worker FD4(0)
337*f6dc9357SAndroid Build Coastguard Worker FD4(1)
338*f6dc9357SAndroid Build Coastguard Worker FD4(2)
339*f6dc9357SAndroid Build Coastguard Worker FD4(3)
340*f6dc9357SAndroid Build Coastguard Worker }
341*f6dc9357SAndroid Build Coastguard Worker
AesCbc_Init(UInt32 * p,const Byte * iv)342*f6dc9357SAndroid Build Coastguard Worker void AesCbc_Init(UInt32 *p, const Byte *iv)
343*f6dc9357SAndroid Build Coastguard Worker {
344*f6dc9357SAndroid Build Coastguard Worker unsigned i;
345*f6dc9357SAndroid Build Coastguard Worker for (i = 0; i < 4; i++)
346*f6dc9357SAndroid Build Coastguard Worker p[i] = GetUi32(iv + i * 4);
347*f6dc9357SAndroid Build Coastguard Worker }
348*f6dc9357SAndroid Build Coastguard Worker
AesCbc_Encode(UInt32 * p,Byte * data,size_t numBlocks)349*f6dc9357SAndroid Build Coastguard Worker void Z7_FASTCALL AesCbc_Encode(UInt32 *p, Byte *data, size_t numBlocks)
350*f6dc9357SAndroid Build Coastguard Worker {
351*f6dc9357SAndroid Build Coastguard Worker for (; numBlocks != 0; numBlocks--, data += AES_BLOCK_SIZE)
352*f6dc9357SAndroid Build Coastguard Worker {
353*f6dc9357SAndroid Build Coastguard Worker p[0] ^= GetUi32(data);
354*f6dc9357SAndroid Build Coastguard Worker p[1] ^= GetUi32(data + 4);
355*f6dc9357SAndroid Build Coastguard Worker p[2] ^= GetUi32(data + 8);
356*f6dc9357SAndroid Build Coastguard Worker p[3] ^= GetUi32(data + 12);
357*f6dc9357SAndroid Build Coastguard Worker
358*f6dc9357SAndroid Build Coastguard Worker Aes_Encode(p + 4, p, p);
359*f6dc9357SAndroid Build Coastguard Worker
360*f6dc9357SAndroid Build Coastguard Worker SetUi32(data, p[0])
361*f6dc9357SAndroid Build Coastguard Worker SetUi32(data + 4, p[1])
362*f6dc9357SAndroid Build Coastguard Worker SetUi32(data + 8, p[2])
363*f6dc9357SAndroid Build Coastguard Worker SetUi32(data + 12, p[3])
364*f6dc9357SAndroid Build Coastguard Worker }
365*f6dc9357SAndroid Build Coastguard Worker }
366*f6dc9357SAndroid Build Coastguard Worker
AesCbc_Decode(UInt32 * p,Byte * data,size_t numBlocks)367*f6dc9357SAndroid Build Coastguard Worker void Z7_FASTCALL AesCbc_Decode(UInt32 *p, Byte *data, size_t numBlocks)
368*f6dc9357SAndroid Build Coastguard Worker {
369*f6dc9357SAndroid Build Coastguard Worker UInt32 in[4], out[4];
370*f6dc9357SAndroid Build Coastguard Worker for (; numBlocks != 0; numBlocks--, data += AES_BLOCK_SIZE)
371*f6dc9357SAndroid Build Coastguard Worker {
372*f6dc9357SAndroid Build Coastguard Worker in[0] = GetUi32(data);
373*f6dc9357SAndroid Build Coastguard Worker in[1] = GetUi32(data + 4);
374*f6dc9357SAndroid Build Coastguard Worker in[2] = GetUi32(data + 8);
375*f6dc9357SAndroid Build Coastguard Worker in[3] = GetUi32(data + 12);
376*f6dc9357SAndroid Build Coastguard Worker
377*f6dc9357SAndroid Build Coastguard Worker Aes_Decode(p + 4, out, in);
378*f6dc9357SAndroid Build Coastguard Worker
379*f6dc9357SAndroid Build Coastguard Worker SetUi32(data, p[0] ^ out[0])
380*f6dc9357SAndroid Build Coastguard Worker SetUi32(data + 4, p[1] ^ out[1])
381*f6dc9357SAndroid Build Coastguard Worker SetUi32(data + 8, p[2] ^ out[2])
382*f6dc9357SAndroid Build Coastguard Worker SetUi32(data + 12, p[3] ^ out[3])
383*f6dc9357SAndroid Build Coastguard Worker
384*f6dc9357SAndroid Build Coastguard Worker p[0] = in[0];
385*f6dc9357SAndroid Build Coastguard Worker p[1] = in[1];
386*f6dc9357SAndroid Build Coastguard Worker p[2] = in[2];
387*f6dc9357SAndroid Build Coastguard Worker p[3] = in[3];
388*f6dc9357SAndroid Build Coastguard Worker }
389*f6dc9357SAndroid Build Coastguard Worker }
390*f6dc9357SAndroid Build Coastguard Worker
AesCtr_Code(UInt32 * p,Byte * data,size_t numBlocks)391*f6dc9357SAndroid Build Coastguard Worker void Z7_FASTCALL AesCtr_Code(UInt32 *p, Byte *data, size_t numBlocks)
392*f6dc9357SAndroid Build Coastguard Worker {
393*f6dc9357SAndroid Build Coastguard Worker for (; numBlocks != 0; numBlocks--)
394*f6dc9357SAndroid Build Coastguard Worker {
395*f6dc9357SAndroid Build Coastguard Worker UInt32 temp[4];
396*f6dc9357SAndroid Build Coastguard Worker unsigned i;
397*f6dc9357SAndroid Build Coastguard Worker
398*f6dc9357SAndroid Build Coastguard Worker if (++p[0] == 0)
399*f6dc9357SAndroid Build Coastguard Worker p[1]++;
400*f6dc9357SAndroid Build Coastguard Worker
401*f6dc9357SAndroid Build Coastguard Worker Aes_Encode(p + 4, temp, p);
402*f6dc9357SAndroid Build Coastguard Worker
403*f6dc9357SAndroid Build Coastguard Worker for (i = 0; i < 4; i++, data += 4)
404*f6dc9357SAndroid Build Coastguard Worker {
405*f6dc9357SAndroid Build Coastguard Worker const UInt32 t = temp[i];
406*f6dc9357SAndroid Build Coastguard Worker
407*f6dc9357SAndroid Build Coastguard Worker #ifdef MY_CPU_LE_UNALIGN
408*f6dc9357SAndroid Build Coastguard Worker *((UInt32 *)(void *)data) ^= t;
409*f6dc9357SAndroid Build Coastguard Worker #else
410*f6dc9357SAndroid Build Coastguard Worker data[0] = (Byte)(data[0] ^ (t & 0xFF));
411*f6dc9357SAndroid Build Coastguard Worker data[1] = (Byte)(data[1] ^ ((t >> 8) & 0xFF));
412*f6dc9357SAndroid Build Coastguard Worker data[2] = (Byte)(data[2] ^ ((t >> 16) & 0xFF));
413*f6dc9357SAndroid Build Coastguard Worker data[3] = (Byte)(data[3] ^ ((t >> 24)));
414*f6dc9357SAndroid Build Coastguard Worker #endif
415*f6dc9357SAndroid Build Coastguard Worker }
416*f6dc9357SAndroid Build Coastguard Worker }
417*f6dc9357SAndroid Build Coastguard Worker }
418*f6dc9357SAndroid Build Coastguard Worker
419*f6dc9357SAndroid Build Coastguard Worker #undef xtime
420*f6dc9357SAndroid Build Coastguard Worker #undef Ui32
421*f6dc9357SAndroid Build Coastguard Worker #undef gb0
422*f6dc9357SAndroid Build Coastguard Worker #undef gb1
423*f6dc9357SAndroid Build Coastguard Worker #undef gb2
424*f6dc9357SAndroid Build Coastguard Worker #undef gb3
425*f6dc9357SAndroid Build Coastguard Worker #undef gb
426*f6dc9357SAndroid Build Coastguard Worker #undef TT
427*f6dc9357SAndroid Build Coastguard Worker #undef DD
428*f6dc9357SAndroid Build Coastguard Worker #undef USE_HW_AES
429*f6dc9357SAndroid Build Coastguard Worker #undef PRF
430