coverity 1462556 Resource leak
[openssl.git] / crypto / aes / aes_core.c
1 /*
2  * Copyright 2002-2020 The OpenSSL Project Authors. All Rights Reserved.
3  *
4  * Licensed under the Apache License 2.0 (the "License").  You may not use
5  * this file except in compliance with the License.  You can obtain a copy
6  * in the file LICENSE in the source distribution or at
7  * https://www.openssl.org/source/license.html
8  */
9
10 /**
11  * rijndael-alg-fst.c
12  *
13  * @version 3.0 (December 2000)
14  *
15  * Optimised ANSI C code for the Rijndael cipher (now AES)
16  *
17  * @author Vincent Rijmen
18  * @author Antoon Bosselaers
19  * @author Paulo Barreto
20  *
21  * This code is hereby placed in the public domain.
22  *
23  * THIS SOFTWARE IS PROVIDED BY THE AUTHORS ''AS IS'' AND ANY EXPRESS
24  * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
25  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
26  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE
27  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
28  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
29  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
30  * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
31  * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
32  * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
33  * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
34  */
35
36 /* Note: rewritten a little bit to provide error control and an OpenSSL-
37    compatible API */
38
39 /*
40  * AES low level APIs are deprecated for public use, but still ok for internal
41  * use where we're using them to implement the higher level EVP interface, as is
42  * the case here.
43  */
44 #include "internal/deprecated.h"
45
46 #include <assert.h>
47
48 #include <stdlib.h>
49 #include <openssl/crypto.h>
50 #include <openssl/aes.h>
51 #include "aes_local.h"
52
53 #ifndef AES_ASM
54 /*-
55 Te0[x] = S [x].[02, 01, 01, 03];
56 Te1[x] = S [x].[03, 02, 01, 01];
57 Te2[x] = S [x].[01, 03, 02, 01];
58 Te3[x] = S [x].[01, 01, 03, 02];
59
60 Td0[x] = Si[x].[0e, 09, 0d, 0b];
61 Td1[x] = Si[x].[0b, 0e, 09, 0d];
62 Td2[x] = Si[x].[0d, 0b, 0e, 09];
63 Td3[x] = Si[x].[09, 0d, 0b, 0e];
64 Td4[x] = Si[x].[01];
65 */
66
67 static const u32 Te0[256] = {
68     0xc66363a5U, 0xf87c7c84U, 0xee777799U, 0xf67b7b8dU,
69     0xfff2f20dU, 0xd66b6bbdU, 0xde6f6fb1U, 0x91c5c554U,
70     0x60303050U, 0x02010103U, 0xce6767a9U, 0x562b2b7dU,
71     0xe7fefe19U, 0xb5d7d762U, 0x4dababe6U, 0xec76769aU,
72     0x8fcaca45U, 0x1f82829dU, 0x89c9c940U, 0xfa7d7d87U,
73     0xeffafa15U, 0xb25959ebU, 0x8e4747c9U, 0xfbf0f00bU,
74     0x41adadecU, 0xb3d4d467U, 0x5fa2a2fdU, 0x45afafeaU,
75     0x239c9cbfU, 0x53a4a4f7U, 0xe4727296U, 0x9bc0c05bU,
76     0x75b7b7c2U, 0xe1fdfd1cU, 0x3d9393aeU, 0x4c26266aU,
77     0x6c36365aU, 0x7e3f3f41U, 0xf5f7f702U, 0x83cccc4fU,
78     0x6834345cU, 0x51a5a5f4U, 0xd1e5e534U, 0xf9f1f108U,
79     0xe2717193U, 0xabd8d873U, 0x62313153U, 0x2a15153fU,
80     0x0804040cU, 0x95c7c752U, 0x46232365U, 0x9dc3c35eU,
81     0x30181828U, 0x379696a1U, 0x0a05050fU, 0x2f9a9ab5U,
82     0x0e070709U, 0x24121236U, 0x1b80809bU, 0xdfe2e23dU,
83     0xcdebeb26U, 0x4e272769U, 0x7fb2b2cdU, 0xea75759fU,
84     0x1209091bU, 0x1d83839eU, 0x582c2c74U, 0x341a1a2eU,
85     0x361b1b2dU, 0xdc6e6eb2U, 0xb45a5aeeU, 0x5ba0a0fbU,
86     0xa45252f6U, 0x763b3b4dU, 0xb7d6d661U, 0x7db3b3ceU,
87     0x5229297bU, 0xdde3e33eU, 0x5e2f2f71U, 0x13848497U,
88     0xa65353f5U, 0xb9d1d168U, 0x00000000U, 0xc1eded2cU,
89     0x40202060U, 0xe3fcfc1fU, 0x79b1b1c8U, 0xb65b5bedU,
90     0xd46a6abeU, 0x8dcbcb46U, 0x67bebed9U, 0x7239394bU,
91     0x944a4adeU, 0x984c4cd4U, 0xb05858e8U, 0x85cfcf4aU,
92     0xbbd0d06bU, 0xc5efef2aU, 0x4faaaae5U, 0xedfbfb16U,
93     0x864343c5U, 0x9a4d4dd7U, 0x66333355U, 0x11858594U,
94     0x8a4545cfU, 0xe9f9f910U, 0x04020206U, 0xfe7f7f81U,
95     0xa05050f0U, 0x783c3c44U, 0x259f9fbaU, 0x4ba8a8e3U,
96     0xa25151f3U, 0x5da3a3feU, 0x804040c0U, 0x058f8f8aU,
97     0x3f9292adU, 0x219d9dbcU, 0x70383848U, 0xf1f5f504U,
98     0x63bcbcdfU, 0x77b6b6c1U, 0xafdada75U, 0x42212163U,
99     0x20101030U, 0xe5ffff1aU, 0xfdf3f30eU, 0xbfd2d26dU,
100     0x81cdcd4cU, 0x180c0c14U, 0x26131335U, 0xc3ecec2fU,
101     0xbe5f5fe1U, 0x359797a2U, 0x884444ccU, 0x2e171739U,
102     0x93c4c457U, 0x55a7a7f2U, 0xfc7e7e82U, 0x7a3d3d47U,
103     0xc86464acU, 0xba5d5de7U, 0x3219192bU, 0xe6737395U,
104     0xc06060a0U, 0x19818198U, 0x9e4f4fd1U, 0xa3dcdc7fU,
105     0x44222266U, 0x542a2a7eU, 0x3b9090abU, 0x0b888883U,
106     0x8c4646caU, 0xc7eeee29U, 0x6bb8b8d3U, 0x2814143cU,
107     0xa7dede79U, 0xbc5e5ee2U, 0x160b0b1dU, 0xaddbdb76U,
108     0xdbe0e03bU, 0x64323256U, 0x743a3a4eU, 0x140a0a1eU,
109     0x924949dbU, 0x0c06060aU, 0x4824246cU, 0xb85c5ce4U,
110     0x9fc2c25dU, 0xbdd3d36eU, 0x43acacefU, 0xc46262a6U,
111     0x399191a8U, 0x319595a4U, 0xd3e4e437U, 0xf279798bU,
112     0xd5e7e732U, 0x8bc8c843U, 0x6e373759U, 0xda6d6db7U,
113     0x018d8d8cU, 0xb1d5d564U, 0x9c4e4ed2U, 0x49a9a9e0U,
114     0xd86c6cb4U, 0xac5656faU, 0xf3f4f407U, 0xcfeaea25U,
115     0xca6565afU, 0xf47a7a8eU, 0x47aeaee9U, 0x10080818U,
116     0x6fbabad5U, 0xf0787888U, 0x4a25256fU, 0x5c2e2e72U,
117     0x381c1c24U, 0x57a6a6f1U, 0x73b4b4c7U, 0x97c6c651U,
118     0xcbe8e823U, 0xa1dddd7cU, 0xe874749cU, 0x3e1f1f21U,
119     0x964b4bddU, 0x61bdbddcU, 0x0d8b8b86U, 0x0f8a8a85U,
120     0xe0707090U, 0x7c3e3e42U, 0x71b5b5c4U, 0xcc6666aaU,
121     0x904848d8U, 0x06030305U, 0xf7f6f601U, 0x1c0e0e12U,
122     0xc26161a3U, 0x6a35355fU, 0xae5757f9U, 0x69b9b9d0U,
123     0x17868691U, 0x99c1c158U, 0x3a1d1d27U, 0x279e9eb9U,
124     0xd9e1e138U, 0xebf8f813U, 0x2b9898b3U, 0x22111133U,
125     0xd26969bbU, 0xa9d9d970U, 0x078e8e89U, 0x339494a7U,
126     0x2d9b9bb6U, 0x3c1e1e22U, 0x15878792U, 0xc9e9e920U,
127     0x87cece49U, 0xaa5555ffU, 0x50282878U, 0xa5dfdf7aU,
128     0x038c8c8fU, 0x59a1a1f8U, 0x09898980U, 0x1a0d0d17U,
129     0x65bfbfdaU, 0xd7e6e631U, 0x844242c6U, 0xd06868b8U,
130     0x824141c3U, 0x299999b0U, 0x5a2d2d77U, 0x1e0f0f11U,
131     0x7bb0b0cbU, 0xa85454fcU, 0x6dbbbbd6U, 0x2c16163aU,
132 };
133 static const u32 Te1[256] = {
134     0xa5c66363U, 0x84f87c7cU, 0x99ee7777U, 0x8df67b7bU,
135     0x0dfff2f2U, 0xbdd66b6bU, 0xb1de6f6fU, 0x5491c5c5U,
136     0x50603030U, 0x03020101U, 0xa9ce6767U, 0x7d562b2bU,
137     0x19e7fefeU, 0x62b5d7d7U, 0xe64dababU, 0x9aec7676U,
138     0x458fcacaU, 0x9d1f8282U, 0x4089c9c9U, 0x87fa7d7dU,
139     0x15effafaU, 0xebb25959U, 0xc98e4747U, 0x0bfbf0f0U,
140     0xec41adadU, 0x67b3d4d4U, 0xfd5fa2a2U, 0xea45afafU,
141     0xbf239c9cU, 0xf753a4a4U, 0x96e47272U, 0x5b9bc0c0U,
142     0xc275b7b7U, 0x1ce1fdfdU, 0xae3d9393U, 0x6a4c2626U,
143     0x5a6c3636U, 0x417e3f3fU, 0x02f5f7f7U, 0x4f83ccccU,
144     0x5c683434U, 0xf451a5a5U, 0x34d1e5e5U, 0x08f9f1f1U,
145     0x93e27171U, 0x73abd8d8U, 0x53623131U, 0x3f2a1515U,
146     0x0c080404U, 0x5295c7c7U, 0x65462323U, 0x5e9dc3c3U,
147     0x28301818U, 0xa1379696U, 0x0f0a0505U, 0xb52f9a9aU,
148     0x090e0707U, 0x36241212U, 0x9b1b8080U, 0x3ddfe2e2U,
149     0x26cdebebU, 0x694e2727U, 0xcd7fb2b2U, 0x9fea7575U,
150     0x1b120909U, 0x9e1d8383U, 0x74582c2cU, 0x2e341a1aU,
151     0x2d361b1bU, 0xb2dc6e6eU, 0xeeb45a5aU, 0xfb5ba0a0U,
152     0xf6a45252U, 0x4d763b3bU, 0x61b7d6d6U, 0xce7db3b3U,
153     0x7b522929U, 0x3edde3e3U, 0x715e2f2fU, 0x97138484U,
154     0xf5a65353U, 0x68b9d1d1U, 0x00000000U, 0x2cc1ededU,
155     0x60402020U, 0x1fe3fcfcU, 0xc879b1b1U, 0xedb65b5bU,
156     0xbed46a6aU, 0x468dcbcbU, 0xd967bebeU, 0x4b723939U,
157     0xde944a4aU, 0xd4984c4cU, 0xe8b05858U, 0x4a85cfcfU,
158     0x6bbbd0d0U, 0x2ac5efefU, 0xe54faaaaU, 0x16edfbfbU,
159     0xc5864343U, 0xd79a4d4dU, 0x55663333U, 0x94118585U,
160     0xcf8a4545U, 0x10e9f9f9U, 0x06040202U, 0x81fe7f7fU,
161     0xf0a05050U, 0x44783c3cU, 0xba259f9fU, 0xe34ba8a8U,
162     0xf3a25151U, 0xfe5da3a3U, 0xc0804040U, 0x8a058f8fU,
163     0xad3f9292U, 0xbc219d9dU, 0x48703838U, 0x04f1f5f5U,
164     0xdf63bcbcU, 0xc177b6b6U, 0x75afdadaU, 0x63422121U,
165     0x30201010U, 0x1ae5ffffU, 0x0efdf3f3U, 0x6dbfd2d2U,
166     0x4c81cdcdU, 0x14180c0cU, 0x35261313U, 0x2fc3ececU,
167     0xe1be5f5fU, 0xa2359797U, 0xcc884444U, 0x392e1717U,
168     0x5793c4c4U, 0xf255a7a7U, 0x82fc7e7eU, 0x477a3d3dU,
169     0xacc86464U, 0xe7ba5d5dU, 0x2b321919U, 0x95e67373U,
170     0xa0c06060U, 0x98198181U, 0xd19e4f4fU, 0x7fa3dcdcU,
171     0x66442222U, 0x7e542a2aU, 0xab3b9090U, 0x830b8888U,
172     0xca8c4646U, 0x29c7eeeeU, 0xd36bb8b8U, 0x3c281414U,
173     0x79a7dedeU, 0xe2bc5e5eU, 0x1d160b0bU, 0x76addbdbU,
174     0x3bdbe0e0U, 0x56643232U, 0x4e743a3aU, 0x1e140a0aU,
175     0xdb924949U, 0x0a0c0606U, 0x6c482424U, 0xe4b85c5cU,
176     0x5d9fc2c2U, 0x6ebdd3d3U, 0xef43acacU, 0xa6c46262U,
177     0xa8399191U, 0xa4319595U, 0x37d3e4e4U, 0x8bf27979U,
178     0x32d5e7e7U, 0x438bc8c8U, 0x596e3737U, 0xb7da6d6dU,
179     0x8c018d8dU, 0x64b1d5d5U, 0xd29c4e4eU, 0xe049a9a9U,
180     0xb4d86c6cU, 0xfaac5656U, 0x07f3f4f4U, 0x25cfeaeaU,
181     0xafca6565U, 0x8ef47a7aU, 0xe947aeaeU, 0x18100808U,
182     0xd56fbabaU, 0x88f07878U, 0x6f4a2525U, 0x725c2e2eU,
183     0x24381c1cU, 0xf157a6a6U, 0xc773b4b4U, 0x5197c6c6U,
184     0x23cbe8e8U, 0x7ca1ddddU, 0x9ce87474U, 0x213e1f1fU,
185     0xdd964b4bU, 0xdc61bdbdU, 0x860d8b8bU, 0x850f8a8aU,
186     0x90e07070U, 0x427c3e3eU, 0xc471b5b5U, 0xaacc6666U,
187     0xd8904848U, 0x05060303U, 0x01f7f6f6U, 0x121c0e0eU,
188     0xa3c26161U, 0x5f6a3535U, 0xf9ae5757U, 0xd069b9b9U,
189     0x91178686U, 0x5899c1c1U, 0x273a1d1dU, 0xb9279e9eU,
190     0x38d9e1e1U, 0x13ebf8f8U, 0xb32b9898U, 0x33221111U,
191     0xbbd26969U, 0x70a9d9d9U, 0x89078e8eU, 0xa7339494U,
192     0xb62d9b9bU, 0x223c1e1eU, 0x92158787U, 0x20c9e9e9U,
193     0x4987ceceU, 0xffaa5555U, 0x78502828U, 0x7aa5dfdfU,
194     0x8f038c8cU, 0xf859a1a1U, 0x80098989U, 0x171a0d0dU,
195     0xda65bfbfU, 0x31d7e6e6U, 0xc6844242U, 0xb8d06868U,
196     0xc3824141U, 0xb0299999U, 0x775a2d2dU, 0x111e0f0fU,
197     0xcb7bb0b0U, 0xfca85454U, 0xd66dbbbbU, 0x3a2c1616U,
198 };
199 static const u32 Te2[256] = {
200     0x63a5c663U, 0x7c84f87cU, 0x7799ee77U, 0x7b8df67bU,
201     0xf20dfff2U, 0x6bbdd66bU, 0x6fb1de6fU, 0xc55491c5U,
202     0x30506030U, 0x01030201U, 0x67a9ce67U, 0x2b7d562bU,
203     0xfe19e7feU, 0xd762b5d7U, 0xabe64dabU, 0x769aec76U,
204     0xca458fcaU, 0x829d1f82U, 0xc94089c9U, 0x7d87fa7dU,
205     0xfa15effaU, 0x59ebb259U, 0x47c98e47U, 0xf00bfbf0U,
206     0xadec41adU, 0xd467b3d4U, 0xa2fd5fa2U, 0xafea45afU,
207     0x9cbf239cU, 0xa4f753a4U, 0x7296e472U, 0xc05b9bc0U,
208     0xb7c275b7U, 0xfd1ce1fdU, 0x93ae3d93U, 0x266a4c26U,
209     0x365a6c36U, 0x3f417e3fU, 0xf702f5f7U, 0xcc4f83ccU,
210     0x345c6834U, 0xa5f451a5U, 0xe534d1e5U, 0xf108f9f1U,
211     0x7193e271U, 0xd873abd8U, 0x31536231U, 0x153f2a15U,
212     0x040c0804U, 0xc75295c7U, 0x23654623U, 0xc35e9dc3U,
213     0x18283018U, 0x96a13796U, 0x050f0a05U, 0x9ab52f9aU,
214     0x07090e07U, 0x12362412U, 0x809b1b80U, 0xe23ddfe2U,
215     0xeb26cdebU, 0x27694e27U, 0xb2cd7fb2U, 0x759fea75U,
216     0x091b1209U, 0x839e1d83U, 0x2c74582cU, 0x1a2e341aU,
217     0x1b2d361bU, 0x6eb2dc6eU, 0x5aeeb45aU, 0xa0fb5ba0U,
218     0x52f6a452U, 0x3b4d763bU, 0xd661b7d6U, 0xb3ce7db3U,
219     0x297b5229U, 0xe33edde3U, 0x2f715e2fU, 0x84971384U,
220     0x53f5a653U, 0xd168b9d1U, 0x00000000U, 0xed2cc1edU,
221     0x20604020U, 0xfc1fe3fcU, 0xb1c879b1U, 0x5bedb65bU,
222     0x6abed46aU, 0xcb468dcbU, 0xbed967beU, 0x394b7239U,
223     0x4ade944aU, 0x4cd4984cU, 0x58e8b058U, 0xcf4a85cfU,
224     0xd06bbbd0U, 0xef2ac5efU, 0xaae54faaU, 0xfb16edfbU,
225     0x43c58643U, 0x4dd79a4dU, 0x33556633U, 0x85941185U,
226     0x45cf8a45U, 0xf910e9f9U, 0x02060402U, 0x7f81fe7fU,
227     0x50f0a050U, 0x3c44783cU, 0x9fba259fU, 0xa8e34ba8U,
228     0x51f3a251U, 0xa3fe5da3U, 0x40c08040U, 0x8f8a058fU,
229     0x92ad3f92U, 0x9dbc219dU, 0x38487038U, 0xf504f1f5U,
230     0xbcdf63bcU, 0xb6c177b6U, 0xda75afdaU, 0x21634221U,
231     0x10302010U, 0xff1ae5ffU, 0xf30efdf3U, 0xd26dbfd2U,
232     0xcd4c81cdU, 0x0c14180cU, 0x13352613U, 0xec2fc3ecU,
233     0x5fe1be5fU, 0x97a23597U, 0x44cc8844U, 0x17392e17U,
234     0xc45793c4U, 0xa7f255a7U, 0x7e82fc7eU, 0x3d477a3dU,
235     0x64acc864U, 0x5de7ba5dU, 0x192b3219U, 0x7395e673U,
236     0x60a0c060U, 0x81981981U, 0x4fd19e4fU, 0xdc7fa3dcU,
237     0x22664422U, 0x2a7e542aU, 0x90ab3b90U, 0x88830b88U,
238     0x46ca8c46U, 0xee29c7eeU, 0xb8d36bb8U, 0x143c2814U,
239     0xde79a7deU, 0x5ee2bc5eU, 0x0b1d160bU, 0xdb76addbU,
240     0xe03bdbe0U, 0x32566432U, 0x3a4e743aU, 0x0a1e140aU,
241     0x49db9249U, 0x060a0c06U, 0x246c4824U, 0x5ce4b85cU,
242     0xc25d9fc2U, 0xd36ebdd3U, 0xacef43acU, 0x62a6c462U,
243     0x91a83991U, 0x95a43195U, 0xe437d3e4U, 0x798bf279U,
244     0xe732d5e7U, 0xc8438bc8U, 0x37596e37U, 0x6db7da6dU,
245     0x8d8c018dU, 0xd564b1d5U, 0x4ed29c4eU, 0xa9e049a9U,
246     0x6cb4d86cU, 0x56faac56U, 0xf407f3f4U, 0xea25cfeaU,
247     0x65afca65U, 0x7a8ef47aU, 0xaee947aeU, 0x08181008U,
248     0xbad56fbaU, 0x7888f078U, 0x256f4a25U, 0x2e725c2eU,
249     0x1c24381cU, 0xa6f157a6U, 0xb4c773b4U, 0xc65197c6U,
250     0xe823cbe8U, 0xdd7ca1ddU, 0x749ce874U, 0x1f213e1fU,
251     0x4bdd964bU, 0xbddc61bdU, 0x8b860d8bU, 0x8a850f8aU,
252     0x7090e070U, 0x3e427c3eU, 0xb5c471b5U, 0x66aacc66U,
253     0x48d89048U, 0x03050603U, 0xf601f7f6U, 0x0e121c0eU,
254     0x61a3c261U, 0x355f6a35U, 0x57f9ae57U, 0xb9d069b9U,
255     0x86911786U, 0xc15899c1U, 0x1d273a1dU, 0x9eb9279eU,
256     0xe138d9e1U, 0xf813ebf8U, 0x98b32b98U, 0x11332211U,
257     0x69bbd269U, 0xd970a9d9U, 0x8e89078eU, 0x94a73394U,
258     0x9bb62d9bU, 0x1e223c1eU, 0x87921587U, 0xe920c9e9U,
259     0xce4987ceU, 0x55ffaa55U, 0x28785028U, 0xdf7aa5dfU,
260     0x8c8f038cU, 0xa1f859a1U, 0x89800989U, 0x0d171a0dU,
261     0xbfda65bfU, 0xe631d7e6U, 0x42c68442U, 0x68b8d068U,
262     0x41c38241U, 0x99b02999U, 0x2d775a2dU, 0x0f111e0fU,
263     0xb0cb7bb0U, 0x54fca854U, 0xbbd66dbbU, 0x163a2c16U,
264 };
265 static const u32 Te3[256] = {
266     0x6363a5c6U, 0x7c7c84f8U, 0x777799eeU, 0x7b7b8df6U,
267     0xf2f20dffU, 0x6b6bbdd6U, 0x6f6fb1deU, 0xc5c55491U,
268     0x30305060U, 0x01010302U, 0x6767a9ceU, 0x2b2b7d56U,
269     0xfefe19e7U, 0xd7d762b5U, 0xababe64dU, 0x76769aecU,
270     0xcaca458fU, 0x82829d1fU, 0xc9c94089U, 0x7d7d87faU,
271     0xfafa15efU, 0x5959ebb2U, 0x4747c98eU, 0xf0f00bfbU,
272     0xadadec41U, 0xd4d467b3U, 0xa2a2fd5fU, 0xafafea45U,
273     0x9c9cbf23U, 0xa4a4f753U, 0x727296e4U, 0xc0c05b9bU,
274     0xb7b7c275U, 0xfdfd1ce1U, 0x9393ae3dU, 0x26266a4cU,
275     0x36365a6cU, 0x3f3f417eU, 0xf7f702f5U, 0xcccc4f83U,
276     0x34345c68U, 0xa5a5f451U, 0xe5e534d1U, 0xf1f108f9U,
277     0x717193e2U, 0xd8d873abU, 0x31315362U, 0x15153f2aU,
278     0x04040c08U, 0xc7c75295U, 0x23236546U, 0xc3c35e9dU,
279     0x18182830U, 0x9696a137U, 0x05050f0aU, 0x9a9ab52fU,
280     0x0707090eU, 0x12123624U, 0x80809b1bU, 0xe2e23ddfU,
281     0xebeb26cdU, 0x2727694eU, 0xb2b2cd7fU, 0x75759feaU,
282     0x09091b12U, 0x83839e1dU, 0x2c2c7458U, 0x1a1a2e34U,
283     0x1b1b2d36U, 0x6e6eb2dcU, 0x5a5aeeb4U, 0xa0a0fb5bU,
284     0x5252f6a4U, 0x3b3b4d76U, 0xd6d661b7U, 0xb3b3ce7dU,
285     0x29297b52U, 0xe3e33eddU, 0x2f2f715eU, 0x84849713U,
286     0x5353f5a6U, 0xd1d168b9U, 0x00000000U, 0xeded2cc1U,
287     0x20206040U, 0xfcfc1fe3U, 0xb1b1c879U, 0x5b5bedb6U,
288     0x6a6abed4U, 0xcbcb468dU, 0xbebed967U, 0x39394b72U,
289     0x4a4ade94U, 0x4c4cd498U, 0x5858e8b0U, 0xcfcf4a85U,
290     0xd0d06bbbU, 0xefef2ac5U, 0xaaaae54fU, 0xfbfb16edU,
291     0x4343c586U, 0x4d4dd79aU, 0x33335566U, 0x85859411U,
292     0x4545cf8aU, 0xf9f910e9U, 0x02020604U, 0x7f7f81feU,
293     0x5050f0a0U, 0x3c3c4478U, 0x9f9fba25U, 0xa8a8e34bU,
294     0x5151f3a2U, 0xa3a3fe5dU, 0x4040c080U, 0x8f8f8a05U,
295     0x9292ad3fU, 0x9d9dbc21U, 0x38384870U, 0xf5f504f1U,
296     0xbcbcdf63U, 0xb6b6c177U, 0xdada75afU, 0x21216342U,
297     0x10103020U, 0xffff1ae5U, 0xf3f30efdU, 0xd2d26dbfU,
298     0xcdcd4c81U, 0x0c0c1418U, 0x13133526U, 0xecec2fc3U,
299     0x5f5fe1beU, 0x9797a235U, 0x4444cc88U, 0x1717392eU,
300     0xc4c45793U, 0xa7a7f255U, 0x7e7e82fcU, 0x3d3d477aU,
301     0x6464acc8U, 0x5d5de7baU, 0x19192b32U, 0x737395e6U,
302     0x6060a0c0U, 0x81819819U, 0x4f4fd19eU, 0xdcdc7fa3U,
303     0x22226644U, 0x2a2a7e54U, 0x9090ab3bU, 0x8888830bU,
304     0x4646ca8cU, 0xeeee29c7U, 0xb8b8d36bU, 0x14143c28U,
305     0xdede79a7U, 0x5e5ee2bcU, 0x0b0b1d16U, 0xdbdb76adU,
306     0xe0e03bdbU, 0x32325664U, 0x3a3a4e74U, 0x0a0a1e14U,
307     0x4949db92U, 0x06060a0cU, 0x24246c48U, 0x5c5ce4b8U,
308     0xc2c25d9fU, 0xd3d36ebdU, 0xacacef43U, 0x6262a6c4U,
309     0x9191a839U, 0x9595a431U, 0xe4e437d3U, 0x79798bf2U,
310     0xe7e732d5U, 0xc8c8438bU, 0x3737596eU, 0x6d6db7daU,
311     0x8d8d8c01U, 0xd5d564b1U, 0x4e4ed29cU, 0xa9a9e049U,
312     0x6c6cb4d8U, 0x5656faacU, 0xf4f407f3U, 0xeaea25cfU,
313     0x6565afcaU, 0x7a7a8ef4U, 0xaeaee947U, 0x08081810U,
314     0xbabad56fU, 0x787888f0U, 0x25256f4aU, 0x2e2e725cU,
315     0x1c1c2438U, 0xa6a6f157U, 0xb4b4c773U, 0xc6c65197U,
316     0xe8e823cbU, 0xdddd7ca1U, 0x74749ce8U, 0x1f1f213eU,
317     0x4b4bdd96U, 0xbdbddc61U, 0x8b8b860dU, 0x8a8a850fU,
318     0x707090e0U, 0x3e3e427cU, 0xb5b5c471U, 0x6666aaccU,
319     0x4848d890U, 0x03030506U, 0xf6f601f7U, 0x0e0e121cU,
320     0x6161a3c2U, 0x35355f6aU, 0x5757f9aeU, 0xb9b9d069U,
321     0x86869117U, 0xc1c15899U, 0x1d1d273aU, 0x9e9eb927U,
322     0xe1e138d9U, 0xf8f813ebU, 0x9898b32bU, 0x11113322U,
323     0x6969bbd2U, 0xd9d970a9U, 0x8e8e8907U, 0x9494a733U,
324     0x9b9bb62dU, 0x1e1e223cU, 0x87879215U, 0xe9e920c9U,
325     0xcece4987U, 0x5555ffaaU, 0x28287850U, 0xdfdf7aa5U,
326     0x8c8c8f03U, 0xa1a1f859U, 0x89898009U, 0x0d0d171aU,
327     0xbfbfda65U, 0xe6e631d7U, 0x4242c684U, 0x6868b8d0U,
328     0x4141c382U, 0x9999b029U, 0x2d2d775aU, 0x0f0f111eU,
329     0xb0b0cb7bU, 0x5454fca8U, 0xbbbbd66dU, 0x16163a2cU,
330 };
331
332 static const u32 Td0[256] = {
333     0x51f4a750U, 0x7e416553U, 0x1a17a4c3U, 0x3a275e96U,
334     0x3bab6bcbU, 0x1f9d45f1U, 0xacfa58abU, 0x4be30393U,
335     0x2030fa55U, 0xad766df6U, 0x88cc7691U, 0xf5024c25U,
336     0x4fe5d7fcU, 0xc52acbd7U, 0x26354480U, 0xb562a38fU,
337     0xdeb15a49U, 0x25ba1b67U, 0x45ea0e98U, 0x5dfec0e1U,
338     0xc32f7502U, 0x814cf012U, 0x8d4697a3U, 0x6bd3f9c6U,
339     0x038f5fe7U, 0x15929c95U, 0xbf6d7aebU, 0x955259daU,
340     0xd4be832dU, 0x587421d3U, 0x49e06929U, 0x8ec9c844U,
341     0x75c2896aU, 0xf48e7978U, 0x99583e6bU, 0x27b971ddU,
342     0xbee14fb6U, 0xf088ad17U, 0xc920ac66U, 0x7dce3ab4U,
343     0x63df4a18U, 0xe51a3182U, 0x97513360U, 0x62537f45U,
344     0xb16477e0U, 0xbb6bae84U, 0xfe81a01cU, 0xf9082b94U,
345     0x70486858U, 0x8f45fd19U, 0x94de6c87U, 0x527bf8b7U,
346     0xab73d323U, 0x724b02e2U, 0xe31f8f57U, 0x6655ab2aU,
347     0xb2eb2807U, 0x2fb5c203U, 0x86c57b9aU, 0xd33708a5U,
348     0x302887f2U, 0x23bfa5b2U, 0x02036abaU, 0xed16825cU,
349     0x8acf1c2bU, 0xa779b492U, 0xf307f2f0U, 0x4e69e2a1U,
350     0x65daf4cdU, 0x0605bed5U, 0xd134621fU, 0xc4a6fe8aU,
351     0x342e539dU, 0xa2f355a0U, 0x058ae132U, 0xa4f6eb75U,
352     0x0b83ec39U, 0x4060efaaU, 0x5e719f06U, 0xbd6e1051U,
353     0x3e218af9U, 0x96dd063dU, 0xdd3e05aeU, 0x4de6bd46U,
354     0x91548db5U, 0x71c45d05U, 0x0406d46fU, 0x605015ffU,
355     0x1998fb24U, 0xd6bde997U, 0x894043ccU, 0x67d99e77U,
356     0xb0e842bdU, 0x07898b88U, 0xe7195b38U, 0x79c8eedbU,
357     0xa17c0a47U, 0x7c420fe9U, 0xf8841ec9U, 0x00000000U,
358     0x09808683U, 0x322bed48U, 0x1e1170acU, 0x6c5a724eU,
359     0xfd0efffbU, 0x0f853856U, 0x3daed51eU, 0x362d3927U,
360     0x0a0fd964U, 0x685ca621U, 0x9b5b54d1U, 0x24362e3aU,
361     0x0c0a67b1U, 0x9357e70fU, 0xb4ee96d2U, 0x1b9b919eU,
362     0x80c0c54fU, 0x61dc20a2U, 0x5a774b69U, 0x1c121a16U,
363     0xe293ba0aU, 0xc0a02ae5U, 0x3c22e043U, 0x121b171dU,
364     0x0e090d0bU, 0xf28bc7adU, 0x2db6a8b9U, 0x141ea9c8U,
365     0x57f11985U, 0xaf75074cU, 0xee99ddbbU, 0xa37f60fdU,
366     0xf701269fU, 0x5c72f5bcU, 0x44663bc5U, 0x5bfb7e34U,
367     0x8b432976U, 0xcb23c6dcU, 0xb6edfc68U, 0xb8e4f163U,
368     0xd731dccaU, 0x42638510U, 0x13972240U, 0x84c61120U,
369     0x854a247dU, 0xd2bb3df8U, 0xaef93211U, 0xc729a16dU,
370     0x1d9e2f4bU, 0xdcb230f3U, 0x0d8652ecU, 0x77c1e3d0U,
371     0x2bb3166cU, 0xa970b999U, 0x119448faU, 0x47e96422U,
372     0xa8fc8cc4U, 0xa0f03f1aU, 0x567d2cd8U, 0x223390efU,
373     0x87494ec7U, 0xd938d1c1U, 0x8ccaa2feU, 0x98d40b36U,
374     0xa6f581cfU, 0xa57ade28U, 0xdab78e26U, 0x3fadbfa4U,
375     0x2c3a9de4U, 0x5078920dU, 0x6a5fcc9bU, 0x547e4662U,
376     0xf68d13c2U, 0x90d8b8e8U, 0x2e39f75eU, 0x82c3aff5U,
377     0x9f5d80beU, 0x69d0937cU, 0x6fd52da9U, 0xcf2512b3U,
378     0xc8ac993bU, 0x10187da7U, 0xe89c636eU, 0xdb3bbb7bU,
379     0xcd267809U, 0x6e5918f4U, 0xec9ab701U, 0x834f9aa8U,
380     0xe6956e65U, 0xaaffe67eU, 0x21bccf08U, 0xef15e8e6U,
381     0xbae79bd9U, 0x4a6f36ceU, 0xea9f09d4U, 0x29b07cd6U,
382     0x31a4b2afU, 0x2a3f2331U, 0xc6a59430U, 0x35a266c0U,
383     0x744ebc37U, 0xfc82caa6U, 0xe090d0b0U, 0x33a7d815U,
384     0xf104984aU, 0x41ecdaf7U, 0x7fcd500eU, 0x1791f62fU,
385     0x764dd68dU, 0x43efb04dU, 0xccaa4d54U, 0xe49604dfU,
386     0x9ed1b5e3U, 0x4c6a881bU, 0xc12c1fb8U, 0x4665517fU,
387     0x9d5eea04U, 0x018c355dU, 0xfa877473U, 0xfb0b412eU,
388     0xb3671d5aU, 0x92dbd252U, 0xe9105633U, 0x6dd64713U,
389     0x9ad7618cU, 0x37a10c7aU, 0x59f8148eU, 0xeb133c89U,
390     0xcea927eeU, 0xb761c935U, 0xe11ce5edU, 0x7a47b13cU,
391     0x9cd2df59U, 0x55f2733fU, 0x1814ce79U, 0x73c737bfU,
392     0x53f7cdeaU, 0x5ffdaa5bU, 0xdf3d6f14U, 0x7844db86U,
393     0xcaaff381U, 0xb968c43eU, 0x3824342cU, 0xc2a3405fU,
394     0x161dc372U, 0xbce2250cU, 0x283c498bU, 0xff0d9541U,
395     0x39a80171U, 0x080cb3deU, 0xd8b4e49cU, 0x6456c190U,
396     0x7bcb8461U, 0xd532b670U, 0x486c5c74U, 0xd0b85742U,
397 };
398 static const u32 Td1[256] = {
399     0x5051f4a7U, 0x537e4165U, 0xc31a17a4U, 0x963a275eU,
400     0xcb3bab6bU, 0xf11f9d45U, 0xabacfa58U, 0x934be303U,
401     0x552030faU, 0xf6ad766dU, 0x9188cc76U, 0x25f5024cU,
402     0xfc4fe5d7U, 0xd7c52acbU, 0x80263544U, 0x8fb562a3U,
403     0x49deb15aU, 0x6725ba1bU, 0x9845ea0eU, 0xe15dfec0U,
404     0x02c32f75U, 0x12814cf0U, 0xa38d4697U, 0xc66bd3f9U,
405     0xe7038f5fU, 0x9515929cU, 0xebbf6d7aU, 0xda955259U,
406     0x2dd4be83U, 0xd3587421U, 0x2949e069U, 0x448ec9c8U,
407     0x6a75c289U, 0x78f48e79U, 0x6b99583eU, 0xdd27b971U,
408     0xb6bee14fU, 0x17f088adU, 0x66c920acU, 0xb47dce3aU,
409     0x1863df4aU, 0x82e51a31U, 0x60975133U, 0x4562537fU,
410     0xe0b16477U, 0x84bb6baeU, 0x1cfe81a0U, 0x94f9082bU,
411     0x58704868U, 0x198f45fdU, 0x8794de6cU, 0xb7527bf8U,
412     0x23ab73d3U, 0xe2724b02U, 0x57e31f8fU, 0x2a6655abU,
413     0x07b2eb28U, 0x032fb5c2U, 0x9a86c57bU, 0xa5d33708U,
414     0xf2302887U, 0xb223bfa5U, 0xba02036aU, 0x5ced1682U,
415     0x2b8acf1cU, 0x92a779b4U, 0xf0f307f2U, 0xa14e69e2U,
416     0xcd65daf4U, 0xd50605beU, 0x1fd13462U, 0x8ac4a6feU,
417     0x9d342e53U, 0xa0a2f355U, 0x32058ae1U, 0x75a4f6ebU,
418     0x390b83ecU, 0xaa4060efU, 0x065e719fU, 0x51bd6e10U,
419     0xf93e218aU, 0x3d96dd06U, 0xaedd3e05U, 0x464de6bdU,
420     0xb591548dU, 0x0571c45dU, 0x6f0406d4U, 0xff605015U,
421     0x241998fbU, 0x97d6bde9U, 0xcc894043U, 0x7767d99eU,
422     0xbdb0e842U, 0x8807898bU, 0x38e7195bU, 0xdb79c8eeU,
423     0x47a17c0aU, 0xe97c420fU, 0xc9f8841eU, 0x00000000U,
424     0x83098086U, 0x48322bedU, 0xac1e1170U, 0x4e6c5a72U,
425     0xfbfd0effU, 0x560f8538U, 0x1e3daed5U, 0x27362d39U,
426     0x640a0fd9U, 0x21685ca6U, 0xd19b5b54U, 0x3a24362eU,
427     0xb10c0a67U, 0x0f9357e7U, 0xd2b4ee96U, 0x9e1b9b91U,
428     0x4f80c0c5U, 0xa261dc20U, 0x695a774bU, 0x161c121aU,
429     0x0ae293baU, 0xe5c0a02aU, 0x433c22e0U, 0x1d121b17U,
430     0x0b0e090dU, 0xadf28bc7U, 0xb92db6a8U, 0xc8141ea9U,
431     0x8557f119U, 0x4caf7507U, 0xbbee99ddU, 0xfda37f60U,
432     0x9ff70126U, 0xbc5c72f5U, 0xc544663bU, 0x345bfb7eU,
433     0x768b4329U, 0xdccb23c6U, 0x68b6edfcU, 0x63b8e4f1U,
434     0xcad731dcU, 0x10426385U, 0x40139722U, 0x2084c611U,
435     0x7d854a24U, 0xf8d2bb3dU, 0x11aef932U, 0x6dc729a1U,
436     0x4b1d9e2fU, 0xf3dcb230U, 0xec0d8652U, 0xd077c1e3U,
437     0x6c2bb316U, 0x99a970b9U, 0xfa119448U, 0x2247e964U,
438     0xc4a8fc8cU, 0x1aa0f03fU, 0xd8567d2cU, 0xef223390U,
439     0xc787494eU, 0xc1d938d1U, 0xfe8ccaa2U, 0x3698d40bU,
440     0xcfa6f581U, 0x28a57adeU, 0x26dab78eU, 0xa43fadbfU,
441     0xe42c3a9dU, 0x0d507892U, 0x9b6a5fccU, 0x62547e46U,
442     0xc2f68d13U, 0xe890d8b8U, 0x5e2e39f7U, 0xf582c3afU,
443     0xbe9f5d80U, 0x7c69d093U, 0xa96fd52dU, 0xb3cf2512U,
444     0x3bc8ac99U, 0xa710187dU, 0x6ee89c63U, 0x7bdb3bbbU,
445     0x09cd2678U, 0xf46e5918U, 0x01ec9ab7U, 0xa8834f9aU,
446     0x65e6956eU, 0x7eaaffe6U, 0x0821bccfU, 0xe6ef15e8U,
447     0xd9bae79bU, 0xce4a6f36U, 0xd4ea9f09U, 0xd629b07cU,
448     0xaf31a4b2U, 0x312a3f23U, 0x30c6a594U, 0xc035a266U,
449     0x37744ebcU, 0xa6fc82caU, 0xb0e090d0U, 0x1533a7d8U,
450     0x4af10498U, 0xf741ecdaU, 0x0e7fcd50U, 0x2f1791f6U,
451     0x8d764dd6U, 0x4d43efb0U, 0x54ccaa4dU, 0xdfe49604U,
452     0xe39ed1b5U, 0x1b4c6a88U, 0xb8c12c1fU, 0x7f466551U,
453     0x049d5eeaU, 0x5d018c35U, 0x73fa8774U, 0x2efb0b41U,
454     0x5ab3671dU, 0x5292dbd2U, 0x33e91056U, 0x136dd647U,
455     0x8c9ad761U, 0x7a37a10cU, 0x8e59f814U, 0x89eb133cU,
456     0xeecea927U, 0x35b761c9U, 0xede11ce5U, 0x3c7a47b1U,
457     0x599cd2dfU, 0x3f55f273U, 0x791814ceU, 0xbf73c737U,
458     0xea53f7cdU, 0x5b5ffdaaU, 0x14df3d6fU, 0x867844dbU,
459     0x81caaff3U, 0x3eb968c4U, 0x2c382434U, 0x5fc2a340U,
460     0x72161dc3U, 0x0cbce225U, 0x8b283c49U, 0x41ff0d95U,
461     0x7139a801U, 0xde080cb3U, 0x9cd8b4e4U, 0x906456c1U,
462     0x617bcb84U, 0x70d532b6U, 0x74486c5cU, 0x42d0b857U,
463 };
464 static const u32 Td2[256] = {
465     0xa75051f4U, 0x65537e41U, 0xa4c31a17U, 0x5e963a27U,
466     0x6bcb3babU, 0x45f11f9dU, 0x58abacfaU, 0x03934be3U,
467     0xfa552030U, 0x6df6ad76U, 0x769188ccU, 0x4c25f502U,
468     0xd7fc4fe5U, 0xcbd7c52aU, 0x44802635U, 0xa38fb562U,
469     0x5a49deb1U, 0x1b6725baU, 0x0e9845eaU, 0xc0e15dfeU,
470     0x7502c32fU, 0xf012814cU, 0x97a38d46U, 0xf9c66bd3U,
471     0x5fe7038fU, 0x9c951592U, 0x7aebbf6dU, 0x59da9552U,
472     0x832dd4beU, 0x21d35874U, 0x692949e0U, 0xc8448ec9U,
473     0x896a75c2U, 0x7978f48eU, 0x3e6b9958U, 0x71dd27b9U,
474     0x4fb6bee1U, 0xad17f088U, 0xac66c920U, 0x3ab47dceU,
475     0x4a1863dfU, 0x3182e51aU, 0x33609751U, 0x7f456253U,
476     0x77e0b164U, 0xae84bb6bU, 0xa01cfe81U, 0x2b94f908U,
477     0x68587048U, 0xfd198f45U, 0x6c8794deU, 0xf8b7527bU,
478     0xd323ab73U, 0x02e2724bU, 0x8f57e31fU, 0xab2a6655U,
479     0x2807b2ebU, 0xc2032fb5U, 0x7b9a86c5U, 0x08a5d337U,
480     0x87f23028U, 0xa5b223bfU, 0x6aba0203U, 0x825ced16U,
481     0x1c2b8acfU, 0xb492a779U, 0xf2f0f307U, 0xe2a14e69U,
482     0xf4cd65daU, 0xbed50605U, 0x621fd134U, 0xfe8ac4a6U,
483     0x539d342eU, 0x55a0a2f3U, 0xe132058aU, 0xeb75a4f6U,
484     0xec390b83U, 0xefaa4060U, 0x9f065e71U, 0x1051bd6eU,
485     0x8af93e21U, 0x063d96ddU, 0x05aedd3eU, 0xbd464de6U,
486     0x8db59154U, 0x5d0571c4U, 0xd46f0406U, 0x15ff6050U,
487     0xfb241998U, 0xe997d6bdU, 0x43cc8940U, 0x9e7767d9U,
488     0x42bdb0e8U, 0x8b880789U, 0x5b38e719U, 0xeedb79c8U,
489     0x0a47a17cU, 0x0fe97c42U, 0x1ec9f884U, 0x00000000U,
490     0x86830980U, 0xed48322bU, 0x70ac1e11U, 0x724e6c5aU,
491     0xfffbfd0eU, 0x38560f85U, 0xd51e3daeU, 0x3927362dU,
492     0xd9640a0fU, 0xa621685cU, 0x54d19b5bU, 0x2e3a2436U,
493     0x67b10c0aU, 0xe70f9357U, 0x96d2b4eeU, 0x919e1b9bU,
494     0xc54f80c0U, 0x20a261dcU, 0x4b695a77U, 0x1a161c12U,
495     0xba0ae293U, 0x2ae5c0a0U, 0xe0433c22U, 0x171d121bU,
496     0x0d0b0e09U, 0xc7adf28bU, 0xa8b92db6U, 0xa9c8141eU,
497     0x198557f1U, 0x074caf75U, 0xddbbee99U, 0x60fda37fU,
498     0x269ff701U, 0xf5bc5c72U, 0x3bc54466U, 0x7e345bfbU,
499     0x29768b43U, 0xc6dccb23U, 0xfc68b6edU, 0xf163b8e4U,
500     0xdccad731U, 0x85104263U, 0x22401397U, 0x112084c6U,
501     0x247d854aU, 0x3df8d2bbU, 0x3211aef9U, 0xa16dc729U,
502     0x2f4b1d9eU, 0x30f3dcb2U, 0x52ec0d86U, 0xe3d077c1U,
503     0x166c2bb3U, 0xb999a970U, 0x48fa1194U, 0x642247e9U,
504     0x8cc4a8fcU, 0x3f1aa0f0U, 0x2cd8567dU, 0x90ef2233U,
505     0x4ec78749U, 0xd1c1d938U, 0xa2fe8ccaU, 0x0b3698d4U,
506     0x81cfa6f5U, 0xde28a57aU, 0x8e26dab7U, 0xbfa43fadU,
507     0x9de42c3aU, 0x920d5078U, 0xcc9b6a5fU, 0x4662547eU,
508     0x13c2f68dU, 0xb8e890d8U, 0xf75e2e39U, 0xaff582c3U,
509     0x80be9f5dU, 0x937c69d0U, 0x2da96fd5U, 0x12b3cf25U,
510     0x993bc8acU, 0x7da71018U, 0x636ee89cU, 0xbb7bdb3bU,
511     0x7809cd26U, 0x18f46e59U, 0xb701ec9aU, 0x9aa8834fU,
512     0x6e65e695U, 0xe67eaaffU, 0xcf0821bcU, 0xe8e6ef15U,
513     0x9bd9bae7U, 0x36ce4a6fU, 0x09d4ea9fU, 0x7cd629b0U,
514     0xb2af31a4U, 0x23312a3fU, 0x9430c6a5U, 0x66c035a2U,
515     0xbc37744eU, 0xcaa6fc82U, 0xd0b0e090U, 0xd81533a7U,
516     0x984af104U, 0xdaf741ecU, 0x500e7fcdU, 0xf62f1791U,
517     0xd68d764dU, 0xb04d43efU, 0x4d54ccaaU, 0x04dfe496U,
518     0xb5e39ed1U, 0x881b4c6aU, 0x1fb8c12cU, 0x517f4665U,
519     0xea049d5eU, 0x355d018cU, 0x7473fa87U, 0x412efb0bU,
520     0x1d5ab367U, 0xd25292dbU, 0x5633e910U, 0x47136dd6U,
521     0x618c9ad7U, 0x0c7a37a1U, 0x148e59f8U, 0x3c89eb13U,
522     0x27eecea9U, 0xc935b761U, 0xe5ede11cU, 0xb13c7a47U,
523     0xdf599cd2U, 0x733f55f2U, 0xce791814U, 0x37bf73c7U,
524     0xcdea53f7U, 0xaa5b5ffdU, 0x6f14df3dU, 0xdb867844U,
525     0xf381caafU, 0xc43eb968U, 0x342c3824U, 0x405fc2a3U,
526     0xc372161dU, 0x250cbce2U, 0x498b283cU, 0x9541ff0dU,
527     0x017139a8U, 0xb3de080cU, 0xe49cd8b4U, 0xc1906456U,
528     0x84617bcbU, 0xb670d532U, 0x5c74486cU, 0x5742d0b8U,
529 };
530 static const u32 Td3[256] = {
531     0xf4a75051U, 0x4165537eU, 0x17a4c31aU, 0x275e963aU,
532     0xab6bcb3bU, 0x9d45f11fU, 0xfa58abacU, 0xe303934bU,
533     0x30fa5520U, 0x766df6adU, 0xcc769188U, 0x024c25f5U,
534     0xe5d7fc4fU, 0x2acbd7c5U, 0x35448026U, 0x62a38fb5U,
535     0xb15a49deU, 0xba1b6725U, 0xea0e9845U, 0xfec0e15dU,
536     0x2f7502c3U, 0x4cf01281U, 0x4697a38dU, 0xd3f9c66bU,
537     0x8f5fe703U, 0x929c9515U, 0x6d7aebbfU, 0x5259da95U,
538     0xbe832dd4U, 0x7421d358U, 0xe0692949U, 0xc9c8448eU,
539     0xc2896a75U, 0x8e7978f4U, 0x583e6b99U, 0xb971dd27U,
540     0xe14fb6beU, 0x88ad17f0U, 0x20ac66c9U, 0xce3ab47dU,
541     0xdf4a1863U, 0x1a3182e5U, 0x51336097U, 0x537f4562U,
542     0x6477e0b1U, 0x6bae84bbU, 0x81a01cfeU, 0x082b94f9U,
543     0x48685870U, 0x45fd198fU, 0xde6c8794U, 0x7bf8b752U,
544     0x73d323abU, 0x4b02e272U, 0x1f8f57e3U, 0x55ab2a66U,
545     0xeb2807b2U, 0xb5c2032fU, 0xc57b9a86U, 0x3708a5d3U,
546     0x2887f230U, 0xbfa5b223U, 0x036aba02U, 0x16825cedU,
547     0xcf1c2b8aU, 0x79b492a7U, 0x07f2f0f3U, 0x69e2a14eU,
548     0xdaf4cd65U, 0x05bed506U, 0x34621fd1U, 0xa6fe8ac4U,
549     0x2e539d34U, 0xf355a0a2U, 0x8ae13205U, 0xf6eb75a4U,
550     0x83ec390bU, 0x60efaa40U, 0x719f065eU, 0x6e1051bdU,
551     0x218af93eU, 0xdd063d96U, 0x3e05aeddU, 0xe6bd464dU,
552     0x548db591U, 0xc45d0571U, 0x06d46f04U, 0x5015ff60U,
553     0x98fb2419U, 0xbde997d6U, 0x4043cc89U, 0xd99e7767U,
554     0xe842bdb0U, 0x898b8807U, 0x195b38e7U, 0xc8eedb79U,
555     0x7c0a47a1U, 0x420fe97cU, 0x841ec9f8U, 0x00000000U,
556     0x80868309U, 0x2bed4832U, 0x1170ac1eU, 0x5a724e6cU,
557     0x0efffbfdU, 0x8538560fU, 0xaed51e3dU, 0x2d392736U,
558     0x0fd9640aU, 0x5ca62168U, 0x5b54d19bU, 0x362e3a24U,
559     0x0a67b10cU, 0x57e70f93U, 0xee96d2b4U, 0x9b919e1bU,
560     0xc0c54f80U, 0xdc20a261U, 0x774b695aU, 0x121a161cU,
561     0x93ba0ae2U, 0xa02ae5c0U, 0x22e0433cU, 0x1b171d12U,
562     0x090d0b0eU, 0x8bc7adf2U, 0xb6a8b92dU, 0x1ea9c814U,
563     0xf1198557U, 0x75074cafU, 0x99ddbbeeU, 0x7f60fda3U,
564     0x01269ff7U, 0x72f5bc5cU, 0x663bc544U, 0xfb7e345bU,
565     0x4329768bU, 0x23c6dccbU, 0xedfc68b6U, 0xe4f163b8U,
566     0x31dccad7U, 0x63851042U, 0x97224013U, 0xc6112084U,
567     0x4a247d85U, 0xbb3df8d2U, 0xf93211aeU, 0x29a16dc7U,
568     0x9e2f4b1dU, 0xb230f3dcU, 0x8652ec0dU, 0xc1e3d077U,
569     0xb3166c2bU, 0x70b999a9U, 0x9448fa11U, 0xe9642247U,
570     0xfc8cc4a8U, 0xf03f1aa0U, 0x7d2cd856U, 0x3390ef22U,
571     0x494ec787U, 0x38d1c1d9U, 0xcaa2fe8cU, 0xd40b3698U,
572     0xf581cfa6U, 0x7ade28a5U, 0xb78e26daU, 0xadbfa43fU,
573     0x3a9de42cU, 0x78920d50U, 0x5fcc9b6aU, 0x7e466254U,
574     0x8d13c2f6U, 0xd8b8e890U, 0x39f75e2eU, 0xc3aff582U,
575     0x5d80be9fU, 0xd0937c69U, 0xd52da96fU, 0x2512b3cfU,
576     0xac993bc8U, 0x187da710U, 0x9c636ee8U, 0x3bbb7bdbU,
577     0x267809cdU, 0x5918f46eU, 0x9ab701ecU, 0x4f9aa883U,
578     0x956e65e6U, 0xffe67eaaU, 0xbccf0821U, 0x15e8e6efU,
579     0xe79bd9baU, 0x6f36ce4aU, 0x9f09d4eaU, 0xb07cd629U,
580     0xa4b2af31U, 0x3f23312aU, 0xa59430c6U, 0xa266c035U,
581     0x4ebc3774U, 0x82caa6fcU, 0x90d0b0e0U, 0xa7d81533U,
582     0x04984af1U, 0xecdaf741U, 0xcd500e7fU, 0x91f62f17U,
583     0x4dd68d76U, 0xefb04d43U, 0xaa4d54ccU, 0x9604dfe4U,
584     0xd1b5e39eU, 0x6a881b4cU, 0x2c1fb8c1U, 0x65517f46U,
585     0x5eea049dU, 0x8c355d01U, 0x877473faU, 0x0b412efbU,
586     0x671d5ab3U, 0xdbd25292U, 0x105633e9U, 0xd647136dU,
587     0xd7618c9aU, 0xa10c7a37U, 0xf8148e59U, 0x133c89ebU,
588     0xa927eeceU, 0x61c935b7U, 0x1ce5ede1U, 0x47b13c7aU,
589     0xd2df599cU, 0xf2733f55U, 0x14ce7918U, 0xc737bf73U,
590     0xf7cdea53U, 0xfdaa5b5fU, 0x3d6f14dfU, 0x44db8678U,
591     0xaff381caU, 0x68c43eb9U, 0x24342c38U, 0xa3405fc2U,
592     0x1dc37216U, 0xe2250cbcU, 0x3c498b28U, 0x0d9541ffU,
593     0xa8017139U, 0x0cb3de08U, 0xb4e49cd8U, 0x56c19064U,
594     0xcb84617bU, 0x32b670d5U, 0x6c5c7448U, 0xb85742d0U,
595 };
596 static const u8 Td4[256] = {
597     0x52U, 0x09U, 0x6aU, 0xd5U, 0x30U, 0x36U, 0xa5U, 0x38U,
598     0xbfU, 0x40U, 0xa3U, 0x9eU, 0x81U, 0xf3U, 0xd7U, 0xfbU,
599     0x7cU, 0xe3U, 0x39U, 0x82U, 0x9bU, 0x2fU, 0xffU, 0x87U,
600     0x34U, 0x8eU, 0x43U, 0x44U, 0xc4U, 0xdeU, 0xe9U, 0xcbU,
601     0x54U, 0x7bU, 0x94U, 0x32U, 0xa6U, 0xc2U, 0x23U, 0x3dU,
602     0xeeU, 0x4cU, 0x95U, 0x0bU, 0x42U, 0xfaU, 0xc3U, 0x4eU,
603     0x08U, 0x2eU, 0xa1U, 0x66U, 0x28U, 0xd9U, 0x24U, 0xb2U,
604     0x76U, 0x5bU, 0xa2U, 0x49U, 0x6dU, 0x8bU, 0xd1U, 0x25U,
605     0x72U, 0xf8U, 0xf6U, 0x64U, 0x86U, 0x68U, 0x98U, 0x16U,
606     0xd4U, 0xa4U, 0x5cU, 0xccU, 0x5dU, 0x65U, 0xb6U, 0x92U,
607     0x6cU, 0x70U, 0x48U, 0x50U, 0xfdU, 0xedU, 0xb9U, 0xdaU,
608     0x5eU, 0x15U, 0x46U, 0x57U, 0xa7U, 0x8dU, 0x9dU, 0x84U,
609     0x90U, 0xd8U, 0xabU, 0x00U, 0x8cU, 0xbcU, 0xd3U, 0x0aU,
610     0xf7U, 0xe4U, 0x58U, 0x05U, 0xb8U, 0xb3U, 0x45U, 0x06U,
611     0xd0U, 0x2cU, 0x1eU, 0x8fU, 0xcaU, 0x3fU, 0x0fU, 0x02U,
612     0xc1U, 0xafU, 0xbdU, 0x03U, 0x01U, 0x13U, 0x8aU, 0x6bU,
613     0x3aU, 0x91U, 0x11U, 0x41U, 0x4fU, 0x67U, 0xdcU, 0xeaU,
614     0x97U, 0xf2U, 0xcfU, 0xceU, 0xf0U, 0xb4U, 0xe6U, 0x73U,
615     0x96U, 0xacU, 0x74U, 0x22U, 0xe7U, 0xadU, 0x35U, 0x85U,
616     0xe2U, 0xf9U, 0x37U, 0xe8U, 0x1cU, 0x75U, 0xdfU, 0x6eU,
617     0x47U, 0xf1U, 0x1aU, 0x71U, 0x1dU, 0x29U, 0xc5U, 0x89U,
618     0x6fU, 0xb7U, 0x62U, 0x0eU, 0xaaU, 0x18U, 0xbeU, 0x1bU,
619     0xfcU, 0x56U, 0x3eU, 0x4bU, 0xc6U, 0xd2U, 0x79U, 0x20U,
620     0x9aU, 0xdbU, 0xc0U, 0xfeU, 0x78U, 0xcdU, 0x5aU, 0xf4U,
621     0x1fU, 0xddU, 0xa8U, 0x33U, 0x88U, 0x07U, 0xc7U, 0x31U,
622     0xb1U, 0x12U, 0x10U, 0x59U, 0x27U, 0x80U, 0xecU, 0x5fU,
623     0x60U, 0x51U, 0x7fU, 0xa9U, 0x19U, 0xb5U, 0x4aU, 0x0dU,
624     0x2dU, 0xe5U, 0x7aU, 0x9fU, 0x93U, 0xc9U, 0x9cU, 0xefU,
625     0xa0U, 0xe0U, 0x3bU, 0x4dU, 0xaeU, 0x2aU, 0xf5U, 0xb0U,
626     0xc8U, 0xebU, 0xbbU, 0x3cU, 0x83U, 0x53U, 0x99U, 0x61U,
627     0x17U, 0x2bU, 0x04U, 0x7eU, 0xbaU, 0x77U, 0xd6U, 0x26U,
628     0xe1U, 0x69U, 0x14U, 0x63U, 0x55U, 0x21U, 0x0cU, 0x7dU,
629 };
630 static const u32 rcon[] = {
631     0x01000000, 0x02000000, 0x04000000, 0x08000000,
632     0x10000000, 0x20000000, 0x40000000, 0x80000000,
633     0x1B000000, 0x36000000, /* for 128-bit blocks, Rijndael never uses more than 10 rcon values */
634 };
635
636 /**
637  * Expand the cipher key into the encryption key schedule.
638  */
639 int AES_set_encrypt_key(const unsigned char *userKey, const int bits,
640                         AES_KEY *key)
641 {
642
643     u32 *rk;
644     int i = 0;
645     u32 temp;
646
647     if (!userKey || !key)
648         return -1;
649     if (bits != 128 && bits != 192 && bits != 256)
650         return -2;
651
652     rk = key->rd_key;
653
654     if (bits == 128)
655         key->rounds = 10;
656     else if (bits == 192)
657         key->rounds = 12;
658     else
659         key->rounds = 14;
660
661     rk[0] = GETU32(userKey     );
662     rk[1] = GETU32(userKey +  4);
663     rk[2] = GETU32(userKey +  8);
664     rk[3] = GETU32(userKey + 12);
665     if (bits == 128) {
666         while (1) {
667             temp  = rk[3];
668             rk[4] = rk[0] ^
669                 (Te2[(temp >> 16) & 0xff] & 0xff000000) ^
670                 (Te3[(temp >>  8) & 0xff] & 0x00ff0000) ^
671                 (Te0[(temp      ) & 0xff] & 0x0000ff00) ^
672                 (Te1[(temp >> 24)       ] & 0x000000ff) ^
673                 rcon[i];
674             rk[5] = rk[1] ^ rk[4];
675             rk[6] = rk[2] ^ rk[5];
676             rk[7] = rk[3] ^ rk[6];
677             if (++i == 10) {
678                 return 0;
679             }
680             rk += 4;
681         }
682     }
683     rk[4] = GETU32(userKey + 16);
684     rk[5] = GETU32(userKey + 20);
685     if (bits == 192) {
686         while (1) {
687             temp = rk[ 5];
688             rk[ 6] = rk[ 0] ^
689                 (Te2[(temp >> 16) & 0xff] & 0xff000000) ^
690                 (Te3[(temp >>  8) & 0xff] & 0x00ff0000) ^
691                 (Te0[(temp      ) & 0xff] & 0x0000ff00) ^
692                 (Te1[(temp >> 24)       ] & 0x000000ff) ^
693                 rcon[i];
694             rk[ 7] = rk[ 1] ^ rk[ 6];
695             rk[ 8] = rk[ 2] ^ rk[ 7];
696             rk[ 9] = rk[ 3] ^ rk[ 8];
697             if (++i == 8) {
698                 return 0;
699             }
700             rk[10] = rk[ 4] ^ rk[ 9];
701             rk[11] = rk[ 5] ^ rk[10];
702             rk += 6;
703         }
704     }
705     rk[6] = GETU32(userKey + 24);
706     rk[7] = GETU32(userKey + 28);
707     if (bits == 256) {
708         while (1) {
709             temp = rk[ 7];
710             rk[ 8] = rk[ 0] ^
711                 (Te2[(temp >> 16) & 0xff] & 0xff000000) ^
712                 (Te3[(temp >>  8) & 0xff] & 0x00ff0000) ^
713                 (Te0[(temp      ) & 0xff] & 0x0000ff00) ^
714                 (Te1[(temp >> 24)       ] & 0x000000ff) ^
715                 rcon[i];
716             rk[ 9] = rk[ 1] ^ rk[ 8];
717             rk[10] = rk[ 2] ^ rk[ 9];
718             rk[11] = rk[ 3] ^ rk[10];
719             if (++i == 7) {
720                 return 0;
721             }
722             temp = rk[11];
723             rk[12] = rk[ 4] ^
724                 (Te2[(temp >> 24)       ] & 0xff000000) ^
725                 (Te3[(temp >> 16) & 0xff] & 0x00ff0000) ^
726                 (Te0[(temp >>  8) & 0xff] & 0x0000ff00) ^
727                 (Te1[(temp      ) & 0xff] & 0x000000ff);
728             rk[13] = rk[ 5] ^ rk[12];
729             rk[14] = rk[ 6] ^ rk[13];
730             rk[15] = rk[ 7] ^ rk[14];
731
732             rk += 8;
733             }
734     }
735     return 0;
736 }
737
738 /**
739  * Expand the cipher key into the decryption key schedule.
740  */
741 int AES_set_decrypt_key(const unsigned char *userKey, const int bits,
742                         AES_KEY *key)
743 {
744
745     u32 *rk;
746     int i, j, status;
747     u32 temp;
748
749     /* first, start with an encryption schedule */
750     status = AES_set_encrypt_key(userKey, bits, key);
751     if (status < 0)
752         return status;
753
754     rk = key->rd_key;
755
756     /* invert the order of the round keys: */
757     for (i = 0, j = 4*(key->rounds); i < j; i += 4, j -= 4) {
758         temp = rk[i    ]; rk[i    ] = rk[j    ]; rk[j    ] = temp;
759         temp = rk[i + 1]; rk[i + 1] = rk[j + 1]; rk[j + 1] = temp;
760         temp = rk[i + 2]; rk[i + 2] = rk[j + 2]; rk[j + 2] = temp;
761         temp = rk[i + 3]; rk[i + 3] = rk[j + 3]; rk[j + 3] = temp;
762     }
763     /* apply the inverse MixColumn transform to all round keys but the first and the last: */
764     for (i = 1; i < (key->rounds); i++) {
765         rk += 4;
766         rk[0] =
767             Td0[Te1[(rk[0] >> 24)       ] & 0xff] ^
768             Td1[Te1[(rk[0] >> 16) & 0xff] & 0xff] ^
769             Td2[Te1[(rk[0] >>  8) & 0xff] & 0xff] ^
770             Td3[Te1[(rk[0]      ) & 0xff] & 0xff];
771         rk[1] =
772             Td0[Te1[(rk[1] >> 24)       ] & 0xff] ^
773             Td1[Te1[(rk[1] >> 16) & 0xff] & 0xff] ^
774             Td2[Te1[(rk[1] >>  8) & 0xff] & 0xff] ^
775             Td3[Te1[(rk[1]      ) & 0xff] & 0xff];
776         rk[2] =
777             Td0[Te1[(rk[2] >> 24)       ] & 0xff] ^
778             Td1[Te1[(rk[2] >> 16) & 0xff] & 0xff] ^
779             Td2[Te1[(rk[2] >>  8) & 0xff] & 0xff] ^
780             Td3[Te1[(rk[2]      ) & 0xff] & 0xff];
781         rk[3] =
782             Td0[Te1[(rk[3] >> 24)       ] & 0xff] ^
783             Td1[Te1[(rk[3] >> 16) & 0xff] & 0xff] ^
784             Td2[Te1[(rk[3] >>  8) & 0xff] & 0xff] ^
785             Td3[Te1[(rk[3]      ) & 0xff] & 0xff];
786     }
787     return 0;
788 }
789
790 /*
791  * Encrypt a single block
792  * in and out can overlap
793  */
794 void AES_encrypt(const unsigned char *in, unsigned char *out,
795                  const AES_KEY *key) {
796
797     const u32 *rk;
798     u32 s0, s1, s2, s3, t0, t1, t2, t3;
799 #ifndef FULL_UNROLL
800     int r;
801 #endif /* ?FULL_UNROLL */
802
803     assert(in && out && key);
804     rk = key->rd_key;
805
806     /*
807      * map byte array block to cipher state
808      * and add initial round key:
809      */
810     s0 = GETU32(in     ) ^ rk[0];
811     s1 = GETU32(in +  4) ^ rk[1];
812     s2 = GETU32(in +  8) ^ rk[2];
813     s3 = GETU32(in + 12) ^ rk[3];
814 #ifdef FULL_UNROLL
815     /* round 1: */
816     t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[ 4];
817     t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[ 5];
818     t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[ 6];
819     t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[ 7];
820     /* round 2: */
821     s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[ 8];
822     s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[ 9];
823     s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[10];
824     s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[11];
825     /* round 3: */
826     t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[12];
827     t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[13];
828     t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[14];
829     t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[15];
830     /* round 4: */
831     s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[16];
832     s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[17];
833     s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[18];
834     s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[19];
835     /* round 5: */
836     t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[20];
837     t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[21];
838     t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[22];
839     t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[23];
840     /* round 6: */
841     s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[24];
842     s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[25];
843     s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[26];
844     s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[27];
845     /* round 7: */
846     t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[28];
847     t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[29];
848     t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[30];
849     t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[31];
850     /* round 8: */
851     s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[32];
852     s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[33];
853     s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[34];
854     s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[35];
855     /* round 9: */
856     t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[36];
857     t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[37];
858     t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[38];
859     t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[39];
860     if (key->rounds > 10) {
861         /* round 10: */
862         s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[40];
863         s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[41];
864         s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[42];
865         s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[43];
866         /* round 11: */
867         t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[44];
868         t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[45];
869         t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[46];
870         t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[47];
871         if (key->rounds > 12) {
872             /* round 12: */
873             s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[48];
874             s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[49];
875             s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[50];
876             s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[51];
877             /* round 13: */
878             t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[52];
879             t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[53];
880             t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[54];
881             t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[55];
882         }
883     }
884     rk += key->rounds << 2;
885 #else  /* !FULL_UNROLL */
886     /*
887      * Nr - 1 full rounds:
888      */
889     r = key->rounds >> 1;
890     for (;;) {
891         t0 =
892             Te0[(s0 >> 24)       ] ^
893             Te1[(s1 >> 16) & 0xff] ^
894             Te2[(s2 >>  8) & 0xff] ^
895             Te3[(s3      ) & 0xff] ^
896             rk[4];
897         t1 =
898             Te0[(s1 >> 24)       ] ^
899             Te1[(s2 >> 16) & 0xff] ^
900             Te2[(s3 >>  8) & 0xff] ^
901             Te3[(s0      ) & 0xff] ^
902             rk[5];
903         t2 =
904             Te0[(s2 >> 24)       ] ^
905             Te1[(s3 >> 16) & 0xff] ^
906             Te2[(s0 >>  8) & 0xff] ^
907             Te3[(s1      ) & 0xff] ^
908             rk[6];
909         t3 =
910             Te0[(s3 >> 24)       ] ^
911             Te1[(s0 >> 16) & 0xff] ^
912             Te2[(s1 >>  8) & 0xff] ^
913             Te3[(s2      ) & 0xff] ^
914             rk[7];
915
916         rk += 8;
917         if (--r == 0) {
918             break;
919         }
920
921         s0 =
922             Te0[(t0 >> 24)       ] ^
923             Te1[(t1 >> 16) & 0xff] ^
924             Te2[(t2 >>  8) & 0xff] ^
925             Te3[(t3      ) & 0xff] ^
926             rk[0];
927         s1 =
928             Te0[(t1 >> 24)       ] ^
929             Te1[(t2 >> 16) & 0xff] ^
930             Te2[(t3 >>  8) & 0xff] ^
931             Te3[(t0      ) & 0xff] ^
932             rk[1];
933         s2 =
934             Te0[(t2 >> 24)       ] ^
935             Te1[(t3 >> 16) & 0xff] ^
936             Te2[(t0 >>  8) & 0xff] ^
937             Te3[(t1      ) & 0xff] ^
938             rk[2];
939         s3 =
940             Te0[(t3 >> 24)       ] ^
941             Te1[(t0 >> 16) & 0xff] ^
942             Te2[(t1 >>  8) & 0xff] ^
943             Te3[(t2      ) & 0xff] ^
944             rk[3];
945     }
946 #endif /* ?FULL_UNROLL */
947     /*
948      * apply last round and
949      * map cipher state to byte array block:
950      */
951     s0 =
952         (Te2[(t0 >> 24)       ] & 0xff000000) ^
953         (Te3[(t1 >> 16) & 0xff] & 0x00ff0000) ^
954         (Te0[(t2 >>  8) & 0xff] & 0x0000ff00) ^
955         (Te1[(t3      ) & 0xff] & 0x000000ff) ^
956         rk[0];
957     PUTU32(out     , s0);
958     s1 =
959         (Te2[(t1 >> 24)       ] & 0xff000000) ^
960         (Te3[(t2 >> 16) & 0xff] & 0x00ff0000) ^
961         (Te0[(t3 >>  8) & 0xff] & 0x0000ff00) ^
962         (Te1[(t0      ) & 0xff] & 0x000000ff) ^
963         rk[1];
964     PUTU32(out +  4, s1);
965     s2 =
966         (Te2[(t2 >> 24)       ] & 0xff000000) ^
967         (Te3[(t3 >> 16) & 0xff] & 0x00ff0000) ^
968         (Te0[(t0 >>  8) & 0xff] & 0x0000ff00) ^
969         (Te1[(t1      ) & 0xff] & 0x000000ff) ^
970         rk[2];
971     PUTU32(out +  8, s2);
972     s3 =
973         (Te2[(t3 >> 24)       ] & 0xff000000) ^
974         (Te3[(t0 >> 16) & 0xff] & 0x00ff0000) ^
975         (Te0[(t1 >>  8) & 0xff] & 0x0000ff00) ^
976         (Te1[(t2      ) & 0xff] & 0x000000ff) ^
977         rk[3];
978     PUTU32(out + 12, s3);
979 }
980
981 /*
982  * Decrypt a single block
983  * in and out can overlap
984  */
985 void AES_decrypt(const unsigned char *in, unsigned char *out,
986                  const AES_KEY *key)
987 {
988
989     const u32 *rk;
990     u32 s0, s1, s2, s3, t0, t1, t2, t3;
991 #ifndef FULL_UNROLL
992     int r;
993 #endif /* ?FULL_UNROLL */
994
995     assert(in && out && key);
996     rk = key->rd_key;
997
998     /*
999      * map byte array block to cipher state
1000      * and add initial round key:
1001      */
1002     s0 = GETU32(in     ) ^ rk[0];
1003     s1 = GETU32(in +  4) ^ rk[1];
1004     s2 = GETU32(in +  8) ^ rk[2];
1005     s3 = GETU32(in + 12) ^ rk[3];
1006 #ifdef FULL_UNROLL
1007     /* round 1: */
1008     t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[ 4];
1009     t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[ 5];
1010     t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[ 6];
1011     t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[ 7];
1012     /* round 2: */
1013     s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[ 8];
1014     s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[ 9];
1015     s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[10];
1016     s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[11];
1017     /* round 3: */
1018     t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[12];
1019     t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[13];
1020     t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[14];
1021     t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[15];
1022     /* round 4: */
1023     s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[16];
1024     s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[17];
1025     s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[18];
1026     s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[19];
1027     /* round 5: */
1028     t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[20];
1029     t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[21];
1030     t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[22];
1031     t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[23];
1032     /* round 6: */
1033     s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[24];
1034     s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[25];
1035     s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[26];
1036     s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[27];
1037     /* round 7: */
1038     t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[28];
1039     t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[29];
1040     t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[30];
1041     t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[31];
1042     /* round 8: */
1043     s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[32];
1044     s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[33];
1045     s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[34];
1046     s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[35];
1047     /* round 9: */
1048     t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[36];
1049     t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[37];
1050     t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[38];
1051     t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[39];
1052     if (key->rounds > 10) {
1053         /* round 10: */
1054         s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[40];
1055         s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[41];
1056         s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[42];
1057         s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[43];
1058         /* round 11: */
1059         t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[44];
1060         t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[45];
1061         t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[46];
1062         t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[47];
1063         if (key->rounds > 12) {
1064             /* round 12: */
1065             s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[48];
1066             s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[49];
1067             s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[50];
1068             s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[51];
1069             /* round 13: */
1070             t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[52];
1071             t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[53];
1072             t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[54];
1073             t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[55];
1074         }
1075     }
1076     rk += key->rounds << 2;
1077 #else  /* !FULL_UNROLL */
1078     /*
1079      * Nr - 1 full rounds:
1080      */
1081     r = key->rounds >> 1;
1082     for (;;) {
1083         t0 =
1084             Td0[(s0 >> 24)       ] ^
1085             Td1[(s3 >> 16) & 0xff] ^
1086             Td2[(s2 >>  8) & 0xff] ^
1087             Td3[(s1      ) & 0xff] ^
1088             rk[4];
1089         t1 =
1090             Td0[(s1 >> 24)       ] ^
1091             Td1[(s0 >> 16) & 0xff] ^
1092             Td2[(s3 >>  8) & 0xff] ^
1093             Td3[(s2      ) & 0xff] ^
1094             rk[5];
1095         t2 =
1096             Td0[(s2 >> 24)       ] ^
1097             Td1[(s1 >> 16) & 0xff] ^
1098             Td2[(s0 >>  8) & 0xff] ^
1099             Td3[(s3      ) & 0xff] ^
1100             rk[6];
1101         t3 =
1102             Td0[(s3 >> 24)       ] ^
1103             Td1[(s2 >> 16) & 0xff] ^
1104             Td2[(s1 >>  8) & 0xff] ^
1105             Td3[(s0      ) & 0xff] ^
1106             rk[7];
1107
1108         rk += 8;
1109         if (--r == 0) {
1110             break;
1111         }
1112
1113         s0 =
1114             Td0[(t0 >> 24)       ] ^
1115             Td1[(t3 >> 16) & 0xff] ^
1116             Td2[(t2 >>  8) & 0xff] ^
1117             Td3[(t1      ) & 0xff] ^
1118             rk[0];
1119         s1 =
1120             Td0[(t1 >> 24)       ] ^
1121             Td1[(t0 >> 16) & 0xff] ^
1122             Td2[(t3 >>  8) & 0xff] ^
1123             Td3[(t2      ) & 0xff] ^
1124             rk[1];
1125         s2 =
1126             Td0[(t2 >> 24)       ] ^
1127             Td1[(t1 >> 16) & 0xff] ^
1128             Td2[(t0 >>  8) & 0xff] ^
1129             Td3[(t3      ) & 0xff] ^
1130             rk[2];
1131         s3 =
1132             Td0[(t3 >> 24)       ] ^
1133             Td1[(t2 >> 16) & 0xff] ^
1134             Td2[(t1 >>  8) & 0xff] ^
1135             Td3[(t0      ) & 0xff] ^
1136             rk[3];
1137     }
1138 #endif /* ?FULL_UNROLL */
1139     /*
1140      * apply last round and
1141      * map cipher state to byte array block:
1142      */
1143     s0 =
1144         ((u32)Td4[(t0 >> 24)       ] << 24) ^
1145         ((u32)Td4[(t3 >> 16) & 0xff] << 16) ^
1146         ((u32)Td4[(t2 >>  8) & 0xff] <<  8) ^
1147         ((u32)Td4[(t1      ) & 0xff])       ^
1148         rk[0];
1149     PUTU32(out     , s0);
1150     s1 =
1151         ((u32)Td4[(t1 >> 24)       ] << 24) ^
1152         ((u32)Td4[(t0 >> 16) & 0xff] << 16) ^
1153         ((u32)Td4[(t3 >>  8) & 0xff] <<  8) ^
1154         ((u32)Td4[(t2      ) & 0xff])       ^
1155         rk[1];
1156     PUTU32(out +  4, s1);
1157     s2 =
1158         ((u32)Td4[(t2 >> 24)       ] << 24) ^
1159         ((u32)Td4[(t1 >> 16) & 0xff] << 16) ^
1160         ((u32)Td4[(t0 >>  8) & 0xff] <<  8) ^
1161         ((u32)Td4[(t3      ) & 0xff])       ^
1162         rk[2];
1163     PUTU32(out +  8, s2);
1164     s3 =
1165         ((u32)Td4[(t3 >> 24)       ] << 24) ^
1166         ((u32)Td4[(t2 >> 16) & 0xff] << 16) ^
1167         ((u32)Td4[(t1 >>  8) & 0xff] <<  8) ^
1168         ((u32)Td4[(t0      ) & 0xff])       ^
1169         rk[3];
1170     PUTU32(out + 12, s3);
1171 }
1172
1173 #else /* AES_ASM */
1174
1175 static const u8 Te4[256] = {
1176     0x63U, 0x7cU, 0x77U, 0x7bU, 0xf2U, 0x6bU, 0x6fU, 0xc5U,
1177     0x30U, 0x01U, 0x67U, 0x2bU, 0xfeU, 0xd7U, 0xabU, 0x76U,
1178     0xcaU, 0x82U, 0xc9U, 0x7dU, 0xfaU, 0x59U, 0x47U, 0xf0U,
1179     0xadU, 0xd4U, 0xa2U, 0xafU, 0x9cU, 0xa4U, 0x72U, 0xc0U,
1180     0xb7U, 0xfdU, 0x93U, 0x26U, 0x36U, 0x3fU, 0xf7U, 0xccU,
1181     0x34U, 0xa5U, 0xe5U, 0xf1U, 0x71U, 0xd8U, 0x31U, 0x15U,
1182     0x04U, 0xc7U, 0x23U, 0xc3U, 0x18U, 0x96U, 0x05U, 0x9aU,
1183     0x07U, 0x12U, 0x80U, 0xe2U, 0xebU, 0x27U, 0xb2U, 0x75U,
1184     0x09U, 0x83U, 0x2cU, 0x1aU, 0x1bU, 0x6eU, 0x5aU, 0xa0U,
1185     0x52U, 0x3bU, 0xd6U, 0xb3U, 0x29U, 0xe3U, 0x2fU, 0x84U,
1186     0x53U, 0xd1U, 0x00U, 0xedU, 0x20U, 0xfcU, 0xb1U, 0x5bU,
1187     0x6aU, 0xcbU, 0xbeU, 0x39U, 0x4aU, 0x4cU, 0x58U, 0xcfU,
1188     0xd0U, 0xefU, 0xaaU, 0xfbU, 0x43U, 0x4dU, 0x33U, 0x85U,
1189     0x45U, 0xf9U, 0x02U, 0x7fU, 0x50U, 0x3cU, 0x9fU, 0xa8U,
1190     0x51U, 0xa3U, 0x40U, 0x8fU, 0x92U, 0x9dU, 0x38U, 0xf5U,
1191     0xbcU, 0xb6U, 0xdaU, 0x21U, 0x10U, 0xffU, 0xf3U, 0xd2U,
1192     0xcdU, 0x0cU, 0x13U, 0xecU, 0x5fU, 0x97U, 0x44U, 0x17U,
1193     0xc4U, 0xa7U, 0x7eU, 0x3dU, 0x64U, 0x5dU, 0x19U, 0x73U,
1194     0x60U, 0x81U, 0x4fU, 0xdcU, 0x22U, 0x2aU, 0x90U, 0x88U,
1195     0x46U, 0xeeU, 0xb8U, 0x14U, 0xdeU, 0x5eU, 0x0bU, 0xdbU,
1196     0xe0U, 0x32U, 0x3aU, 0x0aU, 0x49U, 0x06U, 0x24U, 0x5cU,
1197     0xc2U, 0xd3U, 0xacU, 0x62U, 0x91U, 0x95U, 0xe4U, 0x79U,
1198     0xe7U, 0xc8U, 0x37U, 0x6dU, 0x8dU, 0xd5U, 0x4eU, 0xa9U,
1199     0x6cU, 0x56U, 0xf4U, 0xeaU, 0x65U, 0x7aU, 0xaeU, 0x08U,
1200     0xbaU, 0x78U, 0x25U, 0x2eU, 0x1cU, 0xa6U, 0xb4U, 0xc6U,
1201     0xe8U, 0xddU, 0x74U, 0x1fU, 0x4bU, 0xbdU, 0x8bU, 0x8aU,
1202     0x70U, 0x3eU, 0xb5U, 0x66U, 0x48U, 0x03U, 0xf6U, 0x0eU,
1203     0x61U, 0x35U, 0x57U, 0xb9U, 0x86U, 0xc1U, 0x1dU, 0x9eU,
1204     0xe1U, 0xf8U, 0x98U, 0x11U, 0x69U, 0xd9U, 0x8eU, 0x94U,
1205     0x9bU, 0x1eU, 0x87U, 0xe9U, 0xceU, 0x55U, 0x28U, 0xdfU,
1206     0x8cU, 0xa1U, 0x89U, 0x0dU, 0xbfU, 0xe6U, 0x42U, 0x68U,
1207     0x41U, 0x99U, 0x2dU, 0x0fU, 0xb0U, 0x54U, 0xbbU, 0x16U
1208 };
1209 static const u32 rcon[] = {
1210     0x01000000, 0x02000000, 0x04000000, 0x08000000,
1211     0x10000000, 0x20000000, 0x40000000, 0x80000000,
1212     0x1B000000, 0x36000000, /* for 128-bit blocks, Rijndael never uses more than 10 rcon values */
1213 };
1214
1215 /**
1216  * Expand the cipher key into the encryption key schedule.
1217  */
1218 int AES_set_encrypt_key(const unsigned char *userKey, const int bits,
1219                         AES_KEY *key)
1220 {
1221     u32 *rk;
1222     int i = 0;
1223     u32 temp;
1224
1225     if (!userKey || !key)
1226         return -1;
1227     if (bits != 128 && bits != 192 && bits != 256)
1228         return -2;
1229
1230     rk = key->rd_key;
1231
1232     if (bits == 128)
1233         key->rounds = 10;
1234     else if (bits == 192)
1235         key->rounds = 12;
1236     else
1237         key->rounds = 14;
1238
1239     rk[0] = GETU32(userKey     );
1240     rk[1] = GETU32(userKey +  4);
1241     rk[2] = GETU32(userKey +  8);
1242     rk[3] = GETU32(userKey + 12);
1243     if (bits == 128) {
1244         while (1) {
1245             temp  = rk[3];
1246             rk[4] = rk[0] ^
1247                 ((u32)Te4[(temp >> 16) & 0xff] << 24) ^
1248                 ((u32)Te4[(temp >>  8) & 0xff] << 16) ^
1249                 ((u32)Te4[(temp      ) & 0xff] << 8) ^
1250                 ((u32)Te4[(temp >> 24)       ]) ^
1251                 rcon[i];
1252             rk[5] = rk[1] ^ rk[4];
1253             rk[6] = rk[2] ^ rk[5];
1254             rk[7] = rk[3] ^ rk[6];
1255             if (++i == 10) {
1256                 return 0;
1257             }
1258             rk += 4;
1259         }
1260     }
1261     rk[4] = GETU32(userKey + 16);
1262     rk[5] = GETU32(userKey + 20);
1263     if (bits == 192) {
1264         while (1) {
1265             temp = rk[ 5];
1266             rk[ 6] = rk[ 0] ^
1267                 ((u32)Te4[(temp >> 16) & 0xff] << 24) ^
1268                 ((u32)Te4[(temp >>  8) & 0xff] << 16) ^
1269                 ((u32)Te4[(temp      ) & 0xff] << 8) ^
1270                 ((u32)Te4[(temp >> 24)       ]) ^
1271                 rcon[i];
1272             rk[ 7] = rk[ 1] ^ rk[ 6];
1273             rk[ 8] = rk[ 2] ^ rk[ 7];
1274             rk[ 9] = rk[ 3] ^ rk[ 8];
1275             if (++i == 8) {
1276                 return 0;
1277             }
1278             rk[10] = rk[ 4] ^ rk[ 9];
1279             rk[11] = rk[ 5] ^ rk[10];
1280             rk += 6;
1281         }
1282     }
1283     rk[6] = GETU32(userKey + 24);
1284     rk[7] = GETU32(userKey + 28);
1285     if (bits == 256) {
1286         while (1) {
1287             temp = rk[ 7];
1288             rk[ 8] = rk[ 0] ^
1289                 ((u32)Te4[(temp >> 16) & 0xff] << 24) ^
1290                 ((u32)Te4[(temp >>  8) & 0xff] << 16) ^
1291                 ((u32)Te4[(temp      ) & 0xff] << 8) ^
1292                 ((u32)Te4[(temp >> 24)       ]) ^
1293                 rcon[i];
1294             rk[ 9] = rk[ 1] ^ rk[ 8];
1295             rk[10] = rk[ 2] ^ rk[ 9];
1296             rk[11] = rk[ 3] ^ rk[10];
1297             if (++i == 7) {
1298                 return 0;
1299             }
1300             temp = rk[11];
1301             rk[12] = rk[ 4] ^
1302                 ((u32)Te4[(temp >> 24)       ] << 24) ^
1303                 ((u32)Te4[(temp >> 16) & 0xff] << 16) ^
1304                 ((u32)Te4[(temp >>  8) & 0xff] << 8) ^
1305                 ((u32)Te4[(temp      ) & 0xff]);
1306             rk[13] = rk[ 5] ^ rk[12];
1307             rk[14] = rk[ 6] ^ rk[13];
1308             rk[15] = rk[ 7] ^ rk[14];
1309
1310             rk += 8;
1311         }
1312     }
1313     return 0;
1314 }
1315
1316 /**
1317  * Expand the cipher key into the decryption key schedule.
1318  */
1319 int AES_set_decrypt_key(const unsigned char *userKey, const int bits,
1320                         AES_KEY *key)
1321 {
1322
1323     u32 *rk;
1324     int i, j, status;
1325     u32 temp;
1326
1327     /* first, start with an encryption schedule */
1328     status = AES_set_encrypt_key(userKey, bits, key);
1329     if (status < 0)
1330         return status;
1331
1332     rk = key->rd_key;
1333
1334     /* invert the order of the round keys: */
1335     for (i = 0, j = 4*(key->rounds); i < j; i += 4, j -= 4) {
1336         temp = rk[i    ]; rk[i    ] = rk[j    ]; rk[j    ] = temp;
1337         temp = rk[i + 1]; rk[i + 1] = rk[j + 1]; rk[j + 1] = temp;
1338         temp = rk[i + 2]; rk[i + 2] = rk[j + 2]; rk[j + 2] = temp;
1339         temp = rk[i + 3]; rk[i + 3] = rk[j + 3]; rk[j + 3] = temp;
1340     }
1341     /* apply the inverse MixColumn transform to all round keys but the first and the last: */
1342     for (i = 1; i < (key->rounds); i++) {
1343         rk += 4;
1344         for (j = 0; j < 4; j++) {
1345             u32 tp1, tp2, tp4, tp8, tp9, tpb, tpd, tpe, m;
1346
1347             tp1 = rk[j];
1348             m = tp1 & 0x80808080;
1349             tp2 = ((tp1 & 0x7f7f7f7f) << 1) ^
1350                 ((m - (m >> 7)) & 0x1b1b1b1b);
1351             m = tp2 & 0x80808080;
1352             tp4 = ((tp2 & 0x7f7f7f7f) << 1) ^
1353                 ((m - (m >> 7)) & 0x1b1b1b1b);
1354             m = tp4 & 0x80808080;
1355             tp8 = ((tp4 & 0x7f7f7f7f) << 1) ^
1356                 ((m - (m >> 7)) & 0x1b1b1b1b);
1357             tp9 = tp8 ^ tp1;
1358             tpb = tp9 ^ tp2;
1359             tpd = tp9 ^ tp4;
1360             tpe = tp8 ^ tp4 ^ tp2;
1361 #if defined(ROTATE)
1362             rk[j] = tpe ^ ROTATE(tpd,16) ^
1363                 ROTATE(tp9,24) ^ ROTATE(tpb,8);
1364 #else
1365             rk[j] = tpe ^ (tpd >> 16) ^ (tpd << 16) ^
1366                 (tp9 >> 8) ^ (tp9 << 24) ^
1367                 (tpb >> 24) ^ (tpb << 8);
1368 #endif
1369         }
1370     }
1371     return 0;
1372 }
1373
1374 #endif /* AES_ASM */