aes_core.c revision 296341
11573Srgrimes/* crypto/aes/aes_core.c -*- mode:C; c-file-style: "eay" -*- */
211681Sbde/**
31573Srgrimes * rijndael-alg-fst.c
41573Srgrimes *
51573Srgrimes * @version 3.0 (December 2000)
61573Srgrimes *
71573Srgrimes * Optimised ANSI C code for the Rijndael cipher (now AES)
81573Srgrimes *
91573Srgrimes * @author Vincent Rijmen <vincent.rijmen@esat.kuleuven.ac.be>
101573Srgrimes * @author Antoon Bosselaers <antoon.bosselaers@esat.kuleuven.ac.be>
111573Srgrimes * @author Paulo Barreto <paulo.barreto@terra.com.br>
121573Srgrimes *
131573Srgrimes * This code is hereby placed in the public domain.
141573Srgrimes *
151573Srgrimes * THIS SOFTWARE IS PROVIDED BY THE AUTHORS ''AS IS'' AND ANY EXPRESS
161573Srgrimes * OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
171573Srgrimes * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
181573Srgrimes * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHORS OR CONTRIBUTORS BE
191573Srgrimes * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
201573Srgrimes * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
211573Srgrimes * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
221573Srgrimes * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
231573Srgrimes * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE
241573Srgrimes * OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE,
251573Srgrimes * EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
261573Srgrimes */
271573Srgrimes
281573Srgrimes/* Note: rewritten a little bit to provide error control and an OpenSSL-
291573Srgrimes   compatible API */
3084225Sdillon
3184225Sdillon#ifndef AES_DEBUG
3284225Sdillon# ifndef NDEBUG
331573Srgrimes#  define NDEBUG
3428179Ssteve# endif
3511681Sbde#endif
3628179Ssteve#include <assert.h>
371573Srgrimes
381573Srgrimes#include <stdlib.h>
391573Srgrimes#include <openssl/aes.h>
4011681Sbde#include "aes_locl.h"
411573Srgrimes
4211681Sbde#ifndef AES_ASM
4311681Sbde/*-
441573SrgrimesTe0[x] = S [x].[02, 01, 01, 03];
4511681SbdeTe1[x] = S [x].[03, 02, 01, 01];
46116344SmarkmTe2[x] = S [x].[01, 03, 02, 01];
4711681SbdeTe3[x] = S [x].[01, 01, 03, 02];
4811681Sbde
491573SrgrimesTd0[x] = Si[x].[0e, 09, 0d, 0b];
50184634SdesTd1[x] = Si[x].[0b, 0e, 09, 0d];
511573SrgrimesTd2[x] = Si[x].[0d, 0b, 0e, 09];
52175352SjhbTd3[x] = Si[x].[09, 0d, 0b, 0e];
53175352SjhbTd4[x] = Si[x].[01];
54154835Scognet*/
55154835Scognet
56174818Sjhbstatic const u32 Te0[256] = {
57154835Scognet    0xc66363a5U, 0xf87c7c84U, 0xee777799U, 0xf67b7b8dU,
58154835Scognet    0xfff2f20dU, 0xd66b6bbdU, 0xde6f6fb1U, 0x91c5c554U,
59183565Sed    0x60303050U, 0x02010103U, 0xce6767a9U, 0x562b2b7dU,
60154835Scognet    0xe7fefe19U, 0xb5d7d762U, 0x4dababe6U, 0xec76769aU,
61154835Scognet    0x8fcaca45U, 0x1f82829dU, 0x89c9c940U, 0xfa7d7d87U,
62154835Scognet    0xeffafa15U, 0xb25959ebU, 0x8e4747c9U, 0xfbf0f00bU,
63183565Sed    0x41adadecU, 0xb3d4d467U, 0x5fa2a2fdU, 0x45afafeaU,
64183565Sed    0x239c9cbfU, 0x53a4a4f7U, 0xe4727296U, 0x9bc0c05bU,
65154835Scognet    0x75b7b7c2U, 0xe1fdfd1cU, 0x3d9393aeU, 0x4c26266aU,
66183565Sed    0x6c36365aU, 0x7e3f3f41U, 0xf5f7f702U, 0x83cccc4fU,
67183565Sed    0x6834345cU, 0x51a5a5f4U, 0xd1e5e534U, 0xf9f1f108U,
68183565Sed    0xe2717193U, 0xabd8d873U, 0x62313153U, 0x2a15153fU,
69174818Sjhb    0x0804040cU, 0x95c7c752U, 0x46232365U, 0x9dc3c35eU,
70183565Sed    0x30181828U, 0x379696a1U, 0x0a05050fU, 0x2f9a9ab5U,
71183565Sed    0x0e070709U, 0x24121236U, 0x1b80809bU, 0xdfe2e23dU,
72174818Sjhb    0xcdebeb26U, 0x4e272769U, 0x7fb2b2cdU, 0xea75759fU,
73174818Sjhb    0x1209091bU, 0x1d83839eU, 0x582c2c74U, 0x341a1a2eU,
74183565Sed    0x361b1b2dU, 0xdc6e6eb2U, 0xb45a5aeeU, 0x5ba0a0fbU,
75183565Sed    0xa45252f6U, 0x763b3b4dU, 0xb7d6d661U, 0x7db3b3ceU,
76154835Scognet    0x5229297bU, 0xdde3e33eU, 0x5e2f2f71U, 0x13848497U,
77154835Scognet    0xa65353f5U, 0xb9d1d168U, 0x00000000U, 0xc1eded2cU,
78154835Scognet    0x40202060U, 0xe3fcfc1fU, 0x79b1b1c8U, 0xb65b5bedU,
79154835Scognet    0xd46a6abeU, 0x8dcbcb46U, 0x67bebed9U, 0x7239394bU,
80154835Scognet    0x944a4adeU, 0x984c4cd4U, 0xb05858e8U, 0x85cfcf4aU,
81175352Sjhb    0xbbd0d06bU, 0xc5efef2aU, 0x4faaaae5U, 0xedfbfb16U,
82154835Scognet    0x864343c5U, 0x9a4d4dd7U, 0x66333355U, 0x11858594U,
83154835Scognet    0x8a4545cfU, 0xe9f9f910U, 0x04020206U, 0xfe7f7f81U,
84154835Scognet    0xa05050f0U, 0x783c3c44U, 0x259f9fbaU, 0x4ba8a8e3U,
85154835Scognet    0xa25151f3U, 0x5da3a3feU, 0x804040c0U, 0x058f8f8aU,
86154835Scognet    0x3f9292adU, 0x219d9dbcU, 0x70383848U, 0xf1f5f504U,
87154835Scognet    0x63bcbcdfU, 0x77b6b6c1U, 0xafdada75U, 0x42212163U,
88183565Sed    0x20101030U, 0xe5ffff1aU, 0xfdf3f30eU, 0xbfd2d26dU,
89183565Sed    0x81cdcd4cU, 0x180c0c14U, 0x26131335U, 0xc3ecec2fU,
90183565Sed    0xbe5f5fe1U, 0x359797a2U, 0x884444ccU, 0x2e171739U,
91154835Scognet    0x93c4c457U, 0x55a7a7f2U, 0xfc7e7e82U, 0x7a3d3d47U,
92154835Scognet    0xc86464acU, 0xba5d5de7U, 0x3219192bU, 0xe6737395U,
9313137Speter    0xc06060a0U, 0x19818198U, 0x9e4f4fd1U, 0xa3dcdc7fU,
94121193Smarkm    0x44222266U, 0x542a2a7eU, 0x3b9090abU, 0x0b888883U,
951573Srgrimes    0x8c4646caU, 0xc7eeee29U, 0x6bb8b8d3U, 0x2814143cU,
961573Srgrimes    0xa7dede79U, 0xbc5e5ee2U, 0x160b0b1dU, 0xaddbdb76U,
971573Srgrimes    0xdbe0e03bU, 0x64323256U, 0x743a3a4eU, 0x140a0a1eU,
981573Srgrimes    0x924949dbU, 0x0c06060aU, 0x4824246cU, 0xb85c5ce4U,
991573Srgrimes    0x9fc2c25dU, 0xbdd3d36eU, 0x43acacefU, 0xc46262a6U,
1001573Srgrimes    0x399191a8U, 0x319595a4U, 0xd3e4e437U, 0xf279798bU,
1011573Srgrimes    0xd5e7e732U, 0x8bc8c843U, 0x6e373759U, 0xda6d6db7U,
1021573Srgrimes    0x018d8d8cU, 0xb1d5d564U, 0x9c4e4ed2U, 0x49a9a9e0U,
1031573Srgrimes    0xd86c6cb4U, 0xac5656faU, 0xf3f4f407U, 0xcfeaea25U,
1048870Srgrimes    0xca6565afU, 0xf47a7a8eU, 0x47aeaee9U, 0x10080818U,
1051573Srgrimes    0x6fbabad5U, 0xf0787888U, 0x4a25256fU, 0x5c2e2e72U,
1061573Srgrimes    0x381c1c24U, 0x57a6a6f1U, 0x73b4b4c7U, 0x97c6c651U,
1071573Srgrimes    0xcbe8e823U, 0xa1dddd7cU, 0xe874749cU, 0x3e1f1f21U,
1081573Srgrimes    0x964b4bddU, 0x61bdbddcU, 0x0d8b8b86U, 0x0f8a8a85U,
1091573Srgrimes    0xe0707090U, 0x7c3e3e42U, 0x71b5b5c4U, 0xcc6666aaU,
1101573Srgrimes    0x904848d8U, 0x06030305U, 0xf7f6f601U, 0x1c0e0e12U,
1111573Srgrimes    0xc26161a3U, 0x6a35355fU, 0xae5757f9U, 0x69b9b9d0U,
1121573Srgrimes    0x17868691U, 0x99c1c158U, 0x3a1d1d27U, 0x279e9eb9U,
1131573Srgrimes    0xd9e1e138U, 0xebf8f813U, 0x2b9898b3U, 0x22111133U,
1141573Srgrimes    0xd26969bbU, 0xa9d9d970U, 0x078e8e89U, 0x339494a7U,
1151573Srgrimes    0x2d9b9bb6U, 0x3c1e1e22U, 0x15878792U, 0xc9e9e920U,
1161573Srgrimes    0x87cece49U, 0xaa5555ffU, 0x50282878U, 0xa5dfdf7aU,
1171573Srgrimes    0x038c8c8fU, 0x59a1a1f8U, 0x09898980U, 0x1a0d0d17U,
118    0x65bfbfdaU, 0xd7e6e631U, 0x844242c6U, 0xd06868b8U,
119    0x824141c3U, 0x299999b0U, 0x5a2d2d77U, 0x1e0f0f11U,
120    0x7bb0b0cbU, 0xa85454fcU, 0x6dbbbbd6U, 0x2c16163aU,
121};
122static const u32 Te1[256] = {
123    0xa5c66363U, 0x84f87c7cU, 0x99ee7777U, 0x8df67b7bU,
124    0x0dfff2f2U, 0xbdd66b6bU, 0xb1de6f6fU, 0x5491c5c5U,
125    0x50603030U, 0x03020101U, 0xa9ce6767U, 0x7d562b2bU,
126    0x19e7fefeU, 0x62b5d7d7U, 0xe64dababU, 0x9aec7676U,
127    0x458fcacaU, 0x9d1f8282U, 0x4089c9c9U, 0x87fa7d7dU,
128    0x15effafaU, 0xebb25959U, 0xc98e4747U, 0x0bfbf0f0U,
129    0xec41adadU, 0x67b3d4d4U, 0xfd5fa2a2U, 0xea45afafU,
130    0xbf239c9cU, 0xf753a4a4U, 0x96e47272U, 0x5b9bc0c0U,
131    0xc275b7b7U, 0x1ce1fdfdU, 0xae3d9393U, 0x6a4c2626U,
132    0x5a6c3636U, 0x417e3f3fU, 0x02f5f7f7U, 0x4f83ccccU,
133    0x5c683434U, 0xf451a5a5U, 0x34d1e5e5U, 0x08f9f1f1U,
134    0x93e27171U, 0x73abd8d8U, 0x53623131U, 0x3f2a1515U,
135    0x0c080404U, 0x5295c7c7U, 0x65462323U, 0x5e9dc3c3U,
136    0x28301818U, 0xa1379696U, 0x0f0a0505U, 0xb52f9a9aU,
137    0x090e0707U, 0x36241212U, 0x9b1b8080U, 0x3ddfe2e2U,
138    0x26cdebebU, 0x694e2727U, 0xcd7fb2b2U, 0x9fea7575U,
139    0x1b120909U, 0x9e1d8383U, 0x74582c2cU, 0x2e341a1aU,
140    0x2d361b1bU, 0xb2dc6e6eU, 0xeeb45a5aU, 0xfb5ba0a0U,
141    0xf6a45252U, 0x4d763b3bU, 0x61b7d6d6U, 0xce7db3b3U,
142    0x7b522929U, 0x3edde3e3U, 0x715e2f2fU, 0x97138484U,
143    0xf5a65353U, 0x68b9d1d1U, 0x00000000U, 0x2cc1ededU,
144    0x60402020U, 0x1fe3fcfcU, 0xc879b1b1U, 0xedb65b5bU,
145    0xbed46a6aU, 0x468dcbcbU, 0xd967bebeU, 0x4b723939U,
146    0xde944a4aU, 0xd4984c4cU, 0xe8b05858U, 0x4a85cfcfU,
147    0x6bbbd0d0U, 0x2ac5efefU, 0xe54faaaaU, 0x16edfbfbU,
148    0xc5864343U, 0xd79a4d4dU, 0x55663333U, 0x94118585U,
149    0xcf8a4545U, 0x10e9f9f9U, 0x06040202U, 0x81fe7f7fU,
150    0xf0a05050U, 0x44783c3cU, 0xba259f9fU, 0xe34ba8a8U,
151    0xf3a25151U, 0xfe5da3a3U, 0xc0804040U, 0x8a058f8fU,
152    0xad3f9292U, 0xbc219d9dU, 0x48703838U, 0x04f1f5f5U,
153    0xdf63bcbcU, 0xc177b6b6U, 0x75afdadaU, 0x63422121U,
154    0x30201010U, 0x1ae5ffffU, 0x0efdf3f3U, 0x6dbfd2d2U,
155    0x4c81cdcdU, 0x14180c0cU, 0x35261313U, 0x2fc3ececU,
156    0xe1be5f5fU, 0xa2359797U, 0xcc884444U, 0x392e1717U,
157    0x5793c4c4U, 0xf255a7a7U, 0x82fc7e7eU, 0x477a3d3dU,
158    0xacc86464U, 0xe7ba5d5dU, 0x2b321919U, 0x95e67373U,
159    0xa0c06060U, 0x98198181U, 0xd19e4f4fU, 0x7fa3dcdcU,
160    0x66442222U, 0x7e542a2aU, 0xab3b9090U, 0x830b8888U,
161    0xca8c4646U, 0x29c7eeeeU, 0xd36bb8b8U, 0x3c281414U,
162    0x79a7dedeU, 0xe2bc5e5eU, 0x1d160b0bU, 0x76addbdbU,
163    0x3bdbe0e0U, 0x56643232U, 0x4e743a3aU, 0x1e140a0aU,
164    0xdb924949U, 0x0a0c0606U, 0x6c482424U, 0xe4b85c5cU,
165    0x5d9fc2c2U, 0x6ebdd3d3U, 0xef43acacU, 0xa6c46262U,
166    0xa8399191U, 0xa4319595U, 0x37d3e4e4U, 0x8bf27979U,
167    0x32d5e7e7U, 0x438bc8c8U, 0x596e3737U, 0xb7da6d6dU,
168    0x8c018d8dU, 0x64b1d5d5U, 0xd29c4e4eU, 0xe049a9a9U,
169    0xb4d86c6cU, 0xfaac5656U, 0x07f3f4f4U, 0x25cfeaeaU,
170    0xafca6565U, 0x8ef47a7aU, 0xe947aeaeU, 0x18100808U,
171    0xd56fbabaU, 0x88f07878U, 0x6f4a2525U, 0x725c2e2eU,
172    0x24381c1cU, 0xf157a6a6U, 0xc773b4b4U, 0x5197c6c6U,
173    0x23cbe8e8U, 0x7ca1ddddU, 0x9ce87474U, 0x213e1f1fU,
174    0xdd964b4bU, 0xdc61bdbdU, 0x860d8b8bU, 0x850f8a8aU,
175    0x90e07070U, 0x427c3e3eU, 0xc471b5b5U, 0xaacc6666U,
176    0xd8904848U, 0x05060303U, 0x01f7f6f6U, 0x121c0e0eU,
177    0xa3c26161U, 0x5f6a3535U, 0xf9ae5757U, 0xd069b9b9U,
178    0x91178686U, 0x5899c1c1U, 0x273a1d1dU, 0xb9279e9eU,
179    0x38d9e1e1U, 0x13ebf8f8U, 0xb32b9898U, 0x33221111U,
180    0xbbd26969U, 0x70a9d9d9U, 0x89078e8eU, 0xa7339494U,
181    0xb62d9b9bU, 0x223c1e1eU, 0x92158787U, 0x20c9e9e9U,
182    0x4987ceceU, 0xffaa5555U, 0x78502828U, 0x7aa5dfdfU,
183    0x8f038c8cU, 0xf859a1a1U, 0x80098989U, 0x171a0d0dU,
184    0xda65bfbfU, 0x31d7e6e6U, 0xc6844242U, 0xb8d06868U,
185    0xc3824141U, 0xb0299999U, 0x775a2d2dU, 0x111e0f0fU,
186    0xcb7bb0b0U, 0xfca85454U, 0xd66dbbbbU, 0x3a2c1616U,
187};
188static const u32 Te2[256] = {
189    0x63a5c663U, 0x7c84f87cU, 0x7799ee77U, 0x7b8df67bU,
190    0xf20dfff2U, 0x6bbdd66bU, 0x6fb1de6fU, 0xc55491c5U,
191    0x30506030U, 0x01030201U, 0x67a9ce67U, 0x2b7d562bU,
192    0xfe19e7feU, 0xd762b5d7U, 0xabe64dabU, 0x769aec76U,
193    0xca458fcaU, 0x829d1f82U, 0xc94089c9U, 0x7d87fa7dU,
194    0xfa15effaU, 0x59ebb259U, 0x47c98e47U, 0xf00bfbf0U,
195    0xadec41adU, 0xd467b3d4U, 0xa2fd5fa2U, 0xafea45afU,
196    0x9cbf239cU, 0xa4f753a4U, 0x7296e472U, 0xc05b9bc0U,
197    0xb7c275b7U, 0xfd1ce1fdU, 0x93ae3d93U, 0x266a4c26U,
198    0x365a6c36U, 0x3f417e3fU, 0xf702f5f7U, 0xcc4f83ccU,
199    0x345c6834U, 0xa5f451a5U, 0xe534d1e5U, 0xf108f9f1U,
200    0x7193e271U, 0xd873abd8U, 0x31536231U, 0x153f2a15U,
201    0x040c0804U, 0xc75295c7U, 0x23654623U, 0xc35e9dc3U,
202    0x18283018U, 0x96a13796U, 0x050f0a05U, 0x9ab52f9aU,
203    0x07090e07U, 0x12362412U, 0x809b1b80U, 0xe23ddfe2U,
204    0xeb26cdebU, 0x27694e27U, 0xb2cd7fb2U, 0x759fea75U,
205    0x091b1209U, 0x839e1d83U, 0x2c74582cU, 0x1a2e341aU,
206    0x1b2d361bU, 0x6eb2dc6eU, 0x5aeeb45aU, 0xa0fb5ba0U,
207    0x52f6a452U, 0x3b4d763bU, 0xd661b7d6U, 0xb3ce7db3U,
208    0x297b5229U, 0xe33edde3U, 0x2f715e2fU, 0x84971384U,
209    0x53f5a653U, 0xd168b9d1U, 0x00000000U, 0xed2cc1edU,
210    0x20604020U, 0xfc1fe3fcU, 0xb1c879b1U, 0x5bedb65bU,
211    0x6abed46aU, 0xcb468dcbU, 0xbed967beU, 0x394b7239U,
212    0x4ade944aU, 0x4cd4984cU, 0x58e8b058U, 0xcf4a85cfU,
213    0xd06bbbd0U, 0xef2ac5efU, 0xaae54faaU, 0xfb16edfbU,
214    0x43c58643U, 0x4dd79a4dU, 0x33556633U, 0x85941185U,
215    0x45cf8a45U, 0xf910e9f9U, 0x02060402U, 0x7f81fe7fU,
216    0x50f0a050U, 0x3c44783cU, 0x9fba259fU, 0xa8e34ba8U,
217    0x51f3a251U, 0xa3fe5da3U, 0x40c08040U, 0x8f8a058fU,
218    0x92ad3f92U, 0x9dbc219dU, 0x38487038U, 0xf504f1f5U,
219    0xbcdf63bcU, 0xb6c177b6U, 0xda75afdaU, 0x21634221U,
220    0x10302010U, 0xff1ae5ffU, 0xf30efdf3U, 0xd26dbfd2U,
221    0xcd4c81cdU, 0x0c14180cU, 0x13352613U, 0xec2fc3ecU,
222    0x5fe1be5fU, 0x97a23597U, 0x44cc8844U, 0x17392e17U,
223    0xc45793c4U, 0xa7f255a7U, 0x7e82fc7eU, 0x3d477a3dU,
224    0x64acc864U, 0x5de7ba5dU, 0x192b3219U, 0x7395e673U,
225    0x60a0c060U, 0x81981981U, 0x4fd19e4fU, 0xdc7fa3dcU,
226    0x22664422U, 0x2a7e542aU, 0x90ab3b90U, 0x88830b88U,
227    0x46ca8c46U, 0xee29c7eeU, 0xb8d36bb8U, 0x143c2814U,
228    0xde79a7deU, 0x5ee2bc5eU, 0x0b1d160bU, 0xdb76addbU,
229    0xe03bdbe0U, 0x32566432U, 0x3a4e743aU, 0x0a1e140aU,
230    0x49db9249U, 0x060a0c06U, 0x246c4824U, 0x5ce4b85cU,
231    0xc25d9fc2U, 0xd36ebdd3U, 0xacef43acU, 0x62a6c462U,
232    0x91a83991U, 0x95a43195U, 0xe437d3e4U, 0x798bf279U,
233    0xe732d5e7U, 0xc8438bc8U, 0x37596e37U, 0x6db7da6dU,
234    0x8d8c018dU, 0xd564b1d5U, 0x4ed29c4eU, 0xa9e049a9U,
235    0x6cb4d86cU, 0x56faac56U, 0xf407f3f4U, 0xea25cfeaU,
236    0x65afca65U, 0x7a8ef47aU, 0xaee947aeU, 0x08181008U,
237    0xbad56fbaU, 0x7888f078U, 0x256f4a25U, 0x2e725c2eU,
238    0x1c24381cU, 0xa6f157a6U, 0xb4c773b4U, 0xc65197c6U,
239    0xe823cbe8U, 0xdd7ca1ddU, 0x749ce874U, 0x1f213e1fU,
240    0x4bdd964bU, 0xbddc61bdU, 0x8b860d8bU, 0x8a850f8aU,
241    0x7090e070U, 0x3e427c3eU, 0xb5c471b5U, 0x66aacc66U,
242    0x48d89048U, 0x03050603U, 0xf601f7f6U, 0x0e121c0eU,
243    0x61a3c261U, 0x355f6a35U, 0x57f9ae57U, 0xb9d069b9U,
244    0x86911786U, 0xc15899c1U, 0x1d273a1dU, 0x9eb9279eU,
245    0xe138d9e1U, 0xf813ebf8U, 0x98b32b98U, 0x11332211U,
246    0x69bbd269U, 0xd970a9d9U, 0x8e89078eU, 0x94a73394U,
247    0x9bb62d9bU, 0x1e223c1eU, 0x87921587U, 0xe920c9e9U,
248    0xce4987ceU, 0x55ffaa55U, 0x28785028U, 0xdf7aa5dfU,
249    0x8c8f038cU, 0xa1f859a1U, 0x89800989U, 0x0d171a0dU,
250    0xbfda65bfU, 0xe631d7e6U, 0x42c68442U, 0x68b8d068U,
251    0x41c38241U, 0x99b02999U, 0x2d775a2dU, 0x0f111e0fU,
252    0xb0cb7bb0U, 0x54fca854U, 0xbbd66dbbU, 0x163a2c16U,
253};
254static const u32 Te3[256] = {
255    0x6363a5c6U, 0x7c7c84f8U, 0x777799eeU, 0x7b7b8df6U,
256    0xf2f20dffU, 0x6b6bbdd6U, 0x6f6fb1deU, 0xc5c55491U,
257    0x30305060U, 0x01010302U, 0x6767a9ceU, 0x2b2b7d56U,
258    0xfefe19e7U, 0xd7d762b5U, 0xababe64dU, 0x76769aecU,
259    0xcaca458fU, 0x82829d1fU, 0xc9c94089U, 0x7d7d87faU,
260    0xfafa15efU, 0x5959ebb2U, 0x4747c98eU, 0xf0f00bfbU,
261    0xadadec41U, 0xd4d467b3U, 0xa2a2fd5fU, 0xafafea45U,
262    0x9c9cbf23U, 0xa4a4f753U, 0x727296e4U, 0xc0c05b9bU,
263    0xb7b7c275U, 0xfdfd1ce1U, 0x9393ae3dU, 0x26266a4cU,
264    0x36365a6cU, 0x3f3f417eU, 0xf7f702f5U, 0xcccc4f83U,
265    0x34345c68U, 0xa5a5f451U, 0xe5e534d1U, 0xf1f108f9U,
266    0x717193e2U, 0xd8d873abU, 0x31315362U, 0x15153f2aU,
267    0x04040c08U, 0xc7c75295U, 0x23236546U, 0xc3c35e9dU,
268    0x18182830U, 0x9696a137U, 0x05050f0aU, 0x9a9ab52fU,
269    0x0707090eU, 0x12123624U, 0x80809b1bU, 0xe2e23ddfU,
270    0xebeb26cdU, 0x2727694eU, 0xb2b2cd7fU, 0x75759feaU,
271    0x09091b12U, 0x83839e1dU, 0x2c2c7458U, 0x1a1a2e34U,
272    0x1b1b2d36U, 0x6e6eb2dcU, 0x5a5aeeb4U, 0xa0a0fb5bU,
273    0x5252f6a4U, 0x3b3b4d76U, 0xd6d661b7U, 0xb3b3ce7dU,
274    0x29297b52U, 0xe3e33eddU, 0x2f2f715eU, 0x84849713U,
275    0x5353f5a6U, 0xd1d168b9U, 0x00000000U, 0xeded2cc1U,
276    0x20206040U, 0xfcfc1fe3U, 0xb1b1c879U, 0x5b5bedb6U,
277    0x6a6abed4U, 0xcbcb468dU, 0xbebed967U, 0x39394b72U,
278    0x4a4ade94U, 0x4c4cd498U, 0x5858e8b0U, 0xcfcf4a85U,
279    0xd0d06bbbU, 0xefef2ac5U, 0xaaaae54fU, 0xfbfb16edU,
280    0x4343c586U, 0x4d4dd79aU, 0x33335566U, 0x85859411U,
281    0x4545cf8aU, 0xf9f910e9U, 0x02020604U, 0x7f7f81feU,
282    0x5050f0a0U, 0x3c3c4478U, 0x9f9fba25U, 0xa8a8e34bU,
283    0x5151f3a2U, 0xa3a3fe5dU, 0x4040c080U, 0x8f8f8a05U,
284    0x9292ad3fU, 0x9d9dbc21U, 0x38384870U, 0xf5f504f1U,
285    0xbcbcdf63U, 0xb6b6c177U, 0xdada75afU, 0x21216342U,
286    0x10103020U, 0xffff1ae5U, 0xf3f30efdU, 0xd2d26dbfU,
287    0xcdcd4c81U, 0x0c0c1418U, 0x13133526U, 0xecec2fc3U,
288    0x5f5fe1beU, 0x9797a235U, 0x4444cc88U, 0x1717392eU,
289    0xc4c45793U, 0xa7a7f255U, 0x7e7e82fcU, 0x3d3d477aU,
290    0x6464acc8U, 0x5d5de7baU, 0x19192b32U, 0x737395e6U,
291    0x6060a0c0U, 0x81819819U, 0x4f4fd19eU, 0xdcdc7fa3U,
292    0x22226644U, 0x2a2a7e54U, 0x9090ab3bU, 0x8888830bU,
293    0x4646ca8cU, 0xeeee29c7U, 0xb8b8d36bU, 0x14143c28U,
294    0xdede79a7U, 0x5e5ee2bcU, 0x0b0b1d16U, 0xdbdb76adU,
295    0xe0e03bdbU, 0x32325664U, 0x3a3a4e74U, 0x0a0a1e14U,
296    0x4949db92U, 0x06060a0cU, 0x24246c48U, 0x5c5ce4b8U,
297    0xc2c25d9fU, 0xd3d36ebdU, 0xacacef43U, 0x6262a6c4U,
298    0x9191a839U, 0x9595a431U, 0xe4e437d3U, 0x79798bf2U,
299    0xe7e732d5U, 0xc8c8438bU, 0x3737596eU, 0x6d6db7daU,
300    0x8d8d8c01U, 0xd5d564b1U, 0x4e4ed29cU, 0xa9a9e049U,
301    0x6c6cb4d8U, 0x5656faacU, 0xf4f407f3U, 0xeaea25cfU,
302    0x6565afcaU, 0x7a7a8ef4U, 0xaeaee947U, 0x08081810U,
303    0xbabad56fU, 0x787888f0U, 0x25256f4aU, 0x2e2e725cU,
304    0x1c1c2438U, 0xa6a6f157U, 0xb4b4c773U, 0xc6c65197U,
305    0xe8e823cbU, 0xdddd7ca1U, 0x74749ce8U, 0x1f1f213eU,
306    0x4b4bdd96U, 0xbdbddc61U, 0x8b8b860dU, 0x8a8a850fU,
307    0x707090e0U, 0x3e3e427cU, 0xb5b5c471U, 0x6666aaccU,
308    0x4848d890U, 0x03030506U, 0xf6f601f7U, 0x0e0e121cU,
309    0x6161a3c2U, 0x35355f6aU, 0x5757f9aeU, 0xb9b9d069U,
310    0x86869117U, 0xc1c15899U, 0x1d1d273aU, 0x9e9eb927U,
311    0xe1e138d9U, 0xf8f813ebU, 0x9898b32bU, 0x11113322U,
312    0x6969bbd2U, 0xd9d970a9U, 0x8e8e8907U, 0x9494a733U,
313    0x9b9bb62dU, 0x1e1e223cU, 0x87879215U, 0xe9e920c9U,
314    0xcece4987U, 0x5555ffaaU, 0x28287850U, 0xdfdf7aa5U,
315    0x8c8c8f03U, 0xa1a1f859U, 0x89898009U, 0x0d0d171aU,
316    0xbfbfda65U, 0xe6e631d7U, 0x4242c684U, 0x6868b8d0U,
317    0x4141c382U, 0x9999b029U, 0x2d2d775aU, 0x0f0f111eU,
318    0xb0b0cb7bU, 0x5454fca8U, 0xbbbbd66dU, 0x16163a2cU,
319};
320
321static const u32 Td0[256] = {
322    0x51f4a750U, 0x7e416553U, 0x1a17a4c3U, 0x3a275e96U,
323    0x3bab6bcbU, 0x1f9d45f1U, 0xacfa58abU, 0x4be30393U,
324    0x2030fa55U, 0xad766df6U, 0x88cc7691U, 0xf5024c25U,
325    0x4fe5d7fcU, 0xc52acbd7U, 0x26354480U, 0xb562a38fU,
326    0xdeb15a49U, 0x25ba1b67U, 0x45ea0e98U, 0x5dfec0e1U,
327    0xc32f7502U, 0x814cf012U, 0x8d4697a3U, 0x6bd3f9c6U,
328    0x038f5fe7U, 0x15929c95U, 0xbf6d7aebU, 0x955259daU,
329    0xd4be832dU, 0x587421d3U, 0x49e06929U, 0x8ec9c844U,
330    0x75c2896aU, 0xf48e7978U, 0x99583e6bU, 0x27b971ddU,
331    0xbee14fb6U, 0xf088ad17U, 0xc920ac66U, 0x7dce3ab4U,
332    0x63df4a18U, 0xe51a3182U, 0x97513360U, 0x62537f45U,
333    0xb16477e0U, 0xbb6bae84U, 0xfe81a01cU, 0xf9082b94U,
334    0x70486858U, 0x8f45fd19U, 0x94de6c87U, 0x527bf8b7U,
335    0xab73d323U, 0x724b02e2U, 0xe31f8f57U, 0x6655ab2aU,
336    0xb2eb2807U, 0x2fb5c203U, 0x86c57b9aU, 0xd33708a5U,
337    0x302887f2U, 0x23bfa5b2U, 0x02036abaU, 0xed16825cU,
338    0x8acf1c2bU, 0xa779b492U, 0xf307f2f0U, 0x4e69e2a1U,
339    0x65daf4cdU, 0x0605bed5U, 0xd134621fU, 0xc4a6fe8aU,
340    0x342e539dU, 0xa2f355a0U, 0x058ae132U, 0xa4f6eb75U,
341    0x0b83ec39U, 0x4060efaaU, 0x5e719f06U, 0xbd6e1051U,
342    0x3e218af9U, 0x96dd063dU, 0xdd3e05aeU, 0x4de6bd46U,
343    0x91548db5U, 0x71c45d05U, 0x0406d46fU, 0x605015ffU,
344    0x1998fb24U, 0xd6bde997U, 0x894043ccU, 0x67d99e77U,
345    0xb0e842bdU, 0x07898b88U, 0xe7195b38U, 0x79c8eedbU,
346    0xa17c0a47U, 0x7c420fe9U, 0xf8841ec9U, 0x00000000U,
347    0x09808683U, 0x322bed48U, 0x1e1170acU, 0x6c5a724eU,
348    0xfd0efffbU, 0x0f853856U, 0x3daed51eU, 0x362d3927U,
349    0x0a0fd964U, 0x685ca621U, 0x9b5b54d1U, 0x24362e3aU,
350    0x0c0a67b1U, 0x9357e70fU, 0xb4ee96d2U, 0x1b9b919eU,
351    0x80c0c54fU, 0x61dc20a2U, 0x5a774b69U, 0x1c121a16U,
352    0xe293ba0aU, 0xc0a02ae5U, 0x3c22e043U, 0x121b171dU,
353    0x0e090d0bU, 0xf28bc7adU, 0x2db6a8b9U, 0x141ea9c8U,
354    0x57f11985U, 0xaf75074cU, 0xee99ddbbU, 0xa37f60fdU,
355    0xf701269fU, 0x5c72f5bcU, 0x44663bc5U, 0x5bfb7e34U,
356    0x8b432976U, 0xcb23c6dcU, 0xb6edfc68U, 0xb8e4f163U,
357    0xd731dccaU, 0x42638510U, 0x13972240U, 0x84c61120U,
358    0x854a247dU, 0xd2bb3df8U, 0xaef93211U, 0xc729a16dU,
359    0x1d9e2f4bU, 0xdcb230f3U, 0x0d8652ecU, 0x77c1e3d0U,
360    0x2bb3166cU, 0xa970b999U, 0x119448faU, 0x47e96422U,
361    0xa8fc8cc4U, 0xa0f03f1aU, 0x567d2cd8U, 0x223390efU,
362    0x87494ec7U, 0xd938d1c1U, 0x8ccaa2feU, 0x98d40b36U,
363    0xa6f581cfU, 0xa57ade28U, 0xdab78e26U, 0x3fadbfa4U,
364    0x2c3a9de4U, 0x5078920dU, 0x6a5fcc9bU, 0x547e4662U,
365    0xf68d13c2U, 0x90d8b8e8U, 0x2e39f75eU, 0x82c3aff5U,
366    0x9f5d80beU, 0x69d0937cU, 0x6fd52da9U, 0xcf2512b3U,
367    0xc8ac993bU, 0x10187da7U, 0xe89c636eU, 0xdb3bbb7bU,
368    0xcd267809U, 0x6e5918f4U, 0xec9ab701U, 0x834f9aa8U,
369    0xe6956e65U, 0xaaffe67eU, 0x21bccf08U, 0xef15e8e6U,
370    0xbae79bd9U, 0x4a6f36ceU, 0xea9f09d4U, 0x29b07cd6U,
371    0x31a4b2afU, 0x2a3f2331U, 0xc6a59430U, 0x35a266c0U,
372    0x744ebc37U, 0xfc82caa6U, 0xe090d0b0U, 0x33a7d815U,
373    0xf104984aU, 0x41ecdaf7U, 0x7fcd500eU, 0x1791f62fU,
374    0x764dd68dU, 0x43efb04dU, 0xccaa4d54U, 0xe49604dfU,
375    0x9ed1b5e3U, 0x4c6a881bU, 0xc12c1fb8U, 0x4665517fU,
376    0x9d5eea04U, 0x018c355dU, 0xfa877473U, 0xfb0b412eU,
377    0xb3671d5aU, 0x92dbd252U, 0xe9105633U, 0x6dd64713U,
378    0x9ad7618cU, 0x37a10c7aU, 0x59f8148eU, 0xeb133c89U,
379    0xcea927eeU, 0xb761c935U, 0xe11ce5edU, 0x7a47b13cU,
380    0x9cd2df59U, 0x55f2733fU, 0x1814ce79U, 0x73c737bfU,
381    0x53f7cdeaU, 0x5ffdaa5bU, 0xdf3d6f14U, 0x7844db86U,
382    0xcaaff381U, 0xb968c43eU, 0x3824342cU, 0xc2a3405fU,
383    0x161dc372U, 0xbce2250cU, 0x283c498bU, 0xff0d9541U,
384    0x39a80171U, 0x080cb3deU, 0xd8b4e49cU, 0x6456c190U,
385    0x7bcb8461U, 0xd532b670U, 0x486c5c74U, 0xd0b85742U,
386};
387static const u32 Td1[256] = {
388    0x5051f4a7U, 0x537e4165U, 0xc31a17a4U, 0x963a275eU,
389    0xcb3bab6bU, 0xf11f9d45U, 0xabacfa58U, 0x934be303U,
390    0x552030faU, 0xf6ad766dU, 0x9188cc76U, 0x25f5024cU,
391    0xfc4fe5d7U, 0xd7c52acbU, 0x80263544U, 0x8fb562a3U,
392    0x49deb15aU, 0x6725ba1bU, 0x9845ea0eU, 0xe15dfec0U,
393    0x02c32f75U, 0x12814cf0U, 0xa38d4697U, 0xc66bd3f9U,
394    0xe7038f5fU, 0x9515929cU, 0xebbf6d7aU, 0xda955259U,
395    0x2dd4be83U, 0xd3587421U, 0x2949e069U, 0x448ec9c8U,
396    0x6a75c289U, 0x78f48e79U, 0x6b99583eU, 0xdd27b971U,
397    0xb6bee14fU, 0x17f088adU, 0x66c920acU, 0xb47dce3aU,
398    0x1863df4aU, 0x82e51a31U, 0x60975133U, 0x4562537fU,
399    0xe0b16477U, 0x84bb6baeU, 0x1cfe81a0U, 0x94f9082bU,
400    0x58704868U, 0x198f45fdU, 0x8794de6cU, 0xb7527bf8U,
401    0x23ab73d3U, 0xe2724b02U, 0x57e31f8fU, 0x2a6655abU,
402    0x07b2eb28U, 0x032fb5c2U, 0x9a86c57bU, 0xa5d33708U,
403    0xf2302887U, 0xb223bfa5U, 0xba02036aU, 0x5ced1682U,
404    0x2b8acf1cU, 0x92a779b4U, 0xf0f307f2U, 0xa14e69e2U,
405    0xcd65daf4U, 0xd50605beU, 0x1fd13462U, 0x8ac4a6feU,
406    0x9d342e53U, 0xa0a2f355U, 0x32058ae1U, 0x75a4f6ebU,
407    0x390b83ecU, 0xaa4060efU, 0x065e719fU, 0x51bd6e10U,
408    0xf93e218aU, 0x3d96dd06U, 0xaedd3e05U, 0x464de6bdU,
409    0xb591548dU, 0x0571c45dU, 0x6f0406d4U, 0xff605015U,
410    0x241998fbU, 0x97d6bde9U, 0xcc894043U, 0x7767d99eU,
411    0xbdb0e842U, 0x8807898bU, 0x38e7195bU, 0xdb79c8eeU,
412    0x47a17c0aU, 0xe97c420fU, 0xc9f8841eU, 0x00000000U,
413    0x83098086U, 0x48322bedU, 0xac1e1170U, 0x4e6c5a72U,
414    0xfbfd0effU, 0x560f8538U, 0x1e3daed5U, 0x27362d39U,
415    0x640a0fd9U, 0x21685ca6U, 0xd19b5b54U, 0x3a24362eU,
416    0xb10c0a67U, 0x0f9357e7U, 0xd2b4ee96U, 0x9e1b9b91U,
417    0x4f80c0c5U, 0xa261dc20U, 0x695a774bU, 0x161c121aU,
418    0x0ae293baU, 0xe5c0a02aU, 0x433c22e0U, 0x1d121b17U,
419    0x0b0e090dU, 0xadf28bc7U, 0xb92db6a8U, 0xc8141ea9U,
420    0x8557f119U, 0x4caf7507U, 0xbbee99ddU, 0xfda37f60U,
421    0x9ff70126U, 0xbc5c72f5U, 0xc544663bU, 0x345bfb7eU,
422    0x768b4329U, 0xdccb23c6U, 0x68b6edfcU, 0x63b8e4f1U,
423    0xcad731dcU, 0x10426385U, 0x40139722U, 0x2084c611U,
424    0x7d854a24U, 0xf8d2bb3dU, 0x11aef932U, 0x6dc729a1U,
425    0x4b1d9e2fU, 0xf3dcb230U, 0xec0d8652U, 0xd077c1e3U,
426    0x6c2bb316U, 0x99a970b9U, 0xfa119448U, 0x2247e964U,
427    0xc4a8fc8cU, 0x1aa0f03fU, 0xd8567d2cU, 0xef223390U,
428    0xc787494eU, 0xc1d938d1U, 0xfe8ccaa2U, 0x3698d40bU,
429    0xcfa6f581U, 0x28a57adeU, 0x26dab78eU, 0xa43fadbfU,
430    0xe42c3a9dU, 0x0d507892U, 0x9b6a5fccU, 0x62547e46U,
431    0xc2f68d13U, 0xe890d8b8U, 0x5e2e39f7U, 0xf582c3afU,
432    0xbe9f5d80U, 0x7c69d093U, 0xa96fd52dU, 0xb3cf2512U,
433    0x3bc8ac99U, 0xa710187dU, 0x6ee89c63U, 0x7bdb3bbbU,
434    0x09cd2678U, 0xf46e5918U, 0x01ec9ab7U, 0xa8834f9aU,
435    0x65e6956eU, 0x7eaaffe6U, 0x0821bccfU, 0xe6ef15e8U,
436    0xd9bae79bU, 0xce4a6f36U, 0xd4ea9f09U, 0xd629b07cU,
437    0xaf31a4b2U, 0x312a3f23U, 0x30c6a594U, 0xc035a266U,
438    0x37744ebcU, 0xa6fc82caU, 0xb0e090d0U, 0x1533a7d8U,
439    0x4af10498U, 0xf741ecdaU, 0x0e7fcd50U, 0x2f1791f6U,
440    0x8d764dd6U, 0x4d43efb0U, 0x54ccaa4dU, 0xdfe49604U,
441    0xe39ed1b5U, 0x1b4c6a88U, 0xb8c12c1fU, 0x7f466551U,
442    0x049d5eeaU, 0x5d018c35U, 0x73fa8774U, 0x2efb0b41U,
443    0x5ab3671dU, 0x5292dbd2U, 0x33e91056U, 0x136dd647U,
444    0x8c9ad761U, 0x7a37a10cU, 0x8e59f814U, 0x89eb133cU,
445    0xeecea927U, 0x35b761c9U, 0xede11ce5U, 0x3c7a47b1U,
446    0x599cd2dfU, 0x3f55f273U, 0x791814ceU, 0xbf73c737U,
447    0xea53f7cdU, 0x5b5ffdaaU, 0x14df3d6fU, 0x867844dbU,
448    0x81caaff3U, 0x3eb968c4U, 0x2c382434U, 0x5fc2a340U,
449    0x72161dc3U, 0x0cbce225U, 0x8b283c49U, 0x41ff0d95U,
450    0x7139a801U, 0xde080cb3U, 0x9cd8b4e4U, 0x906456c1U,
451    0x617bcb84U, 0x70d532b6U, 0x74486c5cU, 0x42d0b857U,
452};
453static const u32 Td2[256] = {
454    0xa75051f4U, 0x65537e41U, 0xa4c31a17U, 0x5e963a27U,
455    0x6bcb3babU, 0x45f11f9dU, 0x58abacfaU, 0x03934be3U,
456    0xfa552030U, 0x6df6ad76U, 0x769188ccU, 0x4c25f502U,
457    0xd7fc4fe5U, 0xcbd7c52aU, 0x44802635U, 0xa38fb562U,
458    0x5a49deb1U, 0x1b6725baU, 0x0e9845eaU, 0xc0e15dfeU,
459    0x7502c32fU, 0xf012814cU, 0x97a38d46U, 0xf9c66bd3U,
460    0x5fe7038fU, 0x9c951592U, 0x7aebbf6dU, 0x59da9552U,
461    0x832dd4beU, 0x21d35874U, 0x692949e0U, 0xc8448ec9U,
462    0x896a75c2U, 0x7978f48eU, 0x3e6b9958U, 0x71dd27b9U,
463    0x4fb6bee1U, 0xad17f088U, 0xac66c920U, 0x3ab47dceU,
464    0x4a1863dfU, 0x3182e51aU, 0x33609751U, 0x7f456253U,
465    0x77e0b164U, 0xae84bb6bU, 0xa01cfe81U, 0x2b94f908U,
466    0x68587048U, 0xfd198f45U, 0x6c8794deU, 0xf8b7527bU,
467    0xd323ab73U, 0x02e2724bU, 0x8f57e31fU, 0xab2a6655U,
468    0x2807b2ebU, 0xc2032fb5U, 0x7b9a86c5U, 0x08a5d337U,
469    0x87f23028U, 0xa5b223bfU, 0x6aba0203U, 0x825ced16U,
470    0x1c2b8acfU, 0xb492a779U, 0xf2f0f307U, 0xe2a14e69U,
471    0xf4cd65daU, 0xbed50605U, 0x621fd134U, 0xfe8ac4a6U,
472    0x539d342eU, 0x55a0a2f3U, 0xe132058aU, 0xeb75a4f6U,
473    0xec390b83U, 0xefaa4060U, 0x9f065e71U, 0x1051bd6eU,
474    0x8af93e21U, 0x063d96ddU, 0x05aedd3eU, 0xbd464de6U,
475    0x8db59154U, 0x5d0571c4U, 0xd46f0406U, 0x15ff6050U,
476    0xfb241998U, 0xe997d6bdU, 0x43cc8940U, 0x9e7767d9U,
477    0x42bdb0e8U, 0x8b880789U, 0x5b38e719U, 0xeedb79c8U,
478    0x0a47a17cU, 0x0fe97c42U, 0x1ec9f884U, 0x00000000U,
479    0x86830980U, 0xed48322bU, 0x70ac1e11U, 0x724e6c5aU,
480    0xfffbfd0eU, 0x38560f85U, 0xd51e3daeU, 0x3927362dU,
481    0xd9640a0fU, 0xa621685cU, 0x54d19b5bU, 0x2e3a2436U,
482    0x67b10c0aU, 0xe70f9357U, 0x96d2b4eeU, 0x919e1b9bU,
483    0xc54f80c0U, 0x20a261dcU, 0x4b695a77U, 0x1a161c12U,
484    0xba0ae293U, 0x2ae5c0a0U, 0xe0433c22U, 0x171d121bU,
485    0x0d0b0e09U, 0xc7adf28bU, 0xa8b92db6U, 0xa9c8141eU,
486    0x198557f1U, 0x074caf75U, 0xddbbee99U, 0x60fda37fU,
487    0x269ff701U, 0xf5bc5c72U, 0x3bc54466U, 0x7e345bfbU,
488    0x29768b43U, 0xc6dccb23U, 0xfc68b6edU, 0xf163b8e4U,
489    0xdccad731U, 0x85104263U, 0x22401397U, 0x112084c6U,
490    0x247d854aU, 0x3df8d2bbU, 0x3211aef9U, 0xa16dc729U,
491    0x2f4b1d9eU, 0x30f3dcb2U, 0x52ec0d86U, 0xe3d077c1U,
492    0x166c2bb3U, 0xb999a970U, 0x48fa1194U, 0x642247e9U,
493    0x8cc4a8fcU, 0x3f1aa0f0U, 0x2cd8567dU, 0x90ef2233U,
494    0x4ec78749U, 0xd1c1d938U, 0xa2fe8ccaU, 0x0b3698d4U,
495    0x81cfa6f5U, 0xde28a57aU, 0x8e26dab7U, 0xbfa43fadU,
496    0x9de42c3aU, 0x920d5078U, 0xcc9b6a5fU, 0x4662547eU,
497    0x13c2f68dU, 0xb8e890d8U, 0xf75e2e39U, 0xaff582c3U,
498    0x80be9f5dU, 0x937c69d0U, 0x2da96fd5U, 0x12b3cf25U,
499    0x993bc8acU, 0x7da71018U, 0x636ee89cU, 0xbb7bdb3bU,
500    0x7809cd26U, 0x18f46e59U, 0xb701ec9aU, 0x9aa8834fU,
501    0x6e65e695U, 0xe67eaaffU, 0xcf0821bcU, 0xe8e6ef15U,
502    0x9bd9bae7U, 0x36ce4a6fU, 0x09d4ea9fU, 0x7cd629b0U,
503    0xb2af31a4U, 0x23312a3fU, 0x9430c6a5U, 0x66c035a2U,
504    0xbc37744eU, 0xcaa6fc82U, 0xd0b0e090U, 0xd81533a7U,
505    0x984af104U, 0xdaf741ecU, 0x500e7fcdU, 0xf62f1791U,
506    0xd68d764dU, 0xb04d43efU, 0x4d54ccaaU, 0x04dfe496U,
507    0xb5e39ed1U, 0x881b4c6aU, 0x1fb8c12cU, 0x517f4665U,
508    0xea049d5eU, 0x355d018cU, 0x7473fa87U, 0x412efb0bU,
509    0x1d5ab367U, 0xd25292dbU, 0x5633e910U, 0x47136dd6U,
510    0x618c9ad7U, 0x0c7a37a1U, 0x148e59f8U, 0x3c89eb13U,
511    0x27eecea9U, 0xc935b761U, 0xe5ede11cU, 0xb13c7a47U,
512    0xdf599cd2U, 0x733f55f2U, 0xce791814U, 0x37bf73c7U,
513    0xcdea53f7U, 0xaa5b5ffdU, 0x6f14df3dU, 0xdb867844U,
514    0xf381caafU, 0xc43eb968U, 0x342c3824U, 0x405fc2a3U,
515    0xc372161dU, 0x250cbce2U, 0x498b283cU, 0x9541ff0dU,
516    0x017139a8U, 0xb3de080cU, 0xe49cd8b4U, 0xc1906456U,
517    0x84617bcbU, 0xb670d532U, 0x5c74486cU, 0x5742d0b8U,
518};
519static const u32 Td3[256] = {
520    0xf4a75051U, 0x4165537eU, 0x17a4c31aU, 0x275e963aU,
521    0xab6bcb3bU, 0x9d45f11fU, 0xfa58abacU, 0xe303934bU,
522    0x30fa5520U, 0x766df6adU, 0xcc769188U, 0x024c25f5U,
523    0xe5d7fc4fU, 0x2acbd7c5U, 0x35448026U, 0x62a38fb5U,
524    0xb15a49deU, 0xba1b6725U, 0xea0e9845U, 0xfec0e15dU,
525    0x2f7502c3U, 0x4cf01281U, 0x4697a38dU, 0xd3f9c66bU,
526    0x8f5fe703U, 0x929c9515U, 0x6d7aebbfU, 0x5259da95U,
527    0xbe832dd4U, 0x7421d358U, 0xe0692949U, 0xc9c8448eU,
528    0xc2896a75U, 0x8e7978f4U, 0x583e6b99U, 0xb971dd27U,
529    0xe14fb6beU, 0x88ad17f0U, 0x20ac66c9U, 0xce3ab47dU,
530    0xdf4a1863U, 0x1a3182e5U, 0x51336097U, 0x537f4562U,
531    0x6477e0b1U, 0x6bae84bbU, 0x81a01cfeU, 0x082b94f9U,
532    0x48685870U, 0x45fd198fU, 0xde6c8794U, 0x7bf8b752U,
533    0x73d323abU, 0x4b02e272U, 0x1f8f57e3U, 0x55ab2a66U,
534    0xeb2807b2U, 0xb5c2032fU, 0xc57b9a86U, 0x3708a5d3U,
535    0x2887f230U, 0xbfa5b223U, 0x036aba02U, 0x16825cedU,
536    0xcf1c2b8aU, 0x79b492a7U, 0x07f2f0f3U, 0x69e2a14eU,
537    0xdaf4cd65U, 0x05bed506U, 0x34621fd1U, 0xa6fe8ac4U,
538    0x2e539d34U, 0xf355a0a2U, 0x8ae13205U, 0xf6eb75a4U,
539    0x83ec390bU, 0x60efaa40U, 0x719f065eU, 0x6e1051bdU,
540    0x218af93eU, 0xdd063d96U, 0x3e05aeddU, 0xe6bd464dU,
541    0x548db591U, 0xc45d0571U, 0x06d46f04U, 0x5015ff60U,
542    0x98fb2419U, 0xbde997d6U, 0x4043cc89U, 0xd99e7767U,
543    0xe842bdb0U, 0x898b8807U, 0x195b38e7U, 0xc8eedb79U,
544    0x7c0a47a1U, 0x420fe97cU, 0x841ec9f8U, 0x00000000U,
545    0x80868309U, 0x2bed4832U, 0x1170ac1eU, 0x5a724e6cU,
546    0x0efffbfdU, 0x8538560fU, 0xaed51e3dU, 0x2d392736U,
547    0x0fd9640aU, 0x5ca62168U, 0x5b54d19bU, 0x362e3a24U,
548    0x0a67b10cU, 0x57e70f93U, 0xee96d2b4U, 0x9b919e1bU,
549    0xc0c54f80U, 0xdc20a261U, 0x774b695aU, 0x121a161cU,
550    0x93ba0ae2U, 0xa02ae5c0U, 0x22e0433cU, 0x1b171d12U,
551    0x090d0b0eU, 0x8bc7adf2U, 0xb6a8b92dU, 0x1ea9c814U,
552    0xf1198557U, 0x75074cafU, 0x99ddbbeeU, 0x7f60fda3U,
553    0x01269ff7U, 0x72f5bc5cU, 0x663bc544U, 0xfb7e345bU,
554    0x4329768bU, 0x23c6dccbU, 0xedfc68b6U, 0xe4f163b8U,
555    0x31dccad7U, 0x63851042U, 0x97224013U, 0xc6112084U,
556    0x4a247d85U, 0xbb3df8d2U, 0xf93211aeU, 0x29a16dc7U,
557    0x9e2f4b1dU, 0xb230f3dcU, 0x8652ec0dU, 0xc1e3d077U,
558    0xb3166c2bU, 0x70b999a9U, 0x9448fa11U, 0xe9642247U,
559    0xfc8cc4a8U, 0xf03f1aa0U, 0x7d2cd856U, 0x3390ef22U,
560    0x494ec787U, 0x38d1c1d9U, 0xcaa2fe8cU, 0xd40b3698U,
561    0xf581cfa6U, 0x7ade28a5U, 0xb78e26daU, 0xadbfa43fU,
562    0x3a9de42cU, 0x78920d50U, 0x5fcc9b6aU, 0x7e466254U,
563    0x8d13c2f6U, 0xd8b8e890U, 0x39f75e2eU, 0xc3aff582U,
564    0x5d80be9fU, 0xd0937c69U, 0xd52da96fU, 0x2512b3cfU,
565    0xac993bc8U, 0x187da710U, 0x9c636ee8U, 0x3bbb7bdbU,
566    0x267809cdU, 0x5918f46eU, 0x9ab701ecU, 0x4f9aa883U,
567    0x956e65e6U, 0xffe67eaaU, 0xbccf0821U, 0x15e8e6efU,
568    0xe79bd9baU, 0x6f36ce4aU, 0x9f09d4eaU, 0xb07cd629U,
569    0xa4b2af31U, 0x3f23312aU, 0xa59430c6U, 0xa266c035U,
570    0x4ebc3774U, 0x82caa6fcU, 0x90d0b0e0U, 0xa7d81533U,
571    0x04984af1U, 0xecdaf741U, 0xcd500e7fU, 0x91f62f17U,
572    0x4dd68d76U, 0xefb04d43U, 0xaa4d54ccU, 0x9604dfe4U,
573    0xd1b5e39eU, 0x6a881b4cU, 0x2c1fb8c1U, 0x65517f46U,
574    0x5eea049dU, 0x8c355d01U, 0x877473faU, 0x0b412efbU,
575    0x671d5ab3U, 0xdbd25292U, 0x105633e9U, 0xd647136dU,
576    0xd7618c9aU, 0xa10c7a37U, 0xf8148e59U, 0x133c89ebU,
577    0xa927eeceU, 0x61c935b7U, 0x1ce5ede1U, 0x47b13c7aU,
578    0xd2df599cU, 0xf2733f55U, 0x14ce7918U, 0xc737bf73U,
579    0xf7cdea53U, 0xfdaa5b5fU, 0x3d6f14dfU, 0x44db8678U,
580    0xaff381caU, 0x68c43eb9U, 0x24342c38U, 0xa3405fc2U,
581    0x1dc37216U, 0xe2250cbcU, 0x3c498b28U, 0x0d9541ffU,
582    0xa8017139U, 0x0cb3de08U, 0xb4e49cd8U, 0x56c19064U,
583    0xcb84617bU, 0x32b670d5U, 0x6c5c7448U, 0xb85742d0U,
584};
585static const u8 Td4[256] = {
586    0x52U, 0x09U, 0x6aU, 0xd5U, 0x30U, 0x36U, 0xa5U, 0x38U,
587    0xbfU, 0x40U, 0xa3U, 0x9eU, 0x81U, 0xf3U, 0xd7U, 0xfbU,
588    0x7cU, 0xe3U, 0x39U, 0x82U, 0x9bU, 0x2fU, 0xffU, 0x87U,
589    0x34U, 0x8eU, 0x43U, 0x44U, 0xc4U, 0xdeU, 0xe9U, 0xcbU,
590    0x54U, 0x7bU, 0x94U, 0x32U, 0xa6U, 0xc2U, 0x23U, 0x3dU,
591    0xeeU, 0x4cU, 0x95U, 0x0bU, 0x42U, 0xfaU, 0xc3U, 0x4eU,
592    0x08U, 0x2eU, 0xa1U, 0x66U, 0x28U, 0xd9U, 0x24U, 0xb2U,
593    0x76U, 0x5bU, 0xa2U, 0x49U, 0x6dU, 0x8bU, 0xd1U, 0x25U,
594    0x72U, 0xf8U, 0xf6U, 0x64U, 0x86U, 0x68U, 0x98U, 0x16U,
595    0xd4U, 0xa4U, 0x5cU, 0xccU, 0x5dU, 0x65U, 0xb6U, 0x92U,
596    0x6cU, 0x70U, 0x48U, 0x50U, 0xfdU, 0xedU, 0xb9U, 0xdaU,
597    0x5eU, 0x15U, 0x46U, 0x57U, 0xa7U, 0x8dU, 0x9dU, 0x84U,
598    0x90U, 0xd8U, 0xabU, 0x00U, 0x8cU, 0xbcU, 0xd3U, 0x0aU,
599    0xf7U, 0xe4U, 0x58U, 0x05U, 0xb8U, 0xb3U, 0x45U, 0x06U,
600    0xd0U, 0x2cU, 0x1eU, 0x8fU, 0xcaU, 0x3fU, 0x0fU, 0x02U,
601    0xc1U, 0xafU, 0xbdU, 0x03U, 0x01U, 0x13U, 0x8aU, 0x6bU,
602    0x3aU, 0x91U, 0x11U, 0x41U, 0x4fU, 0x67U, 0xdcU, 0xeaU,
603    0x97U, 0xf2U, 0xcfU, 0xceU, 0xf0U, 0xb4U, 0xe6U, 0x73U,
604    0x96U, 0xacU, 0x74U, 0x22U, 0xe7U, 0xadU, 0x35U, 0x85U,
605    0xe2U, 0xf9U, 0x37U, 0xe8U, 0x1cU, 0x75U, 0xdfU, 0x6eU,
606    0x47U, 0xf1U, 0x1aU, 0x71U, 0x1dU, 0x29U, 0xc5U, 0x89U,
607    0x6fU, 0xb7U, 0x62U, 0x0eU, 0xaaU, 0x18U, 0xbeU, 0x1bU,
608    0xfcU, 0x56U, 0x3eU, 0x4bU, 0xc6U, 0xd2U, 0x79U, 0x20U,
609    0x9aU, 0xdbU, 0xc0U, 0xfeU, 0x78U, 0xcdU, 0x5aU, 0xf4U,
610    0x1fU, 0xddU, 0xa8U, 0x33U, 0x88U, 0x07U, 0xc7U, 0x31U,
611    0xb1U, 0x12U, 0x10U, 0x59U, 0x27U, 0x80U, 0xecU, 0x5fU,
612    0x60U, 0x51U, 0x7fU, 0xa9U, 0x19U, 0xb5U, 0x4aU, 0x0dU,
613    0x2dU, 0xe5U, 0x7aU, 0x9fU, 0x93U, 0xc9U, 0x9cU, 0xefU,
614    0xa0U, 0xe0U, 0x3bU, 0x4dU, 0xaeU, 0x2aU, 0xf5U, 0xb0U,
615    0xc8U, 0xebU, 0xbbU, 0x3cU, 0x83U, 0x53U, 0x99U, 0x61U,
616    0x17U, 0x2bU, 0x04U, 0x7eU, 0xbaU, 0x77U, 0xd6U, 0x26U,
617    0xe1U, 0x69U, 0x14U, 0x63U, 0x55U, 0x21U, 0x0cU, 0x7dU,
618};
619static const u32 rcon[] = {
620    0x01000000, 0x02000000, 0x04000000, 0x08000000,
621    0x10000000, 0x20000000, 0x40000000, 0x80000000,
622    0x1B000000, 0x36000000, /* for 128-bit blocks, Rijndael never uses more than 10 rcon values */
623};
624
625/**
626 * Expand the cipher key into the encryption key schedule.
627 */
628int private_AES_set_encrypt_key(const unsigned char *userKey, const int bits,
629                                AES_KEY *key)
630{
631
632    u32 *rk;
633    int i = 0;
634    u32 temp;
635
636    if (!userKey || !key)
637        return -1;
638    if (bits != 128 && bits != 192 && bits != 256)
639        return -2;
640
641    rk = key->rd_key;
642
643    if (bits==128)
644        key->rounds = 10;
645    else if (bits==192)
646        key->rounds = 12;
647    else
648        key->rounds = 14;
649
650    rk[0] = GETU32(userKey     );
651    rk[1] = GETU32(userKey +  4);
652    rk[2] = GETU32(userKey +  8);
653    rk[3] = GETU32(userKey + 12);
654    if (bits == 128) {
655        while (1) {
656            temp  = rk[3];
657            rk[4] = rk[0] ^
658                (Te2[(temp >> 16) & 0xff] & 0xff000000) ^
659                (Te3[(temp >>  8) & 0xff] & 0x00ff0000) ^
660                (Te0[(temp      ) & 0xff] & 0x0000ff00) ^
661                (Te1[(temp >> 24)       ] & 0x000000ff) ^
662                rcon[i];
663            rk[5] = rk[1] ^ rk[4];
664            rk[6] = rk[2] ^ rk[5];
665            rk[7] = rk[3] ^ rk[6];
666            if (++i == 10) {
667                return 0;
668            }
669            rk += 4;
670        }
671    }
672    rk[4] = GETU32(userKey + 16);
673    rk[5] = GETU32(userKey + 20);
674    if (bits == 192) {
675        while (1) {
676            temp = rk[ 5];
677            rk[ 6] = rk[ 0] ^
678                (Te2[(temp >> 16) & 0xff] & 0xff000000) ^
679                (Te3[(temp >>  8) & 0xff] & 0x00ff0000) ^
680                (Te0[(temp      ) & 0xff] & 0x0000ff00) ^
681                (Te1[(temp >> 24)       ] & 0x000000ff) ^
682                rcon[i];
683            rk[ 7] = rk[ 1] ^ rk[ 6];
684            rk[ 8] = rk[ 2] ^ rk[ 7];
685            rk[ 9] = rk[ 3] ^ rk[ 8];
686            if (++i == 8) {
687                return 0;
688            }
689            rk[10] = rk[ 4] ^ rk[ 9];
690            rk[11] = rk[ 5] ^ rk[10];
691            rk += 6;
692        }
693    }
694    rk[6] = GETU32(userKey + 24);
695    rk[7] = GETU32(userKey + 28);
696    if (bits == 256) {
697        while (1) {
698            temp = rk[ 7];
699            rk[ 8] = rk[ 0] ^
700                (Te2[(temp >> 16) & 0xff] & 0xff000000) ^
701                (Te3[(temp >>  8) & 0xff] & 0x00ff0000) ^
702                (Te0[(temp      ) & 0xff] & 0x0000ff00) ^
703                (Te1[(temp >> 24)       ] & 0x000000ff) ^
704                rcon[i];
705            rk[ 9] = rk[ 1] ^ rk[ 8];
706            rk[10] = rk[ 2] ^ rk[ 9];
707            rk[11] = rk[ 3] ^ rk[10];
708            if (++i == 7) {
709                return 0;
710            }
711            temp = rk[11];
712            rk[12] = rk[ 4] ^
713                (Te2[(temp >> 24)       ] & 0xff000000) ^
714                (Te3[(temp >> 16) & 0xff] & 0x00ff0000) ^
715                (Te0[(temp >>  8) & 0xff] & 0x0000ff00) ^
716                (Te1[(temp      ) & 0xff] & 0x000000ff);
717            rk[13] = rk[ 5] ^ rk[12];
718            rk[14] = rk[ 6] ^ rk[13];
719            rk[15] = rk[ 7] ^ rk[14];
720
721            rk += 8;
722            }
723    }
724    return 0;
725}
726
727/**
728 * Expand the cipher key into the decryption key schedule.
729 */
730int private_AES_set_decrypt_key(const unsigned char *userKey, const int bits,
731                                AES_KEY *key)
732{
733
734    u32 *rk;
735    int i, j, status;
736    u32 temp;
737
738    /* first, start with an encryption schedule */
739    status = private_AES_set_encrypt_key(userKey, bits, key);
740    if (status < 0)
741        return status;
742
743    rk = key->rd_key;
744
745    /* invert the order of the round keys: */
746    for (i = 0, j = 4*(key->rounds); i < j; i += 4, j -= 4) {
747        temp = rk[i    ]; rk[i    ] = rk[j    ]; rk[j    ] = temp;
748        temp = rk[i + 1]; rk[i + 1] = rk[j + 1]; rk[j + 1] = temp;
749        temp = rk[i + 2]; rk[i + 2] = rk[j + 2]; rk[j + 2] = temp;
750        temp = rk[i + 3]; rk[i + 3] = rk[j + 3]; rk[j + 3] = temp;
751    }
752    /* apply the inverse MixColumn transform to all round keys but the first and the last: */
753    for (i = 1; i < (key->rounds); i++) {
754        rk += 4;
755        rk[0] =
756            Td0[Te1[(rk[0] >> 24)       ] & 0xff] ^
757            Td1[Te1[(rk[0] >> 16) & 0xff] & 0xff] ^
758            Td2[Te1[(rk[0] >>  8) & 0xff] & 0xff] ^
759            Td3[Te1[(rk[0]      ) & 0xff] & 0xff];
760        rk[1] =
761            Td0[Te1[(rk[1] >> 24)       ] & 0xff] ^
762            Td1[Te1[(rk[1] >> 16) & 0xff] & 0xff] ^
763            Td2[Te1[(rk[1] >>  8) & 0xff] & 0xff] ^
764            Td3[Te1[(rk[1]      ) & 0xff] & 0xff];
765        rk[2] =
766            Td0[Te1[(rk[2] >> 24)       ] & 0xff] ^
767            Td1[Te1[(rk[2] >> 16) & 0xff] & 0xff] ^
768            Td2[Te1[(rk[2] >>  8) & 0xff] & 0xff] ^
769            Td3[Te1[(rk[2]      ) & 0xff] & 0xff];
770        rk[3] =
771            Td0[Te1[(rk[3] >> 24)       ] & 0xff] ^
772            Td1[Te1[(rk[3] >> 16) & 0xff] & 0xff] ^
773            Td2[Te1[(rk[3] >>  8) & 0xff] & 0xff] ^
774            Td3[Te1[(rk[3]      ) & 0xff] & 0xff];
775    }
776    return 0;
777}
778
779/*
780 * Encrypt a single block
781 * in and out can overlap
782 */
783void AES_encrypt(const unsigned char *in, unsigned char *out,
784                 const AES_KEY *key) {
785
786    const u32 *rk;
787    u32 s0, s1, s2, s3, t0, t1, t2, t3;
788#ifndef FULL_UNROLL
789    int r;
790#endif /* ?FULL_UNROLL */
791
792    assert(in && out && key);
793    rk = key->rd_key;
794
795    /*
796     * map byte array block to cipher state
797     * and add initial round key:
798     */
799    s0 = GETU32(in     ) ^ rk[0];
800    s1 = GETU32(in +  4) ^ rk[1];
801    s2 = GETU32(in +  8) ^ rk[2];
802    s3 = GETU32(in + 12) ^ rk[3];
803#ifdef FULL_UNROLL
804    /* round 1: */
805    t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[ 4];
806    t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[ 5];
807    t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[ 6];
808    t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[ 7];
809    /* round 2: */
810    s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[ 8];
811    s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[ 9];
812    s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[10];
813    s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[11];
814    /* round 3: */
815    t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[12];
816    t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[13];
817    t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[14];
818    t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[15];
819    /* round 4: */
820    s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[16];
821    s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[17];
822    s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[18];
823    s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[19];
824    /* round 5: */
825    t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[20];
826    t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[21];
827    t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[22];
828    t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[23];
829    /* round 6: */
830    s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[24];
831    s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[25];
832    s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[26];
833    s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[27];
834    /* round 7: */
835    t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[28];
836    t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[29];
837    t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[30];
838    t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[31];
839    /* round 8: */
840    s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[32];
841    s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[33];
842    s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[34];
843    s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[35];
844    /* round 9: */
845    t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[36];
846    t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[37];
847    t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[38];
848    t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[39];
849    if (key->rounds > 10) {
850        /* round 10: */
851        s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[40];
852        s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[41];
853        s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[42];
854        s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[43];
855        /* round 11: */
856        t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[44];
857        t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[45];
858        t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[46];
859        t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[47];
860        if (key->rounds > 12) {
861            /* round 12: */
862            s0 = Te0[t0 >> 24] ^ Te1[(t1 >> 16) & 0xff] ^ Te2[(t2 >>  8) & 0xff] ^ Te3[t3 & 0xff] ^ rk[48];
863            s1 = Te0[t1 >> 24] ^ Te1[(t2 >> 16) & 0xff] ^ Te2[(t3 >>  8) & 0xff] ^ Te3[t0 & 0xff] ^ rk[49];
864            s2 = Te0[t2 >> 24] ^ Te1[(t3 >> 16) & 0xff] ^ Te2[(t0 >>  8) & 0xff] ^ Te3[t1 & 0xff] ^ rk[50];
865            s3 = Te0[t3 >> 24] ^ Te1[(t0 >> 16) & 0xff] ^ Te2[(t1 >>  8) & 0xff] ^ Te3[t2 & 0xff] ^ rk[51];
866            /* round 13: */
867            t0 = Te0[s0 >> 24] ^ Te1[(s1 >> 16) & 0xff] ^ Te2[(s2 >>  8) & 0xff] ^ Te3[s3 & 0xff] ^ rk[52];
868            t1 = Te0[s1 >> 24] ^ Te1[(s2 >> 16) & 0xff] ^ Te2[(s3 >>  8) & 0xff] ^ Te3[s0 & 0xff] ^ rk[53];
869            t2 = Te0[s2 >> 24] ^ Te1[(s3 >> 16) & 0xff] ^ Te2[(s0 >>  8) & 0xff] ^ Te3[s1 & 0xff] ^ rk[54];
870            t3 = Te0[s3 >> 24] ^ Te1[(s0 >> 16) & 0xff] ^ Te2[(s1 >>  8) & 0xff] ^ Te3[s2 & 0xff] ^ rk[55];
871        }
872    }
873    rk += key->rounds << 2;
874#else  /* !FULL_UNROLL */
875    /*
876     * Nr - 1 full rounds:
877     */
878    r = key->rounds >> 1;
879    for (;;) {
880        t0 =
881            Te0[(s0 >> 24)       ] ^
882            Te1[(s1 >> 16) & 0xff] ^
883            Te2[(s2 >>  8) & 0xff] ^
884            Te3[(s3      ) & 0xff] ^
885            rk[4];
886        t1 =
887            Te0[(s1 >> 24)       ] ^
888            Te1[(s2 >> 16) & 0xff] ^
889            Te2[(s3 >>  8) & 0xff] ^
890            Te3[(s0      ) & 0xff] ^
891            rk[5];
892        t2 =
893            Te0[(s2 >> 24)       ] ^
894            Te1[(s3 >> 16) & 0xff] ^
895            Te2[(s0 >>  8) & 0xff] ^
896            Te3[(s1      ) & 0xff] ^
897            rk[6];
898        t3 =
899            Te0[(s3 >> 24)       ] ^
900            Te1[(s0 >> 16) & 0xff] ^
901            Te2[(s1 >>  8) & 0xff] ^
902            Te3[(s2      ) & 0xff] ^
903            rk[7];
904
905        rk += 8;
906        if (--r == 0) {
907            break;
908        }
909
910        s0 =
911            Te0[(t0 >> 24)       ] ^
912            Te1[(t1 >> 16) & 0xff] ^
913            Te2[(t2 >>  8) & 0xff] ^
914            Te3[(t3      ) & 0xff] ^
915            rk[0];
916        s1 =
917            Te0[(t1 >> 24)       ] ^
918            Te1[(t2 >> 16) & 0xff] ^
919            Te2[(t3 >>  8) & 0xff] ^
920            Te3[(t0      ) & 0xff] ^
921            rk[1];
922        s2 =
923            Te0[(t2 >> 24)       ] ^
924            Te1[(t3 >> 16) & 0xff] ^
925            Te2[(t0 >>  8) & 0xff] ^
926            Te3[(t1      ) & 0xff] ^
927            rk[2];
928        s3 =
929            Te0[(t3 >> 24)       ] ^
930            Te1[(t0 >> 16) & 0xff] ^
931            Te2[(t1 >>  8) & 0xff] ^
932            Te3[(t2      ) & 0xff] ^
933            rk[3];
934    }
935#endif /* ?FULL_UNROLL */
936    /*
937     * apply last round and
938     * map cipher state to byte array block:
939     */
940    s0 =
941        (Te2[(t0 >> 24)       ] & 0xff000000) ^
942        (Te3[(t1 >> 16) & 0xff] & 0x00ff0000) ^
943        (Te0[(t2 >>  8) & 0xff] & 0x0000ff00) ^
944        (Te1[(t3      ) & 0xff] & 0x000000ff) ^
945        rk[0];
946    PUTU32(out     , s0);
947    s1 =
948        (Te2[(t1 >> 24)       ] & 0xff000000) ^
949        (Te3[(t2 >> 16) & 0xff] & 0x00ff0000) ^
950        (Te0[(t3 >>  8) & 0xff] & 0x0000ff00) ^
951        (Te1[(t0      ) & 0xff] & 0x000000ff) ^
952        rk[1];
953    PUTU32(out +  4, s1);
954    s2 =
955        (Te2[(t2 >> 24)       ] & 0xff000000) ^
956        (Te3[(t3 >> 16) & 0xff] & 0x00ff0000) ^
957        (Te0[(t0 >>  8) & 0xff] & 0x0000ff00) ^
958        (Te1[(t1      ) & 0xff] & 0x000000ff) ^
959        rk[2];
960    PUTU32(out +  8, s2);
961    s3 =
962        (Te2[(t3 >> 24)       ] & 0xff000000) ^
963        (Te3[(t0 >> 16) & 0xff] & 0x00ff0000) ^
964        (Te0[(t1 >>  8) & 0xff] & 0x0000ff00) ^
965        (Te1[(t2      ) & 0xff] & 0x000000ff) ^
966        rk[3];
967    PUTU32(out + 12, s3);
968}
969
970/*
971 * Decrypt a single block
972 * in and out can overlap
973 */
974void AES_decrypt(const unsigned char *in, unsigned char *out,
975                 const AES_KEY *key)
976{
977
978    const u32 *rk;
979    u32 s0, s1, s2, s3, t0, t1, t2, t3;
980#ifndef FULL_UNROLL
981    int r;
982#endif /* ?FULL_UNROLL */
983
984    assert(in && out && key);
985    rk = key->rd_key;
986
987    /*
988     * map byte array block to cipher state
989     * and add initial round key:
990     */
991    s0 = GETU32(in     ) ^ rk[0];
992    s1 = GETU32(in +  4) ^ rk[1];
993    s2 = GETU32(in +  8) ^ rk[2];
994    s3 = GETU32(in + 12) ^ rk[3];
995#ifdef FULL_UNROLL
996    /* round 1: */
997    t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[ 4];
998    t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[ 5];
999    t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[ 6];
1000    t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[ 7];
1001    /* round 2: */
1002    s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[ 8];
1003    s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[ 9];
1004    s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[10];
1005    s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[11];
1006    /* round 3: */
1007    t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[12];
1008    t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[13];
1009    t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[14];
1010    t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[15];
1011    /* round 4: */
1012    s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[16];
1013    s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[17];
1014    s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[18];
1015    s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[19];
1016    /* round 5: */
1017    t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[20];
1018    t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[21];
1019    t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[22];
1020    t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[23];
1021    /* round 6: */
1022    s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[24];
1023    s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[25];
1024    s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[26];
1025    s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[27];
1026    /* round 7: */
1027    t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[28];
1028    t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[29];
1029    t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[30];
1030    t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[31];
1031    /* round 8: */
1032    s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[32];
1033    s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[33];
1034    s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[34];
1035    s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[35];
1036    /* round 9: */
1037    t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[36];
1038    t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[37];
1039    t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[38];
1040    t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[39];
1041    if (key->rounds > 10) {
1042        /* round 10: */
1043        s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[40];
1044        s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[41];
1045        s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[42];
1046        s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[43];
1047        /* round 11: */
1048        t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[44];
1049        t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[45];
1050        t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[46];
1051        t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[47];
1052        if (key->rounds > 12) {
1053            /* round 12: */
1054            s0 = Td0[t0 >> 24] ^ Td1[(t3 >> 16) & 0xff] ^ Td2[(t2 >>  8) & 0xff] ^ Td3[t1 & 0xff] ^ rk[48];
1055            s1 = Td0[t1 >> 24] ^ Td1[(t0 >> 16) & 0xff] ^ Td2[(t3 >>  8) & 0xff] ^ Td3[t2 & 0xff] ^ rk[49];
1056            s2 = Td0[t2 >> 24] ^ Td1[(t1 >> 16) & 0xff] ^ Td2[(t0 >>  8) & 0xff] ^ Td3[t3 & 0xff] ^ rk[50];
1057            s3 = Td0[t3 >> 24] ^ Td1[(t2 >> 16) & 0xff] ^ Td2[(t1 >>  8) & 0xff] ^ Td3[t0 & 0xff] ^ rk[51];
1058            /* round 13: */
1059            t0 = Td0[s0 >> 24] ^ Td1[(s3 >> 16) & 0xff] ^ Td2[(s2 >>  8) & 0xff] ^ Td3[s1 & 0xff] ^ rk[52];
1060            t1 = Td0[s1 >> 24] ^ Td1[(s0 >> 16) & 0xff] ^ Td2[(s3 >>  8) & 0xff] ^ Td3[s2 & 0xff] ^ rk[53];
1061            t2 = Td0[s2 >> 24] ^ Td1[(s1 >> 16) & 0xff] ^ Td2[(s0 >>  8) & 0xff] ^ Td3[s3 & 0xff] ^ rk[54];
1062            t3 = Td0[s3 >> 24] ^ Td1[(s2 >> 16) & 0xff] ^ Td2[(s1 >>  8) & 0xff] ^ Td3[s0 & 0xff] ^ rk[55];
1063        }
1064    }
1065    rk += key->rounds << 2;
1066#else  /* !FULL_UNROLL */
1067    /*
1068     * Nr - 1 full rounds:
1069     */
1070    r = key->rounds >> 1;
1071    for (;;) {
1072        t0 =
1073            Td0[(s0 >> 24)       ] ^
1074            Td1[(s3 >> 16) & 0xff] ^
1075            Td2[(s2 >>  8) & 0xff] ^
1076            Td3[(s1      ) & 0xff] ^
1077            rk[4];
1078        t1 =
1079            Td0[(s1 >> 24)       ] ^
1080            Td1[(s0 >> 16) & 0xff] ^
1081            Td2[(s3 >>  8) & 0xff] ^
1082            Td3[(s2      ) & 0xff] ^
1083            rk[5];
1084        t2 =
1085            Td0[(s2 >> 24)       ] ^
1086            Td1[(s1 >> 16) & 0xff] ^
1087            Td2[(s0 >>  8) & 0xff] ^
1088            Td3[(s3      ) & 0xff] ^
1089            rk[6];
1090        t3 =
1091            Td0[(s3 >> 24)       ] ^
1092            Td1[(s2 >> 16) & 0xff] ^
1093            Td2[(s1 >>  8) & 0xff] ^
1094            Td3[(s0      ) & 0xff] ^
1095            rk[7];
1096
1097        rk += 8;
1098        if (--r == 0) {
1099            break;
1100        }
1101
1102        s0 =
1103            Td0[(t0 >> 24)       ] ^
1104            Td1[(t3 >> 16) & 0xff] ^
1105            Td2[(t2 >>  8) & 0xff] ^
1106            Td3[(t1      ) & 0xff] ^
1107            rk[0];
1108        s1 =
1109            Td0[(t1 >> 24)       ] ^
1110            Td1[(t0 >> 16) & 0xff] ^
1111            Td2[(t3 >>  8) & 0xff] ^
1112            Td3[(t2      ) & 0xff] ^
1113            rk[1];
1114        s2 =
1115            Td0[(t2 >> 24)       ] ^
1116            Td1[(t1 >> 16) & 0xff] ^
1117            Td2[(t0 >>  8) & 0xff] ^
1118            Td3[(t3      ) & 0xff] ^
1119            rk[2];
1120        s3 =
1121            Td0[(t3 >> 24)       ] ^
1122            Td1[(t2 >> 16) & 0xff] ^
1123            Td2[(t1 >>  8) & 0xff] ^
1124            Td3[(t0      ) & 0xff] ^
1125            rk[3];
1126    }
1127#endif /* ?FULL_UNROLL */
1128    /*
1129     * apply last round and
1130     * map cipher state to byte array block:
1131     */
1132    s0 =
1133        ((u32)Td4[(t0 >> 24)       ] << 24) ^
1134        ((u32)Td4[(t3 >> 16) & 0xff] << 16) ^
1135        ((u32)Td4[(t2 >>  8) & 0xff] <<  8) ^
1136        ((u32)Td4[(t1      ) & 0xff])       ^
1137        rk[0];
1138    PUTU32(out     , s0);
1139    s1 =
1140        ((u32)Td4[(t1 >> 24)       ] << 24) ^
1141        ((u32)Td4[(t0 >> 16) & 0xff] << 16) ^
1142        ((u32)Td4[(t3 >>  8) & 0xff] <<  8) ^
1143        ((u32)Td4[(t2      ) & 0xff])       ^
1144        rk[1];
1145    PUTU32(out +  4, s1);
1146    s2 =
1147        ((u32)Td4[(t2 >> 24)       ] << 24) ^
1148        ((u32)Td4[(t1 >> 16) & 0xff] << 16) ^
1149        ((u32)Td4[(t0 >>  8) & 0xff] <<  8) ^
1150        ((u32)Td4[(t3      ) & 0xff])       ^
1151        rk[2];
1152    PUTU32(out +  8, s2);
1153    s3 =
1154        ((u32)Td4[(t3 >> 24)       ] << 24) ^
1155        ((u32)Td4[(t2 >> 16) & 0xff] << 16) ^
1156        ((u32)Td4[(t1 >>  8) & 0xff] <<  8) ^
1157        ((u32)Td4[(t0      ) & 0xff])       ^
1158        rk[3];
1159    PUTU32(out + 12, s3);
1160}
1161
1162#else /* AES_ASM */
1163
1164static const u8 Te4[256] = {
1165    0x63U, 0x7cU, 0x77U, 0x7bU, 0xf2U, 0x6bU, 0x6fU, 0xc5U,
1166    0x30U, 0x01U, 0x67U, 0x2bU, 0xfeU, 0xd7U, 0xabU, 0x76U,
1167    0xcaU, 0x82U, 0xc9U, 0x7dU, 0xfaU, 0x59U, 0x47U, 0xf0U,
1168    0xadU, 0xd4U, 0xa2U, 0xafU, 0x9cU, 0xa4U, 0x72U, 0xc0U,
1169    0xb7U, 0xfdU, 0x93U, 0x26U, 0x36U, 0x3fU, 0xf7U, 0xccU,
1170    0x34U, 0xa5U, 0xe5U, 0xf1U, 0x71U, 0xd8U, 0x31U, 0x15U,
1171    0x04U, 0xc7U, 0x23U, 0xc3U, 0x18U, 0x96U, 0x05U, 0x9aU,
1172    0x07U, 0x12U, 0x80U, 0xe2U, 0xebU, 0x27U, 0xb2U, 0x75U,
1173    0x09U, 0x83U, 0x2cU, 0x1aU, 0x1bU, 0x6eU, 0x5aU, 0xa0U,
1174    0x52U, 0x3bU, 0xd6U, 0xb3U, 0x29U, 0xe3U, 0x2fU, 0x84U,
1175    0x53U, 0xd1U, 0x00U, 0xedU, 0x20U, 0xfcU, 0xb1U, 0x5bU,
1176    0x6aU, 0xcbU, 0xbeU, 0x39U, 0x4aU, 0x4cU, 0x58U, 0xcfU,
1177    0xd0U, 0xefU, 0xaaU, 0xfbU, 0x43U, 0x4dU, 0x33U, 0x85U,
1178    0x45U, 0xf9U, 0x02U, 0x7fU, 0x50U, 0x3cU, 0x9fU, 0xa8U,
1179    0x51U, 0xa3U, 0x40U, 0x8fU, 0x92U, 0x9dU, 0x38U, 0xf5U,
1180    0xbcU, 0xb6U, 0xdaU, 0x21U, 0x10U, 0xffU, 0xf3U, 0xd2U,
1181    0xcdU, 0x0cU, 0x13U, 0xecU, 0x5fU, 0x97U, 0x44U, 0x17U,
1182    0xc4U, 0xa7U, 0x7eU, 0x3dU, 0x64U, 0x5dU, 0x19U, 0x73U,
1183    0x60U, 0x81U, 0x4fU, 0xdcU, 0x22U, 0x2aU, 0x90U, 0x88U,
1184    0x46U, 0xeeU, 0xb8U, 0x14U, 0xdeU, 0x5eU, 0x0bU, 0xdbU,
1185    0xe0U, 0x32U, 0x3aU, 0x0aU, 0x49U, 0x06U, 0x24U, 0x5cU,
1186    0xc2U, 0xd3U, 0xacU, 0x62U, 0x91U, 0x95U, 0xe4U, 0x79U,
1187    0xe7U, 0xc8U, 0x37U, 0x6dU, 0x8dU, 0xd5U, 0x4eU, 0xa9U,
1188    0x6cU, 0x56U, 0xf4U, 0xeaU, 0x65U, 0x7aU, 0xaeU, 0x08U,
1189    0xbaU, 0x78U, 0x25U, 0x2eU, 0x1cU, 0xa6U, 0xb4U, 0xc6U,
1190    0xe8U, 0xddU, 0x74U, 0x1fU, 0x4bU, 0xbdU, 0x8bU, 0x8aU,
1191    0x70U, 0x3eU, 0xb5U, 0x66U, 0x48U, 0x03U, 0xf6U, 0x0eU,
1192    0x61U, 0x35U, 0x57U, 0xb9U, 0x86U, 0xc1U, 0x1dU, 0x9eU,
1193    0xe1U, 0xf8U, 0x98U, 0x11U, 0x69U, 0xd9U, 0x8eU, 0x94U,
1194    0x9bU, 0x1eU, 0x87U, 0xe9U, 0xceU, 0x55U, 0x28U, 0xdfU,
1195    0x8cU, 0xa1U, 0x89U, 0x0dU, 0xbfU, 0xe6U, 0x42U, 0x68U,
1196    0x41U, 0x99U, 0x2dU, 0x0fU, 0xb0U, 0x54U, 0xbbU, 0x16U
1197};
1198static const u32 rcon[] = {
1199    0x01000000, 0x02000000, 0x04000000, 0x08000000,
1200    0x10000000, 0x20000000, 0x40000000, 0x80000000,
1201    0x1B000000, 0x36000000, /* for 128-bit blocks, Rijndael never uses more than 10 rcon values */
1202};
1203
1204/**
1205 * Expand the cipher key into the encryption key schedule.
1206 */
1207int private_AES_set_encrypt_key(const unsigned char *userKey, const int bits,
1208                                AES_KEY *key)
1209{
1210    u32 *rk;
1211   	int i = 0;
1212    u32 temp;
1213
1214    if (!userKey || !key)
1215        return -1;
1216    if (bits != 128 && bits != 192 && bits != 256)
1217        return -2;
1218
1219    rk = key->rd_key;
1220
1221    if (bits==128)
1222        key->rounds = 10;
1223    else if (bits==192)
1224        key->rounds = 12;
1225    else
1226        key->rounds = 14;
1227
1228    rk[0] = GETU32(userKey     );
1229    rk[1] = GETU32(userKey +  4);
1230    rk[2] = GETU32(userKey +  8);
1231    rk[3] = GETU32(userKey + 12);
1232    if (bits == 128) {
1233        while (1) {
1234            temp  = rk[3];
1235            rk[4] = rk[0] ^
1236                ((u32)Te4[(temp >> 16) & 0xff] << 24) ^
1237                ((u32)Te4[(temp >>  8) & 0xff] << 16) ^
1238                ((u32)Te4[(temp      ) & 0xff] << 8) ^
1239                ((u32)Te4[(temp >> 24)       ]) ^
1240                rcon[i];
1241            rk[5] = rk[1] ^ rk[4];
1242            rk[6] = rk[2] ^ rk[5];
1243            rk[7] = rk[3] ^ rk[6];
1244            if (++i == 10) {
1245                return 0;
1246            }
1247            rk += 4;
1248        }
1249    }
1250    rk[4] = GETU32(userKey + 16);
1251    rk[5] = GETU32(userKey + 20);
1252    if (bits == 192) {
1253        while (1) {
1254            temp = rk[ 5];
1255            rk[ 6] = rk[ 0] ^
1256                ((u32)Te4[(temp >> 16) & 0xff] << 24) ^
1257                ((u32)Te4[(temp >>  8) & 0xff] << 16) ^
1258                ((u32)Te4[(temp      ) & 0xff] << 8) ^
1259                ((u32)Te4[(temp >> 24)       ]) ^
1260                rcon[i];
1261            rk[ 7] = rk[ 1] ^ rk[ 6];
1262            rk[ 8] = rk[ 2] ^ rk[ 7];
1263            rk[ 9] = rk[ 3] ^ rk[ 8];
1264            if (++i == 8) {
1265                return 0;
1266            }
1267            rk[10] = rk[ 4] ^ rk[ 9];
1268            rk[11] = rk[ 5] ^ rk[10];
1269            rk += 6;
1270        }
1271    }
1272    rk[6] = GETU32(userKey + 24);
1273    rk[7] = GETU32(userKey + 28);
1274    if (bits == 256) {
1275        while (1) {
1276            temp = rk[ 7];
1277            rk[ 8] = rk[ 0] ^
1278                ((u32)Te4[(temp >> 16) & 0xff] << 24) ^
1279                ((u32)Te4[(temp >>  8) & 0xff] << 16) ^
1280                ((u32)Te4[(temp      ) & 0xff] << 8) ^
1281                ((u32)Te4[(temp >> 24)       ]) ^
1282                rcon[i];
1283            rk[ 9] = rk[ 1] ^ rk[ 8];
1284            rk[10] = rk[ 2] ^ rk[ 9];
1285            rk[11] = rk[ 3] ^ rk[10];
1286            if (++i == 7) {
1287                return 0;
1288            }
1289            temp = rk[11];
1290            rk[12] = rk[ 4] ^
1291                ((u32)Te4[(temp >> 24)       ] << 24) ^
1292                ((u32)Te4[(temp >> 16) & 0xff] << 16) ^
1293                ((u32)Te4[(temp >>  8) & 0xff] << 8) ^
1294                ((u32)Te4[(temp      ) & 0xff]);
1295            rk[13] = rk[ 5] ^ rk[12];
1296            rk[14] = rk[ 6] ^ rk[13];
1297            rk[15] = rk[ 7] ^ rk[14];
1298
1299            rk += 8;
1300        }
1301    }
1302    return 0;
1303}
1304
1305/**
1306 * Expand the cipher key into the decryption key schedule.
1307 */
1308int private_AES_set_decrypt_key(const unsigned char *userKey, const int bits,
1309                                AES_KEY *key)
1310{
1311
1312    u32 *rk;
1313    int i, j, status;
1314    u32 temp;
1315
1316    /* first, start with an encryption schedule */
1317    status = private_AES_set_encrypt_key(userKey, bits, key);
1318    if (status < 0)
1319        return status;
1320
1321    rk = key->rd_key;
1322
1323    /* invert the order of the round keys: */
1324    for (i = 0, j = 4*(key->rounds); i < j; i += 4, j -= 4) {
1325        temp = rk[i    ]; rk[i    ] = rk[j    ]; rk[j    ] = temp;
1326        temp = rk[i + 1]; rk[i + 1] = rk[j + 1]; rk[j + 1] = temp;
1327        temp = rk[i + 2]; rk[i + 2] = rk[j + 2]; rk[j + 2] = temp;
1328        temp = rk[i + 3]; rk[i + 3] = rk[j + 3]; rk[j + 3] = temp;
1329    }
1330    /* apply the inverse MixColumn transform to all round keys but the first and the last: */
1331    for (i = 1; i < (key->rounds); i++) {
1332        rk += 4;
1333        for (j = 0; j < 4; j++) {
1334            u32 tp1, tp2, tp4, tp8, tp9, tpb, tpd, tpe, m;
1335
1336            tp1 = rk[j];
1337            m = tp1 & 0x80808080;
1338            tp2 = ((tp1 & 0x7f7f7f7f) << 1) ^
1339                ((m - (m >> 7)) & 0x1b1b1b1b);
1340            m = tp2 & 0x80808080;
1341            tp4 = ((tp2 & 0x7f7f7f7f) << 1) ^
1342                ((m - (m >> 7)) & 0x1b1b1b1b);
1343            m = tp4 & 0x80808080;
1344            tp8 = ((tp4 & 0x7f7f7f7f) << 1) ^
1345                ((m - (m >> 7)) & 0x1b1b1b1b);
1346            tp9 = tp8 ^ tp1;
1347            tpb = tp9 ^ tp2;
1348            tpd = tp9 ^ tp4;
1349            tpe = tp8 ^ tp4 ^ tp2;
1350#if defined(ROTATE)
1351            rk[j] = tpe ^ ROTATE(tpd,16) ^
1352                ROTATE(tp9,24) ^ ROTATE(tpb,8);
1353#else
1354            rk[j] = tpe ^ (tpd >> 16) ^ (tpd << 16) ^
1355                (tp9 >> 8) ^ (tp9 << 24) ^
1356                (tpb >> 24) ^ (tpb << 8);
1357#endif
1358        }
1359    }
1360    return 0;
1361}
1362
1363#endif /* AES_ASM */
1364