44 static const uint8_t
rcon[10] = {
45 0x01, 0x02, 0x04, 0x08, 0x10, 0x20, 0x40, 0x80, 0x1b, 0x36
59 # define ROT(x, s) ((x >> s) | (x << (32-s)))
61 # define ROT(x, s) ((x << s) | (x >> (32-s)))
67 dst->
u64[0] = src->
u64[0] ^ round_key->
u64[0];
68 dst->
u64[1] = src->
u64[1] ^ round_key->
u64[1];
90 s0[0].
u8[ 0] = box[s0[1].
u8[ 0]];
91 s0[0].
u8[ 4] = box[s0[1].
u8[ 4]];
92 s0[0].
u8[ 8] = box[s0[1].
u8[ 8]];
93 s0[0].
u8[12] = box[s0[1].
u8[12]];
94 s1[0].
u8[ 3] = box[s1[1].
u8[ 7]];
95 s1[0].
u8[ 7] = box[s1[1].
u8[11]];
96 s1[0].
u8[11] = box[s1[1].
u8[15]];
97 s1[0].
u8[15] = box[s1[1].
u8[ 3]];
98 s0[0].
u8[ 2] = box[s0[1].
u8[10]];
99 s0[0].
u8[10] = box[s0[1].
u8[ 2]];
100 s0[0].
u8[ 6] = box[s0[1].
u8[14]];
101 s0[0].
u8[14] = box[s0[1].
u8[ 6]];
102 s3[0].
u8[ 1] = box[s3[1].
u8[13]];
103 s3[0].
u8[13] = box[s3[1].
u8[ 9]];
104 s3[0].
u8[ 9] = box[s3[1].
u8[ 5]];
105 s3[0].
u8[ 5] = box[s3[1].
u8[ 1]];
108 static inline int mix_core(uint32_t multbl[][256],
int a,
int b,
int c,
int d){
110 return multbl[0][a] ^
ROT(multbl[0][b], 8) ^
ROT(multbl[0][c], 16) ^
ROT(multbl[0][d], 24);
112 return multbl[0][a] ^ multbl[1][
b] ^ multbl[2][c] ^ multbl[3][d];
117 uint8_t (*src)[4] = state[1].
u8x4;
118 state[0].
u32[0] =
mix_core(multbl, src[0][0], src[s1 ][1], src[2][2], src[s3 ][3]);
119 state[0].
u32[1] =
mix_core(multbl, src[1][0], src[s3-1][1], src[3][2], src[s1-1][3]);
120 state[0].
u32[2] =
mix_core(multbl, src[2][0], src[s3 ][1], src[0][2], src[s1 ][3]);
121 state[0].
u32[3] =
mix_core(multbl, src[3][0], src[s1-1][1], src[1][2], src[s3-1][3]);
125 uint32_t multbl[][256])
129 for (r = a->
rounds - 1; r > 0; r--) {
130 mix(a->
state, multbl, 3 - s, 1 + s);
138 int count, uint8_t *iv,
int decrypt)
163 const uint8_t *log8,
const uint8_t *alog8,
168 for (i = 0; i < 256; i++) {
173 k = alog8[x + log8[c[0]]];
174 l = alog8[x + log8[c[1]]];
175 m = alog8[x + log8[c[2]]];
176 n = alog8[x + log8[c[3]]];
179 tbl[1][i] =
ROT(tbl[0][i], 8);
180 tbl[2][i] =
ROT(tbl[0][i], 16);
181 tbl[3][i] =
ROT(tbl[0][i], 24);
190 int i, j,
t, rconpointer = 0;
192 int KC = key_bits >> 5;
199 for (i = 0; i < 255; i++) {
200 alog8[i] = alog8[i + 255] = j;
206 for (i = 0; i < 256; i++) {
207 j = i ? alog8[255 - log8[i]] : 0;
208 j ^= (j << 1) ^ (j << 2) ^ (j << 3) ^ (j << 4);
209 j = (j ^ (j >> 8) ^ 99) & 255;
219 if (key_bits != 128 && key_bits != 192 && key_bits != 256)
224 memcpy(tk, key, KC * 4);
227 for (t = KC * 4; t < (rounds + 1) * 16; t += KC * 4) {
228 for (i = 0; i < 4; i++)
229 tk[0][i] ^=
sbox[tk[KC - 1][(i + 1) & 3]];
230 tk[0][0] ^=
rcon[rconpointer++];
232 for (j = 1; j < KC; j++) {
233 if (KC != 8 || j != KC >> 1)
234 for (i = 0; i < 4; i++)
235 tk[j][i] ^= tk[j - 1][i];
237 for (i = 0; i < 4; i++)
238 tk[j][i] ^=
sbox[tk[j - 1][i]];
245 for (i = 1; i < rounds; i++) {
253 for (i = 0; i < (rounds + 1) >> 1; i++) {
266 int main(
int argc,
char **argv)
270 uint8_t rkey[2][16] = {
272 { 0x10, 0xa5, 0x88, 0x69, 0xd7, 0x4b, 0xe5, 0xa3,
273 0x74, 0xcf, 0x86, 0x7c, 0xfb, 0x47, 0x38, 0x59 }
275 uint8_t
pt[16], rpt[2][16]= {
276 { 0x6a, 0x84, 0x86, 0x7c, 0xd7, 0x7e, 0x12, 0xad,
277 0x07, 0xea, 0x1b, 0xe8, 0x95, 0xc5, 0x3f, 0xa3 },
280 uint8_t rct[2][16]= {
281 { 0x73, 0x22, 0x81, 0xc0, 0xa0, 0xaa, 0xb8, 0xf7,
282 0xa5, 0x4a, 0x0c, 0x67, 0xa0, 0xc4, 0x5e, 0xcf },
283 { 0x6d, 0x25, 0x1e, 0x69, 0x44, 0xb0, 0x51, 0xe0,
284 0x4e, 0xaa, 0x6f, 0xb4, 0xdb, 0xf7, 0x84, 0x65 }
291 for (i = 0; i < 2; i++) {
294 for (j = 0; j < 16; j++) {
295 if (rpt[i][j] != temp[j]) {
297 j, rpt[i][j], temp[j]);
303 if (argc > 1 && !strcmp(argv[1],
"-t")) {
311 for (i = 0; i < 10000; i++) {
312 for (j = 0; j < 16; j++) {
320 temp[0], temp[5], temp[10], temp[15]);
324 for (j = 0; j < 16; j++) {
325 if (pt[j] != temp[j]) {
327 i, j, pt[j], temp[j]);