Kyle Swenson | 8d8f654 | 2021-03-15 11:02:55 -0600 | [diff] [blame^] | 1 | /* |
| 2 | * Cryptographic API. |
| 3 | * |
| 4 | * Serpent Cipher Algorithm. |
| 5 | * |
| 6 | * Copyright (C) 2002 Dag Arne Osvik <osvik@ii.uib.no> |
| 7 | * 2003 Herbert Valerio Riedel <hvr@gnu.org> |
| 8 | * |
| 9 | * Added tnepres support: |
| 10 | * Ruben Jesus Garcia Hernandez <ruben@ugr.es>, 18.10.2004 |
| 11 | * Based on code by hvr |
| 12 | * |
| 13 | * This program is free software; you can redistribute it and/or modify |
| 14 | * it under the terms of the GNU General Public License as published by |
| 15 | * the Free Software Foundation; either version 2 of the License, or |
| 16 | * (at your option) any later version. |
| 17 | */ |
| 18 | |
| 19 | #include <linux/init.h> |
| 20 | #include <linux/module.h> |
| 21 | #include <linux/errno.h> |
| 22 | #include <asm/byteorder.h> |
| 23 | #include <linux/crypto.h> |
| 24 | #include <linux/types.h> |
| 25 | #include <crypto/serpent.h> |
| 26 | |
| 27 | /* Key is padded to the maximum of 256 bits before round key generation. |
| 28 | * Any key length <= 256 bits (32 bytes) is allowed by the algorithm. |
| 29 | */ |
| 30 | |
| 31 | #define PHI 0x9e3779b9UL |
| 32 | |
| 33 | #define keyiter(a, b, c, d, i, j) \ |
| 34 | ({ b ^= d; b ^= c; b ^= a; b ^= PHI ^ i; b = rol32(b, 11); k[j] = b; }) |
| 35 | |
| 36 | #define loadkeys(x0, x1, x2, x3, i) \ |
| 37 | ({ x0 = k[i]; x1 = k[i+1]; x2 = k[i+2]; x3 = k[i+3]; }) |
| 38 | |
| 39 | #define storekeys(x0, x1, x2, x3, i) \ |
| 40 | ({ k[i] = x0; k[i+1] = x1; k[i+2] = x2; k[i+3] = x3; }) |
| 41 | |
| 42 | #define store_and_load_keys(x0, x1, x2, x3, s, l) \ |
| 43 | ({ storekeys(x0, x1, x2, x3, s); loadkeys(x0, x1, x2, x3, l); }) |
| 44 | |
| 45 | #define K(x0, x1, x2, x3, i) ({ \ |
| 46 | x3 ^= k[4*(i)+3]; x2 ^= k[4*(i)+2]; \ |
| 47 | x1 ^= k[4*(i)+1]; x0 ^= k[4*(i)+0]; \ |
| 48 | }) |
| 49 | |
| 50 | #define LK(x0, x1, x2, x3, x4, i) ({ \ |
| 51 | x0 = rol32(x0, 13);\ |
| 52 | x2 = rol32(x2, 3); x1 ^= x0; x4 = x0 << 3; \ |
| 53 | x3 ^= x2; x1 ^= x2; \ |
| 54 | x1 = rol32(x1, 1); x3 ^= x4; \ |
| 55 | x3 = rol32(x3, 7); x4 = x1; \ |
| 56 | x0 ^= x1; x4 <<= 7; x2 ^= x3; \ |
| 57 | x0 ^= x3; x2 ^= x4; x3 ^= k[4*i+3]; \ |
| 58 | x1 ^= k[4*i+1]; x0 = rol32(x0, 5); x2 = rol32(x2, 22);\ |
| 59 | x0 ^= k[4*i+0]; x2 ^= k[4*i+2]; \ |
| 60 | }) |
| 61 | |
| 62 | #define KL(x0, x1, x2, x3, x4, i) ({ \ |
| 63 | x0 ^= k[4*i+0]; x1 ^= k[4*i+1]; x2 ^= k[4*i+2]; \ |
| 64 | x3 ^= k[4*i+3]; x0 = ror32(x0, 5); x2 = ror32(x2, 22);\ |
| 65 | x4 = x1; x2 ^= x3; x0 ^= x3; \ |
| 66 | x4 <<= 7; x0 ^= x1; x1 = ror32(x1, 1); \ |
| 67 | x2 ^= x4; x3 = ror32(x3, 7); x4 = x0 << 3; \ |
| 68 | x1 ^= x0; x3 ^= x4; x0 = ror32(x0, 13);\ |
| 69 | x1 ^= x2; x3 ^= x2; x2 = ror32(x2, 3); \ |
| 70 | }) |
| 71 | |
| 72 | #define S0(x0, x1, x2, x3, x4) ({ \ |
| 73 | x4 = x3; \ |
| 74 | x3 |= x0; x0 ^= x4; x4 ^= x2; \ |
| 75 | x4 = ~x4; x3 ^= x1; x1 &= x0; \ |
| 76 | x1 ^= x4; x2 ^= x0; x0 ^= x3; \ |
| 77 | x4 |= x0; x0 ^= x2; x2 &= x1; \ |
| 78 | x3 ^= x2; x1 = ~x1; x2 ^= x4; \ |
| 79 | x1 ^= x2; \ |
| 80 | }) |
| 81 | |
| 82 | #define S1(x0, x1, x2, x3, x4) ({ \ |
| 83 | x4 = x1; \ |
| 84 | x1 ^= x0; x0 ^= x3; x3 = ~x3; \ |
| 85 | x4 &= x1; x0 |= x1; x3 ^= x2; \ |
| 86 | x0 ^= x3; x1 ^= x3; x3 ^= x4; \ |
| 87 | x1 |= x4; x4 ^= x2; x2 &= x0; \ |
| 88 | x2 ^= x1; x1 |= x0; x0 = ~x0; \ |
| 89 | x0 ^= x2; x4 ^= x1; \ |
| 90 | }) |
| 91 | |
| 92 | #define S2(x0, x1, x2, x3, x4) ({ \ |
| 93 | x3 = ~x3; \ |
| 94 | x1 ^= x0; x4 = x0; x0 &= x2; \ |
| 95 | x0 ^= x3; x3 |= x4; x2 ^= x1; \ |
| 96 | x3 ^= x1; x1 &= x0; x0 ^= x2; \ |
| 97 | x2 &= x3; x3 |= x1; x0 = ~x0; \ |
| 98 | x3 ^= x0; x4 ^= x0; x0 ^= x2; \ |
| 99 | x1 |= x2; \ |
| 100 | }) |
| 101 | |
| 102 | #define S3(x0, x1, x2, x3, x4) ({ \ |
| 103 | x4 = x1; \ |
| 104 | x1 ^= x3; x3 |= x0; x4 &= x0; \ |
| 105 | x0 ^= x2; x2 ^= x1; x1 &= x3; \ |
| 106 | x2 ^= x3; x0 |= x4; x4 ^= x3; \ |
| 107 | x1 ^= x0; x0 &= x3; x3 &= x4; \ |
| 108 | x3 ^= x2; x4 |= x1; x2 &= x1; \ |
| 109 | x4 ^= x3; x0 ^= x3; x3 ^= x2; \ |
| 110 | }) |
| 111 | |
| 112 | #define S4(x0, x1, x2, x3, x4) ({ \ |
| 113 | x4 = x3; \ |
| 114 | x3 &= x0; x0 ^= x4; \ |
| 115 | x3 ^= x2; x2 |= x4; x0 ^= x1; \ |
| 116 | x4 ^= x3; x2 |= x0; \ |
| 117 | x2 ^= x1; x1 &= x0; \ |
| 118 | x1 ^= x4; x4 &= x2; x2 ^= x3; \ |
| 119 | x4 ^= x0; x3 |= x1; x1 = ~x1; \ |
| 120 | x3 ^= x0; \ |
| 121 | }) |
| 122 | |
| 123 | #define S5(x0, x1, x2, x3, x4) ({ \ |
| 124 | x4 = x1; x1 |= x0; \ |
| 125 | x2 ^= x1; x3 = ~x3; x4 ^= x0; \ |
| 126 | x0 ^= x2; x1 &= x4; x4 |= x3; \ |
| 127 | x4 ^= x0; x0 &= x3; x1 ^= x3; \ |
| 128 | x3 ^= x2; x0 ^= x1; x2 &= x4; \ |
| 129 | x1 ^= x2; x2 &= x0; \ |
| 130 | x3 ^= x2; \ |
| 131 | }) |
| 132 | |
| 133 | #define S6(x0, x1, x2, x3, x4) ({ \ |
| 134 | x4 = x1; \ |
| 135 | x3 ^= x0; x1 ^= x2; x2 ^= x0; \ |
| 136 | x0 &= x3; x1 |= x3; x4 = ~x4; \ |
| 137 | x0 ^= x1; x1 ^= x2; \ |
| 138 | x3 ^= x4; x4 ^= x0; x2 &= x0; \ |
| 139 | x4 ^= x1; x2 ^= x3; x3 &= x1; \ |
| 140 | x3 ^= x0; x1 ^= x2; \ |
| 141 | }) |
| 142 | |
| 143 | #define S7(x0, x1, x2, x3, x4) ({ \ |
| 144 | x1 = ~x1; \ |
| 145 | x4 = x1; x0 = ~x0; x1 &= x2; \ |
| 146 | x1 ^= x3; x3 |= x4; x4 ^= x2; \ |
| 147 | x2 ^= x3; x3 ^= x0; x0 |= x1; \ |
| 148 | x2 &= x0; x0 ^= x4; x4 ^= x3; \ |
| 149 | x3 &= x0; x4 ^= x1; \ |
| 150 | x2 ^= x4; x3 ^= x1; x4 |= x0; \ |
| 151 | x4 ^= x1; \ |
| 152 | }) |
| 153 | |
| 154 | #define SI0(x0, x1, x2, x3, x4) ({ \ |
| 155 | x4 = x3; x1 ^= x0; \ |
| 156 | x3 |= x1; x4 ^= x1; x0 = ~x0; \ |
| 157 | x2 ^= x3; x3 ^= x0; x0 &= x1; \ |
| 158 | x0 ^= x2; x2 &= x3; x3 ^= x4; \ |
| 159 | x2 ^= x3; x1 ^= x3; x3 &= x0; \ |
| 160 | x1 ^= x0; x0 ^= x2; x4 ^= x3; \ |
| 161 | }) |
| 162 | |
| 163 | #define SI1(x0, x1, x2, x3, x4) ({ \ |
| 164 | x1 ^= x3; x4 = x0; \ |
| 165 | x0 ^= x2; x2 = ~x2; x4 |= x1; \ |
| 166 | x4 ^= x3; x3 &= x1; x1 ^= x2; \ |
| 167 | x2 &= x4; x4 ^= x1; x1 |= x3; \ |
| 168 | x3 ^= x0; x2 ^= x0; x0 |= x4; \ |
| 169 | x2 ^= x4; x1 ^= x0; \ |
| 170 | x4 ^= x1; \ |
| 171 | }) |
| 172 | |
| 173 | #define SI2(x0, x1, x2, x3, x4) ({ \ |
| 174 | x2 ^= x1; x4 = x3; x3 = ~x3; \ |
| 175 | x3 |= x2; x2 ^= x4; x4 ^= x0; \ |
| 176 | x3 ^= x1; x1 |= x2; x2 ^= x0; \ |
| 177 | x1 ^= x4; x4 |= x3; x2 ^= x3; \ |
| 178 | x4 ^= x2; x2 &= x1; \ |
| 179 | x2 ^= x3; x3 ^= x4; x4 ^= x0; \ |
| 180 | }) |
| 181 | |
| 182 | #define SI3(x0, x1, x2, x3, x4) ({ \ |
| 183 | x2 ^= x1; \ |
| 184 | x4 = x1; x1 &= x2; \ |
| 185 | x1 ^= x0; x0 |= x4; x4 ^= x3; \ |
| 186 | x0 ^= x3; x3 |= x1; x1 ^= x2; \ |
| 187 | x1 ^= x3; x0 ^= x2; x2 ^= x3; \ |
| 188 | x3 &= x1; x1 ^= x0; x0 &= x2; \ |
| 189 | x4 ^= x3; x3 ^= x0; x0 ^= x1; \ |
| 190 | }) |
| 191 | |
| 192 | #define SI4(x0, x1, x2, x3, x4) ({ \ |
| 193 | x2 ^= x3; x4 = x0; x0 &= x1; \ |
| 194 | x0 ^= x2; x2 |= x3; x4 = ~x4; \ |
| 195 | x1 ^= x0; x0 ^= x2; x2 &= x4; \ |
| 196 | x2 ^= x0; x0 |= x4; \ |
| 197 | x0 ^= x3; x3 &= x2; \ |
| 198 | x4 ^= x3; x3 ^= x1; x1 &= x0; \ |
| 199 | x4 ^= x1; x0 ^= x3; \ |
| 200 | }) |
| 201 | |
| 202 | #define SI5(x0, x1, x2, x3, x4) ({ \ |
| 203 | x4 = x1; x1 |= x2; \ |
| 204 | x2 ^= x4; x1 ^= x3; x3 &= x4; \ |
| 205 | x2 ^= x3; x3 |= x0; x0 = ~x0; \ |
| 206 | x3 ^= x2; x2 |= x0; x4 ^= x1; \ |
| 207 | x2 ^= x4; x4 &= x0; x0 ^= x1; \ |
| 208 | x1 ^= x3; x0 &= x2; x2 ^= x3; \ |
| 209 | x0 ^= x2; x2 ^= x4; x4 ^= x3; \ |
| 210 | }) |
| 211 | |
| 212 | #define SI6(x0, x1, x2, x3, x4) ({ \ |
| 213 | x0 ^= x2; \ |
| 214 | x4 = x0; x0 &= x3; x2 ^= x3; \ |
| 215 | x0 ^= x2; x3 ^= x1; x2 |= x4; \ |
| 216 | x2 ^= x3; x3 &= x0; x0 = ~x0; \ |
| 217 | x3 ^= x1; x1 &= x2; x4 ^= x0; \ |
| 218 | x3 ^= x4; x4 ^= x2; x0 ^= x1; \ |
| 219 | x2 ^= x0; \ |
| 220 | }) |
| 221 | |
| 222 | #define SI7(x0, x1, x2, x3, x4) ({ \ |
| 223 | x4 = x3; x3 &= x0; x0 ^= x2; \ |
| 224 | x2 |= x4; x4 ^= x1; x0 = ~x0; \ |
| 225 | x1 |= x3; x4 ^= x0; x0 &= x2; \ |
| 226 | x0 ^= x1; x1 &= x2; x3 ^= x2; \ |
| 227 | x4 ^= x3; x2 &= x3; x3 |= x0; \ |
| 228 | x1 ^= x4; x3 ^= x4; x4 &= x0; \ |
| 229 | x4 ^= x2; \ |
| 230 | }) |
| 231 | |
| 232 | int __serpent_setkey(struct serpent_ctx *ctx, const u8 *key, |
| 233 | unsigned int keylen) |
| 234 | { |
| 235 | u32 *k = ctx->expkey; |
| 236 | u8 *k8 = (u8 *)k; |
| 237 | u32 r0, r1, r2, r3, r4; |
| 238 | int i; |
| 239 | |
| 240 | /* Copy key, add padding */ |
| 241 | |
| 242 | for (i = 0; i < keylen; ++i) |
| 243 | k8[i] = key[i]; |
| 244 | if (i < SERPENT_MAX_KEY_SIZE) |
| 245 | k8[i++] = 1; |
| 246 | while (i < SERPENT_MAX_KEY_SIZE) |
| 247 | k8[i++] = 0; |
| 248 | |
| 249 | /* Expand key using polynomial */ |
| 250 | |
| 251 | r0 = le32_to_cpu(k[3]); |
| 252 | r1 = le32_to_cpu(k[4]); |
| 253 | r2 = le32_to_cpu(k[5]); |
| 254 | r3 = le32_to_cpu(k[6]); |
| 255 | r4 = le32_to_cpu(k[7]); |
| 256 | |
| 257 | keyiter(le32_to_cpu(k[0]), r0, r4, r2, 0, 0); |
| 258 | keyiter(le32_to_cpu(k[1]), r1, r0, r3, 1, 1); |
| 259 | keyiter(le32_to_cpu(k[2]), r2, r1, r4, 2, 2); |
| 260 | keyiter(le32_to_cpu(k[3]), r3, r2, r0, 3, 3); |
| 261 | keyiter(le32_to_cpu(k[4]), r4, r3, r1, 4, 4); |
| 262 | keyiter(le32_to_cpu(k[5]), r0, r4, r2, 5, 5); |
| 263 | keyiter(le32_to_cpu(k[6]), r1, r0, r3, 6, 6); |
| 264 | keyiter(le32_to_cpu(k[7]), r2, r1, r4, 7, 7); |
| 265 | |
| 266 | keyiter(k[0], r3, r2, r0, 8, 8); |
| 267 | keyiter(k[1], r4, r3, r1, 9, 9); |
| 268 | keyiter(k[2], r0, r4, r2, 10, 10); |
| 269 | keyiter(k[3], r1, r0, r3, 11, 11); |
| 270 | keyiter(k[4], r2, r1, r4, 12, 12); |
| 271 | keyiter(k[5], r3, r2, r0, 13, 13); |
| 272 | keyiter(k[6], r4, r3, r1, 14, 14); |
| 273 | keyiter(k[7], r0, r4, r2, 15, 15); |
| 274 | keyiter(k[8], r1, r0, r3, 16, 16); |
| 275 | keyiter(k[9], r2, r1, r4, 17, 17); |
| 276 | keyiter(k[10], r3, r2, r0, 18, 18); |
| 277 | keyiter(k[11], r4, r3, r1, 19, 19); |
| 278 | keyiter(k[12], r0, r4, r2, 20, 20); |
| 279 | keyiter(k[13], r1, r0, r3, 21, 21); |
| 280 | keyiter(k[14], r2, r1, r4, 22, 22); |
| 281 | keyiter(k[15], r3, r2, r0, 23, 23); |
| 282 | keyiter(k[16], r4, r3, r1, 24, 24); |
| 283 | keyiter(k[17], r0, r4, r2, 25, 25); |
| 284 | keyiter(k[18], r1, r0, r3, 26, 26); |
| 285 | keyiter(k[19], r2, r1, r4, 27, 27); |
| 286 | keyiter(k[20], r3, r2, r0, 28, 28); |
| 287 | keyiter(k[21], r4, r3, r1, 29, 29); |
| 288 | keyiter(k[22], r0, r4, r2, 30, 30); |
| 289 | keyiter(k[23], r1, r0, r3, 31, 31); |
| 290 | |
| 291 | k += 50; |
| 292 | |
| 293 | keyiter(k[-26], r2, r1, r4, 32, -18); |
| 294 | keyiter(k[-25], r3, r2, r0, 33, -17); |
| 295 | keyiter(k[-24], r4, r3, r1, 34, -16); |
| 296 | keyiter(k[-23], r0, r4, r2, 35, -15); |
| 297 | keyiter(k[-22], r1, r0, r3, 36, -14); |
| 298 | keyiter(k[-21], r2, r1, r4, 37, -13); |
| 299 | keyiter(k[-20], r3, r2, r0, 38, -12); |
| 300 | keyiter(k[-19], r4, r3, r1, 39, -11); |
| 301 | keyiter(k[-18], r0, r4, r2, 40, -10); |
| 302 | keyiter(k[-17], r1, r0, r3, 41, -9); |
| 303 | keyiter(k[-16], r2, r1, r4, 42, -8); |
| 304 | keyiter(k[-15], r3, r2, r0, 43, -7); |
| 305 | keyiter(k[-14], r4, r3, r1, 44, -6); |
| 306 | keyiter(k[-13], r0, r4, r2, 45, -5); |
| 307 | keyiter(k[-12], r1, r0, r3, 46, -4); |
| 308 | keyiter(k[-11], r2, r1, r4, 47, -3); |
| 309 | keyiter(k[-10], r3, r2, r0, 48, -2); |
| 310 | keyiter(k[-9], r4, r3, r1, 49, -1); |
| 311 | keyiter(k[-8], r0, r4, r2, 50, 0); |
| 312 | keyiter(k[-7], r1, r0, r3, 51, 1); |
| 313 | keyiter(k[-6], r2, r1, r4, 52, 2); |
| 314 | keyiter(k[-5], r3, r2, r0, 53, 3); |
| 315 | keyiter(k[-4], r4, r3, r1, 54, 4); |
| 316 | keyiter(k[-3], r0, r4, r2, 55, 5); |
| 317 | keyiter(k[-2], r1, r0, r3, 56, 6); |
| 318 | keyiter(k[-1], r2, r1, r4, 57, 7); |
| 319 | keyiter(k[0], r3, r2, r0, 58, 8); |
| 320 | keyiter(k[1], r4, r3, r1, 59, 9); |
| 321 | keyiter(k[2], r0, r4, r2, 60, 10); |
| 322 | keyiter(k[3], r1, r0, r3, 61, 11); |
| 323 | keyiter(k[4], r2, r1, r4, 62, 12); |
| 324 | keyiter(k[5], r3, r2, r0, 63, 13); |
| 325 | keyiter(k[6], r4, r3, r1, 64, 14); |
| 326 | keyiter(k[7], r0, r4, r2, 65, 15); |
| 327 | keyiter(k[8], r1, r0, r3, 66, 16); |
| 328 | keyiter(k[9], r2, r1, r4, 67, 17); |
| 329 | keyiter(k[10], r3, r2, r0, 68, 18); |
| 330 | keyiter(k[11], r4, r3, r1, 69, 19); |
| 331 | keyiter(k[12], r0, r4, r2, 70, 20); |
| 332 | keyiter(k[13], r1, r0, r3, 71, 21); |
| 333 | keyiter(k[14], r2, r1, r4, 72, 22); |
| 334 | keyiter(k[15], r3, r2, r0, 73, 23); |
| 335 | keyiter(k[16], r4, r3, r1, 74, 24); |
| 336 | keyiter(k[17], r0, r4, r2, 75, 25); |
| 337 | keyiter(k[18], r1, r0, r3, 76, 26); |
| 338 | keyiter(k[19], r2, r1, r4, 77, 27); |
| 339 | keyiter(k[20], r3, r2, r0, 78, 28); |
| 340 | keyiter(k[21], r4, r3, r1, 79, 29); |
| 341 | keyiter(k[22], r0, r4, r2, 80, 30); |
| 342 | keyiter(k[23], r1, r0, r3, 81, 31); |
| 343 | |
| 344 | k += 50; |
| 345 | |
| 346 | keyiter(k[-26], r2, r1, r4, 82, -18); |
| 347 | keyiter(k[-25], r3, r2, r0, 83, -17); |
| 348 | keyiter(k[-24], r4, r3, r1, 84, -16); |
| 349 | keyiter(k[-23], r0, r4, r2, 85, -15); |
| 350 | keyiter(k[-22], r1, r0, r3, 86, -14); |
| 351 | keyiter(k[-21], r2, r1, r4, 87, -13); |
| 352 | keyiter(k[-20], r3, r2, r0, 88, -12); |
| 353 | keyiter(k[-19], r4, r3, r1, 89, -11); |
| 354 | keyiter(k[-18], r0, r4, r2, 90, -10); |
| 355 | keyiter(k[-17], r1, r0, r3, 91, -9); |
| 356 | keyiter(k[-16], r2, r1, r4, 92, -8); |
| 357 | keyiter(k[-15], r3, r2, r0, 93, -7); |
| 358 | keyiter(k[-14], r4, r3, r1, 94, -6); |
| 359 | keyiter(k[-13], r0, r4, r2, 95, -5); |
| 360 | keyiter(k[-12], r1, r0, r3, 96, -4); |
| 361 | keyiter(k[-11], r2, r1, r4, 97, -3); |
| 362 | keyiter(k[-10], r3, r2, r0, 98, -2); |
| 363 | keyiter(k[-9], r4, r3, r1, 99, -1); |
| 364 | keyiter(k[-8], r0, r4, r2, 100, 0); |
| 365 | keyiter(k[-7], r1, r0, r3, 101, 1); |
| 366 | keyiter(k[-6], r2, r1, r4, 102, 2); |
| 367 | keyiter(k[-5], r3, r2, r0, 103, 3); |
| 368 | keyiter(k[-4], r4, r3, r1, 104, 4); |
| 369 | keyiter(k[-3], r0, r4, r2, 105, 5); |
| 370 | keyiter(k[-2], r1, r0, r3, 106, 6); |
| 371 | keyiter(k[-1], r2, r1, r4, 107, 7); |
| 372 | keyiter(k[0], r3, r2, r0, 108, 8); |
| 373 | keyiter(k[1], r4, r3, r1, 109, 9); |
| 374 | keyiter(k[2], r0, r4, r2, 110, 10); |
| 375 | keyiter(k[3], r1, r0, r3, 111, 11); |
| 376 | keyiter(k[4], r2, r1, r4, 112, 12); |
| 377 | keyiter(k[5], r3, r2, r0, 113, 13); |
| 378 | keyiter(k[6], r4, r3, r1, 114, 14); |
| 379 | keyiter(k[7], r0, r4, r2, 115, 15); |
| 380 | keyiter(k[8], r1, r0, r3, 116, 16); |
| 381 | keyiter(k[9], r2, r1, r4, 117, 17); |
| 382 | keyiter(k[10], r3, r2, r0, 118, 18); |
| 383 | keyiter(k[11], r4, r3, r1, 119, 19); |
| 384 | keyiter(k[12], r0, r4, r2, 120, 20); |
| 385 | keyiter(k[13], r1, r0, r3, 121, 21); |
| 386 | keyiter(k[14], r2, r1, r4, 122, 22); |
| 387 | keyiter(k[15], r3, r2, r0, 123, 23); |
| 388 | keyiter(k[16], r4, r3, r1, 124, 24); |
| 389 | keyiter(k[17], r0, r4, r2, 125, 25); |
| 390 | keyiter(k[18], r1, r0, r3, 126, 26); |
| 391 | keyiter(k[19], r2, r1, r4, 127, 27); |
| 392 | keyiter(k[20], r3, r2, r0, 128, 28); |
| 393 | keyiter(k[21], r4, r3, r1, 129, 29); |
| 394 | keyiter(k[22], r0, r4, r2, 130, 30); |
| 395 | keyiter(k[23], r1, r0, r3, 131, 31); |
| 396 | |
| 397 | /* Apply S-boxes */ |
| 398 | |
| 399 | S3(r3, r4, r0, r1, r2); store_and_load_keys(r1, r2, r4, r3, 28, 24); |
| 400 | S4(r1, r2, r4, r3, r0); store_and_load_keys(r2, r4, r3, r0, 24, 20); |
| 401 | S5(r2, r4, r3, r0, r1); store_and_load_keys(r1, r2, r4, r0, 20, 16); |
| 402 | S6(r1, r2, r4, r0, r3); store_and_load_keys(r4, r3, r2, r0, 16, 12); |
| 403 | S7(r4, r3, r2, r0, r1); store_and_load_keys(r1, r2, r0, r4, 12, 8); |
| 404 | S0(r1, r2, r0, r4, r3); store_and_load_keys(r0, r2, r4, r1, 8, 4); |
| 405 | S1(r0, r2, r4, r1, r3); store_and_load_keys(r3, r4, r1, r0, 4, 0); |
| 406 | S2(r3, r4, r1, r0, r2); store_and_load_keys(r2, r4, r3, r0, 0, -4); |
| 407 | S3(r2, r4, r3, r0, r1); store_and_load_keys(r0, r1, r4, r2, -4, -8); |
| 408 | S4(r0, r1, r4, r2, r3); store_and_load_keys(r1, r4, r2, r3, -8, -12); |
| 409 | S5(r1, r4, r2, r3, r0); store_and_load_keys(r0, r1, r4, r3, -12, -16); |
| 410 | S6(r0, r1, r4, r3, r2); store_and_load_keys(r4, r2, r1, r3, -16, -20); |
| 411 | S7(r4, r2, r1, r3, r0); store_and_load_keys(r0, r1, r3, r4, -20, -24); |
| 412 | S0(r0, r1, r3, r4, r2); store_and_load_keys(r3, r1, r4, r0, -24, -28); |
| 413 | k -= 50; |
| 414 | S1(r3, r1, r4, r0, r2); store_and_load_keys(r2, r4, r0, r3, 22, 18); |
| 415 | S2(r2, r4, r0, r3, r1); store_and_load_keys(r1, r4, r2, r3, 18, 14); |
| 416 | S3(r1, r4, r2, r3, r0); store_and_load_keys(r3, r0, r4, r1, 14, 10); |
| 417 | S4(r3, r0, r4, r1, r2); store_and_load_keys(r0, r4, r1, r2, 10, 6); |
| 418 | S5(r0, r4, r1, r2, r3); store_and_load_keys(r3, r0, r4, r2, 6, 2); |
| 419 | S6(r3, r0, r4, r2, r1); store_and_load_keys(r4, r1, r0, r2, 2, -2); |
| 420 | S7(r4, r1, r0, r2, r3); store_and_load_keys(r3, r0, r2, r4, -2, -6); |
| 421 | S0(r3, r0, r2, r4, r1); store_and_load_keys(r2, r0, r4, r3, -6, -10); |
| 422 | S1(r2, r0, r4, r3, r1); store_and_load_keys(r1, r4, r3, r2, -10, -14); |
| 423 | S2(r1, r4, r3, r2, r0); store_and_load_keys(r0, r4, r1, r2, -14, -18); |
| 424 | S3(r0, r4, r1, r2, r3); store_and_load_keys(r2, r3, r4, r0, -18, -22); |
| 425 | k -= 50; |
| 426 | S4(r2, r3, r4, r0, r1); store_and_load_keys(r3, r4, r0, r1, 28, 24); |
| 427 | S5(r3, r4, r0, r1, r2); store_and_load_keys(r2, r3, r4, r1, 24, 20); |
| 428 | S6(r2, r3, r4, r1, r0); store_and_load_keys(r4, r0, r3, r1, 20, 16); |
| 429 | S7(r4, r0, r3, r1, r2); store_and_load_keys(r2, r3, r1, r4, 16, 12); |
| 430 | S0(r2, r3, r1, r4, r0); store_and_load_keys(r1, r3, r4, r2, 12, 8); |
| 431 | S1(r1, r3, r4, r2, r0); store_and_load_keys(r0, r4, r2, r1, 8, 4); |
| 432 | S2(r0, r4, r2, r1, r3); store_and_load_keys(r3, r4, r0, r1, 4, 0); |
| 433 | S3(r3, r4, r0, r1, r2); storekeys(r1, r2, r4, r3, 0); |
| 434 | |
| 435 | return 0; |
| 436 | } |
| 437 | EXPORT_SYMBOL_GPL(__serpent_setkey); |
| 438 | |
| 439 | int serpent_setkey(struct crypto_tfm *tfm, const u8 *key, unsigned int keylen) |
| 440 | { |
| 441 | return __serpent_setkey(crypto_tfm_ctx(tfm), key, keylen); |
| 442 | } |
| 443 | EXPORT_SYMBOL_GPL(serpent_setkey); |
| 444 | |
| 445 | void __serpent_encrypt(struct serpent_ctx *ctx, u8 *dst, const u8 *src) |
| 446 | { |
| 447 | const u32 *k = ctx->expkey; |
| 448 | const __le32 *s = (const __le32 *)src; |
| 449 | __le32 *d = (__le32 *)dst; |
| 450 | u32 r0, r1, r2, r3, r4; |
| 451 | |
| 452 | /* |
| 453 | * Note: The conversions between u8* and u32* might cause trouble |
| 454 | * on architectures with stricter alignment rules than x86 |
| 455 | */ |
| 456 | |
| 457 | r0 = le32_to_cpu(s[0]); |
| 458 | r1 = le32_to_cpu(s[1]); |
| 459 | r2 = le32_to_cpu(s[2]); |
| 460 | r3 = le32_to_cpu(s[3]); |
| 461 | |
| 462 | K(r0, r1, r2, r3, 0); |
| 463 | S0(r0, r1, r2, r3, r4); LK(r2, r1, r3, r0, r4, 1); |
| 464 | S1(r2, r1, r3, r0, r4); LK(r4, r3, r0, r2, r1, 2); |
| 465 | S2(r4, r3, r0, r2, r1); LK(r1, r3, r4, r2, r0, 3); |
| 466 | S3(r1, r3, r4, r2, r0); LK(r2, r0, r3, r1, r4, 4); |
| 467 | S4(r2, r0, r3, r1, r4); LK(r0, r3, r1, r4, r2, 5); |
| 468 | S5(r0, r3, r1, r4, r2); LK(r2, r0, r3, r4, r1, 6); |
| 469 | S6(r2, r0, r3, r4, r1); LK(r3, r1, r0, r4, r2, 7); |
| 470 | S7(r3, r1, r0, r4, r2); LK(r2, r0, r4, r3, r1, 8); |
| 471 | S0(r2, r0, r4, r3, r1); LK(r4, r0, r3, r2, r1, 9); |
| 472 | S1(r4, r0, r3, r2, r1); LK(r1, r3, r2, r4, r0, 10); |
| 473 | S2(r1, r3, r2, r4, r0); LK(r0, r3, r1, r4, r2, 11); |
| 474 | S3(r0, r3, r1, r4, r2); LK(r4, r2, r3, r0, r1, 12); |
| 475 | S4(r4, r2, r3, r0, r1); LK(r2, r3, r0, r1, r4, 13); |
| 476 | S5(r2, r3, r0, r1, r4); LK(r4, r2, r3, r1, r0, 14); |
| 477 | S6(r4, r2, r3, r1, r0); LK(r3, r0, r2, r1, r4, 15); |
| 478 | S7(r3, r0, r2, r1, r4); LK(r4, r2, r1, r3, r0, 16); |
| 479 | S0(r4, r2, r1, r3, r0); LK(r1, r2, r3, r4, r0, 17); |
| 480 | S1(r1, r2, r3, r4, r0); LK(r0, r3, r4, r1, r2, 18); |
| 481 | S2(r0, r3, r4, r1, r2); LK(r2, r3, r0, r1, r4, 19); |
| 482 | S3(r2, r3, r0, r1, r4); LK(r1, r4, r3, r2, r0, 20); |
| 483 | S4(r1, r4, r3, r2, r0); LK(r4, r3, r2, r0, r1, 21); |
| 484 | S5(r4, r3, r2, r0, r1); LK(r1, r4, r3, r0, r2, 22); |
| 485 | S6(r1, r4, r3, r0, r2); LK(r3, r2, r4, r0, r1, 23); |
| 486 | S7(r3, r2, r4, r0, r1); LK(r1, r4, r0, r3, r2, 24); |
| 487 | S0(r1, r4, r0, r3, r2); LK(r0, r4, r3, r1, r2, 25); |
| 488 | S1(r0, r4, r3, r1, r2); LK(r2, r3, r1, r0, r4, 26); |
| 489 | S2(r2, r3, r1, r0, r4); LK(r4, r3, r2, r0, r1, 27); |
| 490 | S3(r4, r3, r2, r0, r1); LK(r0, r1, r3, r4, r2, 28); |
| 491 | S4(r0, r1, r3, r4, r2); LK(r1, r3, r4, r2, r0, 29); |
| 492 | S5(r1, r3, r4, r2, r0); LK(r0, r1, r3, r2, r4, 30); |
| 493 | S6(r0, r1, r3, r2, r4); LK(r3, r4, r1, r2, r0, 31); |
| 494 | S7(r3, r4, r1, r2, r0); K(r0, r1, r2, r3, 32); |
| 495 | |
| 496 | d[0] = cpu_to_le32(r0); |
| 497 | d[1] = cpu_to_le32(r1); |
| 498 | d[2] = cpu_to_le32(r2); |
| 499 | d[3] = cpu_to_le32(r3); |
| 500 | } |
| 501 | EXPORT_SYMBOL_GPL(__serpent_encrypt); |
| 502 | |
| 503 | static void serpent_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src) |
| 504 | { |
| 505 | struct serpent_ctx *ctx = crypto_tfm_ctx(tfm); |
| 506 | |
| 507 | __serpent_encrypt(ctx, dst, src); |
| 508 | } |
| 509 | |
| 510 | void __serpent_decrypt(struct serpent_ctx *ctx, u8 *dst, const u8 *src) |
| 511 | { |
| 512 | const u32 *k = ctx->expkey; |
| 513 | const __le32 *s = (const __le32 *)src; |
| 514 | __le32 *d = (__le32 *)dst; |
| 515 | u32 r0, r1, r2, r3, r4; |
| 516 | |
| 517 | r0 = le32_to_cpu(s[0]); |
| 518 | r1 = le32_to_cpu(s[1]); |
| 519 | r2 = le32_to_cpu(s[2]); |
| 520 | r3 = le32_to_cpu(s[3]); |
| 521 | |
| 522 | K(r0, r1, r2, r3, 32); |
| 523 | SI7(r0, r1, r2, r3, r4); KL(r1, r3, r0, r4, r2, 31); |
| 524 | SI6(r1, r3, r0, r4, r2); KL(r0, r2, r4, r1, r3, 30); |
| 525 | SI5(r0, r2, r4, r1, r3); KL(r2, r3, r0, r4, r1, 29); |
| 526 | SI4(r2, r3, r0, r4, r1); KL(r2, r0, r1, r4, r3, 28); |
| 527 | SI3(r2, r0, r1, r4, r3); KL(r1, r2, r3, r4, r0, 27); |
| 528 | SI2(r1, r2, r3, r4, r0); KL(r2, r0, r4, r3, r1, 26); |
| 529 | SI1(r2, r0, r4, r3, r1); KL(r1, r0, r4, r3, r2, 25); |
| 530 | SI0(r1, r0, r4, r3, r2); KL(r4, r2, r0, r1, r3, 24); |
| 531 | SI7(r4, r2, r0, r1, r3); KL(r2, r1, r4, r3, r0, 23); |
| 532 | SI6(r2, r1, r4, r3, r0); KL(r4, r0, r3, r2, r1, 22); |
| 533 | SI5(r4, r0, r3, r2, r1); KL(r0, r1, r4, r3, r2, 21); |
| 534 | SI4(r0, r1, r4, r3, r2); KL(r0, r4, r2, r3, r1, 20); |
| 535 | SI3(r0, r4, r2, r3, r1); KL(r2, r0, r1, r3, r4, 19); |
| 536 | SI2(r2, r0, r1, r3, r4); KL(r0, r4, r3, r1, r2, 18); |
| 537 | SI1(r0, r4, r3, r1, r2); KL(r2, r4, r3, r1, r0, 17); |
| 538 | SI0(r2, r4, r3, r1, r0); KL(r3, r0, r4, r2, r1, 16); |
| 539 | SI7(r3, r0, r4, r2, r1); KL(r0, r2, r3, r1, r4, 15); |
| 540 | SI6(r0, r2, r3, r1, r4); KL(r3, r4, r1, r0, r2, 14); |
| 541 | SI5(r3, r4, r1, r0, r2); KL(r4, r2, r3, r1, r0, 13); |
| 542 | SI4(r4, r2, r3, r1, r0); KL(r4, r3, r0, r1, r2, 12); |
| 543 | SI3(r4, r3, r0, r1, r2); KL(r0, r4, r2, r1, r3, 11); |
| 544 | SI2(r0, r4, r2, r1, r3); KL(r4, r3, r1, r2, r0, 10); |
| 545 | SI1(r4, r3, r1, r2, r0); KL(r0, r3, r1, r2, r4, 9); |
| 546 | SI0(r0, r3, r1, r2, r4); KL(r1, r4, r3, r0, r2, 8); |
| 547 | SI7(r1, r4, r3, r0, r2); KL(r4, r0, r1, r2, r3, 7); |
| 548 | SI6(r4, r0, r1, r2, r3); KL(r1, r3, r2, r4, r0, 6); |
| 549 | SI5(r1, r3, r2, r4, r0); KL(r3, r0, r1, r2, r4, 5); |
| 550 | SI4(r3, r0, r1, r2, r4); KL(r3, r1, r4, r2, r0, 4); |
| 551 | SI3(r3, r1, r4, r2, r0); KL(r4, r3, r0, r2, r1, 3); |
| 552 | SI2(r4, r3, r0, r2, r1); KL(r3, r1, r2, r0, r4, 2); |
| 553 | SI1(r3, r1, r2, r0, r4); KL(r4, r1, r2, r0, r3, 1); |
| 554 | SI0(r4, r1, r2, r0, r3); K(r2, r3, r1, r4, 0); |
| 555 | |
| 556 | d[0] = cpu_to_le32(r2); |
| 557 | d[1] = cpu_to_le32(r3); |
| 558 | d[2] = cpu_to_le32(r1); |
| 559 | d[3] = cpu_to_le32(r4); |
| 560 | } |
| 561 | EXPORT_SYMBOL_GPL(__serpent_decrypt); |
| 562 | |
| 563 | static void serpent_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src) |
| 564 | { |
| 565 | struct serpent_ctx *ctx = crypto_tfm_ctx(tfm); |
| 566 | |
| 567 | __serpent_decrypt(ctx, dst, src); |
| 568 | } |
| 569 | |
| 570 | static int tnepres_setkey(struct crypto_tfm *tfm, const u8 *key, |
| 571 | unsigned int keylen) |
| 572 | { |
| 573 | u8 rev_key[SERPENT_MAX_KEY_SIZE]; |
| 574 | int i; |
| 575 | |
| 576 | for (i = 0; i < keylen; ++i) |
| 577 | rev_key[keylen - i - 1] = key[i]; |
| 578 | |
| 579 | return serpent_setkey(tfm, rev_key, keylen); |
| 580 | } |
| 581 | |
| 582 | static void tnepres_encrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src) |
| 583 | { |
| 584 | const u32 * const s = (const u32 * const)src; |
| 585 | u32 * const d = (u32 * const)dst; |
| 586 | |
| 587 | u32 rs[4], rd[4]; |
| 588 | |
| 589 | rs[0] = swab32(s[3]); |
| 590 | rs[1] = swab32(s[2]); |
| 591 | rs[2] = swab32(s[1]); |
| 592 | rs[3] = swab32(s[0]); |
| 593 | |
| 594 | serpent_encrypt(tfm, (u8 *)rd, (u8 *)rs); |
| 595 | |
| 596 | d[0] = swab32(rd[3]); |
| 597 | d[1] = swab32(rd[2]); |
| 598 | d[2] = swab32(rd[1]); |
| 599 | d[3] = swab32(rd[0]); |
| 600 | } |
| 601 | |
| 602 | static void tnepres_decrypt(struct crypto_tfm *tfm, u8 *dst, const u8 *src) |
| 603 | { |
| 604 | const u32 * const s = (const u32 * const)src; |
| 605 | u32 * const d = (u32 * const)dst; |
| 606 | |
| 607 | u32 rs[4], rd[4]; |
| 608 | |
| 609 | rs[0] = swab32(s[3]); |
| 610 | rs[1] = swab32(s[2]); |
| 611 | rs[2] = swab32(s[1]); |
| 612 | rs[3] = swab32(s[0]); |
| 613 | |
| 614 | serpent_decrypt(tfm, (u8 *)rd, (u8 *)rs); |
| 615 | |
| 616 | d[0] = swab32(rd[3]); |
| 617 | d[1] = swab32(rd[2]); |
| 618 | d[2] = swab32(rd[1]); |
| 619 | d[3] = swab32(rd[0]); |
| 620 | } |
| 621 | |
| 622 | static struct crypto_alg srp_algs[2] = { { |
| 623 | .cra_name = "serpent", |
| 624 | .cra_driver_name = "serpent-generic", |
| 625 | .cra_priority = 100, |
| 626 | .cra_flags = CRYPTO_ALG_TYPE_CIPHER, |
| 627 | .cra_blocksize = SERPENT_BLOCK_SIZE, |
| 628 | .cra_ctxsize = sizeof(struct serpent_ctx), |
| 629 | .cra_alignmask = 3, |
| 630 | .cra_module = THIS_MODULE, |
| 631 | .cra_u = { .cipher = { |
| 632 | .cia_min_keysize = SERPENT_MIN_KEY_SIZE, |
| 633 | .cia_max_keysize = SERPENT_MAX_KEY_SIZE, |
| 634 | .cia_setkey = serpent_setkey, |
| 635 | .cia_encrypt = serpent_encrypt, |
| 636 | .cia_decrypt = serpent_decrypt } } |
| 637 | }, { |
| 638 | .cra_name = "tnepres", |
| 639 | .cra_flags = CRYPTO_ALG_TYPE_CIPHER, |
| 640 | .cra_blocksize = SERPENT_BLOCK_SIZE, |
| 641 | .cra_ctxsize = sizeof(struct serpent_ctx), |
| 642 | .cra_alignmask = 3, |
| 643 | .cra_module = THIS_MODULE, |
| 644 | .cra_u = { .cipher = { |
| 645 | .cia_min_keysize = SERPENT_MIN_KEY_SIZE, |
| 646 | .cia_max_keysize = SERPENT_MAX_KEY_SIZE, |
| 647 | .cia_setkey = tnepres_setkey, |
| 648 | .cia_encrypt = tnepres_encrypt, |
| 649 | .cia_decrypt = tnepres_decrypt } } |
| 650 | } }; |
| 651 | |
| 652 | static int __init serpent_mod_init(void) |
| 653 | { |
| 654 | return crypto_register_algs(srp_algs, ARRAY_SIZE(srp_algs)); |
| 655 | } |
| 656 | |
| 657 | static void __exit serpent_mod_fini(void) |
| 658 | { |
| 659 | crypto_unregister_algs(srp_algs, ARRAY_SIZE(srp_algs)); |
| 660 | } |
| 661 | |
| 662 | module_init(serpent_mod_init); |
| 663 | module_exit(serpent_mod_fini); |
| 664 | |
| 665 | MODULE_LICENSE("GPL"); |
| 666 | MODULE_DESCRIPTION("Serpent and tnepres (kerneli compatible serpent reversed) Cipher Algorithm"); |
| 667 | MODULE_AUTHOR("Dag Arne Osvik <osvik@ii.uib.no>"); |
| 668 | MODULE_ALIAS_CRYPTO("tnepres"); |
| 669 | MODULE_ALIAS_CRYPTO("serpent"); |
| 670 | MODULE_ALIAS_CRYPTO("serpent-generic"); |