/openswan-2.6.38/lib/libcrypto/libserpent/serpent.c

# · C · 995 lines · 749 code · 154 blank · 92 comment · 10 complexity · 3f3b22b51603c861a1c8f30e8b31de2d MD5 · raw file

  1. /* Optimized implementation of the Serpent AES candidate algorithm
  2. * Designed by Anderson, Biham and Knudsen and Implemented by
  3. * Gisle S?lensminde 2000.
  4. *
  5. * The implementation is based on the pentium optimised sboxes of
  6. * Dag Arne Osvik. Even these sboxes are designed to be optimal for x86
  7. * processors they are efficient on other processors as well, but the speedup
  8. * isn't so impressive compared to other implementations.
  9. *
  10. * This program is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU Library General Public License
  12. * as published by the Free Software Foundation; either version 2 of
  13. * the License, or (at your option) any later version.
  14. */
  15. #ifdef __KERNEL__
  16. #include <linux/init.h>
  17. #include <linux/types.h>
  18. #include <endian.h>
  19. #else
  20. #include <sys/types.h>
  21. #include "oswendian.h"
  22. #endif
  23. #include "serpent.h"
  24. #define rotl(reg, val) ((reg << val) | (reg >> (32 - val)))
  25. #define rotr(reg, val) ((reg >> val) | (reg << (32 - val)))
  26. #ifdef __cpu_to_be32
  27. #define BLOCK_SWAP
  28. #define io_swap(x) __cpu_to_be32(x)
  29. #else
  30. #undef BLOCK_SWAP
  31. #endif
  32. /* The sbox functions. The first four parameters is the input bits, and
  33. * the last is a tempoary. These parameters are also used for output, but
  34. * the bit order is permuted. The output bit order from S0 is
  35. * (1 4 2 0 3), where 3 is the (now useless) tempoary.
  36. */
  37. #define S0(r0,r1,r2,r3,r4) \
  38. r3 = r3 ^ r0; \
  39. r4 = r1; \
  40. r1 = r1 & r3; \
  41. r4 = r4 ^ r2; \
  42. r1 = r1 ^ r0; \
  43. r0 = r0 | r3; \
  44. r0 = r0 ^ r4; \
  45. r4 = r4 ^ r3; \
  46. r3 = r3 ^ r2; \
  47. r2 = r2 | r1; \
  48. r2 = r2 ^ r4; \
  49. r4 = -1 ^ r4; \
  50. r4 = r4 | r1; \
  51. r1 = r1 ^ r3; \
  52. r1 = r1 ^ r4; \
  53. r3 = r3 | r0; \
  54. r1 = r1 ^ r3; \
  55. r4 = r4 ^ r3;
  56. #define S1(r0,r1,r2,r3,r4) \
  57. r1 = -1 ^ r1; \
  58. r4 = r0; \
  59. r0 = r0 ^ r1; \
  60. r4 = r4 | r1; \
  61. r4 = r4 ^ r3; \
  62. r3 = r3 & r0; \
  63. r2 = r2 ^ r4; \
  64. r3 = r3 ^ r1; \
  65. r3 = r3 | r2; \
  66. r0 = r0 ^ r4; \
  67. r3 = r3 ^ r0; \
  68. r1 = r1 & r2; \
  69. r0 = r0 | r1; \
  70. r1 = r1 ^ r4; \
  71. r0 = r0 ^ r2; \
  72. r4 = r4 | r3; \
  73. r0 = r0 ^ r4; \
  74. r4 = -1 ^ r4; \
  75. r1 = r1 ^ r3; \
  76. r4 = r4 & r2; \
  77. r1 = -1 ^ r1; \
  78. r4 = r4 ^ r0; \
  79. r1 = r1 ^ r4;
  80. #define S2(r0,r1,r2,r3,r4) \
  81. r4 = r0; \
  82. r0 = r0 & r2; \
  83. r0 = r0 ^ r3; \
  84. r2 = r2 ^ r1; \
  85. r2 = r2 ^ r0; \
  86. r3 = r3 | r4; \
  87. r3 = r3 ^ r1; \
  88. r4 = r4 ^ r2; \
  89. r1 = r3; \
  90. r3 = r3 | r4; \
  91. r3 = r3 ^ r0; \
  92. r0 = r0 & r1; \
  93. r4 = r4 ^ r0; \
  94. r1 = r1 ^ r3; \
  95. r1 = r1 ^ r4; \
  96. r4 = -1 ^ r4;
  97. #define S3(r0,r1,r2,r3,r4) \
  98. r4 = r0 ; \
  99. r0 = r0 | r3; \
  100. r3 = r3 ^ r1; \
  101. r1 = r1 & r4; \
  102. r4 = r4 ^ r2; \
  103. r2 = r2 ^ r3; \
  104. r3 = r3 & r0; \
  105. r4 = r4 | r1; \
  106. r3 = r3 ^ r4; \
  107. r0 = r0 ^ r1; \
  108. r4 = r4 & r0; \
  109. r1 = r1 ^ r3; \
  110. r4 = r4 ^ r2; \
  111. r1 = r1 | r0; \
  112. r1 = r1 ^ r2; \
  113. r0 = r0 ^ r3; \
  114. r2 = r1; \
  115. r1 = r1 | r3; \
  116. r1 = r1 ^ r0;
  117. #define S4(r0,r1,r2,r3,r4) \
  118. r1 = r1 ^ r3; \
  119. r3 = -1 ^ r3; \
  120. r2 = r2 ^ r3; \
  121. r3 = r3 ^ r0; \
  122. r4 = r1; \
  123. r1 = r1 & r3; \
  124. r1 = r1 ^ r2; \
  125. r4 = r4 ^ r3; \
  126. r0 = r0 ^ r4; \
  127. r2 = r2 & r4; \
  128. r2 = r2 ^ r0; \
  129. r0 = r0 & r1; \
  130. r3 = r3 ^ r0; \
  131. r4 = r4 | r1; \
  132. r4 = r4 ^ r0; \
  133. r0 = r0 | r3; \
  134. r0 = r0 ^ r2; \
  135. r2 = r2 & r3; \
  136. r0 = -1 ^ r0; \
  137. r4 = r4 ^ r2;
  138. #define S5(r0,r1,r2,r3,r4) \
  139. r0 = r0 ^ r1; \
  140. r1 = r1 ^ r3; \
  141. r3 = -1 ^ r3; \
  142. r4 = r1; \
  143. r1 = r1 & r0; \
  144. r2 = r2 ^ r3; \
  145. r1 = r1 ^ r2; \
  146. r2 = r2 | r4; \
  147. r4 = r4 ^ r3; \
  148. r3 = r3 & r1; \
  149. r3 = r3 ^ r0; \
  150. r4 = r4 ^ r1; \
  151. r4 = r4 ^ r2; \
  152. r2 = r2 ^ r0; \
  153. r0 = r0 & r3; \
  154. r2 = -1 ^ r2; \
  155. r0 = r0 ^ r4; \
  156. r4 = r4 | r3; \
  157. r2 = r2 ^ r4;
  158. #define S6(r0,r1,r2,r3,r4) \
  159. r2 = -1 ^ r2; \
  160. r4 = r3; \
  161. r3 = r3 & r0; \
  162. r0 = r0 ^ r4; \
  163. r3 = r3 ^ r2; \
  164. r2 = r2 | r4; \
  165. r1 = r1 ^ r3; \
  166. r2 = r2 ^ r0; \
  167. r0 = r0 | r1; \
  168. r2 = r2 ^ r1; \
  169. r4 = r4 ^ r0; \
  170. r0 = r0 | r3; \
  171. r0 = r0 ^ r2; \
  172. r4 = r4 ^ r3; \
  173. r4 = r4 ^ r0; \
  174. r3 = -1 ^ r3; \
  175. r2 = r2 & r4; \
  176. r2 = r2 ^ r3;
  177. #define S7(r0,r1,r2,r3,r4) \
  178. r4 = r2; \
  179. r2 = r2 & r1; \
  180. r2 = r2 ^ r3; \
  181. r3 = r3 & r1; \
  182. r4 = r4 ^ r2; \
  183. r2 = r2 ^ r1; \
  184. r1 = r1 ^ r0; \
  185. r0 = r0 | r4; \
  186. r0 = r0 ^ r2; \
  187. r3 = r3 ^ r1; \
  188. r2 = r2 ^ r3; \
  189. r3 = r3 & r0; \
  190. r3 = r3 ^ r4; \
  191. r4 = r4 ^ r2; \
  192. r2 = r2 & r0; \
  193. r4 = -1 ^ r4; \
  194. r2 = r2 ^ r4; \
  195. r4 = r4 & r0; \
  196. r1 = r1 ^ r3; \
  197. r4 = r4 ^ r1;
  198. /* The inverse sboxes */
  199. #define I0(r0,r1,r2,r3,r4) \
  200. r2 = r2 ^ -1; \
  201. r4 = r1; \
  202. r1 = r1 | r0; \
  203. r4 = r4 ^ -1; \
  204. r1 = r1 ^ r2; \
  205. r2 = r2 | r4; \
  206. r1 = r1 ^ r3; \
  207. r0 = r0 ^ r4; \
  208. r2 = r2 ^ r0; \
  209. r0 = r0 & r3; \
  210. r4 = r4 ^ r0; \
  211. r0 = r0 | r1; \
  212. r0 = r0 ^ r2; \
  213. r3 = r3 ^ r4; \
  214. r2 = r2 ^ r1; \
  215. r3 = r3 ^ r0; \
  216. r3 = r3 ^ r1; \
  217. r2 = r2 & r3; \
  218. r4 = r4 ^ r2;
  219. #define I1(r0,r1,r2,r3,r4) \
  220. r4 = r1; \
  221. r1 = r1 ^ r3; \
  222. r3 = r3 & r1; \
  223. r4 = r4 ^ r2; \
  224. r3 = r3 ^ r0; \
  225. r0 = r0 | r1; \
  226. r2 = r2 ^ r3; \
  227. r0 = r0 ^ r4; \
  228. r0 = r0 | r2; \
  229. r1 = r1 ^ r3; \
  230. r0 = r0 ^ r1; \
  231. r1 = r1 | r3; \
  232. r1 = r1 ^ r0; \
  233. r4 = r4 ^ -1; \
  234. r4 = r4 ^ r1; \
  235. r1 = r1 | r0; \
  236. r1 = r1 ^ r0; \
  237. r1 = r1 | r4; \
  238. r3 = r3 ^ r1;
  239. #define I2(r0,r1,r2,r3,r4) \
  240. r2 = r2 ^ r3; \
  241. r3 = r3 ^ r0; \
  242. r4 = r3; \
  243. r3 = r3 & r2; \
  244. r3 = r3 ^ r1; \
  245. r1 = r1 | r2; \
  246. r1 = r1 ^ r4; \
  247. r4 = r4 & r3; \
  248. r2 = r2 ^ r3; \
  249. r4 = r4 & r0; \
  250. r4 = r4 ^ r2; \
  251. r2 = r2 & r1; \
  252. r2 = r2 | r0; \
  253. r3 = r3 ^ -1; \
  254. r2 = r2 ^ r3; \
  255. r0 = r0 ^ r3; \
  256. r0 = r0 & r1; \
  257. r3 = r3 ^ r4; \
  258. r3 = r3 ^ r0;
  259. #define I3(r0,r1,r2,r3,r4) \
  260. r4 = r2; \
  261. r2 = r2 ^ r1; \
  262. r0 = r0 ^ r2; \
  263. r4 = r4 & r2; \
  264. r4 = r4 ^ r0; \
  265. r0 = r0 & r1; \
  266. r1 = r1 ^ r3; \
  267. r3 = r3 | r4; \
  268. r2 = r2 ^ r3; \
  269. r0 = r0 ^ r3; \
  270. r1 = r1 ^ r4; \
  271. r3 = r3 & r2; \
  272. r3 = r3 ^ r1; \
  273. r1 = r1 ^ r0; \
  274. r1 = r1 | r2; \
  275. r0 = r0 ^ r3; \
  276. r1 = r1 ^ r4; \
  277. r0 = r0 ^ r1;
  278. #define I4(r0,r1,r2,r3,r4) \
  279. r4 = r2; \
  280. r2 = r2 & r3; \
  281. r2 = r2 ^ r1; \
  282. r1 = r1 | r3; \
  283. r1 = r1 & r0; \
  284. r4 = r4 ^ r2; \
  285. r4 = r4 ^ r1; \
  286. r1 = r1 & r2; \
  287. r0 = r0 ^ -1; \
  288. r3 = r3 ^ r4; \
  289. r1 = r1 ^ r3; \
  290. r3 = r3 & r0; \
  291. r3 = r3 ^ r2; \
  292. r0 = r0 ^ r1; \
  293. r2 = r2 & r0; \
  294. r3 = r3 ^ r0; \
  295. r2 = r2 ^ r4; \
  296. r2 = r2 | r3; \
  297. r3 = r3 ^ r0; \
  298. r2 = r2 ^ r1;
  299. #define I5(r0,r1,r2,r3,r4) \
  300. r1 = r1 ^ -1; \
  301. r4 = r3; \
  302. r2 = r2 ^ r1; \
  303. r3 = r3 | r0; \
  304. r3 = r3 ^ r2; \
  305. r2 = r2 | r1; \
  306. r2 = r2 & r0; \
  307. r4 = r4 ^ r3; \
  308. r2 = r2 ^ r4; \
  309. r4 = r4 | r0; \
  310. r4 = r4 ^ r1; \
  311. r1 = r1 & r2; \
  312. r1 = r1 ^ r3; \
  313. r4 = r4 ^ r2; \
  314. r3 = r3 & r4; \
  315. r4 = r4 ^ r1; \
  316. r3 = r3 ^ r0; \
  317. r3 = r3 ^ r4; \
  318. r4 = r4 ^ -1;
  319. #define I6(r0,r1,r2,r3,r4) \
  320. r0 = r0 ^ r2; \
  321. r4 = r2; \
  322. r2 = r2 & r0; \
  323. r4 = r4 ^ r3; \
  324. r2 = r2 ^ -1; \
  325. r3 = r3 ^ r1; \
  326. r2 = r2 ^ r3; \
  327. r4 = r4 | r0; \
  328. r0 = r0 ^ r2; \
  329. r3 = r3 ^ r4; \
  330. r4 = r4 ^ r1; \
  331. r1 = r1 & r3; \
  332. r1 = r1 ^ r0; \
  333. r0 = r0 ^ r3; \
  334. r0 = r0 | r2; \
  335. r3 = r3 ^ r1; \
  336. r4 = r4 ^ r0;
  337. #define I7(r0,r1,r2,r3,r4) \
  338. r4 = r2; \
  339. r2 = r2 ^ r0; \
  340. r0 = r0 & r3; \
  341. r4 = r4 | r3; \
  342. r2 = r2 ^ -1; \
  343. r3 = r3 ^ r1; \
  344. r1 = r1 | r0; \
  345. r0 = r0 ^ r2; \
  346. r2 = r2 & r4; \
  347. r3 = r3 & r4; \
  348. r1 = r1 ^ r2; \
  349. r2 = r2 ^ r0; \
  350. r0 = r0 | r2; \
  351. r4 = r4 ^ r1; \
  352. r0 = r0 ^ r3; \
  353. r3 = r3 ^ r4; \
  354. r4 = r4 | r0; \
  355. r3 = r3 ^ r2; \
  356. r4 = r4 ^ r2;
  357. /* forward and inverse linear transformations */
  358. #define LINTRANS(r0,r1,r2,r3,r4) \
  359. r0 = rotl(r0, 13); \
  360. r2 = rotl(r2, 3); \
  361. r3 = r3 ^ r2; \
  362. r4 = r0 << 3; \
  363. r1 = r1 ^ r0; \
  364. r3 = r3 ^ r4; \
  365. r1 = r1 ^ r2; \
  366. r3 = rotl(r3, 7); \
  367. r1 = rotl(r1, 1); \
  368. r2 = r2 ^ r3; \
  369. r4 = r1 << 7; \
  370. r0 = r0 ^ r1; \
  371. r2 = r2 ^ r4; \
  372. r0 = r0 ^ r3; \
  373. r2 = rotl(r2, 22); \
  374. r0 = rotl(r0, 5);
  375. #define ILINTRANS(r0,r1,r2,r3,r4) \
  376. r2 = rotr(r2, 22); \
  377. r0 = rotr(r0, 5); \
  378. r2 = r2 ^ r3; \
  379. r4 = r1 << 7; \
  380. r0 = r0 ^ r1; \
  381. r2 = r2 ^ r4; \
  382. r0 = r0 ^ r3; \
  383. r3 = rotr(r3, 7); \
  384. r1 = rotr(r1, 1); \
  385. r3 = r3 ^ r2; \
  386. r4 = r0 << 3; \
  387. r1 = r1 ^ r0; \
  388. r3 = r3 ^ r4; \
  389. r1 = r1 ^ r2; \
  390. r2 = rotr(r2, 3); \
  391. r0 = rotr(r0, 13);
  392. #define KEYMIX(r0,r1,r2,r3,r4,IN) \
  393. r0 = r0 ^ l_key[IN+8]; \
  394. r1 = r1 ^ l_key[IN+9]; \
  395. r2 = r2 ^ l_key[IN+10]; \
  396. r3 = r3 ^ l_key[IN+11];
  397. #define GETKEY(r0, r1, r2, r3, IN) \
  398. r0 = l_key[IN+8]; \
  399. r1 = l_key[IN+9]; \
  400. r2 = l_key[IN+10]; \
  401. r3 = l_key[IN+11];
  402. #define SETKEY(r0, r1, r2, r3, IN) \
  403. l_key[IN+8] = r0; \
  404. l_key[IN+9] = r1; \
  405. l_key[IN+10] = r2; \
  406. l_key[IN+11] = r3;
  407. /* initialise the key schedule from the user supplied key */
  408. int serpent_set_key(serpent_context *cx, const unsigned char *key, int key_len)
  409. { const u32 *in_key = (const u32 *)key;
  410. /* l_key - storage for the key schedule */
  411. u32 *l_key = cx->keyinfo;
  412. u32 i,lk,r0,r1,r2,r3,r4;
  413. if (key_len != 16 && key_len != 24 && key_len != 32)
  414. return -1; /* unsupported key length */
  415. key_len *= 8;
  416. i = 0; lk = (key_len + 31) / 32;
  417. while(i < lk)
  418. {
  419. #ifdef BLOCK_SWAP
  420. l_key[i] = io_swap(in_key[lk - i - 1]);
  421. #else
  422. l_key[i] = in_key[i];
  423. #endif
  424. i++;
  425. }
  426. if (key_len < 256)
  427. {
  428. while(i < 8)
  429. l_key[i++] = 0;
  430. i = key_len / 32; lk = 1 << key_len % 32;
  431. l_key[i] &= lk - 1;
  432. l_key[i] |= lk;
  433. }
  434. for(i = 0; i < 132; ++i)
  435. {
  436. lk = l_key[i] ^ l_key[i + 3] ^ l_key[i + 5]
  437. ^ l_key[i + 7] ^ 0x9e3779b9 ^ i;
  438. l_key[i + 8] = (lk << 11) | (lk >> 21);
  439. }
  440. GETKEY(r0, r1, r2, r3, 0);
  441. S3(r0,r1,r2,r3,r4);
  442. SETKEY(r1, r2, r3, r4, 0)
  443. GETKEY(r0, r1, r2, r3, 4);
  444. S2(r0,r1,r2,r3,r4);
  445. SETKEY(r2, r3, r1, r4, 4)
  446. GETKEY(r0, r1, r2, r3, 8);
  447. S1(r0,r1,r2,r3,r4);
  448. SETKEY(r3, r1, r2, r0, 8)
  449. GETKEY(r0, r1, r2, r3, 12);
  450. S0(r0,r1,r2,r3,r4);
  451. SETKEY(r1, r4, r2, r0, 12)
  452. GETKEY(r0, r1, r2, r3, 16);
  453. S7(r0,r1,r2,r3,r4);
  454. SETKEY(r2, r4, r3, r0, 16)
  455. GETKEY(r0, r1, r2, r3, 20);
  456. S6(r0,r1,r2,r3,r4)
  457. SETKEY(r0, r1, r4, r2, 20)
  458. GETKEY(r0, r1, r2, r3, 24);
  459. S5(r0,r1,r2,r3,r4);
  460. SETKEY(r1, r3, r0, r2, 24)
  461. GETKEY(r0, r1, r2, r3, 28);
  462. S4(r0,r1,r2,r3,r4)
  463. SETKEY(r1, r4, r0, r3, 28)
  464. GETKEY(r0, r1, r2, r3, 32);
  465. S3(r0,r1,r2,r3,r4);
  466. SETKEY(r1, r2, r3, r4, 32)
  467. GETKEY(r0, r1, r2, r3, 36);
  468. S2(r0,r1,r2,r3,r4);
  469. SETKEY(r2, r3, r1, r4, 36)
  470. GETKEY(r0, r1, r2, r3, 40);
  471. S1(r0,r1,r2,r3,r4);
  472. SETKEY(r3, r1, r2, r0, 40)
  473. GETKEY(r0, r1, r2, r3, 44);
  474. S0(r0,r1,r2,r3,r4);
  475. SETKEY(r1, r4, r2, r0, 44)
  476. GETKEY(r0, r1, r2, r3, 48);
  477. S7(r0,r1,r2,r3,r4);
  478. SETKEY(r2, r4, r3, r0, 48)
  479. GETKEY(r0, r1, r2, r3, 52);
  480. S6(r0,r1,r2,r3,r4)
  481. SETKEY(r0, r1, r4, r2, 52)
  482. GETKEY(r0, r1, r2, r3, 56);
  483. S5(r0,r1,r2,r3,r4);
  484. SETKEY(r1, r3, r0, r2, 56)
  485. GETKEY(r0, r1, r2, r3, 60);
  486. S4(r0,r1,r2,r3,r4)
  487. SETKEY(r1, r4, r0, r3, 60)
  488. GETKEY(r0, r1, r2, r3, 64);
  489. S3(r0,r1,r2,r3,r4);
  490. SETKEY(r1, r2, r3, r4, 64)
  491. GETKEY(r0, r1, r2, r3, 68);
  492. S2(r0,r1,r2,r3,r4);
  493. SETKEY(r2, r3, r1, r4, 68)
  494. GETKEY(r0, r1, r2, r3, 72);
  495. S1(r0,r1,r2,r3,r4);
  496. SETKEY(r3, r1, r2, r0, 72)
  497. GETKEY(r0, r1, r2, r3, 76);
  498. S0(r0,r1,r2,r3,r4);
  499. SETKEY(r1, r4, r2, r0, 76)
  500. GETKEY(r0, r1, r2, r3, 80);
  501. S7(r0,r1,r2,r3,r4);
  502. SETKEY(r2, r4, r3, r0, 80)
  503. GETKEY(r0, r1, r2, r3, 84);
  504. S6(r0,r1,r2,r3,r4)
  505. SETKEY(r0, r1, r4, r2, 84)
  506. GETKEY(r0, r1, r2, r3, 88);
  507. S5(r0,r1,r2,r3,r4);
  508. SETKEY(r1, r3, r0, r2, 88)
  509. GETKEY(r0, r1, r2, r3, 92);
  510. S4(r0,r1,r2,r3,r4)
  511. SETKEY(r1, r4, r0, r3, 92)
  512. GETKEY(r0, r1, r2, r3, 96);
  513. S3(r0,r1,r2,r3,r4);
  514. SETKEY(r1, r2, r3, r4, 96)
  515. GETKEY(r0, r1, r2, r3, 100);
  516. S2(r0,r1,r2,r3,r4);
  517. SETKEY(r2, r3, r1, r4, 100)
  518. GETKEY(r0, r1, r2, r3, 104);
  519. S1(r0,r1,r2,r3,r4);
  520. SETKEY(r3, r1, r2, r0, 104)
  521. GETKEY(r0, r1, r2, r3, 108);
  522. S0(r0,r1,r2,r3,r4);
  523. SETKEY(r1, r4, r2, r0, 108)
  524. GETKEY(r0, r1, r2, r3, 112);
  525. S7(r0,r1,r2,r3,r4);
  526. SETKEY(r2, r4, r3, r0, 112)
  527. GETKEY(r0, r1, r2, r3, 116);
  528. S6(r0,r1,r2,r3,r4)
  529. SETKEY(r0, r1, r4, r2, 116)
  530. GETKEY(r0, r1, r2, r3, 120);
  531. S5(r0,r1,r2,r3,r4);
  532. SETKEY(r1, r3, r0, r2, 120)
  533. GETKEY(r0, r1, r2, r3, 124);
  534. S4(r0,r1,r2,r3,r4)
  535. SETKEY(r1, r4, r0, r3, 124)
  536. GETKEY(r0, r1, r2, r3, 128);
  537. S3(r0,r1,r2,r3,r4);
  538. SETKEY(r1, r2, r3, r4, 128)
  539. return 0;
  540. };
  541. /* Encryption and decryption functions. The rounds are fully inlined.
  542. * The sboxes alters the bit order of the output, and the altered
  543. * bit ordrer is used progressivly. */
  544. /* encrypt a block of text */
  545. int serpent_encrypt(serpent_context *cx, const u8 *in,
  546. u8 *out)
  547. { u32 *l_key = cx->keyinfo;
  548. const u32 *in_blk = (const u32 *) in;
  549. u32 *out_blk = (u32 *) out;
  550. u32 r0,r1,r2,r3,r4;
  551. #ifdef BLOCK_SWAP
  552. r0 = io_swap(in_blk[3]); r1 = io_swap(in_blk[2]);
  553. r2 = io_swap(in_blk[1]); r3 = io_swap(in_blk[0]);
  554. #else
  555. r0 = in_blk[0]; r1 = in_blk[1]; r2 = in_blk[2]; r3 = in_blk[3];
  556. #endif
  557. /* round 1 */
  558. KEYMIX(r0,r1,r2,r3,r4,0);
  559. S0(r0,r1,r2,r3,r4);
  560. LINTRANS(r1,r4,r2,r0,r3);
  561. /* round 2 */
  562. KEYMIX(r1,r4,r2,r0,r3,4);
  563. S1(r1,r4,r2,r0,r3);
  564. LINTRANS(r0,r4,r2,r1,r3);
  565. /* round 3 */
  566. KEYMIX(r0,r4,r2,r1,r3,8);
  567. S2(r0,r4,r2,r1,r3);
  568. LINTRANS(r2,r1,r4,r3,r0);
  569. /* round 4 */
  570. KEYMIX(r2,r1,r4,r3,r0,12);
  571. S3(r2,r1,r4,r3,r0);
  572. LINTRANS(r1,r4,r3,r0,r2);
  573. /* round 5 */
  574. KEYMIX(r1,r4,r3,r0,r2,16);
  575. S4(r1,r4,r3,r0,r2)
  576. LINTRANS(r4,r2,r1,r0,r3);
  577. /* round 6 */
  578. KEYMIX(r4,r2,r1,r0,r3,20);
  579. S5(r4,r2,r1,r0,r3);
  580. LINTRANS(r2,r0,r4,r1,r3);
  581. /* round 7 */
  582. KEYMIX(r2,r0,r4,r1,r3,24);
  583. S6(r2,r0,r4,r1,r3)
  584. LINTRANS(r2,r0,r3,r4,r1);
  585. /* round 8 */
  586. KEYMIX(r2,r0,r3,r4,r1,28);
  587. S7(r2,r0,r3,r4,r1);
  588. LINTRANS(r3,r1,r4,r2,r0);
  589. /* round 9 */
  590. KEYMIX(r3,r1,r4,r2,r0,32);
  591. S0(r3,r1,r4,r2,r0);
  592. LINTRANS(r1,r0,r4,r3,r2);
  593. /* round 10 */
  594. KEYMIX(r1,r0,r4,r3,r2,36);
  595. S1(r1,r0,r4,r3,r2);
  596. LINTRANS(r3,r0,r4,r1,r2);
  597. /* round 11 */
  598. KEYMIX(r3,r0,r4,r1,r2,40);
  599. S2(r3,r0,r4,r1,r2);
  600. LINTRANS(r4,r1,r0,r2,r3);
  601. /* round 12 */
  602. KEYMIX(r4,r1,r0,r2,r3,44);
  603. S3(r4,r1,r0,r2,r3);
  604. LINTRANS(r1,r0,r2,r3,r4);
  605. /* round 13 */
  606. KEYMIX(r1,r0,r2,r3,r4,48);
  607. S4(r1,r0,r2,r3,r4)
  608. LINTRANS(r0,r4,r1,r3,r2);
  609. /* round 14 */
  610. KEYMIX(r0,r4,r1,r3,r2,52);
  611. S5(r0,r4,r1,r3,r2);
  612. LINTRANS(r4,r3,r0,r1,r2);
  613. /* round 15 */
  614. KEYMIX(r4,r3,r0,r1,r2,56);
  615. S6(r4,r3,r0,r1,r2)
  616. LINTRANS(r4,r3,r2,r0,r1);
  617. /* round 16 */
  618. KEYMIX(r4,r3,r2,r0,r1,60);
  619. S7(r4,r3,r2,r0,r1);
  620. LINTRANS(r2,r1,r0,r4,r3);
  621. /* round 17 */
  622. KEYMIX(r2,r1,r0,r4,r3,64);
  623. S0(r2,r1,r0,r4,r3);
  624. LINTRANS(r1,r3,r0,r2,r4);
  625. /* round 18 */
  626. KEYMIX(r1,r3,r0,r2,r4,68);
  627. S1(r1,r3,r0,r2,r4);
  628. LINTRANS(r2,r3,r0,r1,r4);
  629. /* round 19 */
  630. KEYMIX(r2,r3,r0,r1,r4,72);
  631. S2(r2,r3,r0,r1,r4);
  632. LINTRANS(r0,r1,r3,r4,r2);
  633. /* round 20 */
  634. KEYMIX(r0,r1,r3,r4,r2,76);
  635. S3(r0,r1,r3,r4,r2);
  636. LINTRANS(r1,r3,r4,r2,r0);
  637. /* round 21 */
  638. KEYMIX(r1,r3,r4,r2,r0,80);
  639. S4(r1,r3,r4,r2,r0)
  640. LINTRANS(r3,r0,r1,r2,r4);
  641. /* round 22 */
  642. KEYMIX(r3,r0,r1,r2,r4,84);
  643. S5(r3,r0,r1,r2,r4);
  644. LINTRANS(r0,r2,r3,r1,r4);
  645. /* round 23 */
  646. KEYMIX(r0,r2,r3,r1,r4,88);
  647. S6(r0,r2,r3,r1,r4)
  648. LINTRANS(r0,r2,r4,r3,r1);
  649. /* round 24 */
  650. KEYMIX(r0,r2,r4,r3,r1,92);
  651. S7(r0,r2,r4,r3,r1);
  652. LINTRANS(r4,r1,r3,r0,r2);
  653. /* round 25 */
  654. KEYMIX(r4,r1,r3,r0,r2,96);
  655. S0(r4,r1,r3,r0,r2);
  656. LINTRANS(r1,r2,r3,r4,r0);
  657. /* round 26 */
  658. KEYMIX(r1,r2,r3,r4,r0,100);
  659. S1(r1,r2,r3,r4,r0);
  660. LINTRANS(r4,r2,r3,r1,r0);
  661. /* round 27 */
  662. KEYMIX(r4,r2,r3,r1,r0,104);
  663. S2(r4,r2,r3,r1,r0);
  664. LINTRANS(r3,r1,r2,r0,r4);
  665. /* round 28 */
  666. KEYMIX(r3,r1,r2,r0,r4,108);
  667. S3(r3,r1,r2,r0,r4);
  668. LINTRANS(r1,r2,r0,r4,r3);
  669. /* round 29 */
  670. KEYMIX(r1,r2,r0,r4,r3,112);
  671. S4(r1,r2,r0,r4,r3)
  672. LINTRANS(r2,r3,r1,r4,r0);
  673. /* round 30 */
  674. KEYMIX(r2,r3,r1,r4,r0,116);
  675. S5(r2,r3,r1,r4,r0);
  676. LINTRANS(r3,r4,r2,r1,r0);
  677. /* round 31 */
  678. KEYMIX(r3,r4,r2,r1,r0,120);
  679. S6(r3,r4,r2,r1,r0)
  680. LINTRANS(r3,r4,r0,r2,r1);
  681. /* round 32 */
  682. KEYMIX(r3,r4,r0,r2,r1,124);
  683. S7(r3,r4,r0,r2,r1);
  684. KEYMIX(r0,r1,r2,r3,r4,128);
  685. #ifdef BLOCK_SWAP
  686. out_blk[3] = io_swap(r0); out_blk[2] = io_swap(r1);
  687. out_blk[1] = io_swap(r2); out_blk[0] = io_swap(r3);
  688. #else
  689. out_blk[0] = r0; out_blk[1] = r1; out_blk[2] = r2; out_blk[3] = r3;
  690. #endif
  691. return 0;
  692. };
  693. /* decrypt a block of text */
  694. int serpent_decrypt(serpent_context *cx, const u8 *in,
  695. u8 *out)
  696. { u32 *l_key = cx->keyinfo;
  697. const u32 *in_blk = (const u32 *)in;
  698. u32 *out_blk = (u32 *)out;
  699. u32 r0,r1,r2,r3,r4;
  700. #ifdef BLOCK_SWAP
  701. r0 = io_swap(in_blk[3]); r1 = io_swap(in_blk[2]);
  702. r2 = io_swap(in_blk[1]); r3 = io_swap(in_blk[0]);
  703. #else
  704. r0 = in_blk[0]; r1 = in_blk[1]; r2 = in_blk[2]; r3 = in_blk[3];
  705. #endif
  706. /* round 1 */
  707. KEYMIX(r0,r1,r2,r3,r4,128);
  708. I7(r0,r1,r2,r3,r4);
  709. KEYMIX(r3,r0,r1,r4,r2,124);
  710. /* round 2 */
  711. ILINTRANS(r3,r0,r1,r4,r2);
  712. I6(r3,r0,r1,r4,r2);
  713. KEYMIX(r0,r1,r2,r4,r3,120);
  714. /* round 3 */
  715. ILINTRANS(r0,r1,r2,r4,r3);
  716. I5(r0,r1,r2,r4,r3);
  717. KEYMIX(r1,r3,r4,r2,r0,116);
  718. /* round 4 */
  719. ILINTRANS(r1,r3,r4,r2,r0);
  720. I4(r1,r3,r4,r2,r0);
  721. KEYMIX(r1,r2,r4,r0,r3,112);
  722. /* round 5 */
  723. ILINTRANS(r1,r2,r4,r0,r3);
  724. I3(r1,r2,r4,r0,r3);
  725. KEYMIX(r4,r2,r0,r1,r3,108);
  726. /* round 6 */
  727. ILINTRANS(r4,r2,r0,r1,r3);
  728. I2(r4,r2,r0,r1,r3);
  729. KEYMIX(r2,r3,r0,r1,r4,104);
  730. /* round 7 */
  731. ILINTRANS(r2,r3,r0,r1,r4);
  732. I1(r2,r3,r0,r1,r4);
  733. KEYMIX(r4,r2,r1,r0,r3,100);
  734. /* round 8 */
  735. ILINTRANS(r4,r2,r1,r0,r3);
  736. I0(r4,r2,r1,r0,r3);
  737. KEYMIX(r4,r3,r2,r0,r1,96);
  738. /* round 9 */
  739. ILINTRANS(r4,r3,r2,r0,r1);
  740. I7(r4,r3,r2,r0,r1);
  741. KEYMIX(r0,r4,r3,r1,r2,92);
  742. /* round 10 */
  743. ILINTRANS(r0,r4,r3,r1,r2);
  744. I6(r0,r4,r3,r1,r2);
  745. KEYMIX(r4,r3,r2,r1,r0,88);
  746. /* round 11 */
  747. ILINTRANS(r4,r3,r2,r1,r0);
  748. I5(r4,r3,r2,r1,r0);
  749. KEYMIX(r3,r0,r1,r2,r4,84);
  750. /* round 12 */
  751. ILINTRANS(r3,r0,r1,r2,r4);
  752. I4(r3,r0,r1,r2,r4);
  753. KEYMIX(r3,r2,r1,r4,r0,80);
  754. /* round 13 */
  755. ILINTRANS(r3,r2,r1,r4,r0);
  756. I3(r3,r2,r1,r4,r0);
  757. KEYMIX(r1,r2,r4,r3,r0,76);
  758. /* round 14 */
  759. ILINTRANS(r1,r2,r4,r3,r0);
  760. I2(r1,r2,r4,r3,r0);
  761. KEYMIX(r2,r0,r4,r3,r1,72);
  762. /* round 15 */
  763. ILINTRANS(r2,r0,r4,r3,r1);
  764. I1(r2,r0,r4,r3,r1);
  765. KEYMIX(r1,r2,r3,r4,r0,68);
  766. /* round 16 */
  767. ILINTRANS(r1,r2,r3,r4,r0);
  768. I0(r1,r2,r3,r4,r0);
  769. KEYMIX(r1,r0,r2,r4,r3,64);
  770. /* round 17 */
  771. ILINTRANS(r1,r0,r2,r4,r3);
  772. I7(r1,r0,r2,r4,r3);
  773. KEYMIX(r4,r1,r0,r3,r2,60);
  774. /* round 18 */
  775. ILINTRANS(r4,r1,r0,r3,r2);
  776. I6(r4,r1,r0,r3,r2);
  777. KEYMIX(r1,r0,r2,r3,r4,56);
  778. /* round 19 */
  779. ILINTRANS(r1,r0,r2,r3,r4);
  780. I5(r1,r0,r2,r3,r4);
  781. KEYMIX(r0,r4,r3,r2,r1,52);
  782. /* round 20 */
  783. ILINTRANS(r0,r4,r3,r2,r1);
  784. I4(r0,r4,r3,r2,r1);
  785. KEYMIX(r0,r2,r3,r1,r4,48);
  786. /* round 21 */
  787. ILINTRANS(r0,r2,r3,r1,r4);
  788. I3(r0,r2,r3,r1,r4);
  789. KEYMIX(r3,r2,r1,r0,r4,44);
  790. /* round 22 */
  791. ILINTRANS(r3,r2,r1,r0,r4);
  792. I2(r3,r2,r1,r0,r4);
  793. KEYMIX(r2,r4,r1,r0,r3,40);
  794. /* round 23 */
  795. ILINTRANS(r2,r4,r1,r0,r3);
  796. I1(r2,r4,r1,r0,r3);
  797. KEYMIX(r3,r2,r0,r1,r4,36);
  798. /* round 24 */
  799. ILINTRANS(r3,r2,r0,r1,r4);
  800. I0(r3,r2,r0,r1,r4);
  801. KEYMIX(r3,r4,r2,r1,r0,32);
  802. /* round 25 */
  803. ILINTRANS(r3,r4,r2,r1,r0);
  804. I7(r3,r4,r2,r1,r0);
  805. KEYMIX(r1,r3,r4,r0,r2,28);
  806. /* round 26 */
  807. ILINTRANS(r1,r3,r4,r0,r2);
  808. I6(r1,r3,r4,r0,r2);
  809. KEYMIX(r3,r4,r2,r0,r1,24);
  810. /* round 27 */
  811. ILINTRANS(r3,r4,r2,r0,r1);
  812. I5(r3,r4,r2,r0,r1);
  813. KEYMIX(r4,r1,r0,r2,r3,20);
  814. /* round 28 */
  815. ILINTRANS(r4,r1,r0,r2,r3);
  816. I4(r4,r1,r0,r2,r3);
  817. KEYMIX(r4,r2,r0,r3,r1,16);
  818. /* round 29 */
  819. ILINTRANS(r4,r2,r0,r3,r1);
  820. I3(r4,r2,r0,r3,r1);
  821. KEYMIX(r0,r2,r3,r4,r1,12);
  822. /* round 30 */
  823. ILINTRANS(r0,r2,r3,r4,r1);
  824. I2(r0,r2,r3,r4,r1);
  825. KEYMIX(r2,r1,r3,r4,r0,8);
  826. /* round 31 */
  827. ILINTRANS(r2,r1,r3,r4,r0);
  828. I1(r2,r1,r3,r4,r0);
  829. KEYMIX(r0,r2,r4,r3,r1,4);
  830. /* round 32 */
  831. ILINTRANS(r0,r2,r4,r3,r1);
  832. I0(r0,r2,r4,r3,r1);
  833. KEYMIX(r0,r1,r2,r3,r4,0);
  834. #ifdef BLOCK_SWAP
  835. out_blk[3] = io_swap(r0); out_blk[2] = io_swap(r1);
  836. out_blk[1] = io_swap(r2); out_blk[0] = io_swap(r3);
  837. #else
  838. out_blk[0] = r0; out_blk[1] = r1; out_blk[2] = r2; out_blk[3] = r3;
  839. #endif
  840. return 0;
  841. };