p54: fix queue stall due to underrun
[linux-2.6/linux-acpi-2.6/ibm-acpi-2.6.git] / crypto / sha256_generic.c
blob6349d8339d379cc6862dba1fadf54bc2cdfe3eb3
1 /*
2 * Cryptographic API.
4 * SHA-256, as specified in
5 * http://csrc.nist.gov/groups/STM/cavp/documents/shs/sha256-384-512.pdf
7 * SHA-256 code by Jean-Luc Cooke <jlcooke@certainkey.com>.
9 * Copyright (c) Jean-Luc Cooke <jlcooke@certainkey.com>
10 * Copyright (c) Andrew McDonald <andrew@mcdonald.org.uk>
11 * Copyright (c) 2002 James Morris <jmorris@intercode.com.au>
12 * SHA224 Support Copyright 2007 Intel Corporation <jonathan.lynch@intel.com>
14 * This program is free software; you can redistribute it and/or modify it
15 * under the terms of the GNU General Public License as published by the Free
16 * Software Foundation; either version 2 of the License, or (at your option)
17 * any later version.
20 #include <crypto/internal/hash.h>
21 #include <linux/init.h>
22 #include <linux/module.h>
23 #include <linux/mm.h>
24 #include <linux/types.h>
25 #include <crypto/sha.h>
26 #include <asm/byteorder.h>
28 struct sha256_ctx {
29 u32 count[2];
30 u32 state[8];
31 u8 buf[128];
34 static inline u32 Ch(u32 x, u32 y, u32 z)
36 return z ^ (x & (y ^ z));
39 static inline u32 Maj(u32 x, u32 y, u32 z)
41 return (x & y) | (z & (x | y));
44 #define e0(x) (ror32(x, 2) ^ ror32(x,13) ^ ror32(x,22))
45 #define e1(x) (ror32(x, 6) ^ ror32(x,11) ^ ror32(x,25))
46 #define s0(x) (ror32(x, 7) ^ ror32(x,18) ^ (x >> 3))
47 #define s1(x) (ror32(x,17) ^ ror32(x,19) ^ (x >> 10))
49 static inline void LOAD_OP(int I, u32 *W, const u8 *input)
51 W[I] = __be32_to_cpu( ((__be32*)(input))[I] );
54 static inline void BLEND_OP(int I, u32 *W)
56 W[I] = s1(W[I-2]) + W[I-7] + s0(W[I-15]) + W[I-16];
59 static void sha256_transform(u32 *state, const u8 *input)
61 u32 a, b, c, d, e, f, g, h, t1, t2;
62 u32 W[64];
63 int i;
65 /* load the input */
66 for (i = 0; i < 16; i++)
67 LOAD_OP(i, W, input);
69 /* now blend */
70 for (i = 16; i < 64; i++)
71 BLEND_OP(i, W);
73 /* load the state into our registers */
74 a=state[0]; b=state[1]; c=state[2]; d=state[3];
75 e=state[4]; f=state[5]; g=state[6]; h=state[7];
77 /* now iterate */
78 t1 = h + e1(e) + Ch(e,f,g) + 0x428a2f98 + W[ 0];
79 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
80 t1 = g + e1(d) + Ch(d,e,f) + 0x71374491 + W[ 1];
81 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
82 t1 = f + e1(c) + Ch(c,d,e) + 0xb5c0fbcf + W[ 2];
83 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
84 t1 = e + e1(b) + Ch(b,c,d) + 0xe9b5dba5 + W[ 3];
85 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
86 t1 = d + e1(a) + Ch(a,b,c) + 0x3956c25b + W[ 4];
87 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
88 t1 = c + e1(h) + Ch(h,a,b) + 0x59f111f1 + W[ 5];
89 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
90 t1 = b + e1(g) + Ch(g,h,a) + 0x923f82a4 + W[ 6];
91 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
92 t1 = a + e1(f) + Ch(f,g,h) + 0xab1c5ed5 + W[ 7];
93 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
95 t1 = h + e1(e) + Ch(e,f,g) + 0xd807aa98 + W[ 8];
96 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
97 t1 = g + e1(d) + Ch(d,e,f) + 0x12835b01 + W[ 9];
98 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
99 t1 = f + e1(c) + Ch(c,d,e) + 0x243185be + W[10];
100 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
101 t1 = e + e1(b) + Ch(b,c,d) + 0x550c7dc3 + W[11];
102 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
103 t1 = d + e1(a) + Ch(a,b,c) + 0x72be5d74 + W[12];
104 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
105 t1 = c + e1(h) + Ch(h,a,b) + 0x80deb1fe + W[13];
106 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
107 t1 = b + e1(g) + Ch(g,h,a) + 0x9bdc06a7 + W[14];
108 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
109 t1 = a + e1(f) + Ch(f,g,h) + 0xc19bf174 + W[15];
110 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
112 t1 = h + e1(e) + Ch(e,f,g) + 0xe49b69c1 + W[16];
113 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
114 t1 = g + e1(d) + Ch(d,e,f) + 0xefbe4786 + W[17];
115 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
116 t1 = f + e1(c) + Ch(c,d,e) + 0x0fc19dc6 + W[18];
117 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
118 t1 = e + e1(b) + Ch(b,c,d) + 0x240ca1cc + W[19];
119 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
120 t1 = d + e1(a) + Ch(a,b,c) + 0x2de92c6f + W[20];
121 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
122 t1 = c + e1(h) + Ch(h,a,b) + 0x4a7484aa + W[21];
123 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
124 t1 = b + e1(g) + Ch(g,h,a) + 0x5cb0a9dc + W[22];
125 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
126 t1 = a + e1(f) + Ch(f,g,h) + 0x76f988da + W[23];
127 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
129 t1 = h + e1(e) + Ch(e,f,g) + 0x983e5152 + W[24];
130 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
131 t1 = g + e1(d) + Ch(d,e,f) + 0xa831c66d + W[25];
132 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
133 t1 = f + e1(c) + Ch(c,d,e) + 0xb00327c8 + W[26];
134 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
135 t1 = e + e1(b) + Ch(b,c,d) + 0xbf597fc7 + W[27];
136 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
137 t1 = d + e1(a) + Ch(a,b,c) + 0xc6e00bf3 + W[28];
138 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
139 t1 = c + e1(h) + Ch(h,a,b) + 0xd5a79147 + W[29];
140 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
141 t1 = b + e1(g) + Ch(g,h,a) + 0x06ca6351 + W[30];
142 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
143 t1 = a + e1(f) + Ch(f,g,h) + 0x14292967 + W[31];
144 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
146 t1 = h + e1(e) + Ch(e,f,g) + 0x27b70a85 + W[32];
147 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
148 t1 = g + e1(d) + Ch(d,e,f) + 0x2e1b2138 + W[33];
149 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
150 t1 = f + e1(c) + Ch(c,d,e) + 0x4d2c6dfc + W[34];
151 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
152 t1 = e + e1(b) + Ch(b,c,d) + 0x53380d13 + W[35];
153 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
154 t1 = d + e1(a) + Ch(a,b,c) + 0x650a7354 + W[36];
155 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
156 t1 = c + e1(h) + Ch(h,a,b) + 0x766a0abb + W[37];
157 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
158 t1 = b + e1(g) + Ch(g,h,a) + 0x81c2c92e + W[38];
159 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
160 t1 = a + e1(f) + Ch(f,g,h) + 0x92722c85 + W[39];
161 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
163 t1 = h + e1(e) + Ch(e,f,g) + 0xa2bfe8a1 + W[40];
164 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
165 t1 = g + e1(d) + Ch(d,e,f) + 0xa81a664b + W[41];
166 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
167 t1 = f + e1(c) + Ch(c,d,e) + 0xc24b8b70 + W[42];
168 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
169 t1 = e + e1(b) + Ch(b,c,d) + 0xc76c51a3 + W[43];
170 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
171 t1 = d + e1(a) + Ch(a,b,c) + 0xd192e819 + W[44];
172 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
173 t1 = c + e1(h) + Ch(h,a,b) + 0xd6990624 + W[45];
174 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
175 t1 = b + e1(g) + Ch(g,h,a) + 0xf40e3585 + W[46];
176 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
177 t1 = a + e1(f) + Ch(f,g,h) + 0x106aa070 + W[47];
178 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
180 t1 = h + e1(e) + Ch(e,f,g) + 0x19a4c116 + W[48];
181 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
182 t1 = g + e1(d) + Ch(d,e,f) + 0x1e376c08 + W[49];
183 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
184 t1 = f + e1(c) + Ch(c,d,e) + 0x2748774c + W[50];
185 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
186 t1 = e + e1(b) + Ch(b,c,d) + 0x34b0bcb5 + W[51];
187 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
188 t1 = d + e1(a) + Ch(a,b,c) + 0x391c0cb3 + W[52];
189 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
190 t1 = c + e1(h) + Ch(h,a,b) + 0x4ed8aa4a + W[53];
191 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
192 t1 = b + e1(g) + Ch(g,h,a) + 0x5b9cca4f + W[54];
193 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
194 t1 = a + e1(f) + Ch(f,g,h) + 0x682e6ff3 + W[55];
195 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
197 t1 = h + e1(e) + Ch(e,f,g) + 0x748f82ee + W[56];
198 t2 = e0(a) + Maj(a,b,c); d+=t1; h=t1+t2;
199 t1 = g + e1(d) + Ch(d,e,f) + 0x78a5636f + W[57];
200 t2 = e0(h) + Maj(h,a,b); c+=t1; g=t1+t2;
201 t1 = f + e1(c) + Ch(c,d,e) + 0x84c87814 + W[58];
202 t2 = e0(g) + Maj(g,h,a); b+=t1; f=t1+t2;
203 t1 = e + e1(b) + Ch(b,c,d) + 0x8cc70208 + W[59];
204 t2 = e0(f) + Maj(f,g,h); a+=t1; e=t1+t2;
205 t1 = d + e1(a) + Ch(a,b,c) + 0x90befffa + W[60];
206 t2 = e0(e) + Maj(e,f,g); h+=t1; d=t1+t2;
207 t1 = c + e1(h) + Ch(h,a,b) + 0xa4506ceb + W[61];
208 t2 = e0(d) + Maj(d,e,f); g+=t1; c=t1+t2;
209 t1 = b + e1(g) + Ch(g,h,a) + 0xbef9a3f7 + W[62];
210 t2 = e0(c) + Maj(c,d,e); f+=t1; b=t1+t2;
211 t1 = a + e1(f) + Ch(f,g,h) + 0xc67178f2 + W[63];
212 t2 = e0(b) + Maj(b,c,d); e+=t1; a=t1+t2;
214 state[0] += a; state[1] += b; state[2] += c; state[3] += d;
215 state[4] += e; state[5] += f; state[6] += g; state[7] += h;
217 /* clear any sensitive info... */
218 a = b = c = d = e = f = g = h = t1 = t2 = 0;
219 memset(W, 0, 64 * sizeof(u32));
223 static int sha224_init(struct shash_desc *desc)
225 struct sha256_ctx *sctx = shash_desc_ctx(desc);
226 sctx->state[0] = SHA224_H0;
227 sctx->state[1] = SHA224_H1;
228 sctx->state[2] = SHA224_H2;
229 sctx->state[3] = SHA224_H3;
230 sctx->state[4] = SHA224_H4;
231 sctx->state[5] = SHA224_H5;
232 sctx->state[6] = SHA224_H6;
233 sctx->state[7] = SHA224_H7;
234 sctx->count[0] = 0;
235 sctx->count[1] = 0;
237 return 0;
240 static int sha256_init(struct shash_desc *desc)
242 struct sha256_ctx *sctx = shash_desc_ctx(desc);
243 sctx->state[0] = SHA256_H0;
244 sctx->state[1] = SHA256_H1;
245 sctx->state[2] = SHA256_H2;
246 sctx->state[3] = SHA256_H3;
247 sctx->state[4] = SHA256_H4;
248 sctx->state[5] = SHA256_H5;
249 sctx->state[6] = SHA256_H6;
250 sctx->state[7] = SHA256_H7;
251 sctx->count[0] = sctx->count[1] = 0;
253 return 0;
256 static int sha256_update(struct shash_desc *desc, const u8 *data,
257 unsigned int len)
259 struct sha256_ctx *sctx = shash_desc_ctx(desc);
260 unsigned int i, index, part_len;
262 /* Compute number of bytes mod 128 */
263 index = (unsigned int)((sctx->count[0] >> 3) & 0x3f);
265 /* Update number of bits */
266 if ((sctx->count[0] += (len << 3)) < (len << 3)) {
267 sctx->count[1]++;
268 sctx->count[1] += (len >> 29);
271 part_len = 64 - index;
273 /* Transform as many times as possible. */
274 if (len >= part_len) {
275 memcpy(&sctx->buf[index], data, part_len);
276 sha256_transform(sctx->state, sctx->buf);
278 for (i = part_len; i + 63 < len; i += 64)
279 sha256_transform(sctx->state, &data[i]);
280 index = 0;
281 } else {
282 i = 0;
285 /* Buffer remaining input */
286 memcpy(&sctx->buf[index], &data[i], len-i);
288 return 0;
291 static int sha256_final(struct shash_desc *desc, u8 *out)
293 struct sha256_ctx *sctx = shash_desc_ctx(desc);
294 __be32 *dst = (__be32 *)out;
295 __be32 bits[2];
296 unsigned int index, pad_len;
297 int i;
298 static const u8 padding[64] = { 0x80, };
300 /* Save number of bits */
301 bits[1] = cpu_to_be32(sctx->count[0]);
302 bits[0] = cpu_to_be32(sctx->count[1]);
304 /* Pad out to 56 mod 64. */
305 index = (sctx->count[0] >> 3) & 0x3f;
306 pad_len = (index < 56) ? (56 - index) : ((64+56) - index);
307 sha256_update(desc, padding, pad_len);
309 /* Append length (before padding) */
310 sha256_update(desc, (const u8 *)bits, sizeof(bits));
312 /* Store state in digest */
313 for (i = 0; i < 8; i++)
314 dst[i] = cpu_to_be32(sctx->state[i]);
316 /* Zeroize sensitive information. */
317 memset(sctx, 0, sizeof(*sctx));
319 return 0;
322 static int sha224_final(struct shash_desc *desc, u8 *hash)
324 u8 D[SHA256_DIGEST_SIZE];
326 sha256_final(desc, D);
328 memcpy(hash, D, SHA224_DIGEST_SIZE);
329 memset(D, 0, SHA256_DIGEST_SIZE);
331 return 0;
334 static struct shash_alg sha256 = {
335 .digestsize = SHA256_DIGEST_SIZE,
336 .init = sha256_init,
337 .update = sha256_update,
338 .final = sha256_final,
339 .descsize = sizeof(struct sha256_ctx),
340 .base = {
341 .cra_name = "sha256",
342 .cra_driver_name= "sha256-generic",
343 .cra_flags = CRYPTO_ALG_TYPE_SHASH,
344 .cra_blocksize = SHA256_BLOCK_SIZE,
345 .cra_module = THIS_MODULE,
349 static struct shash_alg sha224 = {
350 .digestsize = SHA224_DIGEST_SIZE,
351 .init = sha224_init,
352 .update = sha256_update,
353 .final = sha224_final,
354 .descsize = sizeof(struct sha256_ctx),
355 .base = {
356 .cra_name = "sha224",
357 .cra_driver_name= "sha224-generic",
358 .cra_flags = CRYPTO_ALG_TYPE_SHASH,
359 .cra_blocksize = SHA224_BLOCK_SIZE,
360 .cra_module = THIS_MODULE,
364 static int __init sha256_generic_mod_init(void)
366 int ret = 0;
368 ret = crypto_register_shash(&sha224);
370 if (ret < 0)
371 return ret;
373 ret = crypto_register_shash(&sha256);
375 if (ret < 0)
376 crypto_unregister_shash(&sha224);
378 return ret;
381 static void __exit sha256_generic_mod_fini(void)
383 crypto_unregister_shash(&sha224);
384 crypto_unregister_shash(&sha256);
387 module_init(sha256_generic_mod_init);
388 module_exit(sha256_generic_mod_fini);
390 MODULE_LICENSE("GPL");
391 MODULE_DESCRIPTION("SHA-224 and SHA-256 Secure Hash Algorithm");
393 MODULE_ALIAS("sha224");
394 MODULE_ALIAS("sha256");