Mercurial > libavutil.hg
annotate sha1.c @ 302:901256787a89 libavutil
factorize VARIANT2 (smaller and slower)
author | michael |
---|---|
date | Tue, 13 Mar 2007 01:13:38 +0000 |
parents | b1c6f2421786 |
children | 5b46b6b71fe2 |
rev | line source |
---|---|
288 | 1 // SHA-1 code Copyright 2007 Michael Nidermayer <michaelni@gmx.at> |
2 // license LGPL | |
3 // based on public domain SHA-1 code by Steve Reid <steve@edmweb.com> | |
4 | |
5 #include "common.h" | |
6 #include "sha1.h" | |
7 | |
8 typedef struct AVSHA1 { | |
9 uint32_t state[5]; | |
10 uint64_t count; | |
11 uint8_t buffer[64]; | |
12 } AVSHA1; | |
13 | |
14 #define rol(value, bits) (((value) << (bits)) | ((value) >> (32 - (bits)))) | |
15 | |
16 /* (R0+R1), R2, R3, R4 are the different operations used in SHA1 */ | |
299 | 17 #define R0b(v,w,x,y,z,i) z+((w&(x^y))^y) +block[i]+0x5A827999+rol(v,5); |
18 #define R2b(v,w,x,y,z,i) z+( w^x ^y) +block[i]+0x6ED9EBA1+rol(v,5); | |
19 #define R3b(v,w,x,y,z,i) z+(((w|x)&y)|(w&x))+block[i]+0x8F1BBCDC+rol(v,5); | |
20 #define R4b(v,w,x,y,z,i) z+( w^x ^y) +block[i]+0xCA62C1D6+rol(v,5); | |
21 | |
301 | 22 #define blk0(i) (block[i] = be2me_32(block[i])) |
23 #define blk(i) (block[i] = rol(block[i-3]^block[i-8]^block[i-14]^block[i-16],1)) | |
24 | |
25 #define R0(v,w,x,y,z,i) z+=((w&(x^y))^y) +blk0(i)+0x5A827999+rol(v,5);w=rol(w,30); | |
26 #define R1(v,w,x,y,z,i) z+=((w&(x^y))^y) +blk (i)+0x5A827999+rol(v,5);w=rol(w,30); | |
27 #define R2(v,w,x,y,z,i) z+=( w^x ^y) +blk (i)+0x6ED9EBA1+rol(v,5);w=rol(w,30); | |
28 #define R3(v,w,x,y,z,i) z+=(((w|x)&y)|(w&x))+blk (i)+0x8F1BBCDC+rol(v,5);w=rol(w,30); | |
29 #define R4(v,w,x,y,z,i) z+=( w^x ^y) +blk (i)+0xCA62C1D6+rol(v,5);w=rol(w,30); | |
288 | 30 |
31 /* Hash a single 512-bit block. This is the core of the algorithm. */ | |
32 | |
299 | 33 //#define VARIANT1 |
34 //#define VARIANT2 | |
35 | |
288 | 36 static void transform(uint32_t state[5], uint8_t buffer[64]){ |
291
78b11473f66a
avoid silly ring buffer logic (faster with -O2, -O3 is always slower then -O2)
michael
parents:
290
diff
changeset
|
37 uint32_t block[80]; |
299 | 38 unsigned int i; |
39 #ifdef VARIANT1 | |
40 uint32_t s[85]; | |
41 #else | |
42 unsigned int a, b, c, d, e; | |
43 #endif | |
290
8f02801da0f8
its faster to copy the data to the stack it seems ...
michael
parents:
289
diff
changeset
|
44 |
301 | 45 #if defined (VARIANT1) || defined (VARIANT2) |
296 | 46 for(i=0; i<16; i++) |
47 block[i]= be2me_32(((uint32_t*)buffer)[i]); | |
48 for(;i<80; i++) | |
49 block[i]= rol(block[i-3]^block[i-8]^block[i-14]^block[i-16],1); | |
301 | 50 #else |
51 memcpy(block, buffer, 64); | |
52 #endif | |
290
8f02801da0f8
its faster to copy the data to the stack it seems ...
michael
parents:
289
diff
changeset
|
53 |
299 | 54 |
55 #ifdef VARIANT1 | |
56 s[0]= state[4]; | |
57 s[1]= state[3]; | |
58 s[2]= state[2]; | |
59 s[3]= state[1]; | |
60 s[4]= state[0]; | |
61 for(i=0; i<20; i++){ | |
62 s[5+i]= R0b(s[4+i], s[3+i], s[2+i], s[1+i], s[i], i); | |
63 s[3+i]= rol(s[3+i],30); | |
64 } | |
65 for(; i<40; i++){ | |
66 s[5+i]= R2b(s[4+i], s[3+i], s[2+i], s[1+i], s[i], i); | |
67 s[3+i]= rol(s[3+i],30); | |
68 } | |
69 for(; i<60; i++){ | |
70 s[5+i]= R3b(s[4+i], s[3+i], s[2+i], s[1+i], s[i], i); | |
71 s[3+i]= rol(s[3+i],30); | |
72 } | |
73 for(; i<80; i++){ | |
74 s[5+i]= R4b(s[4+i], s[3+i], s[2+i], s[1+i], s[i], i); | |
75 s[3+i]= rol(s[3+i],30); | |
76 } | |
77 state[0] += s[84]; | |
78 state[1] += s[83]; | |
79 state[2] += s[82]; | |
80 state[3] += s[81]; | |
81 state[4] += s[80]; | |
82 #else | |
288 | 83 a = state[0]; |
84 b = state[1]; | |
85 c = state[2]; | |
86 d = state[3]; | |
87 e = state[4]; | |
299 | 88 #ifdef VARIANT2 |
302 | 89 for(i=0; i<80; i++){ |
90 int t= e+block[i]+rol(a,5);; | |
91 if(i<40){ | |
92 if(i<20) t+= ((b&(c^d))^d) +0x5A827999; | |
93 else t+= ( b^c ^d) +0x6ED9EBA1; | |
94 }else{ | |
95 if(i<60) t+= (((b|c)&d)|(b&c))+0x8F1BBCDC; | |
96 else t+= ( b^c ^d) +0xCA62C1D6; | |
97 } | |
299 | 98 e= d; |
99 d= c; | |
100 c= rol(b,30); | |
101 b= a; | |
102 a= t; | |
103 } | |
104 #else | |
301 | 105 for(i=0; i<15; i+=5){ |
288 | 106 R0(a,b,c,d,e,0+i); R0(e,a,b,c,d,1+i); R0(d,e,a,b,c,2+i); R0(c,d,e,a,b,3+i); R0(b,c,d,e,a,4+i); |
107 } | |
301 | 108 R0(a,b,c,d,e,15); R1(e,a,b,c,d,16); R1(d,e,a,b,c,17); R1(c,d,e,a,b,18); R1(b,c,d,e,a,19); |
109 for(i=20; i<40; i+=5){ | |
288 | 110 R2(a,b,c,d,e,0+i); R2(e,a,b,c,d,1+i); R2(d,e,a,b,c,2+i); R2(c,d,e,a,b,3+i); R2(b,c,d,e,a,4+i); |
111 } | |
112 for(; i<60; i+=5){ | |
113 R3(a,b,c,d,e,0+i); R3(e,a,b,c,d,1+i); R3(d,e,a,b,c,2+i); R3(c,d,e,a,b,3+i); R3(b,c,d,e,a,4+i); | |
114 } | |
115 for(; i<80; i+=5){ | |
116 R4(a,b,c,d,e,0+i); R4(e,a,b,c,d,1+i); R4(d,e,a,b,c,2+i); R4(c,d,e,a,b,3+i); R4(b,c,d,e,a,4+i); | |
117 } | |
299 | 118 #endif |
288 | 119 state[0] += a; |
120 state[1] += b; | |
121 state[2] += c; | |
122 state[3] += d; | |
123 state[4] += e; | |
299 | 124 #endif |
288 | 125 } |
126 | |
127 void av_sha1_init(AVSHA1* context){ | |
128 context->state[0] = 0x67452301; | |
129 context->state[1] = 0xEFCDAB89; | |
130 context->state[2] = 0x98BADCFE; | |
131 context->state[3] = 0x10325476; | |
132 context->state[4] = 0xC3D2E1F0; | |
133 context->count = 0; | |
134 } | |
135 | |
136 void av_sha1_update(AVSHA1* context, uint8_t* data, unsigned int len){ | |
137 unsigned int i, j; | |
138 | |
294
97f5321b12ad
make count count bytes not bits (this is simpler and leads to a very slightly smaller object file)
michael
parents:
293
diff
changeset
|
139 j = context->count & 63; |
97f5321b12ad
make count count bytes not bits (this is simpler and leads to a very slightly smaller object file)
michael
parents:
293
diff
changeset
|
140 context->count += len; |
288 | 141 if ((j + len) > 63) { |
142 memcpy(&context->buffer[j], data, (i = 64-j)); | |
143 transform(context->state, context->buffer); | |
144 for ( ; i + 63 < len; i += 64) { | |
145 transform(context->state, &data[i]); | |
146 } | |
147 } | |
148 else i = 0; | |
149 memcpy(&context->buffer[j], &data[i], len - i); | |
150 } | |
151 | |
152 void av_sha1_final(AVSHA1* context, uint8_t digest[20]){ | |
153 int i; | |
294
97f5321b12ad
make count count bytes not bits (this is simpler and leads to a very slightly smaller object file)
michael
parents:
293
diff
changeset
|
154 uint64_t finalcount= be2me_64(context->count<<3); |
288 | 155 |
156 av_sha1_update(context, "\200", 1); | |
294
97f5321b12ad
make count count bytes not bits (this is simpler and leads to a very slightly smaller object file)
michael
parents:
293
diff
changeset
|
157 while ((context->count & 63) != 56) { |
300 | 158 av_sha1_update(context, "", 1); |
288 | 159 } |
160 av_sha1_update(context, &finalcount, 8); /* Should cause a transform() */ | |
295 | 161 for(i=0; i<5; i++) |
162 ((uint32_t*)digest)[i]= be2me_32(context->state[i]); | |
288 | 163 } |
164 | |
289 | 165 // use the following to test |
292 | 166 // gcc -DTEST -DHAVE_AV_CONFIG_H -I.. sha1.c -O2 -W -Wall -o sha1 && time ./sha1 |
288 | 167 #ifdef TEST |
168 #include <stdio.h> | |
169 #undef printf | |
170 | |
171 int main(){ | |
172 int i, k; | |
173 AVSHA1 context; | |
174 unsigned char digest[20]; | |
175 | |
176 for(k=0; k<3; k++){ | |
177 av_sha1_init(&context); | |
178 if(k==0) | |
179 av_sha1_update(&context, "abc", 3); | |
180 else if(k==1) | |
181 av_sha1_update(&context, "abcdbcdecdefdefgefghfghighijhijkijkljklmklmnlmnomnopnopq", 56); | |
182 else | |
183 for(i=0; i<1000*1000; i++) | |
184 av_sha1_update(&context, "a", 1); | |
185 av_sha1_final(&context, digest); | |
186 for (i = 0; i < 20; i++) | |
187 printf("%02X", digest[i]); | |
188 putchar('\n'); | |
189 } | |
190 //Test Vectors (from FIPS PUB 180-1) | |
191 printf("A9993E36 4706816A BA3E2571 7850C26C 9CD0D89D\n" | |
192 "84983E44 1C3BD26E BAAE4AA1 F95129E5 E54670F1\n" | |
193 "34AA973C D4C4DAA4 F61EEB2B DBAD2731 6534016F\n"); | |
194 | |
195 return 0; | |
196 } | |
197 #endif |