2 * Author......: Jens Steube <jens.steube@gmail.com>
6 #if defined _MD4_ || defined _DCC2_ || defined _NETNTLMV2_ || defined _KRB5PA_ || defined _MS_DRSR_
11 #if __CUDA_ARCH__ >= 500
12 #define MD4_F(x,y,z) lut3_ca ((x), (y), (z))
13 #define MD4_G(x,y,z) lut3_e8 ((x), (y), (z))
14 #define MD4_H(x,y,z) lut3_96 ((x), (y), (z))
15 #define MD4_H1(x,y,z) lut3_96 ((x), (y), (z))
16 #define MD4_H2(x,y,z) lut3_96 ((x), (y), (z))
18 #define MD4_F(x,y,z) (((x) & (y)) | ((~(x)) & (z)))
19 #define MD4_G(x,y,z) (((x) & (y)) | ((x) & (z)) | ((y) & (z)))
20 #define MD4_H(x,y,z) ((x) ^ (y) ^ (z))
21 #define MD4_H1(x,y,z) ((tmp2 = (x) ^ (y)) ^ (z))
22 #define MD4_H2(x,y,z) ((x) ^ tmp2)
26 #define MD4_Fo(x,y,z) (bitselect ((z), (y), (x)))
27 #define MD4_Go(x,y,z) (bitselect ((x), (y), ((x) ^ (z))))
29 #define MD4_Fo(x,y,z) (MD4_F((x), (y), (z)))
30 #define MD4_Go(x,y,z) (MD4_G((x), (y), (z)))
33 #define MD4_STEP(f,a,b,c,d,x,K,s) \
41 #define MD4_STEP0(f,a,b,c,d,K,s) \
50 #if defined _MD5_ || defined _MD5H_ || defined _SAPB_ || defined _OLDOFFICE01_ || defined _WPA_ || defined _MD5_SHA1_ || defined _SHA1_MD5_ || defined _NETNTLMV2_ || defined _KRB5PA_ || defined _PBKDF2_MD5_
55 #if __CUDA_ARCH__ >= 500
56 #define MD5_F(x,y,z) lut3_ca ((x), (y), (z))
57 #define MD5_G(x,y,z) lut3_e4 ((x), (y), (z))
58 #define MD5_H(x,y,z) lut3_96 ((x), (y), (z))
59 #define MD5_H1(x,y,z) lut3_96 ((x), (y), (z))
60 #define MD5_H2(x,y,z) lut3_96 ((x), (y), (z))
62 #define MD5_F(x,y,z) ((z) ^ ((x) & ((y) ^ (z))))
63 #define MD5_G(x,y,z) ((y) ^ ((z) & ((x) ^ (y))))
64 #define MD5_H(x,y,z) ((x) ^ (y) ^ (z))
65 #define MD5_H1(x,y,z) ((tmp2 = (x) ^ (y)) ^ (z))
66 #define MD5_H2(x,y,z) ((x) ^ tmp2)
70 #define MD5_I(x,y,z) (bitselect (0xffffffffU, (x), (z)) ^ (y))
72 #if __CUDA_ARCH__ >= 500
73 #define MD5_I(x,y,z) lut3_39 ((x), (y), (z))
75 #define MD5_I(x,y,z) ((y) ^ ((x) | ~(z)))
80 #define MD5_Fo(x,y,z) (bitselect ((z), (y), (x)))
81 #define MD5_Go(x,y,z) (bitselect ((y), (x), (z)))
83 #define MD5_Fo(x,y,z) (MD5_F((x), (y), (z)))
84 #define MD5_Go(x,y,z) (MD5_G((x), (y), (z)))
87 #define MD5_STEP(f,a,b,c,d,x,K,s) \
96 #define MD5_STEP0(f,a,b,c,d,K,s) \
105 #if defined _SHA1_ || defined _SAPG_ || defined _OFFICE2007_ || defined _OFFICE2010_ || defined _OLDOFFICE34_ || defined _ANDROIDFDE_ || defined _DCC2_ || defined _WPA_ || defined _MD5_SHA1_ || defined _SHA1_MD5_ || defined _PSAFE2_ || defined _LOTUS8_ || defined _PBKDF2_SHA1_ || defined _RAR3_ || defined _SHA256_SHA1_
111 #if __CUDA_ARCH__ >= 500
112 #define SHA1_F0(x,y,z) lut3_ca ((x), (y), (z))
113 #define SHA1_F1(x,y,z) lut3_96 ((x), (y), (z))
114 #define SHA1_F2(x,y,z) lut3_e8 ((x), (y), (z))
116 #define SHA1_F0(x,y,z) ((z) ^ ((x) & ((y) ^ (z))))
117 #define SHA1_F1(x,y,z) ((x) ^ (y) ^ (z))
118 #define SHA1_F2(x,y,z) (((x) & (y)) | ((z) & ((x) ^ (y))))
122 #define SHA1_F0o(x,y,z) (bitselect ((z), (y), (x)))
123 #define SHA1_F2o(x,y,z) (bitselect ((x), (y), ((x) ^ (z))))
125 #define SHA1_F0o(x,y,z) (SHA1_F0 ((x), (y), (z)))
126 #define SHA1_F2o(x,y,z) (SHA1_F2 ((x), (y), (z)))
129 #define SHA1_STEP(f,a,b,c,d,e,x) \
134 e += rotl32 (a, 5u); \
135 b = rotl32 (b, 30u); \
138 #define SHA1_STEP0(f,a,b,c,d,e,x) \
142 e += rotl32 (a, 5u); \
143 b = rotl32 (b, 30u); \
146 #define SHA1_STEPX(f,a,b,c,d,e,x) \
150 e += rotl32 (a, 5u); \
151 b = rotl32 (b, 30u); \
154 #define SHA1_STEP_PE(f,a,b,c,d,e,x) \
158 e += rotl32 (a, 5u); \
161 #define SHA1_STEP_PB(f,a,b,c,d,e,x) \
164 b = rotl32 (b, 30u); \
168 #if defined _SHA256_ || defined _PDF17L8_ || defined _SEVEN_ZIP_ || defined _ANDROIDFDE_ || defined _CLOUDKEY_ || defined _SCRYPT_ || defined _PBKDF2_SHA256_ || defined _SHA256_SHA1_ || defined _MS_DRSR_
173 #define SHIFT_RIGHT_32(x,n) ((x) >> (n))
175 #define SHA256_S0(x) (rotl32 ((x), 25u) ^ rotl32 ((x), 14u) ^ SHIFT_RIGHT_32 ((x), 3u))
176 #define SHA256_S1(x) (rotl32 ((x), 15u) ^ rotl32 ((x), 13u) ^ SHIFT_RIGHT_32 ((x), 10u))
177 #define SHA256_S2(x) (rotl32 ((x), 30u) ^ rotl32 ((x), 19u) ^ rotl32 ((x), 10u))
178 #define SHA256_S3(x) (rotl32 ((x), 26u) ^ rotl32 ((x), 21u) ^ rotl32 ((x), 7u))
180 #if __CUDA_ARCH__ >= 500
181 #define SHA256_F0(x,y,z) lut3_e8 ((x), (y), (z))
182 #define SHA256_F1(x,y,z) lut3_ca ((x), (y), (z))
184 #define SHA256_F0(x,y,z) (((x) & (y)) | ((z) & ((x) ^ (y))))
185 #define SHA256_F1(x,y,z) ((z) ^ ((x) & ((y) ^ (z))))
189 #define SHA256_F0o(x,y,z) (bitselect ((x), (y), ((x) ^ (z))))
190 #define SHA256_F1o(x,y,z) (bitselect ((z), (y), (x)))
192 #define SHA256_F0o(x,y,z) (SHA256_F0 ((x), (y), (z)))
193 #define SHA256_F1o(x,y,z) (SHA256_F1 ((x), (y), (z)))
196 #define SHA256_STEP(F0,F1,a,b,c,d,e,f,g,h,x,K) \
200 h += SHA256_S3 (e); \
203 h += SHA256_S2 (a); \
207 #define SHA256_EXPAND(x,y,z,w) (SHA256_S1 (x) + y + SHA256_S0 (z) + w)
211 #if defined _SHA384_ || defined _PDF17L8_
216 #define SHIFT_RIGHT_64(x,n) ((x) >> (n))
218 #define SHA384_S0(x) (rotr64 ((x), 28) ^ rotr64 ((x), 34) ^ rotr64 ((x), 39))
219 #define SHA384_S1(x) (rotr64 ((x), 14) ^ rotr64 ((x), 18) ^ rotr64 ((x), 41))
220 #define SHA384_S2(x) (rotr64 ((x), 1) ^ rotr64 ((x), 8) ^ SHIFT_RIGHT_64 ((x), 7))
221 #define SHA384_S3(x) (rotr64 ((x), 19) ^ rotr64 ((x), 61) ^ SHIFT_RIGHT_64 ((x), 6))
223 #define SHA384_F0(x,y,z) ((z) ^ ((x) & ((y) ^ (z))))
224 #define SHA384_F1(x,y,z) (((x) & (y)) | ((z) & ((x) ^ (y))))
227 #define SHA384_F0o(x,y,z) (bitselect ((z), (y), (x)))
228 #define SHA384_F1o(x,y,z) (bitselect ((x), (y), ((x) ^ (z))))
230 #define SHA384_F0o(x,y,z) (SHA384_F0 ((x), (y), (z)))
231 #define SHA384_F1o(x,y,z) (SHA384_F1 ((x), (y), (z)))
234 #define SHA384_STEP(F0,F1,a,b,c,d,e,f,g,h,x,K) \
240 temp0 += SHA384_S1 (e); \
241 temp0 += F0 (e, f, g); \
248 #define SHA384_EXPAND(x,y,z,w) (SHA384_S3 (x) + y + SHA384_S2 (z) + w)
251 #if defined _SHA512_ || defined _CLOUDKEY_ || defined _OFFICE2013_ || defined _PDF17L8_ || defined _PBKDF2_SHA512_
256 #define SHIFT_RIGHT_64(x,n) ((x) >> (n))
258 #define SHA512_S0(x) (rotr64 ((x), 28) ^ rotr64 ((x), 34) ^ rotr64 ((x), 39))
259 #define SHA512_S1(x) (rotr64 ((x), 14) ^ rotr64 ((x), 18) ^ rotr64 ((x), 41))
260 #define SHA512_S2(x) (rotr64 ((x), 1) ^ rotr64 ((x), 8) ^ SHIFT_RIGHT_64 ((x), 7))
261 #define SHA512_S3(x) (rotr64 ((x), 19) ^ rotr64 ((x), 61) ^ SHIFT_RIGHT_64 ((x), 6))
263 #define SHA512_F0(x,y,z) ((z) ^ ((x) & ((y) ^ (z))))
264 #define SHA512_F1(x,y,z) (((x) & (y)) | ((z) & ((x) ^ (y))))
267 #define SHA512_F0o(x,y,z) (bitselect ((z), (y), (x)))
268 #define SHA512_F1o(x,y,z) (bitselect ((x), (y), ((x) ^ (z))))
270 #define SHA512_F0o(x,y,z) (SHA512_F0 ((x), (y), (z)))
271 #define SHA512_F1o(x,y,z) (SHA512_F1 ((x), (y), (z)))
274 #define SHA512_STEP(F0,F1,a,b,c,d,e,f,g,h,x,K) \
280 temp0 += SHA512_S1 (e); \
281 temp0 += F0 (e, f, g); \
288 #define SHA512_EXPAND(x,y,z,w) (SHA512_S3 (x) + y + SHA512_S2 (z) + w)
290 #define SHA512_S2_WO(x) (rotate ((x), 64- 1ull) ^ rotate ((x), 64- 8ull) ^ SHIFT_RIGHT_64 ((x), 7))
291 #define SHA512_S3_WO(x) (rotate ((x), 64-19ull) ^ rotate ((x), 64-61ull) ^ SHIFT_RIGHT_64 ((x), 6))
293 #define SHA512_EXPAND_WO(x,y,z,w) (SHA512_S3_WO (x) + y + SHA512_S2_WO (z) + w)
298 * RIPEMD160 Functions
301 #if __CUDA_ARCH__ >= 500
302 #define RIPEMD160_F(x,y,z) lut3_96 ((x), (y), (z))
303 #define RIPEMD160_G(x,y,z) lut3_ca ((x), (y), (z))
304 #define RIPEMD160_H(x,y,z) lut3_59 ((x), (y), (z))
305 #define RIPEMD160_I(x,y,z) lut3_e4 ((x), (y), (z))
306 #define RIPEMD160_J(x,y,z) lut3_2d ((x), (y), (z))
308 #define RIPEMD160_F(x,y,z) ((x) ^ (y) ^ (z))
309 #define RIPEMD160_G(x,y,z) ((z) ^ ((x) & ((y) ^ (z)))) /* x ? y : z */
310 #define RIPEMD160_H(x,y,z) (((x) | ~(y)) ^ (z))
311 #define RIPEMD160_I(x,y,z) ((y) ^ ((z) & ((x) ^ (y)))) /* z ? x : y */
312 #define RIPEMD160_J(x,y,z) ((x) ^ ((y) | ~(z)))
316 #define RIPEMD160_Go(x,y,z) (bitselect ((z), (y), (x)))
317 #define RIPEMD160_Io(x,y,z) (bitselect ((y), (x), (z)))
319 #define RIPEMD160_Go(x,y,z) (RIPEMD160_G ((x), (y), (z)))
320 #define RIPEMD160_Io(x,y,z) (RIPEMD160_I ((x), (y), (z)))
323 #define RIPEMD160_STEP(f,a,b,c,d,e,x,K,s) \
330 c = rotl32 (c, 10u); \
333 #define ROTATE_LEFT_WORKAROUND_BUG(a,n) ((a << n) | (a >> (32 - n)))
335 #define RIPEMD160_STEP_WORKAROUND_BUG(f,a,b,c,d,e,x,K,s) \
340 a = ROTATE_LEFT_WORKAROUND_BUG (a, s); \
342 c = rotl32 (c, 10u); \