2 * Authors.....: Jens Steube <jens.steube@gmail.com>
3 * Gabriele Gristina <matrix@hashcat.net>
10 #include "include/constants.h"
11 #include "include/kernel_vendor.h"
18 #include "include/kernel_functions.c"
19 #include "OpenCL/types_ocl.c"
20 #include "OpenCL/common.c"
21 #include "OpenCL/simd.c"
31 static void swap (__local RC4_KEY *rc4_key, const u8 i, const u8 j)
36 rc4_key->S[i] = rc4_key->S[j];
40 static void rc4_init_16 (__local RC4_KEY *rc4_key, const u32 data[4])
45 __local u32 *ptr = (__local u32 *) rc4_key->S;
48 for (u32 i = 0; i < 64; i++)
55 for (u32 i = 0; i < 16; i++)
63 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
64 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
65 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
66 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
70 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
71 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
72 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
73 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
77 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
78 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
79 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
80 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
84 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
85 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
86 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
87 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
91 static u8 rc4_next_16 (__local RC4_KEY *rc4_key, u8 i, u8 j, const u32 in[4], u32 out[4])
94 for (u32 k = 0; k < 4; k++)
103 swap (rc4_key, i, j);
105 idx = rc4_key->S[i] + rc4_key->S[j];
107 xor4 |= rc4_key->S[idx] << 0;
112 swap (rc4_key, i, j);
114 idx = rc4_key->S[i] + rc4_key->S[j];
116 xor4 |= rc4_key->S[idx] << 8;
121 swap (rc4_key, i, j);
123 idx = rc4_key->S[i] + rc4_key->S[j];
125 xor4 |= rc4_key->S[idx] << 16;
130 swap (rc4_key, i, j);
132 idx = rc4_key->S[i] + rc4_key->S[j];
134 xor4 |= rc4_key->S[idx] << 24;
136 out[k] = in[k] ^ xor4;
142 static void md5_transform (const u32 w0[4], const u32 w1[4], const u32 w2[4], const u32 w3[4], u32 digest[4])
166 MD5_STEP (MD5_Fo, a, b, c, d, w0_t, MD5C00, MD5S00);
167 MD5_STEP (MD5_Fo, d, a, b, c, w1_t, MD5C01, MD5S01);
168 MD5_STEP (MD5_Fo, c, d, a, b, w2_t, MD5C02, MD5S02);
169 MD5_STEP (MD5_Fo, b, c, d, a, w3_t, MD5C03, MD5S03);
170 MD5_STEP (MD5_Fo, a, b, c, d, w4_t, MD5C04, MD5S00);
171 MD5_STEP (MD5_Fo, d, a, b, c, w5_t, MD5C05, MD5S01);
172 MD5_STEP (MD5_Fo, c, d, a, b, w6_t, MD5C06, MD5S02);
173 MD5_STEP (MD5_Fo, b, c, d, a, w7_t, MD5C07, MD5S03);
174 MD5_STEP (MD5_Fo, a, b, c, d, w8_t, MD5C08, MD5S00);
175 MD5_STEP (MD5_Fo, d, a, b, c, w9_t, MD5C09, MD5S01);
176 MD5_STEP (MD5_Fo, c, d, a, b, wa_t, MD5C0a, MD5S02);
177 MD5_STEP (MD5_Fo, b, c, d, a, wb_t, MD5C0b, MD5S03);
178 MD5_STEP (MD5_Fo, a, b, c, d, wc_t, MD5C0c, MD5S00);
179 MD5_STEP (MD5_Fo, d, a, b, c, wd_t, MD5C0d, MD5S01);
180 MD5_STEP (MD5_Fo, c, d, a, b, we_t, MD5C0e, MD5S02);
181 MD5_STEP (MD5_Fo, b, c, d, a, wf_t, MD5C0f, MD5S03);
183 MD5_STEP (MD5_Go, a, b, c, d, w1_t, MD5C10, MD5S10);
184 MD5_STEP (MD5_Go, d, a, b, c, w6_t, MD5C11, MD5S11);
185 MD5_STEP (MD5_Go, c, d, a, b, wb_t, MD5C12, MD5S12);
186 MD5_STEP (MD5_Go, b, c, d, a, w0_t, MD5C13, MD5S13);
187 MD5_STEP (MD5_Go, a, b, c, d, w5_t, MD5C14, MD5S10);
188 MD5_STEP (MD5_Go, d, a, b, c, wa_t, MD5C15, MD5S11);
189 MD5_STEP (MD5_Go, c, d, a, b, wf_t, MD5C16, MD5S12);
190 MD5_STEP (MD5_Go, b, c, d, a, w4_t, MD5C17, MD5S13);
191 MD5_STEP (MD5_Go, a, b, c, d, w9_t, MD5C18, MD5S10);
192 MD5_STEP (MD5_Go, d, a, b, c, we_t, MD5C19, MD5S11);
193 MD5_STEP (MD5_Go, c, d, a, b, w3_t, MD5C1a, MD5S12);
194 MD5_STEP (MD5_Go, b, c, d, a, w8_t, MD5C1b, MD5S13);
195 MD5_STEP (MD5_Go, a, b, c, d, wd_t, MD5C1c, MD5S10);
196 MD5_STEP (MD5_Go, d, a, b, c, w2_t, MD5C1d, MD5S11);
197 MD5_STEP (MD5_Go, c, d, a, b, w7_t, MD5C1e, MD5S12);
198 MD5_STEP (MD5_Go, b, c, d, a, wc_t, MD5C1f, MD5S13);
200 MD5_STEP (MD5_H , a, b, c, d, w5_t, MD5C20, MD5S20);
201 MD5_STEP (MD5_H , d, a, b, c, w8_t, MD5C21, MD5S21);
202 MD5_STEP (MD5_H , c, d, a, b, wb_t, MD5C22, MD5S22);
203 MD5_STEP (MD5_H , b, c, d, a, we_t, MD5C23, MD5S23);
204 MD5_STEP (MD5_H , a, b, c, d, w1_t, MD5C24, MD5S20);
205 MD5_STEP (MD5_H , d, a, b, c, w4_t, MD5C25, MD5S21);
206 MD5_STEP (MD5_H , c, d, a, b, w7_t, MD5C26, MD5S22);
207 MD5_STEP (MD5_H , b, c, d, a, wa_t, MD5C27, MD5S23);
208 MD5_STEP (MD5_H , a, b, c, d, wd_t, MD5C28, MD5S20);
209 MD5_STEP (MD5_H , d, a, b, c, w0_t, MD5C29, MD5S21);
210 MD5_STEP (MD5_H , c, d, a, b, w3_t, MD5C2a, MD5S22);
211 MD5_STEP (MD5_H , b, c, d, a, w6_t, MD5C2b, MD5S23);
212 MD5_STEP (MD5_H , a, b, c, d, w9_t, MD5C2c, MD5S20);
213 MD5_STEP (MD5_H , d, a, b, c, wc_t, MD5C2d, MD5S21);
214 MD5_STEP (MD5_H , c, d, a, b, wf_t, MD5C2e, MD5S22);
215 MD5_STEP (MD5_H , b, c, d, a, w2_t, MD5C2f, MD5S23);
217 MD5_STEP (MD5_I , a, b, c, d, w0_t, MD5C30, MD5S30);
218 MD5_STEP (MD5_I , d, a, b, c, w7_t, MD5C31, MD5S31);
219 MD5_STEP (MD5_I , c, d, a, b, we_t, MD5C32, MD5S32);
220 MD5_STEP (MD5_I , b, c, d, a, w5_t, MD5C33, MD5S33);
221 MD5_STEP (MD5_I , a, b, c, d, wc_t, MD5C34, MD5S30);
222 MD5_STEP (MD5_I , d, a, b, c, w3_t, MD5C35, MD5S31);
223 MD5_STEP (MD5_I , c, d, a, b, wa_t, MD5C36, MD5S32);
224 MD5_STEP (MD5_I , b, c, d, a, w1_t, MD5C37, MD5S33);
225 MD5_STEP (MD5_I , a, b, c, d, w8_t, MD5C38, MD5S30);
226 MD5_STEP (MD5_I , d, a, b, c, wf_t, MD5C39, MD5S31);
227 MD5_STEP (MD5_I , c, d, a, b, w6_t, MD5C3a, MD5S32);
228 MD5_STEP (MD5_I , b, c, d, a, wd_t, MD5C3b, MD5S33);
229 MD5_STEP (MD5_I , a, b, c, d, w4_t, MD5C3c, MD5S30);
230 MD5_STEP (MD5_I , d, a, b, c, wb_t, MD5C3d, MD5S31);
231 MD5_STEP (MD5_I , c, d, a, b, w2_t, MD5C3e, MD5S32);
232 MD5_STEP (MD5_I , b, c, d, a, w9_t, MD5C3f, MD5S33);
240 static void m09700m (__local RC4_KEY *rc4_keys, u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 pw_len, __global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset)
246 const u32 gid = get_global_id (0);
247 const u32 lid = get_local_id (0);
249 __local RC4_KEY *rc4_key = &rc4_keys[lid];
260 salt_buf_t0[0] = salt_bufs[salt_pos].salt_buf[0];
261 salt_buf_t0[1] = salt_bufs[salt_pos].salt_buf[1];
262 salt_buf_t0[2] = salt_bufs[salt_pos].salt_buf[2];
263 salt_buf_t0[3] = salt_bufs[salt_pos].salt_buf[3];
265 salt_buf_t1[0] = salt_buf_t0[0] << 8;
266 salt_buf_t1[1] = salt_buf_t0[0] >> 24 | salt_buf_t0[1] << 8;
267 salt_buf_t1[2] = salt_buf_t0[1] >> 24 | salt_buf_t0[2] << 8;
268 salt_buf_t1[3] = salt_buf_t0[2] >> 24 | salt_buf_t0[3] << 8;
269 salt_buf_t1[4] = salt_buf_t0[3] >> 24;
271 salt_buf_t2[0] = salt_buf_t0[0] << 16;
272 salt_buf_t2[1] = salt_buf_t0[0] >> 16 | salt_buf_t0[1] << 16;
273 salt_buf_t2[2] = salt_buf_t0[1] >> 16 | salt_buf_t0[2] << 16;
274 salt_buf_t2[3] = salt_buf_t0[2] >> 16 | salt_buf_t0[3] << 16;
275 salt_buf_t2[4] = salt_buf_t0[3] >> 16;
277 salt_buf_t3[0] = salt_buf_t0[0] << 24;
278 salt_buf_t3[1] = salt_buf_t0[0] >> 8 | salt_buf_t0[1] << 24;
279 salt_buf_t3[2] = salt_buf_t0[1] >> 8 | salt_buf_t0[2] << 24;
280 salt_buf_t3[3] = salt_buf_t0[2] >> 8 | salt_buf_t0[3] << 24;
281 salt_buf_t3[4] = salt_buf_t0[3] >> 8;
283 const u32 salt_len = 16;
289 const u32 version = oldoffice01_bufs[salt_pos].version;
291 u32 encryptedVerifier[4];
293 encryptedVerifier[0] = oldoffice01_bufs[salt_pos].encryptedVerifier[0];
294 encryptedVerifier[1] = oldoffice01_bufs[salt_pos].encryptedVerifier[1];
295 encryptedVerifier[2] = oldoffice01_bufs[salt_pos].encryptedVerifier[2];
296 encryptedVerifier[3] = oldoffice01_bufs[salt_pos].encryptedVerifier[3];
304 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
306 const u32 w0r = ix_create_bft (bfs_buf, il_pos);
308 const u32 w0lr = w0l | w0r;
329 w3_t[2] = pw_len * 8;
333 u32 digest_t1[2]; // need only first 5 byte
337 digest_t0[0] = MD5M_A;
338 digest_t0[1] = MD5M_B;
339 digest_t0[2] = MD5M_C;
340 digest_t0[3] = MD5M_D;
342 md5_transform (w0_t, w1_t, w2_t, w3_t, digest_t0);
344 // prepare 16 * 21 buffer stuff
355 digest_t0[0] &= 0xffffffff;
356 digest_t0[1] &= 0x000000ff;
357 digest_t0[2] &= 0x00000000;
358 digest_t0[3] &= 0x00000000;
360 digest_t1[0] = digest_t0[0] << 8;
361 digest_t1[1] = digest_t0[0] >> 24 | digest_t0[1] << 8;
363 digest_t2[0] = digest_t0[0] << 16;
364 digest_t2[1] = digest_t0[0] >> 16 | digest_t0[1] << 16;
366 digest_t3[0] = digest_t0[0] << 24;
367 digest_t3[1] = digest_t0[0] >> 8 | digest_t0[1] << 24;
369 // generate the 16 * 21 buffer
389 w0_t[0] = digest_t0[0];
390 w0_t[1] = digest_t0[1];
393 w0_t[1] |= salt_buf_t1[0];
394 w0_t[2] = salt_buf_t1[1];
395 w0_t[3] = salt_buf_t1[2];
396 w1_t[0] = salt_buf_t1[3];
397 w1_t[1] = salt_buf_t1[4];
400 w1_t[1] |= digest_t1[0];
401 w1_t[2] = digest_t1[1];
404 w1_t[2] |= salt_buf_t2[0];
405 w1_t[3] = salt_buf_t2[1];
406 w2_t[0] = salt_buf_t2[2];
407 w2_t[1] = salt_buf_t2[3];
408 w2_t[2] = salt_buf_t2[4];
411 w2_t[2] |= digest_t2[0];
412 w2_t[3] = digest_t2[1];
415 w2_t[3] |= salt_buf_t3[0];
416 w3_t[0] = salt_buf_t3[1];
417 w3_t[1] = salt_buf_t3[2];
418 w3_t[2] = salt_buf_t3[3];
419 w3_t[3] = salt_buf_t3[4];
423 w3_t[3] |= digest_t3[0];
425 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
445 w0_t[0] = digest_t3[1];
448 w0_t[1] = salt_buf_t0[0];
449 w0_t[2] = salt_buf_t0[1];
450 w0_t[3] = salt_buf_t0[2];
451 w1_t[0] = salt_buf_t0[3];
454 w1_t[1] = digest_t0[0];
455 w1_t[2] = digest_t0[1];
458 w1_t[2] |= salt_buf_t1[0];
459 w1_t[3] = salt_buf_t1[1];
460 w2_t[0] = salt_buf_t1[2];
461 w2_t[1] = salt_buf_t1[3];
462 w2_t[2] = salt_buf_t1[4];
465 w2_t[2] |= digest_t1[0];
466 w2_t[3] = digest_t1[1];
469 w2_t[3] |= salt_buf_t2[0];
470 w3_t[0] = salt_buf_t2[1];
471 w3_t[1] = salt_buf_t2[2];
472 w3_t[2] = salt_buf_t2[3];
473 w3_t[3] = salt_buf_t2[4];
476 w3_t[3] |= digest_t2[0];
478 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
498 w0_t[0] = digest_t2[1];
501 w0_t[0] |= salt_buf_t3[0];
502 w0_t[1] = salt_buf_t3[1];
503 w0_t[2] = salt_buf_t3[2];
504 w0_t[3] = salt_buf_t3[3];
505 w1_t[0] = salt_buf_t3[4];
508 w1_t[0] |= digest_t3[0];
509 w1_t[1] = digest_t3[1];
512 w1_t[2] = salt_buf_t0[0];
513 w1_t[3] = salt_buf_t0[1];
514 w2_t[0] = salt_buf_t0[2];
515 w2_t[1] = salt_buf_t0[3];
518 w2_t[2] = digest_t0[0];
519 w2_t[3] = digest_t0[1];
522 w2_t[3] |= salt_buf_t1[0];
523 w3_t[0] = salt_buf_t1[1];
524 w3_t[1] = salt_buf_t1[2];
525 w3_t[2] = salt_buf_t1[3];
526 w3_t[3] = salt_buf_t1[4];
529 w3_t[3] |= digest_t1[0];
531 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
551 w0_t[0] = digest_t1[1];
554 w0_t[0] |= salt_buf_t2[0];
555 w0_t[1] = salt_buf_t2[1];
556 w0_t[2] = salt_buf_t2[2];
557 w0_t[3] = salt_buf_t2[3];
558 w1_t[0] = salt_buf_t2[4];
561 w1_t[0] |= digest_t2[0];
562 w1_t[1] = digest_t2[1];
565 w1_t[1] |= salt_buf_t3[0];
566 w1_t[2] = salt_buf_t3[1];
567 w1_t[3] = salt_buf_t3[2];
568 w2_t[0] = salt_buf_t3[3];
569 w2_t[1] = salt_buf_t3[4];
572 w2_t[1] |= digest_t3[0];
573 w2_t[2] = digest_t3[1];
576 w2_t[3] = salt_buf_t0[0];
577 w3_t[0] = salt_buf_t0[1];
578 w3_t[1] = salt_buf_t0[2];
579 w3_t[2] = salt_buf_t0[3];
582 w3_t[3] = digest_t0[0];
584 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
604 w0_t[0] = digest_t0[1];
607 w0_t[0] |= salt_buf_t1[0];
608 w0_t[1] = salt_buf_t1[1];
609 w0_t[2] = salt_buf_t1[2];
610 w0_t[3] = salt_buf_t1[3];
611 w1_t[0] = salt_buf_t1[4];
614 w1_t[0] |= digest_t1[0];
615 w1_t[1] = digest_t1[1];
618 w1_t[1] |= salt_buf_t2[0];
619 w1_t[2] = salt_buf_t2[1];
620 w1_t[3] = salt_buf_t2[2];
621 w2_t[0] = salt_buf_t2[3];
622 w2_t[1] = salt_buf_t2[4];
625 w2_t[1] |= digest_t2[0];
626 w2_t[2] = digest_t2[1];
629 w2_t[2] |= salt_buf_t3[0];
630 w2_t[3] = salt_buf_t3[1];
631 w3_t[0] = salt_buf_t3[2];
632 w3_t[1] = salt_buf_t3[3];
633 w3_t[2] = salt_buf_t3[4];
636 w3_t[2] |= digest_t3[0];
637 w3_t[3] = digest_t3[1];
639 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
641 w0_t[0] = salt_buf_t0[0];
642 w0_t[1] = salt_buf_t0[1];
643 w0_t[2] = salt_buf_t0[2];
644 w0_t[3] = salt_buf_t0[3];
655 w3_t[2] = 21 * 16 * 8;
658 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
660 // now the 40 bit input for the MD5 which then will generate the RC4 key, so it's precomputable!
663 w0_t[1] = digest[1] & 0xff;
684 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
695 rc4_init_16 (rc4_key, key);
699 u8 j = rc4_next_16 (rc4_key, 0, 0, encryptedVerifier, out);
723 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
725 rc4_next_16 (rc4_key, 16, j, digest, out);
727 COMPARE_M_SIMD (out[0], out[1], out[2], out[3]);
731 static void m09700s (__local RC4_KEY *rc4_keys, u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 pw_len, __global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset)
737 const u32 gid = get_global_id (0);
738 const u32 lid = get_local_id (0);
740 __local RC4_KEY *rc4_key = &rc4_keys[lid];
746 const u32 search[4] =
748 digests_buf[digests_offset].digest_buf[DGST_R0],
749 digests_buf[digests_offset].digest_buf[DGST_R1],
750 digests_buf[digests_offset].digest_buf[DGST_R2],
751 digests_buf[digests_offset].digest_buf[DGST_R3]
763 salt_buf_t0[0] = salt_bufs[salt_pos].salt_buf[0];
764 salt_buf_t0[1] = salt_bufs[salt_pos].salt_buf[1];
765 salt_buf_t0[2] = salt_bufs[salt_pos].salt_buf[2];
766 salt_buf_t0[3] = salt_bufs[salt_pos].salt_buf[3];
768 salt_buf_t1[0] = salt_buf_t0[0] << 8;
769 salt_buf_t1[1] = salt_buf_t0[0] >> 24 | salt_buf_t0[1] << 8;
770 salt_buf_t1[2] = salt_buf_t0[1] >> 24 | salt_buf_t0[2] << 8;
771 salt_buf_t1[3] = salt_buf_t0[2] >> 24 | salt_buf_t0[3] << 8;
772 salt_buf_t1[4] = salt_buf_t0[3] >> 24;
774 salt_buf_t2[0] = salt_buf_t0[0] << 16;
775 salt_buf_t2[1] = salt_buf_t0[0] >> 16 | salt_buf_t0[1] << 16;
776 salt_buf_t2[2] = salt_buf_t0[1] >> 16 | salt_buf_t0[2] << 16;
777 salt_buf_t2[3] = salt_buf_t0[2] >> 16 | salt_buf_t0[3] << 16;
778 salt_buf_t2[4] = salt_buf_t0[3] >> 16;
780 salt_buf_t3[0] = salt_buf_t0[0] << 24;
781 salt_buf_t3[1] = salt_buf_t0[0] >> 8 | salt_buf_t0[1] << 24;
782 salt_buf_t3[2] = salt_buf_t0[1] >> 8 | salt_buf_t0[2] << 24;
783 salt_buf_t3[3] = salt_buf_t0[2] >> 8 | salt_buf_t0[3] << 24;
784 salt_buf_t3[4] = salt_buf_t0[3] >> 8;
786 const u32 salt_len = 16;
792 const u32 version = oldoffice01_bufs[salt_pos].version;
794 u32 encryptedVerifier[4];
796 encryptedVerifier[0] = oldoffice01_bufs[salt_pos].encryptedVerifier[0];
797 encryptedVerifier[1] = oldoffice01_bufs[salt_pos].encryptedVerifier[1];
798 encryptedVerifier[2] = oldoffice01_bufs[salt_pos].encryptedVerifier[2];
799 encryptedVerifier[3] = oldoffice01_bufs[salt_pos].encryptedVerifier[3];
807 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
809 const u32 w0r = ix_create_bft (bfs_buf, il_pos);
811 const u32 w0lr = w0l | w0r;
832 w3_t[2] = pw_len * 8;
836 u32 digest_t1[2]; // need only first 5 byte
840 digest_t0[0] = MD5M_A;
841 digest_t0[1] = MD5M_B;
842 digest_t0[2] = MD5M_C;
843 digest_t0[3] = MD5M_D;
845 md5_transform (w0_t, w1_t, w2_t, w3_t, digest_t0);
847 // prepare 16 * 21 buffer stuff
858 digest_t0[0] &= 0xffffffff;
859 digest_t0[1] &= 0x000000ff;
860 digest_t0[2] &= 0x00000000;
861 digest_t0[3] &= 0x00000000;
863 digest_t1[0] = digest_t0[0] << 8;
864 digest_t1[1] = digest_t0[0] >> 24 | digest_t0[1] << 8;
866 digest_t2[0] = digest_t0[0] << 16;
867 digest_t2[1] = digest_t0[0] >> 16 | digest_t0[1] << 16;
869 digest_t3[0] = digest_t0[0] << 24;
870 digest_t3[1] = digest_t0[0] >> 8 | digest_t0[1] << 24;
872 // generate the 16 * 21 buffer
892 w0_t[0] = digest_t0[0];
893 w0_t[1] = digest_t0[1];
896 w0_t[1] |= salt_buf_t1[0];
897 w0_t[2] = salt_buf_t1[1];
898 w0_t[3] = salt_buf_t1[2];
899 w1_t[0] = salt_buf_t1[3];
900 w1_t[1] = salt_buf_t1[4];
903 w1_t[1] |= digest_t1[0];
904 w1_t[2] = digest_t1[1];
907 w1_t[2] |= salt_buf_t2[0];
908 w1_t[3] = salt_buf_t2[1];
909 w2_t[0] = salt_buf_t2[2];
910 w2_t[1] = salt_buf_t2[3];
911 w2_t[2] = salt_buf_t2[4];
914 w2_t[2] |= digest_t2[0];
915 w2_t[3] = digest_t2[1];
918 w2_t[3] |= salt_buf_t3[0];
919 w3_t[0] = salt_buf_t3[1];
920 w3_t[1] = salt_buf_t3[2];
921 w3_t[2] = salt_buf_t3[3];
922 w3_t[3] = salt_buf_t3[4];
926 w3_t[3] |= digest_t3[0];
928 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
948 w0_t[0] = digest_t3[1];
951 w0_t[1] = salt_buf_t0[0];
952 w0_t[2] = salt_buf_t0[1];
953 w0_t[3] = salt_buf_t0[2];
954 w1_t[0] = salt_buf_t0[3];
957 w1_t[1] = digest_t0[0];
958 w1_t[2] = digest_t0[1];
961 w1_t[2] |= salt_buf_t1[0];
962 w1_t[3] = salt_buf_t1[1];
963 w2_t[0] = salt_buf_t1[2];
964 w2_t[1] = salt_buf_t1[3];
965 w2_t[2] = salt_buf_t1[4];
968 w2_t[2] |= digest_t1[0];
969 w2_t[3] = digest_t1[1];
972 w2_t[3] |= salt_buf_t2[0];
973 w3_t[0] = salt_buf_t2[1];
974 w3_t[1] = salt_buf_t2[2];
975 w3_t[2] = salt_buf_t2[3];
976 w3_t[3] = salt_buf_t2[4];
979 w3_t[3] |= digest_t2[0];
981 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1001 w0_t[0] = digest_t2[1];
1004 w0_t[0] |= salt_buf_t3[0];
1005 w0_t[1] = salt_buf_t3[1];
1006 w0_t[2] = salt_buf_t3[2];
1007 w0_t[3] = salt_buf_t3[3];
1008 w1_t[0] = salt_buf_t3[4];
1011 w1_t[0] |= digest_t3[0];
1012 w1_t[1] = digest_t3[1];
1015 w1_t[2] = salt_buf_t0[0];
1016 w1_t[3] = salt_buf_t0[1];
1017 w2_t[0] = salt_buf_t0[2];
1018 w2_t[1] = salt_buf_t0[3];
1021 w2_t[2] = digest_t0[0];
1022 w2_t[3] = digest_t0[1];
1025 w2_t[3] |= salt_buf_t1[0];
1026 w3_t[0] = salt_buf_t1[1];
1027 w3_t[1] = salt_buf_t1[2];
1028 w3_t[2] = salt_buf_t1[3];
1029 w3_t[3] = salt_buf_t1[4];
1032 w3_t[3] |= digest_t1[0];
1034 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1054 w0_t[0] = digest_t1[1];
1057 w0_t[0] |= salt_buf_t2[0];
1058 w0_t[1] = salt_buf_t2[1];
1059 w0_t[2] = salt_buf_t2[2];
1060 w0_t[3] = salt_buf_t2[3];
1061 w1_t[0] = salt_buf_t2[4];
1064 w1_t[0] |= digest_t2[0];
1065 w1_t[1] = digest_t2[1];
1068 w1_t[1] |= salt_buf_t3[0];
1069 w1_t[2] = salt_buf_t3[1];
1070 w1_t[3] = salt_buf_t3[2];
1071 w2_t[0] = salt_buf_t3[3];
1072 w2_t[1] = salt_buf_t3[4];
1075 w2_t[1] |= digest_t3[0];
1076 w2_t[2] = digest_t3[1];
1079 w2_t[3] = salt_buf_t0[0];
1080 w3_t[0] = salt_buf_t0[1];
1081 w3_t[1] = salt_buf_t0[2];
1082 w3_t[2] = salt_buf_t0[3];
1085 w3_t[3] = digest_t0[0];
1087 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1107 w0_t[0] = digest_t0[1];
1110 w0_t[0] |= salt_buf_t1[0];
1111 w0_t[1] = salt_buf_t1[1];
1112 w0_t[2] = salt_buf_t1[2];
1113 w0_t[3] = salt_buf_t1[3];
1114 w1_t[0] = salt_buf_t1[4];
1117 w1_t[0] |= digest_t1[0];
1118 w1_t[1] = digest_t1[1];
1121 w1_t[1] |= salt_buf_t2[0];
1122 w1_t[2] = salt_buf_t2[1];
1123 w1_t[3] = salt_buf_t2[2];
1124 w2_t[0] = salt_buf_t2[3];
1125 w2_t[1] = salt_buf_t2[4];
1128 w2_t[1] |= digest_t2[0];
1129 w2_t[2] = digest_t2[1];
1132 w2_t[2] |= salt_buf_t3[0];
1133 w2_t[3] = salt_buf_t3[1];
1134 w3_t[0] = salt_buf_t3[2];
1135 w3_t[1] = salt_buf_t3[3];
1136 w3_t[2] = salt_buf_t3[4];
1139 w3_t[2] |= digest_t3[0];
1140 w3_t[3] = digest_t3[1];
1142 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1144 w0_t[0] = salt_buf_t0[0];
1145 w0_t[1] = salt_buf_t0[1];
1146 w0_t[2] = salt_buf_t0[2];
1147 w0_t[3] = salt_buf_t0[3];
1158 w3_t[2] = 21 * 16 * 8;
1161 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1163 // now the 40 bit input for the MD5 which then will generate the RC4 key, so it's precomputable!
1165 w0_t[0] = digest[0];
1166 w0_t[1] = digest[1] & 0xff;
1187 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1198 rc4_init_16 (rc4_key, key);
1202 u8 j = rc4_next_16 (rc4_key, 0, 0, encryptedVerifier, out);
1226 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1228 rc4_next_16 (rc4_key, 16, j, digest, out);
1230 COMPARE_S_SIMD (out[0], out[1], out[2], out[3]);
1234 __kernel void m09700_m04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1240 const u32 gid = get_global_id (0);
1242 if (gid >= gid_max) return;
1246 w0[0] = pws[gid].i[ 0];
1247 w0[1] = pws[gid].i[ 1];
1248 w0[2] = pws[gid].i[ 2];
1249 w0[3] = pws[gid].i[ 3];
1272 const u32 pw_len = pws[gid].pw_len;
1278 __local RC4_KEY rc4_keys[64];
1280 m09700m (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, il_cnt, digests_cnt, digests_offset);
1283 __kernel void m09700_m08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1289 const u32 gid = get_global_id (0);
1291 if (gid >= gid_max) return;
1295 w0[0] = pws[gid].i[ 0];
1296 w0[1] = pws[gid].i[ 1];
1297 w0[2] = pws[gid].i[ 2];
1298 w0[3] = pws[gid].i[ 3];
1302 w1[0] = pws[gid].i[ 4];
1303 w1[1] = pws[gid].i[ 5];
1304 w1[2] = pws[gid].i[ 6];
1305 w1[3] = pws[gid].i[ 7];
1321 const u32 pw_len = pws[gid].pw_len;
1327 __local RC4_KEY rc4_keys[64];
1329 m09700m (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, il_cnt, digests_cnt, digests_offset);
1332 __kernel void m09700_m16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1338 const u32 gid = get_global_id (0);
1340 if (gid >= gid_max) return;
1344 w0[0] = pws[gid].i[ 0];
1345 w0[1] = pws[gid].i[ 1];
1346 w0[2] = pws[gid].i[ 2];
1347 w0[3] = pws[gid].i[ 3];
1351 w1[0] = pws[gid].i[ 4];
1352 w1[1] = pws[gid].i[ 5];
1353 w1[2] = pws[gid].i[ 6];
1354 w1[3] = pws[gid].i[ 7];
1358 w2[0] = pws[gid].i[ 8];
1359 w2[1] = pws[gid].i[ 9];
1360 w2[2] = pws[gid].i[10];
1361 w2[3] = pws[gid].i[11];
1365 w3[0] = pws[gid].i[12];
1366 w3[1] = pws[gid].i[13];
1370 const u32 pw_len = pws[gid].pw_len;
1376 __local RC4_KEY rc4_keys[64];
1378 m09700m (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, il_cnt, digests_cnt, digests_offset);
1381 __kernel void m09700_s04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1387 const u32 gid = get_global_id (0);
1389 if (gid >= gid_max) return;
1393 w0[0] = pws[gid].i[ 0];
1394 w0[1] = pws[gid].i[ 1];
1395 w0[2] = pws[gid].i[ 2];
1396 w0[3] = pws[gid].i[ 3];
1419 const u32 pw_len = pws[gid].pw_len;
1425 __local RC4_KEY rc4_keys[64];
1427 m09700s (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, il_cnt, digests_cnt, digests_offset);
1430 __kernel void m09700_s08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1436 const u32 gid = get_global_id (0);
1438 if (gid >= gid_max) return;
1442 w0[0] = pws[gid].i[ 0];
1443 w0[1] = pws[gid].i[ 1];
1444 w0[2] = pws[gid].i[ 2];
1445 w0[3] = pws[gid].i[ 3];
1449 w1[0] = pws[gid].i[ 4];
1450 w1[1] = pws[gid].i[ 5];
1451 w1[2] = pws[gid].i[ 6];
1452 w1[3] = pws[gid].i[ 7];
1468 const u32 pw_len = pws[gid].pw_len;
1474 __local RC4_KEY rc4_keys[64];
1476 m09700s (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, il_cnt, digests_cnt, digests_offset);
1479 __kernel void m09700_s16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1485 const u32 gid = get_global_id (0);
1487 if (gid >= gid_max) return;
1491 w0[0] = pws[gid].i[ 0];
1492 w0[1] = pws[gid].i[ 1];
1493 w0[2] = pws[gid].i[ 2];
1494 w0[3] = pws[gid].i[ 3];
1498 w1[0] = pws[gid].i[ 4];
1499 w1[1] = pws[gid].i[ 5];
1500 w1[2] = pws[gid].i[ 6];
1501 w1[3] = pws[gid].i[ 7];
1505 w2[0] = pws[gid].i[ 8];
1506 w2[1] = pws[gid].i[ 9];
1507 w2[2] = pws[gid].i[10];
1508 w2[3] = pws[gid].i[11];
1512 w3[0] = pws[gid].i[12];
1513 w3[1] = pws[gid].i[13];
1517 const u32 pw_len = pws[gid].pw_len;
1523 __local RC4_KEY rc4_keys[64];
1525 m09700s (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, il_cnt, digests_cnt, digests_offset);