2 * Author......: Jens Steube <jens.steube@gmail.com>
8 #include "include/constants.h"
9 #include "include/kernel_vendor.h"
16 #include "include/kernel_functions.c"
17 #include "types_ocl.c"
20 #define COMPARE_S "check_single_comp4.c"
21 #define COMPARE_M "check_multi_comp4.c"
31 static void swap (__local RC4_KEY *rc4_key, const u8 i, const u8 j)
36 rc4_key->S[i] = rc4_key->S[j];
40 static void rc4_init_16 (__local RC4_KEY *rc4_key, const u32 data[4])
45 __local u32 *ptr = (__local u32 *) rc4_key->S;
48 for (u32 i = 0; i < 64; i++)
56 for (u32 i = 0; i < 16; i++)
64 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
65 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
66 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
67 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
71 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
72 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
73 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
74 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
78 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
79 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
80 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
81 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
85 j += rc4_key->S[idx] + (v >> 0); swap (rc4_key, idx, j); idx++;
86 j += rc4_key->S[idx] + (v >> 8); swap (rc4_key, idx, j); idx++;
87 j += rc4_key->S[idx] + (v >> 16); swap (rc4_key, idx, j); idx++;
88 j += rc4_key->S[idx] + (v >> 24); swap (rc4_key, idx, j); idx++;
92 static u8 rc4_next_16 (__local RC4_KEY *rc4_key, u8 i, u8 j, const u32 in[4], u32 out[4])
95 for (u32 k = 0; k < 4; k++)
104 swap (rc4_key, i, j);
106 idx = rc4_key->S[i] + rc4_key->S[j];
108 xor4 |= rc4_key->S[idx] << 0;
113 swap (rc4_key, i, j);
115 idx = rc4_key->S[i] + rc4_key->S[j];
117 xor4 |= rc4_key->S[idx] << 8;
122 swap (rc4_key, i, j);
124 idx = rc4_key->S[i] + rc4_key->S[j];
126 xor4 |= rc4_key->S[idx] << 16;
131 swap (rc4_key, i, j);
133 idx = rc4_key->S[i] + rc4_key->S[j];
135 xor4 |= rc4_key->S[idx] << 24;
137 out[k] = in[k] ^ xor4;
143 static void md5_transform (const u32 w0[4], const u32 w1[4], const u32 w2[4], const u32 w3[4], u32 digest[4])
167 MD5_STEP (MD5_Fo, a, b, c, d, w0_t, MD5C00, MD5S00);
168 MD5_STEP (MD5_Fo, d, a, b, c, w1_t, MD5C01, MD5S01);
169 MD5_STEP (MD5_Fo, c, d, a, b, w2_t, MD5C02, MD5S02);
170 MD5_STEP (MD5_Fo, b, c, d, a, w3_t, MD5C03, MD5S03);
171 MD5_STEP (MD5_Fo, a, b, c, d, w4_t, MD5C04, MD5S00);
172 MD5_STEP (MD5_Fo, d, a, b, c, w5_t, MD5C05, MD5S01);
173 MD5_STEP (MD5_Fo, c, d, a, b, w6_t, MD5C06, MD5S02);
174 MD5_STEP (MD5_Fo, b, c, d, a, w7_t, MD5C07, MD5S03);
175 MD5_STEP (MD5_Fo, a, b, c, d, w8_t, MD5C08, MD5S00);
176 MD5_STEP (MD5_Fo, d, a, b, c, w9_t, MD5C09, MD5S01);
177 MD5_STEP (MD5_Fo, c, d, a, b, wa_t, MD5C0a, MD5S02);
178 MD5_STEP (MD5_Fo, b, c, d, a, wb_t, MD5C0b, MD5S03);
179 MD5_STEP (MD5_Fo, a, b, c, d, wc_t, MD5C0c, MD5S00);
180 MD5_STEP (MD5_Fo, d, a, b, c, wd_t, MD5C0d, MD5S01);
181 MD5_STEP (MD5_Fo, c, d, a, b, we_t, MD5C0e, MD5S02);
182 MD5_STEP (MD5_Fo, b, c, d, a, wf_t, MD5C0f, MD5S03);
184 MD5_STEP (MD5_Go, a, b, c, d, w1_t, MD5C10, MD5S10);
185 MD5_STEP (MD5_Go, d, a, b, c, w6_t, MD5C11, MD5S11);
186 MD5_STEP (MD5_Go, c, d, a, b, wb_t, MD5C12, MD5S12);
187 MD5_STEP (MD5_Go, b, c, d, a, w0_t, MD5C13, MD5S13);
188 MD5_STEP (MD5_Go, a, b, c, d, w5_t, MD5C14, MD5S10);
189 MD5_STEP (MD5_Go, d, a, b, c, wa_t, MD5C15, MD5S11);
190 MD5_STEP (MD5_Go, c, d, a, b, wf_t, MD5C16, MD5S12);
191 MD5_STEP (MD5_Go, b, c, d, a, w4_t, MD5C17, MD5S13);
192 MD5_STEP (MD5_Go, a, b, c, d, w9_t, MD5C18, MD5S10);
193 MD5_STEP (MD5_Go, d, a, b, c, we_t, MD5C19, MD5S11);
194 MD5_STEP (MD5_Go, c, d, a, b, w3_t, MD5C1a, MD5S12);
195 MD5_STEP (MD5_Go, b, c, d, a, w8_t, MD5C1b, MD5S13);
196 MD5_STEP (MD5_Go, a, b, c, d, wd_t, MD5C1c, MD5S10);
197 MD5_STEP (MD5_Go, d, a, b, c, w2_t, MD5C1d, MD5S11);
198 MD5_STEP (MD5_Go, c, d, a, b, w7_t, MD5C1e, MD5S12);
199 MD5_STEP (MD5_Go, b, c, d, a, wc_t, MD5C1f, MD5S13);
201 MD5_STEP (MD5_H , a, b, c, d, w5_t, MD5C20, MD5S20);
202 MD5_STEP (MD5_H , d, a, b, c, w8_t, MD5C21, MD5S21);
203 MD5_STEP (MD5_H , c, d, a, b, wb_t, MD5C22, MD5S22);
204 MD5_STEP (MD5_H , b, c, d, a, we_t, MD5C23, MD5S23);
205 MD5_STEP (MD5_H , a, b, c, d, w1_t, MD5C24, MD5S20);
206 MD5_STEP (MD5_H , d, a, b, c, w4_t, MD5C25, MD5S21);
207 MD5_STEP (MD5_H , c, d, a, b, w7_t, MD5C26, MD5S22);
208 MD5_STEP (MD5_H , b, c, d, a, wa_t, MD5C27, MD5S23);
209 MD5_STEP (MD5_H , a, b, c, d, wd_t, MD5C28, MD5S20);
210 MD5_STEP (MD5_H , d, a, b, c, w0_t, MD5C29, MD5S21);
211 MD5_STEP (MD5_H , c, d, a, b, w3_t, MD5C2a, MD5S22);
212 MD5_STEP (MD5_H , b, c, d, a, w6_t, MD5C2b, MD5S23);
213 MD5_STEP (MD5_H , a, b, c, d, w9_t, MD5C2c, MD5S20);
214 MD5_STEP (MD5_H , d, a, b, c, wc_t, MD5C2d, MD5S21);
215 MD5_STEP (MD5_H , c, d, a, b, wf_t, MD5C2e, MD5S22);
216 MD5_STEP (MD5_H , b, c, d, a, w2_t, MD5C2f, MD5S23);
218 MD5_STEP (MD5_I , a, b, c, d, w0_t, MD5C30, MD5S30);
219 MD5_STEP (MD5_I , d, a, b, c, w7_t, MD5C31, MD5S31);
220 MD5_STEP (MD5_I , c, d, a, b, we_t, MD5C32, MD5S32);
221 MD5_STEP (MD5_I , b, c, d, a, w5_t, MD5C33, MD5S33);
222 MD5_STEP (MD5_I , a, b, c, d, wc_t, MD5C34, MD5S30);
223 MD5_STEP (MD5_I , d, a, b, c, w3_t, MD5C35, MD5S31);
224 MD5_STEP (MD5_I , c, d, a, b, wa_t, MD5C36, MD5S32);
225 MD5_STEP (MD5_I , b, c, d, a, w1_t, MD5C37, MD5S33);
226 MD5_STEP (MD5_I , a, b, c, d, w8_t, MD5C38, MD5S30);
227 MD5_STEP (MD5_I , d, a, b, c, wf_t, MD5C39, MD5S31);
228 MD5_STEP (MD5_I , c, d, a, b, w6_t, MD5C3a, MD5S32);
229 MD5_STEP (MD5_I , b, c, d, a, wd_t, MD5C3b, MD5S33);
230 MD5_STEP (MD5_I , a, b, c, d, w4_t, MD5C3c, MD5S30);
231 MD5_STEP (MD5_I , d, a, b, c, wb_t, MD5C3d, MD5S31);
232 MD5_STEP (MD5_I , c, d, a, b, w2_t, MD5C3e, MD5S32);
233 MD5_STEP (MD5_I , b, c, d, a, w9_t, MD5C3f, MD5S33);
241 static void m09700m (__local RC4_KEY rc4_keys[64], u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 pw_len, __global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset)
247 const u32 gid = get_global_id (0);
248 const u32 lid = get_local_id (0);
250 __local RC4_KEY *rc4_key = &rc4_keys[lid];
261 salt_buf_t0[0] = salt_bufs[salt_pos].salt_buf[0];
262 salt_buf_t0[1] = salt_bufs[salt_pos].salt_buf[1];
263 salt_buf_t0[2] = salt_bufs[salt_pos].salt_buf[2];
264 salt_buf_t0[3] = salt_bufs[salt_pos].salt_buf[3];
266 salt_buf_t1[0] = salt_buf_t0[0] << 8;
267 salt_buf_t1[1] = salt_buf_t0[0] >> 24 | salt_buf_t0[1] << 8;
268 salt_buf_t1[2] = salt_buf_t0[1] >> 24 | salt_buf_t0[2] << 8;
269 salt_buf_t1[3] = salt_buf_t0[2] >> 24 | salt_buf_t0[3] << 8;
270 salt_buf_t1[4] = salt_buf_t0[3] >> 24;
272 salt_buf_t2[0] = salt_buf_t0[0] << 16;
273 salt_buf_t2[1] = salt_buf_t0[0] >> 16 | salt_buf_t0[1] << 16;
274 salt_buf_t2[2] = salt_buf_t0[1] >> 16 | salt_buf_t0[2] << 16;
275 salt_buf_t2[3] = salt_buf_t0[2] >> 16 | salt_buf_t0[3] << 16;
276 salt_buf_t2[4] = salt_buf_t0[3] >> 16;
278 salt_buf_t3[0] = salt_buf_t0[0] << 24;
279 salt_buf_t3[1] = salt_buf_t0[0] >> 8 | salt_buf_t0[1] << 24;
280 salt_buf_t3[2] = salt_buf_t0[1] >> 8 | salt_buf_t0[2] << 24;
281 salt_buf_t3[3] = salt_buf_t0[2] >> 8 | salt_buf_t0[3] << 24;
282 salt_buf_t3[4] = salt_buf_t0[3] >> 8;
284 const u32 salt_len = 16;
290 const u32 version = oldoffice01_bufs[salt_pos].version;
292 u32 encryptedVerifier[4];
294 encryptedVerifier[0] = oldoffice01_bufs[salt_pos].encryptedVerifier[0];
295 encryptedVerifier[1] = oldoffice01_bufs[salt_pos].encryptedVerifier[1];
296 encryptedVerifier[2] = oldoffice01_bufs[salt_pos].encryptedVerifier[2];
297 encryptedVerifier[3] = oldoffice01_bufs[salt_pos].encryptedVerifier[3];
305 for (u32 il_pos = 0; il_pos < bfs_cnt; il_pos++)
307 const u32 w0r = bfs_buf[il_pos].i;
330 w3_t[2] = pw_len * 8;
334 u32 digest_t1[2]; // need only first 5 byte
338 digest_t0[0] = MD5M_A;
339 digest_t0[1] = MD5M_B;
340 digest_t0[2] = MD5M_C;
341 digest_t0[3] = MD5M_D;
343 md5_transform (w0_t, w1_t, w2_t, w3_t, digest_t0);
345 // prepare 16 * 21 buffer stuff
356 digest_t0[0] &= 0xffffffff;
357 digest_t0[1] &= 0x000000ff;
358 digest_t0[2] &= 0x00000000;
359 digest_t0[3] &= 0x00000000;
361 digest_t1[0] = digest_t0[0] << 8;
362 digest_t1[1] = digest_t0[0] >> 24 | digest_t0[1] << 8;
364 digest_t2[0] = digest_t0[0] << 16;
365 digest_t2[1] = digest_t0[0] >> 16 | digest_t0[1] << 16;
367 digest_t3[0] = digest_t0[0] << 24;
368 digest_t3[1] = digest_t0[0] >> 8 | digest_t0[1] << 24;
370 // generate the 16 * 21 buffer
390 w0_t[0] = digest_t0[0];
391 w0_t[1] = digest_t0[1];
394 w0_t[1] |= salt_buf_t1[0];
395 w0_t[2] = salt_buf_t1[1];
396 w0_t[3] = salt_buf_t1[2];
397 w1_t[0] = salt_buf_t1[3];
398 w1_t[1] = salt_buf_t1[4];
401 w1_t[1] |= digest_t1[0];
402 w1_t[2] = digest_t1[1];
405 w1_t[2] |= salt_buf_t2[0];
406 w1_t[3] = salt_buf_t2[1];
407 w2_t[0] = salt_buf_t2[2];
408 w2_t[1] = salt_buf_t2[3];
409 w2_t[2] = salt_buf_t2[4];
412 w2_t[2] |= digest_t2[0];
413 w2_t[3] = digest_t2[1];
416 w2_t[3] |= salt_buf_t3[0];
417 w3_t[0] = salt_buf_t3[1];
418 w3_t[1] = salt_buf_t3[2];
419 w3_t[2] = salt_buf_t3[3];
420 w3_t[3] = salt_buf_t3[4];
424 w3_t[3] |= digest_t3[0];
426 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
446 w0_t[0] = digest_t3[1];
449 w0_t[1] = salt_buf_t0[0];
450 w0_t[2] = salt_buf_t0[1];
451 w0_t[3] = salt_buf_t0[2];
452 w1_t[0] = salt_buf_t0[3];
455 w1_t[1] = digest_t0[0];
456 w1_t[2] = digest_t0[1];
459 w1_t[2] |= salt_buf_t1[0];
460 w1_t[3] = salt_buf_t1[1];
461 w2_t[0] = salt_buf_t1[2];
462 w2_t[1] = salt_buf_t1[3];
463 w2_t[2] = salt_buf_t1[4];
466 w2_t[2] |= digest_t1[0];
467 w2_t[3] = digest_t1[1];
470 w2_t[3] |= salt_buf_t2[0];
471 w3_t[0] = salt_buf_t2[1];
472 w3_t[1] = salt_buf_t2[2];
473 w3_t[2] = salt_buf_t2[3];
474 w3_t[3] = salt_buf_t2[4];
477 w3_t[3] |= digest_t2[0];
479 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
499 w0_t[0] = digest_t2[1];
502 w0_t[0] |= salt_buf_t3[0];
503 w0_t[1] = salt_buf_t3[1];
504 w0_t[2] = salt_buf_t3[2];
505 w0_t[3] = salt_buf_t3[3];
506 w1_t[0] = salt_buf_t3[4];
509 w1_t[0] |= digest_t3[0];
510 w1_t[1] = digest_t3[1];
513 w1_t[2] = salt_buf_t0[0];
514 w1_t[3] = salt_buf_t0[1];
515 w2_t[0] = salt_buf_t0[2];
516 w2_t[1] = salt_buf_t0[3];
519 w2_t[2] = digest_t0[0];
520 w2_t[3] = digest_t0[1];
523 w2_t[3] |= salt_buf_t1[0];
524 w3_t[0] = salt_buf_t1[1];
525 w3_t[1] = salt_buf_t1[2];
526 w3_t[2] = salt_buf_t1[3];
527 w3_t[3] = salt_buf_t1[4];
530 w3_t[3] |= digest_t1[0];
532 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
552 w0_t[0] = digest_t1[1];
555 w0_t[0] |= salt_buf_t2[0];
556 w0_t[1] = salt_buf_t2[1];
557 w0_t[2] = salt_buf_t2[2];
558 w0_t[3] = salt_buf_t2[3];
559 w1_t[0] = salt_buf_t2[4];
562 w1_t[0] |= digest_t2[0];
563 w1_t[1] = digest_t2[1];
566 w1_t[1] |= salt_buf_t3[0];
567 w1_t[2] = salt_buf_t3[1];
568 w1_t[3] = salt_buf_t3[2];
569 w2_t[0] = salt_buf_t3[3];
570 w2_t[1] = salt_buf_t3[4];
573 w2_t[1] |= digest_t3[0];
574 w2_t[2] = digest_t3[1];
577 w2_t[3] = salt_buf_t0[0];
578 w3_t[0] = salt_buf_t0[1];
579 w3_t[1] = salt_buf_t0[2];
580 w3_t[2] = salt_buf_t0[3];
583 w3_t[3] = digest_t0[0];
585 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
605 w0_t[0] = digest_t0[1];
608 w0_t[0] |= salt_buf_t1[0];
609 w0_t[1] = salt_buf_t1[1];
610 w0_t[2] = salt_buf_t1[2];
611 w0_t[3] = salt_buf_t1[3];
612 w1_t[0] = salt_buf_t1[4];
615 w1_t[0] |= digest_t1[0];
616 w1_t[1] = digest_t1[1];
619 w1_t[1] |= salt_buf_t2[0];
620 w1_t[2] = salt_buf_t2[1];
621 w1_t[3] = salt_buf_t2[2];
622 w2_t[0] = salt_buf_t2[3];
623 w2_t[1] = salt_buf_t2[4];
626 w2_t[1] |= digest_t2[0];
627 w2_t[2] = digest_t2[1];
630 w2_t[2] |= salt_buf_t3[0];
631 w2_t[3] = salt_buf_t3[1];
632 w3_t[0] = salt_buf_t3[2];
633 w3_t[1] = salt_buf_t3[3];
634 w3_t[2] = salt_buf_t3[4];
637 w3_t[2] |= digest_t3[0];
638 w3_t[3] = digest_t3[1];
640 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
642 w0_t[0] = salt_buf_t0[0];
643 w0_t[1] = salt_buf_t0[1];
644 w0_t[2] = salt_buf_t0[2];
645 w0_t[3] = salt_buf_t0[3];
656 w3_t[2] = 21 * 16 * 8;
659 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
661 // now the 40 bit input for the MD5 which then will generate the RC4 key, so it's precomputable!
664 w0_t[1] = digest[1] & 0xff;
685 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
696 rc4_init_16 (rc4_key, key);
700 u8 j = rc4_next_16 (rc4_key, 0, 0, encryptedVerifier, out);
724 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
726 rc4_next_16 (rc4_key, 16, j, digest, out);
728 const u32 r0 = out[0];
729 const u32 r1 = out[1];
730 const u32 r2 = out[2];
731 const u32 r3 = out[3];
737 static void m09700s (__local RC4_KEY rc4_keys[64], u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 pw_len, __global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset)
743 const u32 gid = get_global_id (0);
744 const u32 lid = get_local_id (0);
746 __local RC4_KEY *rc4_key = &rc4_keys[lid];
752 const u32 search[4] =
754 digests_buf[digests_offset].digest_buf[DGST_R0],
755 digests_buf[digests_offset].digest_buf[DGST_R1],
756 digests_buf[digests_offset].digest_buf[DGST_R2],
757 digests_buf[digests_offset].digest_buf[DGST_R3]
769 salt_buf_t0[0] = salt_bufs[salt_pos].salt_buf[0];
770 salt_buf_t0[1] = salt_bufs[salt_pos].salt_buf[1];
771 salt_buf_t0[2] = salt_bufs[salt_pos].salt_buf[2];
772 salt_buf_t0[3] = salt_bufs[salt_pos].salt_buf[3];
774 salt_buf_t1[0] = salt_buf_t0[0] << 8;
775 salt_buf_t1[1] = salt_buf_t0[0] >> 24 | salt_buf_t0[1] << 8;
776 salt_buf_t1[2] = salt_buf_t0[1] >> 24 | salt_buf_t0[2] << 8;
777 salt_buf_t1[3] = salt_buf_t0[2] >> 24 | salt_buf_t0[3] << 8;
778 salt_buf_t1[4] = salt_buf_t0[3] >> 24;
780 salt_buf_t2[0] = salt_buf_t0[0] << 16;
781 salt_buf_t2[1] = salt_buf_t0[0] >> 16 | salt_buf_t0[1] << 16;
782 salt_buf_t2[2] = salt_buf_t0[1] >> 16 | salt_buf_t0[2] << 16;
783 salt_buf_t2[3] = salt_buf_t0[2] >> 16 | salt_buf_t0[3] << 16;
784 salt_buf_t2[4] = salt_buf_t0[3] >> 16;
786 salt_buf_t3[0] = salt_buf_t0[0] << 24;
787 salt_buf_t3[1] = salt_buf_t0[0] >> 8 | salt_buf_t0[1] << 24;
788 salt_buf_t3[2] = salt_buf_t0[1] >> 8 | salt_buf_t0[2] << 24;
789 salt_buf_t3[3] = salt_buf_t0[2] >> 8 | salt_buf_t0[3] << 24;
790 salt_buf_t3[4] = salt_buf_t0[3] >> 8;
792 const u32 salt_len = 16;
798 const u32 version = oldoffice01_bufs[salt_pos].version;
800 u32 encryptedVerifier[4];
802 encryptedVerifier[0] = oldoffice01_bufs[salt_pos].encryptedVerifier[0];
803 encryptedVerifier[1] = oldoffice01_bufs[salt_pos].encryptedVerifier[1];
804 encryptedVerifier[2] = oldoffice01_bufs[salt_pos].encryptedVerifier[2];
805 encryptedVerifier[3] = oldoffice01_bufs[salt_pos].encryptedVerifier[3];
813 for (u32 il_pos = 0; il_pos < bfs_cnt; il_pos++)
815 const u32 w0r = bfs_buf[il_pos].i;
838 w3_t[2] = pw_len * 8;
842 u32 digest_t1[2]; // need only first 5 byte
846 digest_t0[0] = MD5M_A;
847 digest_t0[1] = MD5M_B;
848 digest_t0[2] = MD5M_C;
849 digest_t0[3] = MD5M_D;
851 md5_transform (w0_t, w1_t, w2_t, w3_t, digest_t0);
853 // prepare 16 * 21 buffer stuff
864 digest_t0[0] &= 0xffffffff;
865 digest_t0[1] &= 0x000000ff;
866 digest_t0[2] &= 0x00000000;
867 digest_t0[3] &= 0x00000000;
869 digest_t1[0] = digest_t0[0] << 8;
870 digest_t1[1] = digest_t0[0] >> 24 | digest_t0[1] << 8;
872 digest_t2[0] = digest_t0[0] << 16;
873 digest_t2[1] = digest_t0[0] >> 16 | digest_t0[1] << 16;
875 digest_t3[0] = digest_t0[0] << 24;
876 digest_t3[1] = digest_t0[0] >> 8 | digest_t0[1] << 24;
878 // generate the 16 * 21 buffer
898 w0_t[0] = digest_t0[0];
899 w0_t[1] = digest_t0[1];
902 w0_t[1] |= salt_buf_t1[0];
903 w0_t[2] = salt_buf_t1[1];
904 w0_t[3] = salt_buf_t1[2];
905 w1_t[0] = salt_buf_t1[3];
906 w1_t[1] = salt_buf_t1[4];
909 w1_t[1] |= digest_t1[0];
910 w1_t[2] = digest_t1[1];
913 w1_t[2] |= salt_buf_t2[0];
914 w1_t[3] = salt_buf_t2[1];
915 w2_t[0] = salt_buf_t2[2];
916 w2_t[1] = salt_buf_t2[3];
917 w2_t[2] = salt_buf_t2[4];
920 w2_t[2] |= digest_t2[0];
921 w2_t[3] = digest_t2[1];
924 w2_t[3] |= salt_buf_t3[0];
925 w3_t[0] = salt_buf_t3[1];
926 w3_t[1] = salt_buf_t3[2];
927 w3_t[2] = salt_buf_t3[3];
928 w3_t[3] = salt_buf_t3[4];
932 w3_t[3] |= digest_t3[0];
934 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
954 w0_t[0] = digest_t3[1];
957 w0_t[1] = salt_buf_t0[0];
958 w0_t[2] = salt_buf_t0[1];
959 w0_t[3] = salt_buf_t0[2];
960 w1_t[0] = salt_buf_t0[3];
963 w1_t[1] = digest_t0[0];
964 w1_t[2] = digest_t0[1];
967 w1_t[2] |= salt_buf_t1[0];
968 w1_t[3] = salt_buf_t1[1];
969 w2_t[0] = salt_buf_t1[2];
970 w2_t[1] = salt_buf_t1[3];
971 w2_t[2] = salt_buf_t1[4];
974 w2_t[2] |= digest_t1[0];
975 w2_t[3] = digest_t1[1];
978 w2_t[3] |= salt_buf_t2[0];
979 w3_t[0] = salt_buf_t2[1];
980 w3_t[1] = salt_buf_t2[2];
981 w3_t[2] = salt_buf_t2[3];
982 w3_t[3] = salt_buf_t2[4];
985 w3_t[3] |= digest_t2[0];
987 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1007 w0_t[0] = digest_t2[1];
1010 w0_t[0] |= salt_buf_t3[0];
1011 w0_t[1] = salt_buf_t3[1];
1012 w0_t[2] = salt_buf_t3[2];
1013 w0_t[3] = salt_buf_t3[3];
1014 w1_t[0] = salt_buf_t3[4];
1017 w1_t[0] |= digest_t3[0];
1018 w1_t[1] = digest_t3[1];
1021 w1_t[2] = salt_buf_t0[0];
1022 w1_t[3] = salt_buf_t0[1];
1023 w2_t[0] = salt_buf_t0[2];
1024 w2_t[1] = salt_buf_t0[3];
1027 w2_t[2] = digest_t0[0];
1028 w2_t[3] = digest_t0[1];
1031 w2_t[3] |= salt_buf_t1[0];
1032 w3_t[0] = salt_buf_t1[1];
1033 w3_t[1] = salt_buf_t1[2];
1034 w3_t[2] = salt_buf_t1[3];
1035 w3_t[3] = salt_buf_t1[4];
1038 w3_t[3] |= digest_t1[0];
1040 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1060 w0_t[0] = digest_t1[1];
1063 w0_t[0] |= salt_buf_t2[0];
1064 w0_t[1] = salt_buf_t2[1];
1065 w0_t[2] = salt_buf_t2[2];
1066 w0_t[3] = salt_buf_t2[3];
1067 w1_t[0] = salt_buf_t2[4];
1070 w1_t[0] |= digest_t2[0];
1071 w1_t[1] = digest_t2[1];
1074 w1_t[1] |= salt_buf_t3[0];
1075 w1_t[2] = salt_buf_t3[1];
1076 w1_t[3] = salt_buf_t3[2];
1077 w2_t[0] = salt_buf_t3[3];
1078 w2_t[1] = salt_buf_t3[4];
1081 w2_t[1] |= digest_t3[0];
1082 w2_t[2] = digest_t3[1];
1085 w2_t[3] = salt_buf_t0[0];
1086 w3_t[0] = salt_buf_t0[1];
1087 w3_t[1] = salt_buf_t0[2];
1088 w3_t[2] = salt_buf_t0[3];
1091 w3_t[3] = digest_t0[0];
1093 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1113 w0_t[0] = digest_t0[1];
1116 w0_t[0] |= salt_buf_t1[0];
1117 w0_t[1] = salt_buf_t1[1];
1118 w0_t[2] = salt_buf_t1[2];
1119 w0_t[3] = salt_buf_t1[3];
1120 w1_t[0] = salt_buf_t1[4];
1123 w1_t[0] |= digest_t1[0];
1124 w1_t[1] = digest_t1[1];
1127 w1_t[1] |= salt_buf_t2[0];
1128 w1_t[2] = salt_buf_t2[1];
1129 w1_t[3] = salt_buf_t2[2];
1130 w2_t[0] = salt_buf_t2[3];
1131 w2_t[1] = salt_buf_t2[4];
1134 w2_t[1] |= digest_t2[0];
1135 w2_t[2] = digest_t2[1];
1138 w2_t[2] |= salt_buf_t3[0];
1139 w2_t[3] = salt_buf_t3[1];
1140 w3_t[0] = salt_buf_t3[2];
1141 w3_t[1] = salt_buf_t3[3];
1142 w3_t[2] = salt_buf_t3[4];
1145 w3_t[2] |= digest_t3[0];
1146 w3_t[3] = digest_t3[1];
1148 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1150 w0_t[0] = salt_buf_t0[0];
1151 w0_t[1] = salt_buf_t0[1];
1152 w0_t[2] = salt_buf_t0[2];
1153 w0_t[3] = salt_buf_t0[3];
1164 w3_t[2] = 21 * 16 * 8;
1167 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1169 // now the 40 bit input for the MD5 which then will generate the RC4 key, so it's precomputable!
1171 w0_t[0] = digest[0];
1172 w0_t[1] = digest[1] & 0xff;
1193 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1204 rc4_init_16 (rc4_key, key);
1208 u8 j = rc4_next_16 (rc4_key, 0, 0, encryptedVerifier, out);
1232 md5_transform (w0_t, w1_t, w2_t, w3_t, digest);
1234 rc4_next_16 (rc4_key, 16, j, digest, out);
1236 const u32 r0 = out[0];
1237 const u32 r1 = out[1];
1238 const u32 r2 = out[2];
1239 const u32 r3 = out[3];
1245 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m09700_m04 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1251 const u32 gid = get_global_id (0);
1253 if (gid >= gid_max) return;
1257 w0[0] = pws[gid].i[ 0];
1258 w0[1] = pws[gid].i[ 1];
1259 w0[2] = pws[gid].i[ 2];
1260 w0[3] = pws[gid].i[ 3];
1283 const u32 pw_len = pws[gid].pw_len;
1289 __local RC4_KEY rc4_keys[64];
1291 m09700m (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1294 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m09700_m08 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1300 const u32 gid = get_global_id (0);
1302 if (gid >= gid_max) return;
1306 w0[0] = pws[gid].i[ 0];
1307 w0[1] = pws[gid].i[ 1];
1308 w0[2] = pws[gid].i[ 2];
1309 w0[3] = pws[gid].i[ 3];
1313 w1[0] = pws[gid].i[ 4];
1314 w1[1] = pws[gid].i[ 5];
1315 w1[2] = pws[gid].i[ 6];
1316 w1[3] = pws[gid].i[ 7];
1332 const u32 pw_len = pws[gid].pw_len;
1338 __local RC4_KEY rc4_keys[64];
1340 m09700m (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1343 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m09700_m16 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1349 const u32 gid = get_global_id (0);
1351 if (gid >= gid_max) return;
1355 w0[0] = pws[gid].i[ 0];
1356 w0[1] = pws[gid].i[ 1];
1357 w0[2] = pws[gid].i[ 2];
1358 w0[3] = pws[gid].i[ 3];
1362 w1[0] = pws[gid].i[ 4];
1363 w1[1] = pws[gid].i[ 5];
1364 w1[2] = pws[gid].i[ 6];
1365 w1[3] = pws[gid].i[ 7];
1369 w2[0] = pws[gid].i[ 8];
1370 w2[1] = pws[gid].i[ 9];
1371 w2[2] = pws[gid].i[10];
1372 w2[3] = pws[gid].i[11];
1376 w3[0] = pws[gid].i[12];
1377 w3[1] = pws[gid].i[13];
1381 const u32 pw_len = pws[gid].pw_len;
1387 __local RC4_KEY rc4_keys[64];
1389 m09700m (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1392 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m09700_s04 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1398 const u32 gid = get_global_id (0);
1400 if (gid >= gid_max) return;
1404 w0[0] = pws[gid].i[ 0];
1405 w0[1] = pws[gid].i[ 1];
1406 w0[2] = pws[gid].i[ 2];
1407 w0[3] = pws[gid].i[ 3];
1430 const u32 pw_len = pws[gid].pw_len;
1436 __local RC4_KEY rc4_keys[64];
1438 m09700s (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1441 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m09700_s08 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1447 const u32 gid = get_global_id (0);
1449 if (gid >= gid_max) return;
1453 w0[0] = pws[gid].i[ 0];
1454 w0[1] = pws[gid].i[ 1];
1455 w0[2] = pws[gid].i[ 2];
1456 w0[3] = pws[gid].i[ 3];
1460 w1[0] = pws[gid].i[ 4];
1461 w1[1] = pws[gid].i[ 5];
1462 w1[2] = pws[gid].i[ 6];
1463 w1[3] = pws[gid].i[ 7];
1479 const u32 pw_len = pws[gid].pw_len;
1485 __local RC4_KEY rc4_keys[64];
1487 m09700s (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1490 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m09700_s16 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global oldoffice01_t *oldoffice01_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1496 const u32 gid = get_global_id (0);
1498 if (gid >= gid_max) return;
1502 w0[0] = pws[gid].i[ 0];
1503 w0[1] = pws[gid].i[ 1];
1504 w0[2] = pws[gid].i[ 2];
1505 w0[3] = pws[gid].i[ 3];
1509 w1[0] = pws[gid].i[ 4];
1510 w1[1] = pws[gid].i[ 5];
1511 w1[2] = pws[gid].i[ 6];
1512 w1[3] = pws[gid].i[ 7];
1516 w2[0] = pws[gid].i[ 8];
1517 w2[1] = pws[gid].i[ 9];
1518 w2[2] = pws[gid].i[10];
1519 w2[3] = pws[gid].i[11];
1523 w3[0] = pws[gid].i[12];
1524 w3[1] = pws[gid].i[13];
1528 const u32 pw_len = pws[gid].pw_len;
1534 __local RC4_KEY rc4_keys[64];
1536 m09700s (rc4_keys, w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, bfs_buf, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, oldoffice01_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);