2 * Author......: Jens Steube <jens.steube@gmail.com>
10 #include "include/constants.h"
11 #include "include/kernel_vendor.h"
18 #include "include/kernel_functions.c"
20 #include "OpenCL/types_ocl.c"
21 #include "OpenCL/common.c"
22 #include "OpenCL/simd.c"
24 #define uint_to_hex_lower8_le(i) l_bin2asc[(i)]
26 __kernel void m04700_m04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 combs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
32 const u32 gid = get_global_id (0);
33 const u32 lid = get_local_id (0);
34 const u32 lsz = get_local_size (0);
40 __local u32 l_bin2asc[256];
42 for (u32 i = lid; i < 256; i += lsz)
44 const u32 i0 = (i >> 0) & 15;
45 const u32 i1 = (i >> 4) & 15;
47 l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 0
48 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 8;
51 barrier (CLK_LOCAL_MEM_FENCE);
53 if (gid >= gid_max) return;
62 pws0[0] = pws[gid].i[0];
63 pws0[1] = pws[gid].i[1];
64 pws0[2] = pws[gid].i[2];
65 pws0[3] = pws[gid].i[3];
66 pws1[0] = pws[gid].i[4];
67 pws1[1] = pws[gid].i[5];
68 pws1[2] = pws[gid].i[6];
69 pws1[3] = pws[gid].i[7];
71 const u32 pw_l_len = pws[gid].pw_len;
77 for (u32 il_pos = 0; il_pos < combs_cnt; il_pos += VECT_SIZE)
79 const u32x pw_r_len = pwlenx_create_combt (combs_buf, il_pos);
81 const u32x pw_len = pw_l_len + pw_r_len;
83 u32x wordr0[4] = { 0 };
84 u32x wordr1[4] = { 0 };
85 u32x wordr2[4] = { 0 };
86 u32x wordr3[4] = { 0 };
88 wordr0[0] = ix_create_combt (combs_buf, il_pos, 0);
89 wordr0[1] = ix_create_combt (combs_buf, il_pos, 1);
90 wordr0[2] = ix_create_combt (combs_buf, il_pos, 2);
91 wordr0[3] = ix_create_combt (combs_buf, il_pos, 3);
92 wordr1[0] = ix_create_combt (combs_buf, il_pos, 4);
93 wordr1[1] = ix_create_combt (combs_buf, il_pos, 5);
94 wordr1[2] = ix_create_combt (combs_buf, il_pos, 6);
95 wordr1[3] = ix_create_combt (combs_buf, il_pos, 7);
97 if (combs_mode == COMBINATOR_MODE_BASE_LEFT)
99 append_0x80_2x4 (wordr0, wordr1, pw_r_len);
101 switch_buffer_by_offset_le (wordr0, wordr1, wordr2, wordr3, pw_l_len);
106 w0[0] = wordl0[0] | wordr0[0];
107 w0[1] = wordl0[1] | wordr0[1];
108 w0[2] = wordl0[2] | wordr0[2];
109 w0[3] = wordl0[3] | wordr0[3];
113 w1[0] = wordl1[0] | wordr1[0];
114 w1[1] = wordl1[1] | wordr1[1];
115 w1[2] = wordl1[2] | wordr1[2];
116 w1[3] = wordl1[3] | wordr1[3];
120 w2[0] = wordl2[0] | wordr2[0];
121 w2[1] = wordl2[1] | wordr2[1];
122 w2[2] = wordl2[2] | wordr2[2];
123 w2[3] = wordl2[3] | wordr2[3];
127 w3[0] = wordl3[0] | wordr3[0];
128 w3[1] = wordl3[1] | wordr3[1];
141 MD5_STEP (MD5_Fo, a, b, c, d, w0[0], MD5C00, MD5S00);
142 MD5_STEP (MD5_Fo, d, a, b, c, w0[1], MD5C01, MD5S01);
143 MD5_STEP (MD5_Fo, c, d, a, b, w0[2], MD5C02, MD5S02);
144 MD5_STEP (MD5_Fo, b, c, d, a, w0[3], MD5C03, MD5S03);
145 MD5_STEP (MD5_Fo, a, b, c, d, w1[0], MD5C04, MD5S00);
146 MD5_STEP (MD5_Fo, d, a, b, c, w1[1], MD5C05, MD5S01);
147 MD5_STEP (MD5_Fo, c, d, a, b, w1[2], MD5C06, MD5S02);
148 MD5_STEP (MD5_Fo, b, c, d, a, w1[3], MD5C07, MD5S03);
149 MD5_STEP (MD5_Fo, a, b, c, d, w2[0], MD5C08, MD5S00);
150 MD5_STEP (MD5_Fo, d, a, b, c, w2[1], MD5C09, MD5S01);
151 MD5_STEP (MD5_Fo, c, d, a, b, w2[2], MD5C0a, MD5S02);
152 MD5_STEP (MD5_Fo, b, c, d, a, w2[3], MD5C0b, MD5S03);
153 MD5_STEP (MD5_Fo, a, b, c, d, w3[0], MD5C0c, MD5S00);
154 MD5_STEP (MD5_Fo, d, a, b, c, w3[1], MD5C0d, MD5S01);
155 MD5_STEP (MD5_Fo, c, d, a, b, w3[2], MD5C0e, MD5S02);
156 MD5_STEP (MD5_Fo, b, c, d, a, w3[3], MD5C0f, MD5S03);
158 MD5_STEP (MD5_Go, a, b, c, d, w0[1], MD5C10, MD5S10);
159 MD5_STEP (MD5_Go, d, a, b, c, w1[2], MD5C11, MD5S11);
160 MD5_STEP (MD5_Go, c, d, a, b, w2[3], MD5C12, MD5S12);
161 MD5_STEP (MD5_Go, b, c, d, a, w0[0], MD5C13, MD5S13);
162 MD5_STEP (MD5_Go, a, b, c, d, w1[1], MD5C14, MD5S10);
163 MD5_STEP (MD5_Go, d, a, b, c, w2[2], MD5C15, MD5S11);
164 MD5_STEP (MD5_Go, c, d, a, b, w3[3], MD5C16, MD5S12);
165 MD5_STEP (MD5_Go, b, c, d, a, w1[0], MD5C17, MD5S13);
166 MD5_STEP (MD5_Go, a, b, c, d, w2[1], MD5C18, MD5S10);
167 MD5_STEP (MD5_Go, d, a, b, c, w3[2], MD5C19, MD5S11);
168 MD5_STEP (MD5_Go, c, d, a, b, w0[3], MD5C1a, MD5S12);
169 MD5_STEP (MD5_Go, b, c, d, a, w2[0], MD5C1b, MD5S13);
170 MD5_STEP (MD5_Go, a, b, c, d, w3[1], MD5C1c, MD5S10);
171 MD5_STEP (MD5_Go, d, a, b, c, w0[2], MD5C1d, MD5S11);
172 MD5_STEP (MD5_Go, c, d, a, b, w1[3], MD5C1e, MD5S12);
173 MD5_STEP (MD5_Go, b, c, d, a, w3[0], MD5C1f, MD5S13);
175 MD5_STEP (MD5_H , a, b, c, d, w1[1], MD5C20, MD5S20);
176 MD5_STEP (MD5_H , d, a, b, c, w2[0], MD5C21, MD5S21);
177 MD5_STEP (MD5_H , c, d, a, b, w2[3], MD5C22, MD5S22);
178 MD5_STEP (MD5_H , b, c, d, a, w3[2], MD5C23, MD5S23);
179 MD5_STEP (MD5_H , a, b, c, d, w0[1], MD5C24, MD5S20);
180 MD5_STEP (MD5_H , d, a, b, c, w1[0], MD5C25, MD5S21);
181 MD5_STEP (MD5_H , c, d, a, b, w1[3], MD5C26, MD5S22);
182 MD5_STEP (MD5_H , b, c, d, a, w2[2], MD5C27, MD5S23);
183 MD5_STEP (MD5_H , a, b, c, d, w3[1], MD5C28, MD5S20);
184 MD5_STEP (MD5_H , d, a, b, c, w0[0], MD5C29, MD5S21);
185 MD5_STEP (MD5_H , c, d, a, b, w0[3], MD5C2a, MD5S22);
186 MD5_STEP (MD5_H , b, c, d, a, w1[2], MD5C2b, MD5S23);
187 MD5_STEP (MD5_H , a, b, c, d, w2[1], MD5C2c, MD5S20);
188 MD5_STEP (MD5_H , d, a, b, c, w3[0], MD5C2d, MD5S21);
189 MD5_STEP (MD5_H , c, d, a, b, w3[3], MD5C2e, MD5S22);
190 MD5_STEP (MD5_H , b, c, d, a, w0[2], MD5C2f, MD5S23);
192 MD5_STEP (MD5_I , a, b, c, d, w0[0], MD5C30, MD5S30);
193 MD5_STEP (MD5_I , d, a, b, c, w1[3], MD5C31, MD5S31);
194 MD5_STEP (MD5_I , c, d, a, b, w3[2], MD5C32, MD5S32);
195 MD5_STEP (MD5_I , b, c, d, a, w1[1], MD5C33, MD5S33);
196 MD5_STEP (MD5_I , a, b, c, d, w3[0], MD5C34, MD5S30);
197 MD5_STEP (MD5_I , d, a, b, c, w0[3], MD5C35, MD5S31);
198 MD5_STEP (MD5_I , c, d, a, b, w2[2], MD5C36, MD5S32);
199 MD5_STEP (MD5_I , b, c, d, a, w0[1], MD5C37, MD5S33);
200 MD5_STEP (MD5_I , a, b, c, d, w2[0], MD5C38, MD5S30);
201 MD5_STEP (MD5_I , d, a, b, c, w3[3], MD5C39, MD5S31);
202 MD5_STEP (MD5_I , c, d, a, b, w1[2], MD5C3a, MD5S32);
203 MD5_STEP (MD5_I , b, c, d, a, w3[1], MD5C3b, MD5S33);
204 MD5_STEP (MD5_I , a, b, c, d, w1[0], MD5C3c, MD5S30);
205 MD5_STEP (MD5_I , d, a, b, c, w2[3], MD5C3d, MD5S31);
206 MD5_STEP (MD5_I , c, d, a, b, w0[2], MD5C3e, MD5S32);
207 MD5_STEP (MD5_I , b, c, d, a, w2[1], MD5C3f, MD5S33);
218 u32x w0_t = uint_to_hex_lower8_le ((a >> 8) & 255) << 0
219 | uint_to_hex_lower8_le ((a >> 0) & 255) << 16;
220 u32x w1_t = uint_to_hex_lower8_le ((a >> 24) & 255) << 0
221 | uint_to_hex_lower8_le ((a >> 16) & 255) << 16;
222 u32x w2_t = uint_to_hex_lower8_le ((b >> 8) & 255) << 0
223 | uint_to_hex_lower8_le ((b >> 0) & 255) << 16;
224 u32x w3_t = uint_to_hex_lower8_le ((b >> 24) & 255) << 0
225 | uint_to_hex_lower8_le ((b >> 16) & 255) << 16;
226 u32x w4_t = uint_to_hex_lower8_le ((c >> 8) & 255) << 0
227 | uint_to_hex_lower8_le ((c >> 0) & 255) << 16;
228 u32x w5_t = uint_to_hex_lower8_le ((c >> 24) & 255) << 0
229 | uint_to_hex_lower8_le ((c >> 16) & 255) << 16;
230 u32x w6_t = uint_to_hex_lower8_le ((d >> 8) & 255) << 0
231 | uint_to_hex_lower8_le ((d >> 0) & 255) << 16;
232 u32x w7_t = uint_to_hex_lower8_le ((d >> 24) & 255) << 0
233 | uint_to_hex_lower8_le ((d >> 16) & 255) << 16;
235 u32x w8_t = 0x80000000;
255 SHA1_STEP (SHA1_F0o, a, b, c, d, e, w0_t);
256 SHA1_STEP (SHA1_F0o, e, a, b, c, d, w1_t);
257 SHA1_STEP (SHA1_F0o, d, e, a, b, c, w2_t);
258 SHA1_STEP (SHA1_F0o, c, d, e, a, b, w3_t);
259 SHA1_STEP (SHA1_F0o, b, c, d, e, a, w4_t);
260 SHA1_STEP (SHA1_F0o, a, b, c, d, e, w5_t);
261 SHA1_STEP (SHA1_F0o, e, a, b, c, d, w6_t);
262 SHA1_STEP (SHA1_F0o, d, e, a, b, c, w7_t);
263 SHA1_STEP (SHA1_F0o, c, d, e, a, b, w8_t);
264 SHA1_STEP (SHA1_F0o, b, c, d, e, a, w9_t);
265 SHA1_STEP (SHA1_F0o, a, b, c, d, e, wa_t);
266 SHA1_STEP (SHA1_F0o, e, a, b, c, d, wb_t);
267 SHA1_STEP (SHA1_F0o, d, e, a, b, c, wc_t);
268 SHA1_STEP (SHA1_F0o, c, d, e, a, b, wd_t);
269 SHA1_STEP (SHA1_F0o, b, c, d, e, a, we_t);
270 SHA1_STEP (SHA1_F0o, a, b, c, d, e, wf_t);
271 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F0o, e, a, b, c, d, w0_t);
272 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F0o, d, e, a, b, c, w1_t);
273 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F0o, c, d, e, a, b, w2_t);
274 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F0o, b, c, d, e, a, w3_t);
279 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w4_t);
280 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w5_t);
281 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w6_t);
282 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w7_t);
283 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w8_t);
284 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w9_t);
285 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wa_t);
286 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, wb_t);
287 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, wc_t);
288 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, wd_t);
289 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, we_t);
290 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wf_t);
291 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w0_t);
292 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w1_t);
293 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w2_t);
294 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w3_t);
295 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w4_t);
296 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w5_t);
297 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w6_t);
298 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w7_t);
303 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, w8_t);
304 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, w9_t);
305 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, wa_t);
306 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, wb_t);
307 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, wc_t);
308 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, wd_t);
309 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, we_t);
310 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, wf_t);
311 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, w0_t);
312 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, w1_t);
313 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, w2_t);
314 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, w3_t);
315 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, w4_t);
316 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, w5_t);
317 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, w6_t);
318 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, w7_t);
319 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, w8_t);
320 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, w9_t);
321 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, wa_t);
322 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, wb_t);
327 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, wc_t);
328 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wd_t);
329 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, we_t);
330 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, wf_t);
331 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w0_t);
332 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w1_t);
333 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w2_t);
334 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w3_t);
335 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w4_t);
336 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w5_t);
337 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w6_t);
338 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w7_t);
339 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w8_t);
340 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w9_t);
341 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, wa_t);
342 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, wb_t);
343 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wc_t);
344 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, wd_t);
345 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, we_t);
346 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, wf_t);
347 COMPARE_M_SIMD (a, d, c, b);
351 __kernel void m04700_m08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 combs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
355 __kernel void m04700_m16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 combs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
359 __kernel void m04700_s04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 combs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
365 const u32 gid = get_global_id (0);
366 const u32 lid = get_local_id (0);
367 const u32 lsz = get_local_size (0);
373 __local u32 l_bin2asc[256];
375 for (u32 i = lid; i < 256; i += lsz)
377 const u32 i0 = (i >> 0) & 15;
378 const u32 i1 = (i >> 4) & 15;
380 l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 0
381 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 8;
384 barrier (CLK_LOCAL_MEM_FENCE);
386 if (gid >= gid_max) return;
395 pws0[0] = pws[gid].i[0];
396 pws0[1] = pws[gid].i[1];
397 pws0[2] = pws[gid].i[2];
398 pws0[3] = pws[gid].i[3];
399 pws1[0] = pws[gid].i[4];
400 pws1[1] = pws[gid].i[5];
401 pws1[2] = pws[gid].i[6];
402 pws1[3] = pws[gid].i[7];
404 const u32 pw_l_len = pws[gid].pw_len;
410 const u32 search[4] =
412 digests_buf[digests_offset].digest_buf[DGST_R0],
413 digests_buf[digests_offset].digest_buf[DGST_R1],
414 digests_buf[digests_offset].digest_buf[DGST_R2],
415 digests_buf[digests_offset].digest_buf[DGST_R3]
422 const u32 e_rev = rotl32_S (search[1], 2u);
428 for (u32 il_pos = 0; il_pos < combs_cnt; il_pos += VECT_SIZE)
430 const u32x pw_r_len = pwlenx_create_combt (combs_buf, il_pos);
432 const u32x pw_len = pw_l_len + pw_r_len;
434 u32x wordr0[4] = { 0 };
435 u32x wordr1[4] = { 0 };
436 u32x wordr2[4] = { 0 };
437 u32x wordr3[4] = { 0 };
439 wordr0[0] = ix_create_combt (combs_buf, il_pos, 0);
440 wordr0[1] = ix_create_combt (combs_buf, il_pos, 1);
441 wordr0[2] = ix_create_combt (combs_buf, il_pos, 2);
442 wordr0[3] = ix_create_combt (combs_buf, il_pos, 3);
443 wordr1[0] = ix_create_combt (combs_buf, il_pos, 4);
444 wordr1[1] = ix_create_combt (combs_buf, il_pos, 5);
445 wordr1[2] = ix_create_combt (combs_buf, il_pos, 6);
446 wordr1[3] = ix_create_combt (combs_buf, il_pos, 7);
448 if (combs_mode == COMBINATOR_MODE_BASE_LEFT)
450 append_0x80_2x4 (wordr0, wordr1, pw_r_len);
452 switch_buffer_by_offset_le (wordr0, wordr1, wordr2, wordr3, pw_l_len);
457 w0[0] = wordl0[0] | wordr0[0];
458 w0[1] = wordl0[1] | wordr0[1];
459 w0[2] = wordl0[2] | wordr0[2];
460 w0[3] = wordl0[3] | wordr0[3];
464 w1[0] = wordl1[0] | wordr1[0];
465 w1[1] = wordl1[1] | wordr1[1];
466 w1[2] = wordl1[2] | wordr1[2];
467 w1[3] = wordl1[3] | wordr1[3];
471 w2[0] = wordl2[0] | wordr2[0];
472 w2[1] = wordl2[1] | wordr2[1];
473 w2[2] = wordl2[2] | wordr2[2];
474 w2[3] = wordl2[3] | wordr2[3];
478 w3[0] = wordl3[0] | wordr3[0];
479 w3[1] = wordl3[1] | wordr3[1];
492 MD5_STEP (MD5_Fo, a, b, c, d, w0[0], MD5C00, MD5S00);
493 MD5_STEP (MD5_Fo, d, a, b, c, w0[1], MD5C01, MD5S01);
494 MD5_STEP (MD5_Fo, c, d, a, b, w0[2], MD5C02, MD5S02);
495 MD5_STEP (MD5_Fo, b, c, d, a, w0[3], MD5C03, MD5S03);
496 MD5_STEP (MD5_Fo, a, b, c, d, w1[0], MD5C04, MD5S00);
497 MD5_STEP (MD5_Fo, d, a, b, c, w1[1], MD5C05, MD5S01);
498 MD5_STEP (MD5_Fo, c, d, a, b, w1[2], MD5C06, MD5S02);
499 MD5_STEP (MD5_Fo, b, c, d, a, w1[3], MD5C07, MD5S03);
500 MD5_STEP (MD5_Fo, a, b, c, d, w2[0], MD5C08, MD5S00);
501 MD5_STEP (MD5_Fo, d, a, b, c, w2[1], MD5C09, MD5S01);
502 MD5_STEP (MD5_Fo, c, d, a, b, w2[2], MD5C0a, MD5S02);
503 MD5_STEP (MD5_Fo, b, c, d, a, w2[3], MD5C0b, MD5S03);
504 MD5_STEP (MD5_Fo, a, b, c, d, w3[0], MD5C0c, MD5S00);
505 MD5_STEP (MD5_Fo, d, a, b, c, w3[1], MD5C0d, MD5S01);
506 MD5_STEP (MD5_Fo, c, d, a, b, w3[2], MD5C0e, MD5S02);
507 MD5_STEP (MD5_Fo, b, c, d, a, w3[3], MD5C0f, MD5S03);
509 MD5_STEP (MD5_Go, a, b, c, d, w0[1], MD5C10, MD5S10);
510 MD5_STEP (MD5_Go, d, a, b, c, w1[2], MD5C11, MD5S11);
511 MD5_STEP (MD5_Go, c, d, a, b, w2[3], MD5C12, MD5S12);
512 MD5_STEP (MD5_Go, b, c, d, a, w0[0], MD5C13, MD5S13);
513 MD5_STEP (MD5_Go, a, b, c, d, w1[1], MD5C14, MD5S10);
514 MD5_STEP (MD5_Go, d, a, b, c, w2[2], MD5C15, MD5S11);
515 MD5_STEP (MD5_Go, c, d, a, b, w3[3], MD5C16, MD5S12);
516 MD5_STEP (MD5_Go, b, c, d, a, w1[0], MD5C17, MD5S13);
517 MD5_STEP (MD5_Go, a, b, c, d, w2[1], MD5C18, MD5S10);
518 MD5_STEP (MD5_Go, d, a, b, c, w3[2], MD5C19, MD5S11);
519 MD5_STEP (MD5_Go, c, d, a, b, w0[3], MD5C1a, MD5S12);
520 MD5_STEP (MD5_Go, b, c, d, a, w2[0], MD5C1b, MD5S13);
521 MD5_STEP (MD5_Go, a, b, c, d, w3[1], MD5C1c, MD5S10);
522 MD5_STEP (MD5_Go, d, a, b, c, w0[2], MD5C1d, MD5S11);
523 MD5_STEP (MD5_Go, c, d, a, b, w1[3], MD5C1e, MD5S12);
524 MD5_STEP (MD5_Go, b, c, d, a, w3[0], MD5C1f, MD5S13);
526 MD5_STEP (MD5_H , a, b, c, d, w1[1], MD5C20, MD5S20);
527 MD5_STEP (MD5_H , d, a, b, c, w2[0], MD5C21, MD5S21);
528 MD5_STEP (MD5_H , c, d, a, b, w2[3], MD5C22, MD5S22);
529 MD5_STEP (MD5_H , b, c, d, a, w3[2], MD5C23, MD5S23);
530 MD5_STEP (MD5_H , a, b, c, d, w0[1], MD5C24, MD5S20);
531 MD5_STEP (MD5_H , d, a, b, c, w1[0], MD5C25, MD5S21);
532 MD5_STEP (MD5_H , c, d, a, b, w1[3], MD5C26, MD5S22);
533 MD5_STEP (MD5_H , b, c, d, a, w2[2], MD5C27, MD5S23);
534 MD5_STEP (MD5_H , a, b, c, d, w3[1], MD5C28, MD5S20);
535 MD5_STEP (MD5_H , d, a, b, c, w0[0], MD5C29, MD5S21);
536 MD5_STEP (MD5_H , c, d, a, b, w0[3], MD5C2a, MD5S22);
537 MD5_STEP (MD5_H , b, c, d, a, w1[2], MD5C2b, MD5S23);
538 MD5_STEP (MD5_H , a, b, c, d, w2[1], MD5C2c, MD5S20);
539 MD5_STEP (MD5_H , d, a, b, c, w3[0], MD5C2d, MD5S21);
540 MD5_STEP (MD5_H , c, d, a, b, w3[3], MD5C2e, MD5S22);
541 MD5_STEP (MD5_H , b, c, d, a, w0[2], MD5C2f, MD5S23);
543 MD5_STEP (MD5_I , a, b, c, d, w0[0], MD5C30, MD5S30);
544 MD5_STEP (MD5_I , d, a, b, c, w1[3], MD5C31, MD5S31);
545 MD5_STEP (MD5_I , c, d, a, b, w3[2], MD5C32, MD5S32);
546 MD5_STEP (MD5_I , b, c, d, a, w1[1], MD5C33, MD5S33);
547 MD5_STEP (MD5_I , a, b, c, d, w3[0], MD5C34, MD5S30);
548 MD5_STEP (MD5_I , d, a, b, c, w0[3], MD5C35, MD5S31);
549 MD5_STEP (MD5_I , c, d, a, b, w2[2], MD5C36, MD5S32);
550 MD5_STEP (MD5_I , b, c, d, a, w0[1], MD5C37, MD5S33);
551 MD5_STEP (MD5_I , a, b, c, d, w2[0], MD5C38, MD5S30);
552 MD5_STEP (MD5_I , d, a, b, c, w3[3], MD5C39, MD5S31);
553 MD5_STEP (MD5_I , c, d, a, b, w1[2], MD5C3a, MD5S32);
554 MD5_STEP (MD5_I , b, c, d, a, w3[1], MD5C3b, MD5S33);
555 MD5_STEP (MD5_I , a, b, c, d, w1[0], MD5C3c, MD5S30);
556 MD5_STEP (MD5_I , d, a, b, c, w2[3], MD5C3d, MD5S31);
557 MD5_STEP (MD5_I , c, d, a, b, w0[2], MD5C3e, MD5S32);
558 MD5_STEP (MD5_I , b, c, d, a, w2[1], MD5C3f, MD5S33);
569 u32x w0_t = uint_to_hex_lower8_le ((a >> 8) & 255) << 0
570 | uint_to_hex_lower8_le ((a >> 0) & 255) << 16;
571 u32x w1_t = uint_to_hex_lower8_le ((a >> 24) & 255) << 0
572 | uint_to_hex_lower8_le ((a >> 16) & 255) << 16;
573 u32x w2_t = uint_to_hex_lower8_le ((b >> 8) & 255) << 0
574 | uint_to_hex_lower8_le ((b >> 0) & 255) << 16;
575 u32x w3_t = uint_to_hex_lower8_le ((b >> 24) & 255) << 0
576 | uint_to_hex_lower8_le ((b >> 16) & 255) << 16;
577 u32x w4_t = uint_to_hex_lower8_le ((c >> 8) & 255) << 0
578 | uint_to_hex_lower8_le ((c >> 0) & 255) << 16;
579 u32x w5_t = uint_to_hex_lower8_le ((c >> 24) & 255) << 0
580 | uint_to_hex_lower8_le ((c >> 16) & 255) << 16;
581 u32x w6_t = uint_to_hex_lower8_le ((d >> 8) & 255) << 0
582 | uint_to_hex_lower8_le ((d >> 0) & 255) << 16;
583 u32x w7_t = uint_to_hex_lower8_le ((d >> 24) & 255) << 0
584 | uint_to_hex_lower8_le ((d >> 16) & 255) << 16;
586 u32x w8_t = 0x80000000;
606 SHA1_STEP (SHA1_F0o, a, b, c, d, e, w0_t);
607 SHA1_STEP (SHA1_F0o, e, a, b, c, d, w1_t);
608 SHA1_STEP (SHA1_F0o, d, e, a, b, c, w2_t);
609 SHA1_STEP (SHA1_F0o, c, d, e, a, b, w3_t);
610 SHA1_STEP (SHA1_F0o, b, c, d, e, a, w4_t);
611 SHA1_STEP (SHA1_F0o, a, b, c, d, e, w5_t);
612 SHA1_STEP (SHA1_F0o, e, a, b, c, d, w6_t);
613 SHA1_STEP (SHA1_F0o, d, e, a, b, c, w7_t);
614 SHA1_STEP (SHA1_F0o, c, d, e, a, b, w8_t);
615 SHA1_STEP (SHA1_F0o, b, c, d, e, a, w9_t);
616 SHA1_STEP (SHA1_F0o, a, b, c, d, e, wa_t);
617 SHA1_STEP (SHA1_F0o, e, a, b, c, d, wb_t);
618 SHA1_STEP (SHA1_F0o, d, e, a, b, c, wc_t);
619 SHA1_STEP (SHA1_F0o, c, d, e, a, b, wd_t);
620 SHA1_STEP (SHA1_F0o, b, c, d, e, a, we_t);
621 SHA1_STEP (SHA1_F0o, a, b, c, d, e, wf_t);
622 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F0o, e, a, b, c, d, w0_t);
623 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F0o, d, e, a, b, c, w1_t);
624 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F0o, c, d, e, a, b, w2_t);
625 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F0o, b, c, d, e, a, w3_t);
630 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w4_t);
631 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w5_t);
632 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w6_t);
633 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w7_t);
634 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w8_t);
635 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w9_t);
636 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wa_t);
637 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, wb_t);
638 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, wc_t);
639 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, wd_t);
640 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, we_t);
641 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wf_t);
642 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w0_t);
643 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w1_t);
644 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w2_t);
645 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w3_t);
646 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w4_t);
647 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w5_t);
648 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w6_t);
649 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w7_t);
654 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, w8_t);
655 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, w9_t);
656 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, wa_t);
657 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, wb_t);
658 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, wc_t);
659 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, wd_t);
660 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, we_t);
661 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, wf_t);
662 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, w0_t);
663 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, w1_t);
664 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, w2_t);
665 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, w3_t);
666 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, w4_t);
667 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, w5_t);
668 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, w6_t);
669 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F2o, a, b, c, d, e, w7_t);
670 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F2o, e, a, b, c, d, w8_t);
671 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F2o, d, e, a, b, c, w9_t);
672 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F2o, c, d, e, a, b, wa_t);
673 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F2o, b, c, d, e, a, wb_t);
678 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, wc_t);
679 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wd_t);
680 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, we_t);
681 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, wf_t);
682 w0_t = rotl32 ((wd_t ^ w8_t ^ w2_t ^ w0_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w0_t);
683 w1_t = rotl32 ((we_t ^ w9_t ^ w3_t ^ w1_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w1_t);
684 w2_t = rotl32 ((wf_t ^ wa_t ^ w4_t ^ w2_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w2_t);
685 w3_t = rotl32 ((w0_t ^ wb_t ^ w5_t ^ w3_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w3_t);
686 w4_t = rotl32 ((w1_t ^ wc_t ^ w6_t ^ w4_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w4_t);
687 w5_t = rotl32 ((w2_t ^ wd_t ^ w7_t ^ w5_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, w5_t);
688 w6_t = rotl32 ((w3_t ^ we_t ^ w8_t ^ w6_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, w6_t);
689 w7_t = rotl32 ((w4_t ^ wf_t ^ w9_t ^ w7_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, w7_t);
690 w8_t = rotl32 ((w5_t ^ w0_t ^ wa_t ^ w8_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, w8_t);
691 w9_t = rotl32 ((w6_t ^ w1_t ^ wb_t ^ w9_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, w9_t);
692 wa_t = rotl32 ((w7_t ^ w2_t ^ wc_t ^ wa_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, wa_t);
693 wb_t = rotl32 ((w8_t ^ w3_t ^ wd_t ^ wb_t), 1u); SHA1_STEP (SHA1_F1, a, b, c, d, e, wb_t);
695 if (MATCHES_NONE_VS (e, e_rev)) continue;
697 wc_t = rotl32 ((w9_t ^ w4_t ^ we_t ^ wc_t), 1u); SHA1_STEP (SHA1_F1, e, a, b, c, d, wc_t);
698 wd_t = rotl32 ((wa_t ^ w5_t ^ wf_t ^ wd_t), 1u); SHA1_STEP (SHA1_F1, d, e, a, b, c, wd_t);
699 we_t = rotl32 ((wb_t ^ w6_t ^ w0_t ^ we_t), 1u); SHA1_STEP (SHA1_F1, c, d, e, a, b, we_t);
700 wf_t = rotl32 ((wc_t ^ w7_t ^ w1_t ^ wf_t), 1u); SHA1_STEP (SHA1_F1, b, c, d, e, a, wf_t);
701 COMPARE_S_SIMD (a, d, c, b);
705 __kernel void m04700_s08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 combs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
709 __kernel void m04700_s16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 combs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)