2 * Authors.....: Jens Steube <jens.steube@gmail.com>
3 * Gabriele Gristina <matrix@hashcat.net>
4 * magnum <john.magnum@hushmail.com>
12 //#define NEW_SIMD_CODE
14 #include "inc_hash_constants.h"
15 #include "inc_vendor.cl"
22 #include "inc_hash_functions.cl"
23 #include "inc_types.cl"
24 #include "inc_common.cl"
27 #include "inc_simd.cl"
29 #define PERM_OP(a,b,tt,n,m) \
39 #define HPERM_OP(a,tt,n,m) \
45 tt = tt >> (16 + n); \
51 PERM_OP (r, l, tt, 4, 0x0f0f0f0f); \
52 PERM_OP (l, r, tt, 16, 0x0000ffff); \
53 PERM_OP (r, l, tt, 2, 0x33333333); \
54 PERM_OP (l, r, tt, 8, 0x00ff00ff); \
55 PERM_OP (r, l, tt, 1, 0x55555555); \
60 PERM_OP (l, r, tt, 1, 0x55555555); \
61 PERM_OP (r, l, tt, 8, 0x00ff00ff); \
62 PERM_OP (l, r, tt, 2, 0x33333333); \
63 PERM_OP (r, l, tt, 16, 0x0000ffff); \
64 PERM_OP (l, r, tt, 4, 0x0f0f0f0f); \
67 __constant u32 c_SPtrans[8][64] =
70 0x02080800, 0x00080000, 0x02000002, 0x02080802,
71 0x02000000, 0x00080802, 0x00080002, 0x02000002,
72 0x00080802, 0x02080800, 0x02080000, 0x00000802,
73 0x02000802, 0x02000000, 0x00000000, 0x00080002,
74 0x00080000, 0x00000002, 0x02000800, 0x00080800,
75 0x02080802, 0x02080000, 0x00000802, 0x02000800,
76 0x00000002, 0x00000800, 0x00080800, 0x02080002,
77 0x00000800, 0x02000802, 0x02080002, 0x00000000,
78 0x00000000, 0x02080802, 0x02000800, 0x00080002,
79 0x02080800, 0x00080000, 0x00000802, 0x02000800,
80 0x02080002, 0x00000800, 0x00080800, 0x02000002,
81 0x00080802, 0x00000002, 0x02000002, 0x02080000,
82 0x02080802, 0x00080800, 0x02080000, 0x02000802,
83 0x02000000, 0x00000802, 0x00080002, 0x00000000,
84 0x00080000, 0x02000000, 0x02000802, 0x02080800,
85 0x00000002, 0x02080002, 0x00000800, 0x00080802,
88 0x40108010, 0x00000000, 0x00108000, 0x40100000,
89 0x40000010, 0x00008010, 0x40008000, 0x00108000,
90 0x00008000, 0x40100010, 0x00000010, 0x40008000,
91 0x00100010, 0x40108000, 0x40100000, 0x00000010,
92 0x00100000, 0x40008010, 0x40100010, 0x00008000,
93 0x00108010, 0x40000000, 0x00000000, 0x00100010,
94 0x40008010, 0x00108010, 0x40108000, 0x40000010,
95 0x40000000, 0x00100000, 0x00008010, 0x40108010,
96 0x00100010, 0x40108000, 0x40008000, 0x00108010,
97 0x40108010, 0x00100010, 0x40000010, 0x00000000,
98 0x40000000, 0x00008010, 0x00100000, 0x40100010,
99 0x00008000, 0x40000000, 0x00108010, 0x40008010,
100 0x40108000, 0x00008000, 0x00000000, 0x40000010,
101 0x00000010, 0x40108010, 0x00108000, 0x40100000,
102 0x40100010, 0x00100000, 0x00008010, 0x40008000,
103 0x40008010, 0x00000010, 0x40100000, 0x00108000,
106 0x04000001, 0x04040100, 0x00000100, 0x04000101,
107 0x00040001, 0x04000000, 0x04000101, 0x00040100,
108 0x04000100, 0x00040000, 0x04040000, 0x00000001,
109 0x04040101, 0x00000101, 0x00000001, 0x04040001,
110 0x00000000, 0x00040001, 0x04040100, 0x00000100,
111 0x00000101, 0x04040101, 0x00040000, 0x04000001,
112 0x04040001, 0x04000100, 0x00040101, 0x04040000,
113 0x00040100, 0x00000000, 0x04000000, 0x00040101,
114 0x04040100, 0x00000100, 0x00000001, 0x00040000,
115 0x00000101, 0x00040001, 0x04040000, 0x04000101,
116 0x00000000, 0x04040100, 0x00040100, 0x04040001,
117 0x00040001, 0x04000000, 0x04040101, 0x00000001,
118 0x00040101, 0x04000001, 0x04000000, 0x04040101,
119 0x00040000, 0x04000100, 0x04000101, 0x00040100,
120 0x04000100, 0x00000000, 0x04040001, 0x00000101,
121 0x04000001, 0x00040101, 0x00000100, 0x04040000,
124 0x00401008, 0x10001000, 0x00000008, 0x10401008,
125 0x00000000, 0x10400000, 0x10001008, 0x00400008,
126 0x10401000, 0x10000008, 0x10000000, 0x00001008,
127 0x10000008, 0x00401008, 0x00400000, 0x10000000,
128 0x10400008, 0x00401000, 0x00001000, 0x00000008,
129 0x00401000, 0x10001008, 0x10400000, 0x00001000,
130 0x00001008, 0x00000000, 0x00400008, 0x10401000,
131 0x10001000, 0x10400008, 0x10401008, 0x00400000,
132 0x10400008, 0x00001008, 0x00400000, 0x10000008,
133 0x00401000, 0x10001000, 0x00000008, 0x10400000,
134 0x10001008, 0x00000000, 0x00001000, 0x00400008,
135 0x00000000, 0x10400008, 0x10401000, 0x00001000,
136 0x10000000, 0x10401008, 0x00401008, 0x00400000,
137 0x10401008, 0x00000008, 0x10001000, 0x00401008,
138 0x00400008, 0x00401000, 0x10400000, 0x10001008,
139 0x00001008, 0x10000000, 0x10000008, 0x10401000,
142 0x08000000, 0x00010000, 0x00000400, 0x08010420,
143 0x08010020, 0x08000400, 0x00010420, 0x08010000,
144 0x00010000, 0x00000020, 0x08000020, 0x00010400,
145 0x08000420, 0x08010020, 0x08010400, 0x00000000,
146 0x00010400, 0x08000000, 0x00010020, 0x00000420,
147 0x08000400, 0x00010420, 0x00000000, 0x08000020,
148 0x00000020, 0x08000420, 0x08010420, 0x00010020,
149 0x08010000, 0x00000400, 0x00000420, 0x08010400,
150 0x08010400, 0x08000420, 0x00010020, 0x08010000,
151 0x00010000, 0x00000020, 0x08000020, 0x08000400,
152 0x08000000, 0x00010400, 0x08010420, 0x00000000,
153 0x00010420, 0x08000000, 0x00000400, 0x00010020,
154 0x08000420, 0x00000400, 0x00000000, 0x08010420,
155 0x08010020, 0x08010400, 0x00000420, 0x00010000,
156 0x00010400, 0x08010020, 0x08000400, 0x00000420,
157 0x00000020, 0x00010420, 0x08010000, 0x08000020,
160 0x80000040, 0x00200040, 0x00000000, 0x80202000,
161 0x00200040, 0x00002000, 0x80002040, 0x00200000,
162 0x00002040, 0x80202040, 0x00202000, 0x80000000,
163 0x80002000, 0x80000040, 0x80200000, 0x00202040,
164 0x00200000, 0x80002040, 0x80200040, 0x00000000,
165 0x00002000, 0x00000040, 0x80202000, 0x80200040,
166 0x80202040, 0x80200000, 0x80000000, 0x00002040,
167 0x00000040, 0x00202000, 0x00202040, 0x80002000,
168 0x00002040, 0x80000000, 0x80002000, 0x00202040,
169 0x80202000, 0x00200040, 0x00000000, 0x80002000,
170 0x80000000, 0x00002000, 0x80200040, 0x00200000,
171 0x00200040, 0x80202040, 0x00202000, 0x00000040,
172 0x80202040, 0x00202000, 0x00200000, 0x80002040,
173 0x80000040, 0x80200000, 0x00202040, 0x00000000,
174 0x00002000, 0x80000040, 0x80002040, 0x80202000,
175 0x80200000, 0x00002040, 0x00000040, 0x80200040,
178 0x00004000, 0x00000200, 0x01000200, 0x01000004,
179 0x01004204, 0x00004004, 0x00004200, 0x00000000,
180 0x01000000, 0x01000204, 0x00000204, 0x01004000,
181 0x00000004, 0x01004200, 0x01004000, 0x00000204,
182 0x01000204, 0x00004000, 0x00004004, 0x01004204,
183 0x00000000, 0x01000200, 0x01000004, 0x00004200,
184 0x01004004, 0x00004204, 0x01004200, 0x00000004,
185 0x00004204, 0x01004004, 0x00000200, 0x01000000,
186 0x00004204, 0x01004000, 0x01004004, 0x00000204,
187 0x00004000, 0x00000200, 0x01000000, 0x01004004,
188 0x01000204, 0x00004204, 0x00004200, 0x00000000,
189 0x00000200, 0x01000004, 0x00000004, 0x01000200,
190 0x00000000, 0x01000204, 0x01000200, 0x00004200,
191 0x00000204, 0x00004000, 0x01004204, 0x01000000,
192 0x01004200, 0x00000004, 0x00004004, 0x01004204,
193 0x01000004, 0x01004200, 0x01004000, 0x00004004,
196 0x20800080, 0x20820000, 0x00020080, 0x00000000,
197 0x20020000, 0x00800080, 0x20800000, 0x20820080,
198 0x00000080, 0x20000000, 0x00820000, 0x00020080,
199 0x00820080, 0x20020080, 0x20000080, 0x20800000,
200 0x00020000, 0x00820080, 0x00800080, 0x20020000,
201 0x20820080, 0x20000080, 0x00000000, 0x00820000,
202 0x20000000, 0x00800000, 0x20020080, 0x20800080,
203 0x00800000, 0x00020000, 0x20820000, 0x00000080,
204 0x00800000, 0x00020000, 0x20000080, 0x20820080,
205 0x00020080, 0x20000000, 0x00000000, 0x00820000,
206 0x20800080, 0x20020080, 0x20020000, 0x00800080,
207 0x20820000, 0x00000080, 0x00800080, 0x20020000,
208 0x20820080, 0x00800000, 0x20800000, 0x20000080,
209 0x00820000, 0x00020080, 0x20020080, 0x20800000,
210 0x00000080, 0x20820000, 0x00820080, 0x00000000,
211 0x20000000, 0x20800080, 0x00020000, 0x00820080,
215 __constant u32 c_skb[8][64] =
218 0x00000000, 0x00000010, 0x20000000, 0x20000010,
219 0x00010000, 0x00010010, 0x20010000, 0x20010010,
220 0x00000800, 0x00000810, 0x20000800, 0x20000810,
221 0x00010800, 0x00010810, 0x20010800, 0x20010810,
222 0x00000020, 0x00000030, 0x20000020, 0x20000030,
223 0x00010020, 0x00010030, 0x20010020, 0x20010030,
224 0x00000820, 0x00000830, 0x20000820, 0x20000830,
225 0x00010820, 0x00010830, 0x20010820, 0x20010830,
226 0x00080000, 0x00080010, 0x20080000, 0x20080010,
227 0x00090000, 0x00090010, 0x20090000, 0x20090010,
228 0x00080800, 0x00080810, 0x20080800, 0x20080810,
229 0x00090800, 0x00090810, 0x20090800, 0x20090810,
230 0x00080020, 0x00080030, 0x20080020, 0x20080030,
231 0x00090020, 0x00090030, 0x20090020, 0x20090030,
232 0x00080820, 0x00080830, 0x20080820, 0x20080830,
233 0x00090820, 0x00090830, 0x20090820, 0x20090830,
236 0x00000000, 0x02000000, 0x00002000, 0x02002000,
237 0x00200000, 0x02200000, 0x00202000, 0x02202000,
238 0x00000004, 0x02000004, 0x00002004, 0x02002004,
239 0x00200004, 0x02200004, 0x00202004, 0x02202004,
240 0x00000400, 0x02000400, 0x00002400, 0x02002400,
241 0x00200400, 0x02200400, 0x00202400, 0x02202400,
242 0x00000404, 0x02000404, 0x00002404, 0x02002404,
243 0x00200404, 0x02200404, 0x00202404, 0x02202404,
244 0x10000000, 0x12000000, 0x10002000, 0x12002000,
245 0x10200000, 0x12200000, 0x10202000, 0x12202000,
246 0x10000004, 0x12000004, 0x10002004, 0x12002004,
247 0x10200004, 0x12200004, 0x10202004, 0x12202004,
248 0x10000400, 0x12000400, 0x10002400, 0x12002400,
249 0x10200400, 0x12200400, 0x10202400, 0x12202400,
250 0x10000404, 0x12000404, 0x10002404, 0x12002404,
251 0x10200404, 0x12200404, 0x10202404, 0x12202404,
254 0x00000000, 0x00000001, 0x00040000, 0x00040001,
255 0x01000000, 0x01000001, 0x01040000, 0x01040001,
256 0x00000002, 0x00000003, 0x00040002, 0x00040003,
257 0x01000002, 0x01000003, 0x01040002, 0x01040003,
258 0x00000200, 0x00000201, 0x00040200, 0x00040201,
259 0x01000200, 0x01000201, 0x01040200, 0x01040201,
260 0x00000202, 0x00000203, 0x00040202, 0x00040203,
261 0x01000202, 0x01000203, 0x01040202, 0x01040203,
262 0x08000000, 0x08000001, 0x08040000, 0x08040001,
263 0x09000000, 0x09000001, 0x09040000, 0x09040001,
264 0x08000002, 0x08000003, 0x08040002, 0x08040003,
265 0x09000002, 0x09000003, 0x09040002, 0x09040003,
266 0x08000200, 0x08000201, 0x08040200, 0x08040201,
267 0x09000200, 0x09000201, 0x09040200, 0x09040201,
268 0x08000202, 0x08000203, 0x08040202, 0x08040203,
269 0x09000202, 0x09000203, 0x09040202, 0x09040203,
272 0x00000000, 0x00100000, 0x00000100, 0x00100100,
273 0x00000008, 0x00100008, 0x00000108, 0x00100108,
274 0x00001000, 0x00101000, 0x00001100, 0x00101100,
275 0x00001008, 0x00101008, 0x00001108, 0x00101108,
276 0x04000000, 0x04100000, 0x04000100, 0x04100100,
277 0x04000008, 0x04100008, 0x04000108, 0x04100108,
278 0x04001000, 0x04101000, 0x04001100, 0x04101100,
279 0x04001008, 0x04101008, 0x04001108, 0x04101108,
280 0x00020000, 0x00120000, 0x00020100, 0x00120100,
281 0x00020008, 0x00120008, 0x00020108, 0x00120108,
282 0x00021000, 0x00121000, 0x00021100, 0x00121100,
283 0x00021008, 0x00121008, 0x00021108, 0x00121108,
284 0x04020000, 0x04120000, 0x04020100, 0x04120100,
285 0x04020008, 0x04120008, 0x04020108, 0x04120108,
286 0x04021000, 0x04121000, 0x04021100, 0x04121100,
287 0x04021008, 0x04121008, 0x04021108, 0x04121108,
290 0x00000000, 0x10000000, 0x00010000, 0x10010000,
291 0x00000004, 0x10000004, 0x00010004, 0x10010004,
292 0x20000000, 0x30000000, 0x20010000, 0x30010000,
293 0x20000004, 0x30000004, 0x20010004, 0x30010004,
294 0x00100000, 0x10100000, 0x00110000, 0x10110000,
295 0x00100004, 0x10100004, 0x00110004, 0x10110004,
296 0x20100000, 0x30100000, 0x20110000, 0x30110000,
297 0x20100004, 0x30100004, 0x20110004, 0x30110004,
298 0x00001000, 0x10001000, 0x00011000, 0x10011000,
299 0x00001004, 0x10001004, 0x00011004, 0x10011004,
300 0x20001000, 0x30001000, 0x20011000, 0x30011000,
301 0x20001004, 0x30001004, 0x20011004, 0x30011004,
302 0x00101000, 0x10101000, 0x00111000, 0x10111000,
303 0x00101004, 0x10101004, 0x00111004, 0x10111004,
304 0x20101000, 0x30101000, 0x20111000, 0x30111000,
305 0x20101004, 0x30101004, 0x20111004, 0x30111004,
308 0x00000000, 0x08000000, 0x00000008, 0x08000008,
309 0x00000400, 0x08000400, 0x00000408, 0x08000408,
310 0x00020000, 0x08020000, 0x00020008, 0x08020008,
311 0x00020400, 0x08020400, 0x00020408, 0x08020408,
312 0x00000001, 0x08000001, 0x00000009, 0x08000009,
313 0x00000401, 0x08000401, 0x00000409, 0x08000409,
314 0x00020001, 0x08020001, 0x00020009, 0x08020009,
315 0x00020401, 0x08020401, 0x00020409, 0x08020409,
316 0x02000000, 0x0A000000, 0x02000008, 0x0A000008,
317 0x02000400, 0x0A000400, 0x02000408, 0x0A000408,
318 0x02020000, 0x0A020000, 0x02020008, 0x0A020008,
319 0x02020400, 0x0A020400, 0x02020408, 0x0A020408,
320 0x02000001, 0x0A000001, 0x02000009, 0x0A000009,
321 0x02000401, 0x0A000401, 0x02000409, 0x0A000409,
322 0x02020001, 0x0A020001, 0x02020009, 0x0A020009,
323 0x02020401, 0x0A020401, 0x02020409, 0x0A020409,
326 0x00000000, 0x00000100, 0x00080000, 0x00080100,
327 0x01000000, 0x01000100, 0x01080000, 0x01080100,
328 0x00000010, 0x00000110, 0x00080010, 0x00080110,
329 0x01000010, 0x01000110, 0x01080010, 0x01080110,
330 0x00200000, 0x00200100, 0x00280000, 0x00280100,
331 0x01200000, 0x01200100, 0x01280000, 0x01280100,
332 0x00200010, 0x00200110, 0x00280010, 0x00280110,
333 0x01200010, 0x01200110, 0x01280010, 0x01280110,
334 0x00000200, 0x00000300, 0x00080200, 0x00080300,
335 0x01000200, 0x01000300, 0x01080200, 0x01080300,
336 0x00000210, 0x00000310, 0x00080210, 0x00080310,
337 0x01000210, 0x01000310, 0x01080210, 0x01080310,
338 0x00200200, 0x00200300, 0x00280200, 0x00280300,
339 0x01200200, 0x01200300, 0x01280200, 0x01280300,
340 0x00200210, 0x00200310, 0x00280210, 0x00280310,
341 0x01200210, 0x01200310, 0x01280210, 0x01280310,
344 0x00000000, 0x04000000, 0x00040000, 0x04040000,
345 0x00000002, 0x04000002, 0x00040002, 0x04040002,
346 0x00002000, 0x04002000, 0x00042000, 0x04042000,
347 0x00002002, 0x04002002, 0x00042002, 0x04042002,
348 0x00000020, 0x04000020, 0x00040020, 0x04040020,
349 0x00000022, 0x04000022, 0x00040022, 0x04040022,
350 0x00002020, 0x04002020, 0x00042020, 0x04042020,
351 0x00002022, 0x04002022, 0x00042022, 0x04042022,
352 0x00000800, 0x04000800, 0x00040800, 0x04040800,
353 0x00000802, 0x04000802, 0x00040802, 0x04040802,
354 0x00002800, 0x04002800, 0x00042800, 0x04042800,
355 0x00002802, 0x04002802, 0x00042802, 0x04042802,
356 0x00000820, 0x04000820, 0x00040820, 0x04040820,
357 0x00000822, 0x04000822, 0x00040822, 0x04040822,
358 0x00002820, 0x04002820, 0x00042820, 0x04042820,
359 0x00002822, 0x04002822, 0x00042822, 0x04042822
364 #define BOX(i,n,S) (S)[(n)][(i)]
366 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1])
368 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3])
370 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7])
371 #elif VECT_SIZE == 16
372 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7], (S)[(n)][(i).s8], (S)[(n)][(i).s9], (S)[(n)][(i).sa], (S)[(n)][(i).sb], (S)[(n)][(i).sc], (S)[(n)][(i).sd], (S)[(n)][(i).se], (S)[(n)][(i).sf])
375 void _des_crypt_encrypt (u32x iv[2], u32x data[2], u32x Kc[16], u32x Kd[16], __local u32 (*s_SPtrans)[64])
390 for (u32 i = 0; i < 16; i += 2)
396 t = Kd[i + 0] ^ rotl32 (r, 28u);
398 l ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
399 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
400 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
401 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
402 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
403 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
404 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
405 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
408 t = Kd[i + 1] ^ rotl32 (l, 28u);
410 r ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
411 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
412 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
413 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
414 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
415 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
416 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
417 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
429 void _des_crypt_keysetup (u32x c, u32x d, u32x Kc[16], u32x Kd[16], __local u32 (*s_skb)[64])
433 PERM_OP (d, c, tt, 4, 0x0f0f0f0f);
434 HPERM_OP (c, tt, 2, 0xcccc0000);
435 HPERM_OP (d, tt, 2, 0xcccc0000);
436 PERM_OP (d, c, tt, 1, 0x55555555);
437 PERM_OP (c, d, tt, 8, 0x00ff00ff);
438 PERM_OP (d, c, tt, 1, 0x55555555);
440 d = ((d & 0x000000ff) << 16)
441 | ((d & 0x0000ff00) << 0)
442 | ((d & 0x00ff0000) >> 16)
443 | ((c & 0xf0000000) >> 4);
450 for (u32 i = 0; i < 16; i++)
452 if ((i < 2) || (i == 8) || (i == 15))
454 c = ((c >> 1) | (c << 27));
455 d = ((d >> 1) | (d << 27));
459 c = ((c >> 2) | (c << 26));
460 d = ((d >> 2) | (d << 26));
466 const u32x c00 = (c >> 0) & 0x0000003f;
467 const u32x c06 = (c >> 6) & 0x00383003;
468 const u32x c07 = (c >> 7) & 0x0000003c;
469 const u32x c13 = (c >> 13) & 0x0000060f;
470 const u32x c20 = (c >> 20) & 0x00000001;
472 u32x s = BOX (((c00 >> 0) & 0xff), 0, s_skb)
473 | BOX (((c06 >> 0) & 0xff)
474 |((c07 >> 0) & 0xff), 1, s_skb)
475 | BOX (((c13 >> 0) & 0xff)
476 |((c06 >> 8) & 0xff), 2, s_skb)
477 | BOX (((c20 >> 0) & 0xff)
479 |((c06 >> 16) & 0xff), 3, s_skb);
481 const u32x d00 = (d >> 0) & 0x00003c3f;
482 const u32x d07 = (d >> 7) & 0x00003f03;
483 const u32x d21 = (d >> 21) & 0x0000000f;
484 const u32x d22 = (d >> 22) & 0x00000030;
486 u32x t = BOX (((d00 >> 0) & 0xff), 4, s_skb)
487 | BOX (((d07 >> 0) & 0xff)
488 |((d00 >> 8) & 0xff), 5, s_skb)
489 | BOX (((d07 >> 8) & 0xff), 6, s_skb)
490 | BOX (((d21 >> 0) & 0xff)
491 |((d22 >> 0) & 0xff), 7, s_skb);
493 Kc[i] = ((t << 16) | (s & 0x0000ffff));
494 Kd[i] = ((s >> 16) | (t & 0xffff0000));
496 Kc[i] = rotl32 (Kc[i], 2u);
497 Kd[i] = rotl32 (Kd[i], 2u);
501 __kernel void m03100_m04 (__global pw_t *pws, __global kernel_rule_t * rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
507 const u32 gid = get_global_id (0);
508 const u32 lid = get_local_id (0);
509 const u32 lsz = get_local_size (0);
515 __local u32 s_SPtrans[8][64];
516 __local u32 s_skb[8][64];
518 for (u32 i = lid; i < 64; i += lsz)
520 s_SPtrans[0][i] = c_SPtrans[0][i];
521 s_SPtrans[1][i] = c_SPtrans[1][i];
522 s_SPtrans[2][i] = c_SPtrans[2][i];
523 s_SPtrans[3][i] = c_SPtrans[3][i];
524 s_SPtrans[4][i] = c_SPtrans[4][i];
525 s_SPtrans[5][i] = c_SPtrans[5][i];
526 s_SPtrans[6][i] = c_SPtrans[6][i];
527 s_SPtrans[7][i] = c_SPtrans[7][i];
529 s_skb[0][i] = c_skb[0][i];
530 s_skb[1][i] = c_skb[1][i];
531 s_skb[2][i] = c_skb[2][i];
532 s_skb[3][i] = c_skb[3][i];
533 s_skb[4][i] = c_skb[4][i];
534 s_skb[5][i] = c_skb[5][i];
535 s_skb[6][i] = c_skb[6][i];
536 s_skb[7][i] = c_skb[7][i];
539 barrier (CLK_LOCAL_MEM_FENCE);
541 if (gid >= gid_max) return;
550 pw_buf0[0] = pws[gid].i[0];
551 pw_buf0[1] = pws[gid].i[1];
552 pw_buf0[2] = pws[gid].i[2];
553 pw_buf0[3] = pws[gid].i[3];
554 pw_buf1[0] = pws[gid].i[4];
555 pw_buf1[1] = pws[gid].i[5];
556 pw_buf1[2] = pws[gid].i[6];
557 pw_buf1[3] = pws[gid].i[7];
559 const u32 pw_len = pws[gid].pw_len;
568 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
569 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
570 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
571 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
572 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
573 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
574 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
575 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
577 const u32 salt_len = salt_bufs[salt_pos].salt_len;
583 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
590 const u32x out_len = apply_rules_vect (pw_buf0, pw_buf1, pw_len, rules_buf, il_pos, w0, w1);
592 const u32x salt_word_len = (salt_len + out_len) * 2;
598 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
602 dst[ 0] = w0[0] | salt_buf0[0];
603 dst[ 1] = w0[1] | salt_buf0[1];
604 dst[ 2] = w0[2] | salt_buf0[2];
605 dst[ 3] = w0[3] | salt_buf0[3];
606 dst[ 4] = w1[0] | salt_buf1[0];
607 dst[ 5] = w1[1] | salt_buf1[1];
608 dst[ 6] = w1[2] | salt_buf1[2];
609 dst[ 7] = w1[3] | salt_buf1[3];
620 * precompute key1 since key is static: 0x0123456789abcdef
621 * plus LEFT_ROTATE by 2
663 * key1 (generate key)
671 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
675 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
676 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
681 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
685 * key2 (generate hash)
688 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
693 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
697 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
698 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
703 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
712 COMPARE_M_SIMD (iv[0], iv[1], z, z);
716 __kernel void m03100_m08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
720 __kernel void m03100_m16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
724 __kernel void m03100_s04 (__global pw_t *pws, __global kernel_rule_t * rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
730 const u32 gid = get_global_id (0);
731 const u32 lid = get_local_id (0);
732 const u32 lsz = get_local_size (0);
738 __local u32 s_SPtrans[8][64];
739 __local u32 s_skb[8][64];
741 for (u32 i = lid; i < 64; i += lsz)
743 s_SPtrans[0][i] = c_SPtrans[0][i];
744 s_SPtrans[1][i] = c_SPtrans[1][i];
745 s_SPtrans[2][i] = c_SPtrans[2][i];
746 s_SPtrans[3][i] = c_SPtrans[3][i];
747 s_SPtrans[4][i] = c_SPtrans[4][i];
748 s_SPtrans[5][i] = c_SPtrans[5][i];
749 s_SPtrans[6][i] = c_SPtrans[6][i];
750 s_SPtrans[7][i] = c_SPtrans[7][i];
752 s_skb[0][i] = c_skb[0][i];
753 s_skb[1][i] = c_skb[1][i];
754 s_skb[2][i] = c_skb[2][i];
755 s_skb[3][i] = c_skb[3][i];
756 s_skb[4][i] = c_skb[4][i];
757 s_skb[5][i] = c_skb[5][i];
758 s_skb[6][i] = c_skb[6][i];
759 s_skb[7][i] = c_skb[7][i];
762 barrier (CLK_LOCAL_MEM_FENCE);
764 if (gid >= gid_max) return;
773 pw_buf0[0] = pws[gid].i[0];
774 pw_buf0[1] = pws[gid].i[1];
775 pw_buf0[2] = pws[gid].i[2];
776 pw_buf0[3] = pws[gid].i[3];
777 pw_buf1[0] = pws[gid].i[4];
778 pw_buf1[1] = pws[gid].i[5];
779 pw_buf1[2] = pws[gid].i[6];
780 pw_buf1[3] = pws[gid].i[7];
782 const u32 pw_len = pws[gid].pw_len;
791 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
792 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
793 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
794 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
795 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
796 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
797 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
798 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
800 const u32 salt_len = salt_bufs[salt_pos].salt_len;
806 const u32 search[4] =
808 digests_buf[digests_offset].digest_buf[DGST_R0],
809 digests_buf[digests_offset].digest_buf[DGST_R1],
818 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
825 const u32x out_len = apply_rules_vect (pw_buf0, pw_buf1, pw_len, rules_buf, il_pos, w0, w1);
827 const u32x salt_word_len = (salt_len + out_len) * 2;
833 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
837 dst[ 0] = w0[0] | salt_buf0[0];
838 dst[ 1] = w0[1] | salt_buf0[1];
839 dst[ 2] = w0[2] | salt_buf0[2];
840 dst[ 3] = w0[3] | salt_buf0[3];
841 dst[ 4] = w1[0] | salt_buf1[0];
842 dst[ 5] = w1[1] | salt_buf1[1];
843 dst[ 6] = w1[2] | salt_buf1[2];
844 dst[ 7] = w1[3] | salt_buf1[3];
855 * precompute key1 since key is static: 0x0123456789abcdef
856 * plus LEFT_ROTATE by 2
898 * key1 (generate key)
906 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
910 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
911 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
916 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
920 * key2 (generate hash)
923 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
928 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
932 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
933 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
938 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
947 COMPARE_S_SIMD (iv[0], iv[1], z, z);
951 __kernel void m03100_s08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
955 __kernel void m03100_s16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)