2 * Authors.....: Jens Steube <jens.steube@gmail.com>
3 * Gabriele Gristina <matrix@hashcat.net>
4 * magnum <john.magnum@hushmail.com>
12 //#define NEW_SIMD_CODE
14 #include "inc_vendor.cl"
15 #include "inc_hash_constants.h"
16 #include "inc_hash_functions.cl"
17 #include "inc_types.cl"
18 #include "inc_common.cl"
21 #include "inc_simd.cl"
23 #define PERM_OP(a,b,tt,n,m) \
33 #define HPERM_OP(a,tt,n,m) \
39 tt = tt >> (16 + n); \
45 PERM_OP (r, l, tt, 4, 0x0f0f0f0f); \
46 PERM_OP (l, r, tt, 16, 0x0000ffff); \
47 PERM_OP (r, l, tt, 2, 0x33333333); \
48 PERM_OP (l, r, tt, 8, 0x00ff00ff); \
49 PERM_OP (r, l, tt, 1, 0x55555555); \
54 PERM_OP (l, r, tt, 1, 0x55555555); \
55 PERM_OP (r, l, tt, 8, 0x00ff00ff); \
56 PERM_OP (l, r, tt, 2, 0x33333333); \
57 PERM_OP (r, l, tt, 16, 0x0000ffff); \
58 PERM_OP (l, r, tt, 4, 0x0f0f0f0f); \
61 __constant u32 c_SPtrans[8][64] =
64 0x02080800, 0x00080000, 0x02000002, 0x02080802,
65 0x02000000, 0x00080802, 0x00080002, 0x02000002,
66 0x00080802, 0x02080800, 0x02080000, 0x00000802,
67 0x02000802, 0x02000000, 0x00000000, 0x00080002,
68 0x00080000, 0x00000002, 0x02000800, 0x00080800,
69 0x02080802, 0x02080000, 0x00000802, 0x02000800,
70 0x00000002, 0x00000800, 0x00080800, 0x02080002,
71 0x00000800, 0x02000802, 0x02080002, 0x00000000,
72 0x00000000, 0x02080802, 0x02000800, 0x00080002,
73 0x02080800, 0x00080000, 0x00000802, 0x02000800,
74 0x02080002, 0x00000800, 0x00080800, 0x02000002,
75 0x00080802, 0x00000002, 0x02000002, 0x02080000,
76 0x02080802, 0x00080800, 0x02080000, 0x02000802,
77 0x02000000, 0x00000802, 0x00080002, 0x00000000,
78 0x00080000, 0x02000000, 0x02000802, 0x02080800,
79 0x00000002, 0x02080002, 0x00000800, 0x00080802,
82 0x40108010, 0x00000000, 0x00108000, 0x40100000,
83 0x40000010, 0x00008010, 0x40008000, 0x00108000,
84 0x00008000, 0x40100010, 0x00000010, 0x40008000,
85 0x00100010, 0x40108000, 0x40100000, 0x00000010,
86 0x00100000, 0x40008010, 0x40100010, 0x00008000,
87 0x00108010, 0x40000000, 0x00000000, 0x00100010,
88 0x40008010, 0x00108010, 0x40108000, 0x40000010,
89 0x40000000, 0x00100000, 0x00008010, 0x40108010,
90 0x00100010, 0x40108000, 0x40008000, 0x00108010,
91 0x40108010, 0x00100010, 0x40000010, 0x00000000,
92 0x40000000, 0x00008010, 0x00100000, 0x40100010,
93 0x00008000, 0x40000000, 0x00108010, 0x40008010,
94 0x40108000, 0x00008000, 0x00000000, 0x40000010,
95 0x00000010, 0x40108010, 0x00108000, 0x40100000,
96 0x40100010, 0x00100000, 0x00008010, 0x40008000,
97 0x40008010, 0x00000010, 0x40100000, 0x00108000,
100 0x04000001, 0x04040100, 0x00000100, 0x04000101,
101 0x00040001, 0x04000000, 0x04000101, 0x00040100,
102 0x04000100, 0x00040000, 0x04040000, 0x00000001,
103 0x04040101, 0x00000101, 0x00000001, 0x04040001,
104 0x00000000, 0x00040001, 0x04040100, 0x00000100,
105 0x00000101, 0x04040101, 0x00040000, 0x04000001,
106 0x04040001, 0x04000100, 0x00040101, 0x04040000,
107 0x00040100, 0x00000000, 0x04000000, 0x00040101,
108 0x04040100, 0x00000100, 0x00000001, 0x00040000,
109 0x00000101, 0x00040001, 0x04040000, 0x04000101,
110 0x00000000, 0x04040100, 0x00040100, 0x04040001,
111 0x00040001, 0x04000000, 0x04040101, 0x00000001,
112 0x00040101, 0x04000001, 0x04000000, 0x04040101,
113 0x00040000, 0x04000100, 0x04000101, 0x00040100,
114 0x04000100, 0x00000000, 0x04040001, 0x00000101,
115 0x04000001, 0x00040101, 0x00000100, 0x04040000,
118 0x00401008, 0x10001000, 0x00000008, 0x10401008,
119 0x00000000, 0x10400000, 0x10001008, 0x00400008,
120 0x10401000, 0x10000008, 0x10000000, 0x00001008,
121 0x10000008, 0x00401008, 0x00400000, 0x10000000,
122 0x10400008, 0x00401000, 0x00001000, 0x00000008,
123 0x00401000, 0x10001008, 0x10400000, 0x00001000,
124 0x00001008, 0x00000000, 0x00400008, 0x10401000,
125 0x10001000, 0x10400008, 0x10401008, 0x00400000,
126 0x10400008, 0x00001008, 0x00400000, 0x10000008,
127 0x00401000, 0x10001000, 0x00000008, 0x10400000,
128 0x10001008, 0x00000000, 0x00001000, 0x00400008,
129 0x00000000, 0x10400008, 0x10401000, 0x00001000,
130 0x10000000, 0x10401008, 0x00401008, 0x00400000,
131 0x10401008, 0x00000008, 0x10001000, 0x00401008,
132 0x00400008, 0x00401000, 0x10400000, 0x10001008,
133 0x00001008, 0x10000000, 0x10000008, 0x10401000,
136 0x08000000, 0x00010000, 0x00000400, 0x08010420,
137 0x08010020, 0x08000400, 0x00010420, 0x08010000,
138 0x00010000, 0x00000020, 0x08000020, 0x00010400,
139 0x08000420, 0x08010020, 0x08010400, 0x00000000,
140 0x00010400, 0x08000000, 0x00010020, 0x00000420,
141 0x08000400, 0x00010420, 0x00000000, 0x08000020,
142 0x00000020, 0x08000420, 0x08010420, 0x00010020,
143 0x08010000, 0x00000400, 0x00000420, 0x08010400,
144 0x08010400, 0x08000420, 0x00010020, 0x08010000,
145 0x00010000, 0x00000020, 0x08000020, 0x08000400,
146 0x08000000, 0x00010400, 0x08010420, 0x00000000,
147 0x00010420, 0x08000000, 0x00000400, 0x00010020,
148 0x08000420, 0x00000400, 0x00000000, 0x08010420,
149 0x08010020, 0x08010400, 0x00000420, 0x00010000,
150 0x00010400, 0x08010020, 0x08000400, 0x00000420,
151 0x00000020, 0x00010420, 0x08010000, 0x08000020,
154 0x80000040, 0x00200040, 0x00000000, 0x80202000,
155 0x00200040, 0x00002000, 0x80002040, 0x00200000,
156 0x00002040, 0x80202040, 0x00202000, 0x80000000,
157 0x80002000, 0x80000040, 0x80200000, 0x00202040,
158 0x00200000, 0x80002040, 0x80200040, 0x00000000,
159 0x00002000, 0x00000040, 0x80202000, 0x80200040,
160 0x80202040, 0x80200000, 0x80000000, 0x00002040,
161 0x00000040, 0x00202000, 0x00202040, 0x80002000,
162 0x00002040, 0x80000000, 0x80002000, 0x00202040,
163 0x80202000, 0x00200040, 0x00000000, 0x80002000,
164 0x80000000, 0x00002000, 0x80200040, 0x00200000,
165 0x00200040, 0x80202040, 0x00202000, 0x00000040,
166 0x80202040, 0x00202000, 0x00200000, 0x80002040,
167 0x80000040, 0x80200000, 0x00202040, 0x00000000,
168 0x00002000, 0x80000040, 0x80002040, 0x80202000,
169 0x80200000, 0x00002040, 0x00000040, 0x80200040,
172 0x00004000, 0x00000200, 0x01000200, 0x01000004,
173 0x01004204, 0x00004004, 0x00004200, 0x00000000,
174 0x01000000, 0x01000204, 0x00000204, 0x01004000,
175 0x00000004, 0x01004200, 0x01004000, 0x00000204,
176 0x01000204, 0x00004000, 0x00004004, 0x01004204,
177 0x00000000, 0x01000200, 0x01000004, 0x00004200,
178 0x01004004, 0x00004204, 0x01004200, 0x00000004,
179 0x00004204, 0x01004004, 0x00000200, 0x01000000,
180 0x00004204, 0x01004000, 0x01004004, 0x00000204,
181 0x00004000, 0x00000200, 0x01000000, 0x01004004,
182 0x01000204, 0x00004204, 0x00004200, 0x00000000,
183 0x00000200, 0x01000004, 0x00000004, 0x01000200,
184 0x00000000, 0x01000204, 0x01000200, 0x00004200,
185 0x00000204, 0x00004000, 0x01004204, 0x01000000,
186 0x01004200, 0x00000004, 0x00004004, 0x01004204,
187 0x01000004, 0x01004200, 0x01004000, 0x00004004,
190 0x20800080, 0x20820000, 0x00020080, 0x00000000,
191 0x20020000, 0x00800080, 0x20800000, 0x20820080,
192 0x00000080, 0x20000000, 0x00820000, 0x00020080,
193 0x00820080, 0x20020080, 0x20000080, 0x20800000,
194 0x00020000, 0x00820080, 0x00800080, 0x20020000,
195 0x20820080, 0x20000080, 0x00000000, 0x00820000,
196 0x20000000, 0x00800000, 0x20020080, 0x20800080,
197 0x00800000, 0x00020000, 0x20820000, 0x00000080,
198 0x00800000, 0x00020000, 0x20000080, 0x20820080,
199 0x00020080, 0x20000000, 0x00000000, 0x00820000,
200 0x20800080, 0x20020080, 0x20020000, 0x00800080,
201 0x20820000, 0x00000080, 0x00800080, 0x20020000,
202 0x20820080, 0x00800000, 0x20800000, 0x20000080,
203 0x00820000, 0x00020080, 0x20020080, 0x20800000,
204 0x00000080, 0x20820000, 0x00820080, 0x00000000,
205 0x20000000, 0x20800080, 0x00020000, 0x00820080,
209 __constant u32 c_skb[8][64] =
212 0x00000000, 0x00000010, 0x20000000, 0x20000010,
213 0x00010000, 0x00010010, 0x20010000, 0x20010010,
214 0x00000800, 0x00000810, 0x20000800, 0x20000810,
215 0x00010800, 0x00010810, 0x20010800, 0x20010810,
216 0x00000020, 0x00000030, 0x20000020, 0x20000030,
217 0x00010020, 0x00010030, 0x20010020, 0x20010030,
218 0x00000820, 0x00000830, 0x20000820, 0x20000830,
219 0x00010820, 0x00010830, 0x20010820, 0x20010830,
220 0x00080000, 0x00080010, 0x20080000, 0x20080010,
221 0x00090000, 0x00090010, 0x20090000, 0x20090010,
222 0x00080800, 0x00080810, 0x20080800, 0x20080810,
223 0x00090800, 0x00090810, 0x20090800, 0x20090810,
224 0x00080020, 0x00080030, 0x20080020, 0x20080030,
225 0x00090020, 0x00090030, 0x20090020, 0x20090030,
226 0x00080820, 0x00080830, 0x20080820, 0x20080830,
227 0x00090820, 0x00090830, 0x20090820, 0x20090830,
230 0x00000000, 0x02000000, 0x00002000, 0x02002000,
231 0x00200000, 0x02200000, 0x00202000, 0x02202000,
232 0x00000004, 0x02000004, 0x00002004, 0x02002004,
233 0x00200004, 0x02200004, 0x00202004, 0x02202004,
234 0x00000400, 0x02000400, 0x00002400, 0x02002400,
235 0x00200400, 0x02200400, 0x00202400, 0x02202400,
236 0x00000404, 0x02000404, 0x00002404, 0x02002404,
237 0x00200404, 0x02200404, 0x00202404, 0x02202404,
238 0x10000000, 0x12000000, 0x10002000, 0x12002000,
239 0x10200000, 0x12200000, 0x10202000, 0x12202000,
240 0x10000004, 0x12000004, 0x10002004, 0x12002004,
241 0x10200004, 0x12200004, 0x10202004, 0x12202004,
242 0x10000400, 0x12000400, 0x10002400, 0x12002400,
243 0x10200400, 0x12200400, 0x10202400, 0x12202400,
244 0x10000404, 0x12000404, 0x10002404, 0x12002404,
245 0x10200404, 0x12200404, 0x10202404, 0x12202404,
248 0x00000000, 0x00000001, 0x00040000, 0x00040001,
249 0x01000000, 0x01000001, 0x01040000, 0x01040001,
250 0x00000002, 0x00000003, 0x00040002, 0x00040003,
251 0x01000002, 0x01000003, 0x01040002, 0x01040003,
252 0x00000200, 0x00000201, 0x00040200, 0x00040201,
253 0x01000200, 0x01000201, 0x01040200, 0x01040201,
254 0x00000202, 0x00000203, 0x00040202, 0x00040203,
255 0x01000202, 0x01000203, 0x01040202, 0x01040203,
256 0x08000000, 0x08000001, 0x08040000, 0x08040001,
257 0x09000000, 0x09000001, 0x09040000, 0x09040001,
258 0x08000002, 0x08000003, 0x08040002, 0x08040003,
259 0x09000002, 0x09000003, 0x09040002, 0x09040003,
260 0x08000200, 0x08000201, 0x08040200, 0x08040201,
261 0x09000200, 0x09000201, 0x09040200, 0x09040201,
262 0x08000202, 0x08000203, 0x08040202, 0x08040203,
263 0x09000202, 0x09000203, 0x09040202, 0x09040203,
266 0x00000000, 0x00100000, 0x00000100, 0x00100100,
267 0x00000008, 0x00100008, 0x00000108, 0x00100108,
268 0x00001000, 0x00101000, 0x00001100, 0x00101100,
269 0x00001008, 0x00101008, 0x00001108, 0x00101108,
270 0x04000000, 0x04100000, 0x04000100, 0x04100100,
271 0x04000008, 0x04100008, 0x04000108, 0x04100108,
272 0x04001000, 0x04101000, 0x04001100, 0x04101100,
273 0x04001008, 0x04101008, 0x04001108, 0x04101108,
274 0x00020000, 0x00120000, 0x00020100, 0x00120100,
275 0x00020008, 0x00120008, 0x00020108, 0x00120108,
276 0x00021000, 0x00121000, 0x00021100, 0x00121100,
277 0x00021008, 0x00121008, 0x00021108, 0x00121108,
278 0x04020000, 0x04120000, 0x04020100, 0x04120100,
279 0x04020008, 0x04120008, 0x04020108, 0x04120108,
280 0x04021000, 0x04121000, 0x04021100, 0x04121100,
281 0x04021008, 0x04121008, 0x04021108, 0x04121108,
284 0x00000000, 0x10000000, 0x00010000, 0x10010000,
285 0x00000004, 0x10000004, 0x00010004, 0x10010004,
286 0x20000000, 0x30000000, 0x20010000, 0x30010000,
287 0x20000004, 0x30000004, 0x20010004, 0x30010004,
288 0x00100000, 0x10100000, 0x00110000, 0x10110000,
289 0x00100004, 0x10100004, 0x00110004, 0x10110004,
290 0x20100000, 0x30100000, 0x20110000, 0x30110000,
291 0x20100004, 0x30100004, 0x20110004, 0x30110004,
292 0x00001000, 0x10001000, 0x00011000, 0x10011000,
293 0x00001004, 0x10001004, 0x00011004, 0x10011004,
294 0x20001000, 0x30001000, 0x20011000, 0x30011000,
295 0x20001004, 0x30001004, 0x20011004, 0x30011004,
296 0x00101000, 0x10101000, 0x00111000, 0x10111000,
297 0x00101004, 0x10101004, 0x00111004, 0x10111004,
298 0x20101000, 0x30101000, 0x20111000, 0x30111000,
299 0x20101004, 0x30101004, 0x20111004, 0x30111004,
302 0x00000000, 0x08000000, 0x00000008, 0x08000008,
303 0x00000400, 0x08000400, 0x00000408, 0x08000408,
304 0x00020000, 0x08020000, 0x00020008, 0x08020008,
305 0x00020400, 0x08020400, 0x00020408, 0x08020408,
306 0x00000001, 0x08000001, 0x00000009, 0x08000009,
307 0x00000401, 0x08000401, 0x00000409, 0x08000409,
308 0x00020001, 0x08020001, 0x00020009, 0x08020009,
309 0x00020401, 0x08020401, 0x00020409, 0x08020409,
310 0x02000000, 0x0A000000, 0x02000008, 0x0A000008,
311 0x02000400, 0x0A000400, 0x02000408, 0x0A000408,
312 0x02020000, 0x0A020000, 0x02020008, 0x0A020008,
313 0x02020400, 0x0A020400, 0x02020408, 0x0A020408,
314 0x02000001, 0x0A000001, 0x02000009, 0x0A000009,
315 0x02000401, 0x0A000401, 0x02000409, 0x0A000409,
316 0x02020001, 0x0A020001, 0x02020009, 0x0A020009,
317 0x02020401, 0x0A020401, 0x02020409, 0x0A020409,
320 0x00000000, 0x00000100, 0x00080000, 0x00080100,
321 0x01000000, 0x01000100, 0x01080000, 0x01080100,
322 0x00000010, 0x00000110, 0x00080010, 0x00080110,
323 0x01000010, 0x01000110, 0x01080010, 0x01080110,
324 0x00200000, 0x00200100, 0x00280000, 0x00280100,
325 0x01200000, 0x01200100, 0x01280000, 0x01280100,
326 0x00200010, 0x00200110, 0x00280010, 0x00280110,
327 0x01200010, 0x01200110, 0x01280010, 0x01280110,
328 0x00000200, 0x00000300, 0x00080200, 0x00080300,
329 0x01000200, 0x01000300, 0x01080200, 0x01080300,
330 0x00000210, 0x00000310, 0x00080210, 0x00080310,
331 0x01000210, 0x01000310, 0x01080210, 0x01080310,
332 0x00200200, 0x00200300, 0x00280200, 0x00280300,
333 0x01200200, 0x01200300, 0x01280200, 0x01280300,
334 0x00200210, 0x00200310, 0x00280210, 0x00280310,
335 0x01200210, 0x01200310, 0x01280210, 0x01280310,
338 0x00000000, 0x04000000, 0x00040000, 0x04040000,
339 0x00000002, 0x04000002, 0x00040002, 0x04040002,
340 0x00002000, 0x04002000, 0x00042000, 0x04042000,
341 0x00002002, 0x04002002, 0x00042002, 0x04042002,
342 0x00000020, 0x04000020, 0x00040020, 0x04040020,
343 0x00000022, 0x04000022, 0x00040022, 0x04040022,
344 0x00002020, 0x04002020, 0x00042020, 0x04042020,
345 0x00002022, 0x04002022, 0x00042022, 0x04042022,
346 0x00000800, 0x04000800, 0x00040800, 0x04040800,
347 0x00000802, 0x04000802, 0x00040802, 0x04040802,
348 0x00002800, 0x04002800, 0x00042800, 0x04042800,
349 0x00002802, 0x04002802, 0x00042802, 0x04042802,
350 0x00000820, 0x04000820, 0x00040820, 0x04040820,
351 0x00000822, 0x04000822, 0x00040822, 0x04040822,
352 0x00002820, 0x04002820, 0x00042820, 0x04042820,
353 0x00002822, 0x04002822, 0x00042822, 0x04042822
358 #define BOX(i,n,S) (S)[(n)][(i)]
360 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1])
362 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3])
364 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7])
365 #elif VECT_SIZE == 16
366 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7], (S)[(n)][(i).s8], (S)[(n)][(i).s9], (S)[(n)][(i).sa], (S)[(n)][(i).sb], (S)[(n)][(i).sc], (S)[(n)][(i).sd], (S)[(n)][(i).se], (S)[(n)][(i).sf])
369 void _des_crypt_encrypt (u32x iv[2], u32x data[2], u32x Kc[16], u32x Kd[16], __local u32 (*s_SPtrans)[64])
384 for (u32 i = 0; i < 16; i += 2)
390 t = Kd[i + 0] ^ rotl32 (r, 28u);
392 l ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
393 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
394 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
395 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
396 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
397 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
398 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
399 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
402 t = Kd[i + 1] ^ rotl32 (l, 28u);
404 r ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
405 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
406 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
407 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
408 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
409 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
410 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
411 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
423 void _des_crypt_keysetup (u32x c, u32x d, u32x Kc[16], u32x Kd[16], __local u32 (*s_skb)[64])
427 PERM_OP (d, c, tt, 4, 0x0f0f0f0f);
428 HPERM_OP (c, tt, 2, 0xcccc0000);
429 HPERM_OP (d, tt, 2, 0xcccc0000);
430 PERM_OP (d, c, tt, 1, 0x55555555);
431 PERM_OP (c, d, tt, 8, 0x00ff00ff);
432 PERM_OP (d, c, tt, 1, 0x55555555);
434 d = ((d & 0x000000ff) << 16)
435 | ((d & 0x0000ff00) << 0)
436 | ((d & 0x00ff0000) >> 16)
437 | ((c & 0xf0000000) >> 4);
444 for (u32 i = 0; i < 16; i++)
446 if ((i < 2) || (i == 8) || (i == 15))
448 c = ((c >> 1) | (c << 27));
449 d = ((d >> 1) | (d << 27));
453 c = ((c >> 2) | (c << 26));
454 d = ((d >> 2) | (d << 26));
460 const u32x c00 = (c >> 0) & 0x0000003f;
461 const u32x c06 = (c >> 6) & 0x00383003;
462 const u32x c07 = (c >> 7) & 0x0000003c;
463 const u32x c13 = (c >> 13) & 0x0000060f;
464 const u32x c20 = (c >> 20) & 0x00000001;
466 u32x s = BOX (((c00 >> 0) & 0xff), 0, s_skb)
467 | BOX (((c06 >> 0) & 0xff)
468 |((c07 >> 0) & 0xff), 1, s_skb)
469 | BOX (((c13 >> 0) & 0xff)
470 |((c06 >> 8) & 0xff), 2, s_skb)
471 | BOX (((c20 >> 0) & 0xff)
473 |((c06 >> 16) & 0xff), 3, s_skb);
475 const u32x d00 = (d >> 0) & 0x00003c3f;
476 const u32x d07 = (d >> 7) & 0x00003f03;
477 const u32x d21 = (d >> 21) & 0x0000000f;
478 const u32x d22 = (d >> 22) & 0x00000030;
480 u32x t = BOX (((d00 >> 0) & 0xff), 4, s_skb)
481 | BOX (((d07 >> 0) & 0xff)
482 |((d00 >> 8) & 0xff), 5, s_skb)
483 | BOX (((d07 >> 8) & 0xff), 6, s_skb)
484 | BOX (((d21 >> 0) & 0xff)
485 |((d22 >> 0) & 0xff), 7, s_skb);
487 Kc[i] = ((t << 16) | (s & 0x0000ffff));
488 Kd[i] = ((s >> 16) | (t & 0xffff0000));
490 Kc[i] = rotl32 (Kc[i], 2u);
491 Kd[i] = rotl32 (Kd[i], 2u);
495 __kernel void m03100_m04 (__global pw_t *pws, __global kernel_rule_t * rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
501 const u32 gid = get_global_id (0);
502 const u32 lid = get_local_id (0);
503 const u32 lsz = get_local_size (0);
509 __local u32 s_SPtrans[8][64];
510 __local u32 s_skb[8][64];
512 for (u32 i = lid; i < 64; i += lsz)
514 s_SPtrans[0][i] = c_SPtrans[0][i];
515 s_SPtrans[1][i] = c_SPtrans[1][i];
516 s_SPtrans[2][i] = c_SPtrans[2][i];
517 s_SPtrans[3][i] = c_SPtrans[3][i];
518 s_SPtrans[4][i] = c_SPtrans[4][i];
519 s_SPtrans[5][i] = c_SPtrans[5][i];
520 s_SPtrans[6][i] = c_SPtrans[6][i];
521 s_SPtrans[7][i] = c_SPtrans[7][i];
523 s_skb[0][i] = c_skb[0][i];
524 s_skb[1][i] = c_skb[1][i];
525 s_skb[2][i] = c_skb[2][i];
526 s_skb[3][i] = c_skb[3][i];
527 s_skb[4][i] = c_skb[4][i];
528 s_skb[5][i] = c_skb[5][i];
529 s_skb[6][i] = c_skb[6][i];
530 s_skb[7][i] = c_skb[7][i];
533 barrier (CLK_LOCAL_MEM_FENCE);
535 if (gid >= gid_max) return;
544 pw_buf0[0] = pws[gid].i[0];
545 pw_buf0[1] = pws[gid].i[1];
546 pw_buf0[2] = pws[gid].i[2];
547 pw_buf0[3] = pws[gid].i[3];
548 pw_buf1[0] = pws[gid].i[4];
549 pw_buf1[1] = pws[gid].i[5];
550 pw_buf1[2] = pws[gid].i[6];
551 pw_buf1[3] = pws[gid].i[7];
553 const u32 pw_len = pws[gid].pw_len;
562 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
563 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
564 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
565 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
566 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
567 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
568 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
569 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
571 const u32 salt_len = salt_bufs[salt_pos].salt_len;
577 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
584 const u32x out_len = apply_rules_vect (pw_buf0, pw_buf1, pw_len, rules_buf, il_pos, w0, w1);
586 const u32x salt_word_len = (salt_len + out_len) * 2;
592 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
596 dst[ 0] = w0[0] | salt_buf0[0];
597 dst[ 1] = w0[1] | salt_buf0[1];
598 dst[ 2] = w0[2] | salt_buf0[2];
599 dst[ 3] = w0[3] | salt_buf0[3];
600 dst[ 4] = w1[0] | salt_buf1[0];
601 dst[ 5] = w1[1] | salt_buf1[1];
602 dst[ 6] = w1[2] | salt_buf1[2];
603 dst[ 7] = w1[3] | salt_buf1[3];
614 * precompute key1 since key is static: 0x0123456789abcdef
615 * plus LEFT_ROTATE by 2
657 * key1 (generate key)
665 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
669 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
670 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
675 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
679 * key2 (generate hash)
682 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
687 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
691 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
692 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
697 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
706 COMPARE_M_SIMD (iv[0], iv[1], z, z);
710 __kernel void m03100_m08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
714 __kernel void m03100_m16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
718 __kernel void m03100_s04 (__global pw_t *pws, __global kernel_rule_t * rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
724 const u32 gid = get_global_id (0);
725 const u32 lid = get_local_id (0);
726 const u32 lsz = get_local_size (0);
732 __local u32 s_SPtrans[8][64];
733 __local u32 s_skb[8][64];
735 for (u32 i = lid; i < 64; i += lsz)
737 s_SPtrans[0][i] = c_SPtrans[0][i];
738 s_SPtrans[1][i] = c_SPtrans[1][i];
739 s_SPtrans[2][i] = c_SPtrans[2][i];
740 s_SPtrans[3][i] = c_SPtrans[3][i];
741 s_SPtrans[4][i] = c_SPtrans[4][i];
742 s_SPtrans[5][i] = c_SPtrans[5][i];
743 s_SPtrans[6][i] = c_SPtrans[6][i];
744 s_SPtrans[7][i] = c_SPtrans[7][i];
746 s_skb[0][i] = c_skb[0][i];
747 s_skb[1][i] = c_skb[1][i];
748 s_skb[2][i] = c_skb[2][i];
749 s_skb[3][i] = c_skb[3][i];
750 s_skb[4][i] = c_skb[4][i];
751 s_skb[5][i] = c_skb[5][i];
752 s_skb[6][i] = c_skb[6][i];
753 s_skb[7][i] = c_skb[7][i];
756 barrier (CLK_LOCAL_MEM_FENCE);
758 if (gid >= gid_max) return;
767 pw_buf0[0] = pws[gid].i[0];
768 pw_buf0[1] = pws[gid].i[1];
769 pw_buf0[2] = pws[gid].i[2];
770 pw_buf0[3] = pws[gid].i[3];
771 pw_buf1[0] = pws[gid].i[4];
772 pw_buf1[1] = pws[gid].i[5];
773 pw_buf1[2] = pws[gid].i[6];
774 pw_buf1[3] = pws[gid].i[7];
776 const u32 pw_len = pws[gid].pw_len;
785 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
786 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
787 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
788 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
789 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
790 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
791 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
792 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
794 const u32 salt_len = salt_bufs[salt_pos].salt_len;
800 const u32 search[4] =
802 digests_buf[digests_offset].digest_buf[DGST_R0],
803 digests_buf[digests_offset].digest_buf[DGST_R1],
812 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
819 const u32x out_len = apply_rules_vect (pw_buf0, pw_buf1, pw_len, rules_buf, il_pos, w0, w1);
821 const u32x salt_word_len = (salt_len + out_len) * 2;
827 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
831 dst[ 0] = w0[0] | salt_buf0[0];
832 dst[ 1] = w0[1] | salt_buf0[1];
833 dst[ 2] = w0[2] | salt_buf0[2];
834 dst[ 3] = w0[3] | salt_buf0[3];
835 dst[ 4] = w1[0] | salt_buf1[0];
836 dst[ 5] = w1[1] | salt_buf1[1];
837 dst[ 6] = w1[2] | salt_buf1[2];
838 dst[ 7] = w1[3] | salt_buf1[3];
849 * precompute key1 since key is static: 0x0123456789abcdef
850 * plus LEFT_ROTATE by 2
892 * key1 (generate key)
900 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
904 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
905 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
910 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
914 * key2 (generate hash)
917 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
922 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
926 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
927 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
932 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
941 COMPARE_S_SIMD (iv[0], iv[1], z, z);
945 __kernel void m03100_s08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
949 __kernel void m03100_s16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)