2 * Authors.....: Jens Steube <jens.steube@gmail.com>
3 * Gabriele Gristina <matrix@hashcat.net>
11 //#define NEW_SIMD_CODE
13 #include "include/constants.h"
14 #include "include/kernel_vendor.h"
21 #include "include/kernel_functions.c"
22 #include "OpenCL/types_ocl.c"
23 #include "OpenCL/common.c"
24 #include "OpenCL/simd.c"
26 #define PERM_OP(a,b,tt,n,m) \
36 #define HPERM_OP(a,tt,n,m) \
42 tt = tt >> (16 + n); \
48 PERM_OP (r, l, tt, 4, 0x0f0f0f0f); \
49 PERM_OP (l, r, tt, 16, 0x0000ffff); \
50 PERM_OP (r, l, tt, 2, 0x33333333); \
51 PERM_OP (l, r, tt, 8, 0x00ff00ff); \
52 PERM_OP (r, l, tt, 1, 0x55555555); \
57 PERM_OP (l, r, tt, 1, 0x55555555); \
58 PERM_OP (r, l, tt, 8, 0x00ff00ff); \
59 PERM_OP (l, r, tt, 2, 0x33333333); \
60 PERM_OP (r, l, tt, 16, 0x0000ffff); \
61 PERM_OP (l, r, tt, 4, 0x0f0f0f0f); \
64 __constant u32 c_SPtrans[8][64] =
67 0x02080800, 0x00080000, 0x02000002, 0x02080802,
68 0x02000000, 0x00080802, 0x00080002, 0x02000002,
69 0x00080802, 0x02080800, 0x02080000, 0x00000802,
70 0x02000802, 0x02000000, 0x00000000, 0x00080002,
71 0x00080000, 0x00000002, 0x02000800, 0x00080800,
72 0x02080802, 0x02080000, 0x00000802, 0x02000800,
73 0x00000002, 0x00000800, 0x00080800, 0x02080002,
74 0x00000800, 0x02000802, 0x02080002, 0x00000000,
75 0x00000000, 0x02080802, 0x02000800, 0x00080002,
76 0x02080800, 0x00080000, 0x00000802, 0x02000800,
77 0x02080002, 0x00000800, 0x00080800, 0x02000002,
78 0x00080802, 0x00000002, 0x02000002, 0x02080000,
79 0x02080802, 0x00080800, 0x02080000, 0x02000802,
80 0x02000000, 0x00000802, 0x00080002, 0x00000000,
81 0x00080000, 0x02000000, 0x02000802, 0x02080800,
82 0x00000002, 0x02080002, 0x00000800, 0x00080802,
85 0x40108010, 0x00000000, 0x00108000, 0x40100000,
86 0x40000010, 0x00008010, 0x40008000, 0x00108000,
87 0x00008000, 0x40100010, 0x00000010, 0x40008000,
88 0x00100010, 0x40108000, 0x40100000, 0x00000010,
89 0x00100000, 0x40008010, 0x40100010, 0x00008000,
90 0x00108010, 0x40000000, 0x00000000, 0x00100010,
91 0x40008010, 0x00108010, 0x40108000, 0x40000010,
92 0x40000000, 0x00100000, 0x00008010, 0x40108010,
93 0x00100010, 0x40108000, 0x40008000, 0x00108010,
94 0x40108010, 0x00100010, 0x40000010, 0x00000000,
95 0x40000000, 0x00008010, 0x00100000, 0x40100010,
96 0x00008000, 0x40000000, 0x00108010, 0x40008010,
97 0x40108000, 0x00008000, 0x00000000, 0x40000010,
98 0x00000010, 0x40108010, 0x00108000, 0x40100000,
99 0x40100010, 0x00100000, 0x00008010, 0x40008000,
100 0x40008010, 0x00000010, 0x40100000, 0x00108000,
103 0x04000001, 0x04040100, 0x00000100, 0x04000101,
104 0x00040001, 0x04000000, 0x04000101, 0x00040100,
105 0x04000100, 0x00040000, 0x04040000, 0x00000001,
106 0x04040101, 0x00000101, 0x00000001, 0x04040001,
107 0x00000000, 0x00040001, 0x04040100, 0x00000100,
108 0x00000101, 0x04040101, 0x00040000, 0x04000001,
109 0x04040001, 0x04000100, 0x00040101, 0x04040000,
110 0x00040100, 0x00000000, 0x04000000, 0x00040101,
111 0x04040100, 0x00000100, 0x00000001, 0x00040000,
112 0x00000101, 0x00040001, 0x04040000, 0x04000101,
113 0x00000000, 0x04040100, 0x00040100, 0x04040001,
114 0x00040001, 0x04000000, 0x04040101, 0x00000001,
115 0x00040101, 0x04000001, 0x04000000, 0x04040101,
116 0x00040000, 0x04000100, 0x04000101, 0x00040100,
117 0x04000100, 0x00000000, 0x04040001, 0x00000101,
118 0x04000001, 0x00040101, 0x00000100, 0x04040000,
121 0x00401008, 0x10001000, 0x00000008, 0x10401008,
122 0x00000000, 0x10400000, 0x10001008, 0x00400008,
123 0x10401000, 0x10000008, 0x10000000, 0x00001008,
124 0x10000008, 0x00401008, 0x00400000, 0x10000000,
125 0x10400008, 0x00401000, 0x00001000, 0x00000008,
126 0x00401000, 0x10001008, 0x10400000, 0x00001000,
127 0x00001008, 0x00000000, 0x00400008, 0x10401000,
128 0x10001000, 0x10400008, 0x10401008, 0x00400000,
129 0x10400008, 0x00001008, 0x00400000, 0x10000008,
130 0x00401000, 0x10001000, 0x00000008, 0x10400000,
131 0x10001008, 0x00000000, 0x00001000, 0x00400008,
132 0x00000000, 0x10400008, 0x10401000, 0x00001000,
133 0x10000000, 0x10401008, 0x00401008, 0x00400000,
134 0x10401008, 0x00000008, 0x10001000, 0x00401008,
135 0x00400008, 0x00401000, 0x10400000, 0x10001008,
136 0x00001008, 0x10000000, 0x10000008, 0x10401000,
139 0x08000000, 0x00010000, 0x00000400, 0x08010420,
140 0x08010020, 0x08000400, 0x00010420, 0x08010000,
141 0x00010000, 0x00000020, 0x08000020, 0x00010400,
142 0x08000420, 0x08010020, 0x08010400, 0x00000000,
143 0x00010400, 0x08000000, 0x00010020, 0x00000420,
144 0x08000400, 0x00010420, 0x00000000, 0x08000020,
145 0x00000020, 0x08000420, 0x08010420, 0x00010020,
146 0x08010000, 0x00000400, 0x00000420, 0x08010400,
147 0x08010400, 0x08000420, 0x00010020, 0x08010000,
148 0x00010000, 0x00000020, 0x08000020, 0x08000400,
149 0x08000000, 0x00010400, 0x08010420, 0x00000000,
150 0x00010420, 0x08000000, 0x00000400, 0x00010020,
151 0x08000420, 0x00000400, 0x00000000, 0x08010420,
152 0x08010020, 0x08010400, 0x00000420, 0x00010000,
153 0x00010400, 0x08010020, 0x08000400, 0x00000420,
154 0x00000020, 0x00010420, 0x08010000, 0x08000020,
157 0x80000040, 0x00200040, 0x00000000, 0x80202000,
158 0x00200040, 0x00002000, 0x80002040, 0x00200000,
159 0x00002040, 0x80202040, 0x00202000, 0x80000000,
160 0x80002000, 0x80000040, 0x80200000, 0x00202040,
161 0x00200000, 0x80002040, 0x80200040, 0x00000000,
162 0x00002000, 0x00000040, 0x80202000, 0x80200040,
163 0x80202040, 0x80200000, 0x80000000, 0x00002040,
164 0x00000040, 0x00202000, 0x00202040, 0x80002000,
165 0x00002040, 0x80000000, 0x80002000, 0x00202040,
166 0x80202000, 0x00200040, 0x00000000, 0x80002000,
167 0x80000000, 0x00002000, 0x80200040, 0x00200000,
168 0x00200040, 0x80202040, 0x00202000, 0x00000040,
169 0x80202040, 0x00202000, 0x00200000, 0x80002040,
170 0x80000040, 0x80200000, 0x00202040, 0x00000000,
171 0x00002000, 0x80000040, 0x80002040, 0x80202000,
172 0x80200000, 0x00002040, 0x00000040, 0x80200040,
175 0x00004000, 0x00000200, 0x01000200, 0x01000004,
176 0x01004204, 0x00004004, 0x00004200, 0x00000000,
177 0x01000000, 0x01000204, 0x00000204, 0x01004000,
178 0x00000004, 0x01004200, 0x01004000, 0x00000204,
179 0x01000204, 0x00004000, 0x00004004, 0x01004204,
180 0x00000000, 0x01000200, 0x01000004, 0x00004200,
181 0x01004004, 0x00004204, 0x01004200, 0x00000004,
182 0x00004204, 0x01004004, 0x00000200, 0x01000000,
183 0x00004204, 0x01004000, 0x01004004, 0x00000204,
184 0x00004000, 0x00000200, 0x01000000, 0x01004004,
185 0x01000204, 0x00004204, 0x00004200, 0x00000000,
186 0x00000200, 0x01000004, 0x00000004, 0x01000200,
187 0x00000000, 0x01000204, 0x01000200, 0x00004200,
188 0x00000204, 0x00004000, 0x01004204, 0x01000000,
189 0x01004200, 0x00000004, 0x00004004, 0x01004204,
190 0x01000004, 0x01004200, 0x01004000, 0x00004004,
193 0x20800080, 0x20820000, 0x00020080, 0x00000000,
194 0x20020000, 0x00800080, 0x20800000, 0x20820080,
195 0x00000080, 0x20000000, 0x00820000, 0x00020080,
196 0x00820080, 0x20020080, 0x20000080, 0x20800000,
197 0x00020000, 0x00820080, 0x00800080, 0x20020000,
198 0x20820080, 0x20000080, 0x00000000, 0x00820000,
199 0x20000000, 0x00800000, 0x20020080, 0x20800080,
200 0x00800000, 0x00020000, 0x20820000, 0x00000080,
201 0x00800000, 0x00020000, 0x20000080, 0x20820080,
202 0x00020080, 0x20000000, 0x00000000, 0x00820000,
203 0x20800080, 0x20020080, 0x20020000, 0x00800080,
204 0x20820000, 0x00000080, 0x00800080, 0x20020000,
205 0x20820080, 0x00800000, 0x20800000, 0x20000080,
206 0x00820000, 0x00020080, 0x20020080, 0x20800000,
207 0x00000080, 0x20820000, 0x00820080, 0x00000000,
208 0x20000000, 0x20800080, 0x00020000, 0x00820080,
212 __constant u32 c_skb[8][64] =
215 0x00000000, 0x00000010, 0x20000000, 0x20000010,
216 0x00010000, 0x00010010, 0x20010000, 0x20010010,
217 0x00000800, 0x00000810, 0x20000800, 0x20000810,
218 0x00010800, 0x00010810, 0x20010800, 0x20010810,
219 0x00000020, 0x00000030, 0x20000020, 0x20000030,
220 0x00010020, 0x00010030, 0x20010020, 0x20010030,
221 0x00000820, 0x00000830, 0x20000820, 0x20000830,
222 0x00010820, 0x00010830, 0x20010820, 0x20010830,
223 0x00080000, 0x00080010, 0x20080000, 0x20080010,
224 0x00090000, 0x00090010, 0x20090000, 0x20090010,
225 0x00080800, 0x00080810, 0x20080800, 0x20080810,
226 0x00090800, 0x00090810, 0x20090800, 0x20090810,
227 0x00080020, 0x00080030, 0x20080020, 0x20080030,
228 0x00090020, 0x00090030, 0x20090020, 0x20090030,
229 0x00080820, 0x00080830, 0x20080820, 0x20080830,
230 0x00090820, 0x00090830, 0x20090820, 0x20090830,
233 0x00000000, 0x02000000, 0x00002000, 0x02002000,
234 0x00200000, 0x02200000, 0x00202000, 0x02202000,
235 0x00000004, 0x02000004, 0x00002004, 0x02002004,
236 0x00200004, 0x02200004, 0x00202004, 0x02202004,
237 0x00000400, 0x02000400, 0x00002400, 0x02002400,
238 0x00200400, 0x02200400, 0x00202400, 0x02202400,
239 0x00000404, 0x02000404, 0x00002404, 0x02002404,
240 0x00200404, 0x02200404, 0x00202404, 0x02202404,
241 0x10000000, 0x12000000, 0x10002000, 0x12002000,
242 0x10200000, 0x12200000, 0x10202000, 0x12202000,
243 0x10000004, 0x12000004, 0x10002004, 0x12002004,
244 0x10200004, 0x12200004, 0x10202004, 0x12202004,
245 0x10000400, 0x12000400, 0x10002400, 0x12002400,
246 0x10200400, 0x12200400, 0x10202400, 0x12202400,
247 0x10000404, 0x12000404, 0x10002404, 0x12002404,
248 0x10200404, 0x12200404, 0x10202404, 0x12202404,
251 0x00000000, 0x00000001, 0x00040000, 0x00040001,
252 0x01000000, 0x01000001, 0x01040000, 0x01040001,
253 0x00000002, 0x00000003, 0x00040002, 0x00040003,
254 0x01000002, 0x01000003, 0x01040002, 0x01040003,
255 0x00000200, 0x00000201, 0x00040200, 0x00040201,
256 0x01000200, 0x01000201, 0x01040200, 0x01040201,
257 0x00000202, 0x00000203, 0x00040202, 0x00040203,
258 0x01000202, 0x01000203, 0x01040202, 0x01040203,
259 0x08000000, 0x08000001, 0x08040000, 0x08040001,
260 0x09000000, 0x09000001, 0x09040000, 0x09040001,
261 0x08000002, 0x08000003, 0x08040002, 0x08040003,
262 0x09000002, 0x09000003, 0x09040002, 0x09040003,
263 0x08000200, 0x08000201, 0x08040200, 0x08040201,
264 0x09000200, 0x09000201, 0x09040200, 0x09040201,
265 0x08000202, 0x08000203, 0x08040202, 0x08040203,
266 0x09000202, 0x09000203, 0x09040202, 0x09040203,
269 0x00000000, 0x00100000, 0x00000100, 0x00100100,
270 0x00000008, 0x00100008, 0x00000108, 0x00100108,
271 0x00001000, 0x00101000, 0x00001100, 0x00101100,
272 0x00001008, 0x00101008, 0x00001108, 0x00101108,
273 0x04000000, 0x04100000, 0x04000100, 0x04100100,
274 0x04000008, 0x04100008, 0x04000108, 0x04100108,
275 0x04001000, 0x04101000, 0x04001100, 0x04101100,
276 0x04001008, 0x04101008, 0x04001108, 0x04101108,
277 0x00020000, 0x00120000, 0x00020100, 0x00120100,
278 0x00020008, 0x00120008, 0x00020108, 0x00120108,
279 0x00021000, 0x00121000, 0x00021100, 0x00121100,
280 0x00021008, 0x00121008, 0x00021108, 0x00121108,
281 0x04020000, 0x04120000, 0x04020100, 0x04120100,
282 0x04020008, 0x04120008, 0x04020108, 0x04120108,
283 0x04021000, 0x04121000, 0x04021100, 0x04121100,
284 0x04021008, 0x04121008, 0x04021108, 0x04121108,
287 0x00000000, 0x10000000, 0x00010000, 0x10010000,
288 0x00000004, 0x10000004, 0x00010004, 0x10010004,
289 0x20000000, 0x30000000, 0x20010000, 0x30010000,
290 0x20000004, 0x30000004, 0x20010004, 0x30010004,
291 0x00100000, 0x10100000, 0x00110000, 0x10110000,
292 0x00100004, 0x10100004, 0x00110004, 0x10110004,
293 0x20100000, 0x30100000, 0x20110000, 0x30110000,
294 0x20100004, 0x30100004, 0x20110004, 0x30110004,
295 0x00001000, 0x10001000, 0x00011000, 0x10011000,
296 0x00001004, 0x10001004, 0x00011004, 0x10011004,
297 0x20001000, 0x30001000, 0x20011000, 0x30011000,
298 0x20001004, 0x30001004, 0x20011004, 0x30011004,
299 0x00101000, 0x10101000, 0x00111000, 0x10111000,
300 0x00101004, 0x10101004, 0x00111004, 0x10111004,
301 0x20101000, 0x30101000, 0x20111000, 0x30111000,
302 0x20101004, 0x30101004, 0x20111004, 0x30111004,
305 0x00000000, 0x08000000, 0x00000008, 0x08000008,
306 0x00000400, 0x08000400, 0x00000408, 0x08000408,
307 0x00020000, 0x08020000, 0x00020008, 0x08020008,
308 0x00020400, 0x08020400, 0x00020408, 0x08020408,
309 0x00000001, 0x08000001, 0x00000009, 0x08000009,
310 0x00000401, 0x08000401, 0x00000409, 0x08000409,
311 0x00020001, 0x08020001, 0x00020009, 0x08020009,
312 0x00020401, 0x08020401, 0x00020409, 0x08020409,
313 0x02000000, 0x0A000000, 0x02000008, 0x0A000008,
314 0x02000400, 0x0A000400, 0x02000408, 0x0A000408,
315 0x02020000, 0x0A020000, 0x02020008, 0x0A020008,
316 0x02020400, 0x0A020400, 0x02020408, 0x0A020408,
317 0x02000001, 0x0A000001, 0x02000009, 0x0A000009,
318 0x02000401, 0x0A000401, 0x02000409, 0x0A000409,
319 0x02020001, 0x0A020001, 0x02020009, 0x0A020009,
320 0x02020401, 0x0A020401, 0x02020409, 0x0A020409,
323 0x00000000, 0x00000100, 0x00080000, 0x00080100,
324 0x01000000, 0x01000100, 0x01080000, 0x01080100,
325 0x00000010, 0x00000110, 0x00080010, 0x00080110,
326 0x01000010, 0x01000110, 0x01080010, 0x01080110,
327 0x00200000, 0x00200100, 0x00280000, 0x00280100,
328 0x01200000, 0x01200100, 0x01280000, 0x01280100,
329 0x00200010, 0x00200110, 0x00280010, 0x00280110,
330 0x01200010, 0x01200110, 0x01280010, 0x01280110,
331 0x00000200, 0x00000300, 0x00080200, 0x00080300,
332 0x01000200, 0x01000300, 0x01080200, 0x01080300,
333 0x00000210, 0x00000310, 0x00080210, 0x00080310,
334 0x01000210, 0x01000310, 0x01080210, 0x01080310,
335 0x00200200, 0x00200300, 0x00280200, 0x00280300,
336 0x01200200, 0x01200300, 0x01280200, 0x01280300,
337 0x00200210, 0x00200310, 0x00280210, 0x00280310,
338 0x01200210, 0x01200310, 0x01280210, 0x01280310,
341 0x00000000, 0x04000000, 0x00040000, 0x04040000,
342 0x00000002, 0x04000002, 0x00040002, 0x04040002,
343 0x00002000, 0x04002000, 0x00042000, 0x04042000,
344 0x00002002, 0x04002002, 0x00042002, 0x04042002,
345 0x00000020, 0x04000020, 0x00040020, 0x04040020,
346 0x00000022, 0x04000022, 0x00040022, 0x04040022,
347 0x00002020, 0x04002020, 0x00042020, 0x04042020,
348 0x00002022, 0x04002022, 0x00042022, 0x04042022,
349 0x00000800, 0x04000800, 0x00040800, 0x04040800,
350 0x00000802, 0x04000802, 0x00040802, 0x04040802,
351 0x00002800, 0x04002800, 0x00042800, 0x04042800,
352 0x00002802, 0x04002802, 0x00042802, 0x04042802,
353 0x00000820, 0x04000820, 0x00040820, 0x04040820,
354 0x00000822, 0x04000822, 0x00040822, 0x04040822,
355 0x00002820, 0x04002820, 0x00042820, 0x04042820,
356 0x00002822, 0x04002822, 0x00042822, 0x04042822
361 #define BOX(i,n,S) (S)[(n)][(i)]
363 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1])
365 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3])
367 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7])
368 #elif VECT_SIZE == 16
369 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7], (S)[(n)][(i).s8], (S)[(n)][(i).s9], (S)[(n)][(i).sa], (S)[(n)][(i).sb], (S)[(n)][(i).sc], (S)[(n)][(i).sd], (S)[(n)][(i).se], (S)[(n)][(i).sf])
372 static void _des_crypt_encrypt (u32x iv[2], u32x data[2], u32x Kc[16], u32x Kd[16], __local u32 (*s_SPtrans)[64])
385 for (u32 i = 0; i < 16; i += 2)
391 t = Kd[i + 0] ^ rotl32 (r, 28u);
393 l ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
394 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
395 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
396 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
397 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
398 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
399 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
400 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
403 t = Kd[i + 1] ^ rotl32 (l, 28u);
405 r ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
406 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
407 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
408 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
409 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
410 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
411 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
412 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
424 static void _des_crypt_keysetup (u32x c, u32x d, u32x Kc[16], u32x Kd[16], __local u32 (*s_skb)[64])
428 PERM_OP (d, c, tt, 4, 0x0f0f0f0f);
429 HPERM_OP (c, tt, 2, 0xcccc0000);
430 HPERM_OP (d, tt, 2, 0xcccc0000);
431 PERM_OP (d, c, tt, 1, 0x55555555);
432 PERM_OP (c, d, tt, 8, 0x00ff00ff);
433 PERM_OP (d, c, tt, 1, 0x55555555);
435 d = ((d & 0x000000ff) << 16)
436 | ((d & 0x0000ff00) << 0)
437 | ((d & 0x00ff0000) >> 16)
438 | ((c & 0xf0000000) >> 4);
443 for (u32 i = 0; i < 16; i++)
445 if ((i < 2) || (i == 8) || (i == 15))
447 c = ((c >> 1) | (c << 27));
448 d = ((d >> 1) | (d << 27));
452 c = ((c >> 2) | (c << 26));
453 d = ((d >> 2) | (d << 26));
459 const u32x c00 = (c >> 0) & 0x0000003f;
460 const u32x c06 = (c >> 6) & 0x00383003;
461 const u32x c07 = (c >> 7) & 0x0000003c;
462 const u32x c13 = (c >> 13) & 0x0000060f;
463 const u32x c20 = (c >> 20) & 0x00000001;
465 u32x s = BOX (((c00 >> 0) & 0xff), 0, s_skb)
466 | BOX (((c06 >> 0) & 0xff)
467 |((c07 >> 0) & 0xff), 1, s_skb)
468 | BOX (((c13 >> 0) & 0xff)
469 |((c06 >> 8) & 0xff), 2, s_skb)
470 | BOX (((c20 >> 0) & 0xff)
472 |((c06 >> 16) & 0xff), 3, s_skb);
474 const u32x d00 = (d >> 0) & 0x00003c3f;
475 const u32x d07 = (d >> 7) & 0x00003f03;
476 const u32x d21 = (d >> 21) & 0x0000000f;
477 const u32x d22 = (d >> 22) & 0x00000030;
479 u32x t = BOX (((d00 >> 0) & 0xff), 4, s_skb)
480 | BOX (((d07 >> 0) & 0xff)
481 |((d00 >> 8) & 0xff), 5, s_skb)
482 | BOX (((d07 >> 8) & 0xff), 6, s_skb)
483 | BOX (((d21 >> 0) & 0xff)
484 |((d22 >> 0) & 0xff), 7, s_skb);
486 Kc[i] = ((t << 16) | (s & 0x0000ffff));
487 Kd[i] = ((s >> 16) | (t & 0xffff0000));
489 Kc[i] = rotl32 (Kc[i], 2u);
490 Kd[i] = rotl32 (Kd[i], 2u);
494 __kernel void m03100_m04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
500 const u32 gid = get_global_id (0);
501 const u32 lid = get_local_id (0);
502 const u32 lsz = get_local_size (0);
508 __local u32 s_SPtrans[8][64];
509 __local u32 s_skb[8][64];
511 for (u32 i = lid; i < 64; i += lsz)
513 s_SPtrans[0][i] = c_SPtrans[0][i];
514 s_SPtrans[1][i] = c_SPtrans[1][i];
515 s_SPtrans[2][i] = c_SPtrans[2][i];
516 s_SPtrans[3][i] = c_SPtrans[3][i];
517 s_SPtrans[4][i] = c_SPtrans[4][i];
518 s_SPtrans[5][i] = c_SPtrans[5][i];
519 s_SPtrans[6][i] = c_SPtrans[6][i];
520 s_SPtrans[7][i] = c_SPtrans[7][i];
522 s_skb[0][i] = c_skb[0][i];
523 s_skb[1][i] = c_skb[1][i];
524 s_skb[2][i] = c_skb[2][i];
525 s_skb[3][i] = c_skb[3][i];
526 s_skb[4][i] = c_skb[4][i];
527 s_skb[5][i] = c_skb[5][i];
528 s_skb[6][i] = c_skb[6][i];
529 s_skb[7][i] = c_skb[7][i];
532 barrier (CLK_LOCAL_MEM_FENCE);
534 if (gid >= gid_max) return;
543 pw_buf0[0] = pws[gid].i[0];
544 pw_buf0[1] = pws[gid].i[1];
545 pw_buf0[2] = pws[gid].i[2];
546 pw_buf0[3] = pws[gid].i[3];
547 pw_buf1[0] = pws[gid].i[4];
548 pw_buf1[1] = pws[gid].i[5];
549 pw_buf1[2] = pws[gid].i[6];
550 pw_buf1[3] = pws[gid].i[7];
552 const u32 pw_l_len = pws[gid].pw_len;
561 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
562 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
563 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
564 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
565 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
566 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
567 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
568 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
570 const u32 salt_len = salt_bufs[salt_pos].salt_len;
576 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
578 const u32x pw_r_len = pwlenx_create_combt (combs_buf, il_pos);
580 const u32x pw_len = pw_l_len + pw_r_len;
582 const u32x salt_word_len = (salt_len + pw_len) * 2;
585 * concat password candidate
588 u32x wordl0[4] = { 0 };
589 u32x wordl1[4] = { 0 };
590 u32x wordl2[4] = { 0 };
591 u32x wordl3[4] = { 0 };
593 wordl0[0] = pw_buf0[0];
594 wordl0[1] = pw_buf0[1];
595 wordl0[2] = pw_buf0[2];
596 wordl0[3] = pw_buf0[3];
597 wordl1[0] = pw_buf1[0];
598 wordl1[1] = pw_buf1[1];
599 wordl1[2] = pw_buf1[2];
600 wordl1[3] = pw_buf1[3];
602 u32x wordr0[4] = { 0 };
603 u32x wordr1[4] = { 0 };
604 u32x wordr2[4] = { 0 };
605 u32x wordr3[4] = { 0 };
607 wordr0[0] = ix_create_combt (combs_buf, il_pos, 0);
608 wordr0[1] = ix_create_combt (combs_buf, il_pos, 1);
609 wordr0[2] = ix_create_combt (combs_buf, il_pos, 2);
610 wordr0[3] = ix_create_combt (combs_buf, il_pos, 3);
611 wordr1[0] = ix_create_combt (combs_buf, il_pos, 4);
612 wordr1[1] = ix_create_combt (combs_buf, il_pos, 5);
613 wordr1[2] = ix_create_combt (combs_buf, il_pos, 6);
614 wordr1[3] = ix_create_combt (combs_buf, il_pos, 7);
616 if (combs_mode == COMBINATOR_MODE_BASE_LEFT)
618 switch_buffer_by_offset_le_VV (wordr0, wordr1, wordr2, wordr3, pw_l_len);
622 switch_buffer_by_offset_le_VV (wordl0, wordl1, wordl2, wordl3, pw_r_len);
630 w0[0] = wordl0[0] | wordr0[0];
631 w0[1] = wordl0[1] | wordr0[1];
632 w0[2] = wordl0[2] | wordr0[2];
633 w0[3] = wordl0[3] | wordr0[3];
634 w1[0] = wordl1[0] | wordr1[0];
635 w1[1] = wordl1[1] | wordr1[1];
636 w1[2] = wordl1[2] | wordr1[2];
637 w1[3] = wordl1[3] | wordr1[3];
638 w2[0] = wordl2[0] | wordr2[0];
639 w2[1] = wordl2[1] | wordr2[1];
640 w2[2] = wordl2[2] | wordr2[2];
641 w2[3] = wordl2[3] | wordr2[3];
642 w3[0] = wordl3[0] | wordr3[0];
643 w3[1] = wordl3[1] | wordr3[1];
644 w3[2] = wordl3[2] | wordr3[2];
645 w3[3] = wordl3[3] | wordr3[3];
651 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
655 dst[ 0] = w0[0] | salt_buf0[0];
656 dst[ 1] = w0[1] | salt_buf0[1];
657 dst[ 2] = w0[2] | salt_buf0[2];
658 dst[ 3] = w0[3] | salt_buf0[3];
659 dst[ 4] = w1[0] | salt_buf1[0];
660 dst[ 5] = w1[1] | salt_buf1[1];
661 dst[ 6] = w1[2] | salt_buf1[2];
662 dst[ 7] = w1[3] | salt_buf1[3];
673 * precompute key1 since key is static: 0x0123456789abcdef
674 * plus LEFT_ROTATE by 2
716 * key1 (generate key)
724 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
728 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
729 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
734 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
738 * key2 (generate hash)
741 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
746 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
750 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
751 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
756 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
763 const u32x r0 = iv[0];
764 const u32x r1 = iv[1];
768 COMPARE_M_SIMD (r0, r1, r2, r3);
772 __kernel void m03100_m08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
776 __kernel void m03100_m16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
780 __kernel void m03100_s04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
786 const u32 gid = get_global_id (0);
787 const u32 lid = get_local_id (0);
788 const u32 lsz = get_local_size (0);
794 __local u32 s_SPtrans[8][64];
795 __local u32 s_skb[8][64];
797 for (u32 i = lid; i < 64; i += lsz)
799 s_SPtrans[0][i] = c_SPtrans[0][i];
800 s_SPtrans[1][i] = c_SPtrans[1][i];
801 s_SPtrans[2][i] = c_SPtrans[2][i];
802 s_SPtrans[3][i] = c_SPtrans[3][i];
803 s_SPtrans[4][i] = c_SPtrans[4][i];
804 s_SPtrans[5][i] = c_SPtrans[5][i];
805 s_SPtrans[6][i] = c_SPtrans[6][i];
806 s_SPtrans[7][i] = c_SPtrans[7][i];
808 s_skb[0][i] = c_skb[0][i];
809 s_skb[1][i] = c_skb[1][i];
810 s_skb[2][i] = c_skb[2][i];
811 s_skb[3][i] = c_skb[3][i];
812 s_skb[4][i] = c_skb[4][i];
813 s_skb[5][i] = c_skb[5][i];
814 s_skb[6][i] = c_skb[6][i];
815 s_skb[7][i] = c_skb[7][i];
818 barrier (CLK_LOCAL_MEM_FENCE);
820 if (gid >= gid_max) return;
829 pw_buf0[0] = pws[gid].i[0];
830 pw_buf0[1] = pws[gid].i[1];
831 pw_buf0[2] = pws[gid].i[2];
832 pw_buf0[3] = pws[gid].i[3];
833 pw_buf1[0] = pws[gid].i[4];
834 pw_buf1[1] = pws[gid].i[5];
835 pw_buf1[2] = pws[gid].i[6];
836 pw_buf1[3] = pws[gid].i[7];
838 const u32 pw_l_len = pws[gid].pw_len;
847 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
848 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
849 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
850 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
851 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
852 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
853 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
854 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
856 const u32 salt_len = salt_bufs[salt_pos].salt_len;
862 const u32 search[4] =
864 digests_buf[digests_offset].digest_buf[DGST_R0],
865 digests_buf[digests_offset].digest_buf[DGST_R1],
866 digests_buf[digests_offset].digest_buf[DGST_R2],
867 digests_buf[digests_offset].digest_buf[DGST_R3]
874 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
876 const u32x pw_r_len = pwlenx_create_combt (combs_buf, il_pos);
878 const u32x pw_len = pw_l_len + pw_r_len;
880 const u32x salt_word_len = (salt_len + pw_len) * 2;
883 * concat password candidate
886 u32x wordl0[4] = { 0 };
887 u32x wordl1[4] = { 0 };
888 u32x wordl2[4] = { 0 };
889 u32x wordl3[4] = { 0 };
891 wordl0[0] = pw_buf0[0];
892 wordl0[1] = pw_buf0[1];
893 wordl0[2] = pw_buf0[2];
894 wordl0[3] = pw_buf0[3];
895 wordl1[0] = pw_buf1[0];
896 wordl1[1] = pw_buf1[1];
897 wordl1[2] = pw_buf1[2];
898 wordl1[3] = pw_buf1[3];
900 u32x wordr0[4] = { 0 };
901 u32x wordr1[4] = { 0 };
902 u32x wordr2[4] = { 0 };
903 u32x wordr3[4] = { 0 };
905 wordr0[0] = ix_create_combt (combs_buf, il_pos, 0);
906 wordr0[1] = ix_create_combt (combs_buf, il_pos, 1);
907 wordr0[2] = ix_create_combt (combs_buf, il_pos, 2);
908 wordr0[3] = ix_create_combt (combs_buf, il_pos, 3);
909 wordr1[0] = ix_create_combt (combs_buf, il_pos, 4);
910 wordr1[1] = ix_create_combt (combs_buf, il_pos, 5);
911 wordr1[2] = ix_create_combt (combs_buf, il_pos, 6);
912 wordr1[3] = ix_create_combt (combs_buf, il_pos, 7);
914 if (combs_mode == COMBINATOR_MODE_BASE_LEFT)
916 switch_buffer_by_offset_le_VV (wordr0, wordr1, wordr2, wordr3, pw_l_len);
920 switch_buffer_by_offset_le_VV (wordl0, wordl1, wordl2, wordl3, pw_r_len);
928 w0[0] = wordl0[0] | wordr0[0];
929 w0[1] = wordl0[1] | wordr0[1];
930 w0[2] = wordl0[2] | wordr0[2];
931 w0[3] = wordl0[3] | wordr0[3];
932 w1[0] = wordl1[0] | wordr1[0];
933 w1[1] = wordl1[1] | wordr1[1];
934 w1[2] = wordl1[2] | wordr1[2];
935 w1[3] = wordl1[3] | wordr1[3];
936 w2[0] = wordl2[0] | wordr2[0];
937 w2[1] = wordl2[1] | wordr2[1];
938 w2[2] = wordl2[2] | wordr2[2];
939 w2[3] = wordl2[3] | wordr2[3];
940 w3[0] = wordl3[0] | wordr3[0];
941 w3[1] = wordl3[1] | wordr3[1];
942 w3[2] = wordl3[2] | wordr3[2];
943 w3[3] = wordl3[3] | wordr3[3];
949 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
953 dst[ 0] = w0[0] | salt_buf0[0];
954 dst[ 1] = w0[1] | salt_buf0[1];
955 dst[ 2] = w0[2] | salt_buf0[2];
956 dst[ 3] = w0[3] | salt_buf0[3];
957 dst[ 4] = w1[0] | salt_buf1[0];
958 dst[ 5] = w1[1] | salt_buf1[1];
959 dst[ 6] = w1[2] | salt_buf1[2];
960 dst[ 7] = w1[3] | salt_buf1[3];
971 * precompute key1 since key is static: 0x0123456789abcdef
972 * plus LEFT_ROTATE by 2
1000 Kd[ 4] = 0x405cc070;
1001 Kd[ 5] = 0xa010784c;
1002 Kd[ 6] = 0x6074a800;
1003 Kd[ 7] = 0x80701c1c;
1004 Kd[ 8] = 0x9cd49430;
1005 Kd[ 9] = 0x4c8ce078;
1006 Kd[10] = 0x5c18c088;
1007 Kd[11] = 0x28a8a4c8;
1008 Kd[12] = 0x3c180838;
1009 Kd[13] = 0xb0b86c20;
1010 Kd[14] = 0xac84a094;
1011 Kd[15] = 0x4ce0c0c4;
1014 * key1 (generate key)
1022 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
1026 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
1027 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
1032 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
1036 * key2 (generate hash)
1039 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
1044 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
1048 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
1049 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
1054 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
1061 const u32x r0 = iv[0];
1062 const u32x r1 = iv[1];
1066 COMPARE_S_SIMD (r0, r1, r2, r3);
1070 __kernel void m03100_s08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1074 __kernel void m03100_s16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)