2 * Authors.....: Jens Steube <jens.steube@gmail.com>
3 * Gabriele Gristina <matrix@hashcat.net>
11 //#define NEW_SIMD_CODE
13 #include "include/constants.h"
14 #include "include/kernel_vendor.h"
21 #include "include/kernel_functions.c"
22 #include "OpenCL/types_ocl.c"
23 #include "OpenCL/common.c"
24 #include "OpenCL/simd.c"
26 #define PERM_OP(a,b,tt,n,m) \
36 #define HPERM_OP(a,tt,n,m) \
42 tt = tt >> (16 + n); \
48 PERM_OP (r, l, tt, 4, 0x0f0f0f0f); \
49 PERM_OP (l, r, tt, 16, 0x0000ffff); \
50 PERM_OP (r, l, tt, 2, 0x33333333); \
51 PERM_OP (l, r, tt, 8, 0x00ff00ff); \
52 PERM_OP (r, l, tt, 1, 0x55555555); \
57 PERM_OP (l, r, tt, 1, 0x55555555); \
58 PERM_OP (r, l, tt, 8, 0x00ff00ff); \
59 PERM_OP (l, r, tt, 2, 0x33333333); \
60 PERM_OP (r, l, tt, 16, 0x0000ffff); \
61 PERM_OP (l, r, tt, 4, 0x0f0f0f0f); \
64 __constant u32 c_SPtrans[8][64] =
67 0x02080800, 0x00080000, 0x02000002, 0x02080802,
68 0x02000000, 0x00080802, 0x00080002, 0x02000002,
69 0x00080802, 0x02080800, 0x02080000, 0x00000802,
70 0x02000802, 0x02000000, 0x00000000, 0x00080002,
71 0x00080000, 0x00000002, 0x02000800, 0x00080800,
72 0x02080802, 0x02080000, 0x00000802, 0x02000800,
73 0x00000002, 0x00000800, 0x00080800, 0x02080002,
74 0x00000800, 0x02000802, 0x02080002, 0x00000000,
75 0x00000000, 0x02080802, 0x02000800, 0x00080002,
76 0x02080800, 0x00080000, 0x00000802, 0x02000800,
77 0x02080002, 0x00000800, 0x00080800, 0x02000002,
78 0x00080802, 0x00000002, 0x02000002, 0x02080000,
79 0x02080802, 0x00080800, 0x02080000, 0x02000802,
80 0x02000000, 0x00000802, 0x00080002, 0x00000000,
81 0x00080000, 0x02000000, 0x02000802, 0x02080800,
82 0x00000002, 0x02080002, 0x00000800, 0x00080802,
85 0x40108010, 0x00000000, 0x00108000, 0x40100000,
86 0x40000010, 0x00008010, 0x40008000, 0x00108000,
87 0x00008000, 0x40100010, 0x00000010, 0x40008000,
88 0x00100010, 0x40108000, 0x40100000, 0x00000010,
89 0x00100000, 0x40008010, 0x40100010, 0x00008000,
90 0x00108010, 0x40000000, 0x00000000, 0x00100010,
91 0x40008010, 0x00108010, 0x40108000, 0x40000010,
92 0x40000000, 0x00100000, 0x00008010, 0x40108010,
93 0x00100010, 0x40108000, 0x40008000, 0x00108010,
94 0x40108010, 0x00100010, 0x40000010, 0x00000000,
95 0x40000000, 0x00008010, 0x00100000, 0x40100010,
96 0x00008000, 0x40000000, 0x00108010, 0x40008010,
97 0x40108000, 0x00008000, 0x00000000, 0x40000010,
98 0x00000010, 0x40108010, 0x00108000, 0x40100000,
99 0x40100010, 0x00100000, 0x00008010, 0x40008000,
100 0x40008010, 0x00000010, 0x40100000, 0x00108000,
103 0x04000001, 0x04040100, 0x00000100, 0x04000101,
104 0x00040001, 0x04000000, 0x04000101, 0x00040100,
105 0x04000100, 0x00040000, 0x04040000, 0x00000001,
106 0x04040101, 0x00000101, 0x00000001, 0x04040001,
107 0x00000000, 0x00040001, 0x04040100, 0x00000100,
108 0x00000101, 0x04040101, 0x00040000, 0x04000001,
109 0x04040001, 0x04000100, 0x00040101, 0x04040000,
110 0x00040100, 0x00000000, 0x04000000, 0x00040101,
111 0x04040100, 0x00000100, 0x00000001, 0x00040000,
112 0x00000101, 0x00040001, 0x04040000, 0x04000101,
113 0x00000000, 0x04040100, 0x00040100, 0x04040001,
114 0x00040001, 0x04000000, 0x04040101, 0x00000001,
115 0x00040101, 0x04000001, 0x04000000, 0x04040101,
116 0x00040000, 0x04000100, 0x04000101, 0x00040100,
117 0x04000100, 0x00000000, 0x04040001, 0x00000101,
118 0x04000001, 0x00040101, 0x00000100, 0x04040000,
121 0x00401008, 0x10001000, 0x00000008, 0x10401008,
122 0x00000000, 0x10400000, 0x10001008, 0x00400008,
123 0x10401000, 0x10000008, 0x10000000, 0x00001008,
124 0x10000008, 0x00401008, 0x00400000, 0x10000000,
125 0x10400008, 0x00401000, 0x00001000, 0x00000008,
126 0x00401000, 0x10001008, 0x10400000, 0x00001000,
127 0x00001008, 0x00000000, 0x00400008, 0x10401000,
128 0x10001000, 0x10400008, 0x10401008, 0x00400000,
129 0x10400008, 0x00001008, 0x00400000, 0x10000008,
130 0x00401000, 0x10001000, 0x00000008, 0x10400000,
131 0x10001008, 0x00000000, 0x00001000, 0x00400008,
132 0x00000000, 0x10400008, 0x10401000, 0x00001000,
133 0x10000000, 0x10401008, 0x00401008, 0x00400000,
134 0x10401008, 0x00000008, 0x10001000, 0x00401008,
135 0x00400008, 0x00401000, 0x10400000, 0x10001008,
136 0x00001008, 0x10000000, 0x10000008, 0x10401000,
139 0x08000000, 0x00010000, 0x00000400, 0x08010420,
140 0x08010020, 0x08000400, 0x00010420, 0x08010000,
141 0x00010000, 0x00000020, 0x08000020, 0x00010400,
142 0x08000420, 0x08010020, 0x08010400, 0x00000000,
143 0x00010400, 0x08000000, 0x00010020, 0x00000420,
144 0x08000400, 0x00010420, 0x00000000, 0x08000020,
145 0x00000020, 0x08000420, 0x08010420, 0x00010020,
146 0x08010000, 0x00000400, 0x00000420, 0x08010400,
147 0x08010400, 0x08000420, 0x00010020, 0x08010000,
148 0x00010000, 0x00000020, 0x08000020, 0x08000400,
149 0x08000000, 0x00010400, 0x08010420, 0x00000000,
150 0x00010420, 0x08000000, 0x00000400, 0x00010020,
151 0x08000420, 0x00000400, 0x00000000, 0x08010420,
152 0x08010020, 0x08010400, 0x00000420, 0x00010000,
153 0x00010400, 0x08010020, 0x08000400, 0x00000420,
154 0x00000020, 0x00010420, 0x08010000, 0x08000020,
157 0x80000040, 0x00200040, 0x00000000, 0x80202000,
158 0x00200040, 0x00002000, 0x80002040, 0x00200000,
159 0x00002040, 0x80202040, 0x00202000, 0x80000000,
160 0x80002000, 0x80000040, 0x80200000, 0x00202040,
161 0x00200000, 0x80002040, 0x80200040, 0x00000000,
162 0x00002000, 0x00000040, 0x80202000, 0x80200040,
163 0x80202040, 0x80200000, 0x80000000, 0x00002040,
164 0x00000040, 0x00202000, 0x00202040, 0x80002000,
165 0x00002040, 0x80000000, 0x80002000, 0x00202040,
166 0x80202000, 0x00200040, 0x00000000, 0x80002000,
167 0x80000000, 0x00002000, 0x80200040, 0x00200000,
168 0x00200040, 0x80202040, 0x00202000, 0x00000040,
169 0x80202040, 0x00202000, 0x00200000, 0x80002040,
170 0x80000040, 0x80200000, 0x00202040, 0x00000000,
171 0x00002000, 0x80000040, 0x80002040, 0x80202000,
172 0x80200000, 0x00002040, 0x00000040, 0x80200040,
175 0x00004000, 0x00000200, 0x01000200, 0x01000004,
176 0x01004204, 0x00004004, 0x00004200, 0x00000000,
177 0x01000000, 0x01000204, 0x00000204, 0x01004000,
178 0x00000004, 0x01004200, 0x01004000, 0x00000204,
179 0x01000204, 0x00004000, 0x00004004, 0x01004204,
180 0x00000000, 0x01000200, 0x01000004, 0x00004200,
181 0x01004004, 0x00004204, 0x01004200, 0x00000004,
182 0x00004204, 0x01004004, 0x00000200, 0x01000000,
183 0x00004204, 0x01004000, 0x01004004, 0x00000204,
184 0x00004000, 0x00000200, 0x01000000, 0x01004004,
185 0x01000204, 0x00004204, 0x00004200, 0x00000000,
186 0x00000200, 0x01000004, 0x00000004, 0x01000200,
187 0x00000000, 0x01000204, 0x01000200, 0x00004200,
188 0x00000204, 0x00004000, 0x01004204, 0x01000000,
189 0x01004200, 0x00000004, 0x00004004, 0x01004204,
190 0x01000004, 0x01004200, 0x01004000, 0x00004004,
193 0x20800080, 0x20820000, 0x00020080, 0x00000000,
194 0x20020000, 0x00800080, 0x20800000, 0x20820080,
195 0x00000080, 0x20000000, 0x00820000, 0x00020080,
196 0x00820080, 0x20020080, 0x20000080, 0x20800000,
197 0x00020000, 0x00820080, 0x00800080, 0x20020000,
198 0x20820080, 0x20000080, 0x00000000, 0x00820000,
199 0x20000000, 0x00800000, 0x20020080, 0x20800080,
200 0x00800000, 0x00020000, 0x20820000, 0x00000080,
201 0x00800000, 0x00020000, 0x20000080, 0x20820080,
202 0x00020080, 0x20000000, 0x00000000, 0x00820000,
203 0x20800080, 0x20020080, 0x20020000, 0x00800080,
204 0x20820000, 0x00000080, 0x00800080, 0x20020000,
205 0x20820080, 0x00800000, 0x20800000, 0x20000080,
206 0x00820000, 0x00020080, 0x20020080, 0x20800000,
207 0x00000080, 0x20820000, 0x00820080, 0x00000000,
208 0x20000000, 0x20800080, 0x00020000, 0x00820080,
212 __constant u32 c_skb[8][64] =
215 0x00000000, 0x00000010, 0x20000000, 0x20000010,
216 0x00010000, 0x00010010, 0x20010000, 0x20010010,
217 0x00000800, 0x00000810, 0x20000800, 0x20000810,
218 0x00010800, 0x00010810, 0x20010800, 0x20010810,
219 0x00000020, 0x00000030, 0x20000020, 0x20000030,
220 0x00010020, 0x00010030, 0x20010020, 0x20010030,
221 0x00000820, 0x00000830, 0x20000820, 0x20000830,
222 0x00010820, 0x00010830, 0x20010820, 0x20010830,
223 0x00080000, 0x00080010, 0x20080000, 0x20080010,
224 0x00090000, 0x00090010, 0x20090000, 0x20090010,
225 0x00080800, 0x00080810, 0x20080800, 0x20080810,
226 0x00090800, 0x00090810, 0x20090800, 0x20090810,
227 0x00080020, 0x00080030, 0x20080020, 0x20080030,
228 0x00090020, 0x00090030, 0x20090020, 0x20090030,
229 0x00080820, 0x00080830, 0x20080820, 0x20080830,
230 0x00090820, 0x00090830, 0x20090820, 0x20090830,
233 0x00000000, 0x02000000, 0x00002000, 0x02002000,
234 0x00200000, 0x02200000, 0x00202000, 0x02202000,
235 0x00000004, 0x02000004, 0x00002004, 0x02002004,
236 0x00200004, 0x02200004, 0x00202004, 0x02202004,
237 0x00000400, 0x02000400, 0x00002400, 0x02002400,
238 0x00200400, 0x02200400, 0x00202400, 0x02202400,
239 0x00000404, 0x02000404, 0x00002404, 0x02002404,
240 0x00200404, 0x02200404, 0x00202404, 0x02202404,
241 0x10000000, 0x12000000, 0x10002000, 0x12002000,
242 0x10200000, 0x12200000, 0x10202000, 0x12202000,
243 0x10000004, 0x12000004, 0x10002004, 0x12002004,
244 0x10200004, 0x12200004, 0x10202004, 0x12202004,
245 0x10000400, 0x12000400, 0x10002400, 0x12002400,
246 0x10200400, 0x12200400, 0x10202400, 0x12202400,
247 0x10000404, 0x12000404, 0x10002404, 0x12002404,
248 0x10200404, 0x12200404, 0x10202404, 0x12202404,
251 0x00000000, 0x00000001, 0x00040000, 0x00040001,
252 0x01000000, 0x01000001, 0x01040000, 0x01040001,
253 0x00000002, 0x00000003, 0x00040002, 0x00040003,
254 0x01000002, 0x01000003, 0x01040002, 0x01040003,
255 0x00000200, 0x00000201, 0x00040200, 0x00040201,
256 0x01000200, 0x01000201, 0x01040200, 0x01040201,
257 0x00000202, 0x00000203, 0x00040202, 0x00040203,
258 0x01000202, 0x01000203, 0x01040202, 0x01040203,
259 0x08000000, 0x08000001, 0x08040000, 0x08040001,
260 0x09000000, 0x09000001, 0x09040000, 0x09040001,
261 0x08000002, 0x08000003, 0x08040002, 0x08040003,
262 0x09000002, 0x09000003, 0x09040002, 0x09040003,
263 0x08000200, 0x08000201, 0x08040200, 0x08040201,
264 0x09000200, 0x09000201, 0x09040200, 0x09040201,
265 0x08000202, 0x08000203, 0x08040202, 0x08040203,
266 0x09000202, 0x09000203, 0x09040202, 0x09040203,
269 0x00000000, 0x00100000, 0x00000100, 0x00100100,
270 0x00000008, 0x00100008, 0x00000108, 0x00100108,
271 0x00001000, 0x00101000, 0x00001100, 0x00101100,
272 0x00001008, 0x00101008, 0x00001108, 0x00101108,
273 0x04000000, 0x04100000, 0x04000100, 0x04100100,
274 0x04000008, 0x04100008, 0x04000108, 0x04100108,
275 0x04001000, 0x04101000, 0x04001100, 0x04101100,
276 0x04001008, 0x04101008, 0x04001108, 0x04101108,
277 0x00020000, 0x00120000, 0x00020100, 0x00120100,
278 0x00020008, 0x00120008, 0x00020108, 0x00120108,
279 0x00021000, 0x00121000, 0x00021100, 0x00121100,
280 0x00021008, 0x00121008, 0x00021108, 0x00121108,
281 0x04020000, 0x04120000, 0x04020100, 0x04120100,
282 0x04020008, 0x04120008, 0x04020108, 0x04120108,
283 0x04021000, 0x04121000, 0x04021100, 0x04121100,
284 0x04021008, 0x04121008, 0x04021108, 0x04121108,
287 0x00000000, 0x10000000, 0x00010000, 0x10010000,
288 0x00000004, 0x10000004, 0x00010004, 0x10010004,
289 0x20000000, 0x30000000, 0x20010000, 0x30010000,
290 0x20000004, 0x30000004, 0x20010004, 0x30010004,
291 0x00100000, 0x10100000, 0x00110000, 0x10110000,
292 0x00100004, 0x10100004, 0x00110004, 0x10110004,
293 0x20100000, 0x30100000, 0x20110000, 0x30110000,
294 0x20100004, 0x30100004, 0x20110004, 0x30110004,
295 0x00001000, 0x10001000, 0x00011000, 0x10011000,
296 0x00001004, 0x10001004, 0x00011004, 0x10011004,
297 0x20001000, 0x30001000, 0x20011000, 0x30011000,
298 0x20001004, 0x30001004, 0x20011004, 0x30011004,
299 0x00101000, 0x10101000, 0x00111000, 0x10111000,
300 0x00101004, 0x10101004, 0x00111004, 0x10111004,
301 0x20101000, 0x30101000, 0x20111000, 0x30111000,
302 0x20101004, 0x30101004, 0x20111004, 0x30111004,
305 0x00000000, 0x08000000, 0x00000008, 0x08000008,
306 0x00000400, 0x08000400, 0x00000408, 0x08000408,
307 0x00020000, 0x08020000, 0x00020008, 0x08020008,
308 0x00020400, 0x08020400, 0x00020408, 0x08020408,
309 0x00000001, 0x08000001, 0x00000009, 0x08000009,
310 0x00000401, 0x08000401, 0x00000409, 0x08000409,
311 0x00020001, 0x08020001, 0x00020009, 0x08020009,
312 0x00020401, 0x08020401, 0x00020409, 0x08020409,
313 0x02000000, 0x0A000000, 0x02000008, 0x0A000008,
314 0x02000400, 0x0A000400, 0x02000408, 0x0A000408,
315 0x02020000, 0x0A020000, 0x02020008, 0x0A020008,
316 0x02020400, 0x0A020400, 0x02020408, 0x0A020408,
317 0x02000001, 0x0A000001, 0x02000009, 0x0A000009,
318 0x02000401, 0x0A000401, 0x02000409, 0x0A000409,
319 0x02020001, 0x0A020001, 0x02020009, 0x0A020009,
320 0x02020401, 0x0A020401, 0x02020409, 0x0A020409,
323 0x00000000, 0x00000100, 0x00080000, 0x00080100,
324 0x01000000, 0x01000100, 0x01080000, 0x01080100,
325 0x00000010, 0x00000110, 0x00080010, 0x00080110,
326 0x01000010, 0x01000110, 0x01080010, 0x01080110,
327 0x00200000, 0x00200100, 0x00280000, 0x00280100,
328 0x01200000, 0x01200100, 0x01280000, 0x01280100,
329 0x00200010, 0x00200110, 0x00280010, 0x00280110,
330 0x01200010, 0x01200110, 0x01280010, 0x01280110,
331 0x00000200, 0x00000300, 0x00080200, 0x00080300,
332 0x01000200, 0x01000300, 0x01080200, 0x01080300,
333 0x00000210, 0x00000310, 0x00080210, 0x00080310,
334 0x01000210, 0x01000310, 0x01080210, 0x01080310,
335 0x00200200, 0x00200300, 0x00280200, 0x00280300,
336 0x01200200, 0x01200300, 0x01280200, 0x01280300,
337 0x00200210, 0x00200310, 0x00280210, 0x00280310,
338 0x01200210, 0x01200310, 0x01280210, 0x01280310,
341 0x00000000, 0x04000000, 0x00040000, 0x04040000,
342 0x00000002, 0x04000002, 0x00040002, 0x04040002,
343 0x00002000, 0x04002000, 0x00042000, 0x04042000,
344 0x00002002, 0x04002002, 0x00042002, 0x04042002,
345 0x00000020, 0x04000020, 0x00040020, 0x04040020,
346 0x00000022, 0x04000022, 0x00040022, 0x04040022,
347 0x00002020, 0x04002020, 0x00042020, 0x04042020,
348 0x00002022, 0x04002022, 0x00042022, 0x04042022,
349 0x00000800, 0x04000800, 0x00040800, 0x04040800,
350 0x00000802, 0x04000802, 0x00040802, 0x04040802,
351 0x00002800, 0x04002800, 0x00042800, 0x04042800,
352 0x00002802, 0x04002802, 0x00042802, 0x04042802,
353 0x00000820, 0x04000820, 0x00040820, 0x04040820,
354 0x00000822, 0x04000822, 0x00040822, 0x04040822,
355 0x00002820, 0x04002820, 0x00042820, 0x04042820,
356 0x00002822, 0x04002822, 0x00042822, 0x04042822
361 #define BOX(i,n,S) (S)[(n)][(i)]
363 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1])
365 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3])
367 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7])
368 #elif VECT_SIZE == 16
369 #define BOX(i,n,S) (u32x) ((S)[(n)][(i).s0], (S)[(n)][(i).s1], (S)[(n)][(i).s2], (S)[(n)][(i).s3], (S)[(n)][(i).s4], (S)[(n)][(i).s5], (S)[(n)][(i).s6], (S)[(n)][(i).s7], (S)[(n)][(i).s8], (S)[(n)][(i).s9], (S)[(n)][(i).sa], (S)[(n)][(i).sb], (S)[(n)][(i).sc], (S)[(n)][(i).sd], (S)[(n)][(i).se], (S)[(n)][(i).sf])
372 void _des_crypt_encrypt (u32x iv[2], u32x data[2], u32x Kc[16], u32x Kd[16], __local u32 (*s_SPtrans)[64])
385 for (u32 i = 0; i < 16; i += 2)
391 t = Kd[i + 0] ^ rotl32 (r, 28u);
393 l ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
394 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
395 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
396 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
397 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
398 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
399 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
400 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
403 t = Kd[i + 1] ^ rotl32 (l, 28u);
405 r ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
406 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
407 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
408 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
409 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
410 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
411 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
412 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
424 void _des_crypt_keysetup (u32x c, u32x d, u32x Kc[16], u32x Kd[16], __local u32 (*s_skb)[64])
428 PERM_OP (d, c, tt, 4, 0x0f0f0f0f);
429 HPERM_OP (c, tt, 2, 0xcccc0000);
430 HPERM_OP (d, tt, 2, 0xcccc0000);
431 PERM_OP (d, c, tt, 1, 0x55555555);
432 PERM_OP (c, d, tt, 8, 0x00ff00ff);
433 PERM_OP (d, c, tt, 1, 0x55555555);
435 d = ((d & 0x000000ff) << 16)
436 | ((d & 0x0000ff00) << 0)
437 | ((d & 0x00ff0000) >> 16)
438 | ((c & 0xf0000000) >> 4);
443 for (u32 i = 0; i < 16; i++)
445 if ((i < 2) || (i == 8) || (i == 15))
447 c = ((c >> 1) | (c << 27));
448 d = ((d >> 1) | (d << 27));
452 c = ((c >> 2) | (c << 26));
453 d = ((d >> 2) | (d << 26));
459 const u32x c00 = (c >> 0) & 0x0000003f;
460 const u32x c06 = (c >> 6) & 0x00383003;
461 const u32x c07 = (c >> 7) & 0x0000003c;
462 const u32x c13 = (c >> 13) & 0x0000060f;
463 const u32x c20 = (c >> 20) & 0x00000001;
465 u32x s = BOX (((c00 >> 0) & 0xff), 0, s_skb)
466 | BOX (((c06 >> 0) & 0xff)
467 |((c07 >> 0) & 0xff), 1, s_skb)
468 | BOX (((c13 >> 0) & 0xff)
469 |((c06 >> 8) & 0xff), 2, s_skb)
470 | BOX (((c20 >> 0) & 0xff)
472 |((c06 >> 16) & 0xff), 3, s_skb);
474 const u32x d00 = (d >> 0) & 0x00003c3f;
475 const u32x d07 = (d >> 7) & 0x00003f03;
476 const u32x d21 = (d >> 21) & 0x0000000f;
477 const u32x d22 = (d >> 22) & 0x00000030;
479 u32x t = BOX (((d00 >> 0) & 0xff), 4, s_skb)
480 | BOX (((d07 >> 0) & 0xff)
481 |((d00 >> 8) & 0xff), 5, s_skb)
482 | BOX (((d07 >> 8) & 0xff), 6, s_skb)
483 | BOX (((d21 >> 0) & 0xff)
484 |((d22 >> 0) & 0xff), 7, s_skb);
486 Kc[i] = ((t << 16) | (s & 0x0000ffff));
487 Kd[i] = ((s >> 16) | (t & 0xffff0000));
489 Kc[i] = rotl32 (Kc[i], 2u);
490 Kd[i] = rotl32 (Kd[i], 2u);
494 __kernel void m03100_m04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
500 const u32 gid = get_global_id (0);
501 const u32 lid = get_local_id (0);
502 const u32 lsz = get_local_size (0);
508 __local u32 s_SPtrans[8][64];
509 __local u32 s_skb[8][64];
511 for (u32 i = lid; i < 64; i += lsz)
513 s_SPtrans[0][i] = c_SPtrans[0][i];
514 s_SPtrans[1][i] = c_SPtrans[1][i];
515 s_SPtrans[2][i] = c_SPtrans[2][i];
516 s_SPtrans[3][i] = c_SPtrans[3][i];
517 s_SPtrans[4][i] = c_SPtrans[4][i];
518 s_SPtrans[5][i] = c_SPtrans[5][i];
519 s_SPtrans[6][i] = c_SPtrans[6][i];
520 s_SPtrans[7][i] = c_SPtrans[7][i];
522 s_skb[0][i] = c_skb[0][i];
523 s_skb[1][i] = c_skb[1][i];
524 s_skb[2][i] = c_skb[2][i];
525 s_skb[3][i] = c_skb[3][i];
526 s_skb[4][i] = c_skb[4][i];
527 s_skb[5][i] = c_skb[5][i];
528 s_skb[6][i] = c_skb[6][i];
529 s_skb[7][i] = c_skb[7][i];
532 barrier (CLK_LOCAL_MEM_FENCE);
534 if (gid >= gid_max) return;
543 pw_buf0[0] = pws[gid].i[0];
544 pw_buf0[1] = pws[gid].i[1];
545 pw_buf0[2] = pws[gid].i[2];
546 pw_buf0[3] = pws[gid].i[3];
547 pw_buf1[0] = pws[gid].i[4];
548 pw_buf1[1] = pws[gid].i[5];
549 pw_buf1[2] = pws[gid].i[6];
550 pw_buf1[3] = pws[gid].i[7];
552 const u32 pw_l_len = pws[gid].pw_len;
561 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
562 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
563 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
564 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
565 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
566 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
567 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
568 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
570 const u32 salt_len = salt_bufs[salt_pos].salt_len;
576 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
578 const u32x pw_r_len = pwlenx_create_combt (combs_buf, il_pos);
580 const u32x pw_len = pw_l_len + pw_r_len;
582 const u32x salt_word_len = (salt_len + pw_len) * 2;
585 * concat password candidate
588 u32x wordl0[4] = { 0 };
589 u32x wordl1[4] = { 0 };
590 u32x wordl2[4] = { 0 };
591 u32x wordl3[4] = { 0 };
593 wordl0[0] = pw_buf0[0];
594 wordl0[1] = pw_buf0[1];
595 wordl0[2] = pw_buf0[2];
596 wordl0[3] = pw_buf0[3];
597 wordl1[0] = pw_buf1[0];
598 wordl1[1] = pw_buf1[1];
599 wordl1[2] = pw_buf1[2];
600 wordl1[3] = pw_buf1[3];
602 u32x wordr0[4] = { 0 };
603 u32x wordr1[4] = { 0 };
604 u32x wordr2[4] = { 0 };
605 u32x wordr3[4] = { 0 };
607 wordr0[0] = ix_create_combt (combs_buf, il_pos, 0);
608 wordr0[1] = ix_create_combt (combs_buf, il_pos, 1);
609 wordr0[2] = ix_create_combt (combs_buf, il_pos, 2);
610 wordr0[3] = ix_create_combt (combs_buf, il_pos, 3);
611 wordr1[0] = ix_create_combt (combs_buf, il_pos, 4);
612 wordr1[1] = ix_create_combt (combs_buf, il_pos, 5);
613 wordr1[2] = ix_create_combt (combs_buf, il_pos, 6);
614 wordr1[3] = ix_create_combt (combs_buf, il_pos, 7);
616 if (combs_mode == COMBINATOR_MODE_BASE_LEFT)
618 switch_buffer_by_offset_le_VV (wordr0, wordr1, wordr2, wordr3, pw_l_len);
622 switch_buffer_by_offset_le_VV (wordl0, wordl1, wordl2, wordl3, pw_r_len);
630 w0[0] = wordl0[0] | wordr0[0];
631 w0[1] = wordl0[1] | wordr0[1];
632 w0[2] = wordl0[2] | wordr0[2];
633 w0[3] = wordl0[3] | wordr0[3];
634 w1[0] = wordl1[0] | wordr1[0];
635 w1[1] = wordl1[1] | wordr1[1];
636 w1[2] = wordl1[2] | wordr1[2];
637 w1[3] = wordl1[3] | wordr1[3];
638 w2[0] = wordl2[0] | wordr2[0];
639 w2[1] = wordl2[1] | wordr2[1];
640 w2[2] = wordl2[2] | wordr2[2];
641 w2[3] = wordl2[3] | wordr2[3];
642 w3[0] = wordl3[0] | wordr3[0];
643 w3[1] = wordl3[1] | wordr3[1];
644 w3[2] = wordl3[2] | wordr3[2];
645 w3[3] = wordl3[3] | wordr3[3];
651 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
655 dst[ 0] = w0[0] | salt_buf0[0];
656 dst[ 1] = w0[1] | salt_buf0[1];
657 dst[ 2] = w0[2] | salt_buf0[2];
658 dst[ 3] = w0[3] | salt_buf0[3];
659 dst[ 4] = w1[0] | salt_buf1[0];
660 dst[ 5] = w1[1] | salt_buf1[1];
661 dst[ 6] = w1[2] | salt_buf1[2];
662 dst[ 7] = w1[3] | salt_buf1[3];
673 * precompute key1 since key is static: 0x0123456789abcdef
674 * plus LEFT_ROTATE by 2
716 * key1 (generate key)
724 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
728 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
729 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
734 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
738 * key2 (generate hash)
741 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
746 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
750 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
751 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
756 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
765 COMPARE_M_SIMD (iv[0], iv[1], z, z);
769 __kernel void m03100_m08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
773 __kernel void m03100_m16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
777 __kernel void m03100_s04 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
783 const u32 gid = get_global_id (0);
784 const u32 lid = get_local_id (0);
785 const u32 lsz = get_local_size (0);
791 __local u32 s_SPtrans[8][64];
792 __local u32 s_skb[8][64];
794 for (u32 i = lid; i < 64; i += lsz)
796 s_SPtrans[0][i] = c_SPtrans[0][i];
797 s_SPtrans[1][i] = c_SPtrans[1][i];
798 s_SPtrans[2][i] = c_SPtrans[2][i];
799 s_SPtrans[3][i] = c_SPtrans[3][i];
800 s_SPtrans[4][i] = c_SPtrans[4][i];
801 s_SPtrans[5][i] = c_SPtrans[5][i];
802 s_SPtrans[6][i] = c_SPtrans[6][i];
803 s_SPtrans[7][i] = c_SPtrans[7][i];
805 s_skb[0][i] = c_skb[0][i];
806 s_skb[1][i] = c_skb[1][i];
807 s_skb[2][i] = c_skb[2][i];
808 s_skb[3][i] = c_skb[3][i];
809 s_skb[4][i] = c_skb[4][i];
810 s_skb[5][i] = c_skb[5][i];
811 s_skb[6][i] = c_skb[6][i];
812 s_skb[7][i] = c_skb[7][i];
815 barrier (CLK_LOCAL_MEM_FENCE);
817 if (gid >= gid_max) return;
826 pw_buf0[0] = pws[gid].i[0];
827 pw_buf0[1] = pws[gid].i[1];
828 pw_buf0[2] = pws[gid].i[2];
829 pw_buf0[3] = pws[gid].i[3];
830 pw_buf1[0] = pws[gid].i[4];
831 pw_buf1[1] = pws[gid].i[5];
832 pw_buf1[2] = pws[gid].i[6];
833 pw_buf1[3] = pws[gid].i[7];
835 const u32 pw_l_len = pws[gid].pw_len;
844 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
845 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
846 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
847 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
848 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
849 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
850 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
851 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
853 const u32 salt_len = salt_bufs[salt_pos].salt_len;
859 const u32 search[4] =
861 digests_buf[digests_offset].digest_buf[DGST_R0],
862 digests_buf[digests_offset].digest_buf[DGST_R1],
871 for (u32 il_pos = 0; il_pos < il_cnt; il_pos += VECT_SIZE)
873 const u32x pw_r_len = pwlenx_create_combt (combs_buf, il_pos);
875 const u32x pw_len = pw_l_len + pw_r_len;
877 const u32x salt_word_len = (salt_len + pw_len) * 2;
880 * concat password candidate
883 u32x wordl0[4] = { 0 };
884 u32x wordl1[4] = { 0 };
885 u32x wordl2[4] = { 0 };
886 u32x wordl3[4] = { 0 };
888 wordl0[0] = pw_buf0[0];
889 wordl0[1] = pw_buf0[1];
890 wordl0[2] = pw_buf0[2];
891 wordl0[3] = pw_buf0[3];
892 wordl1[0] = pw_buf1[0];
893 wordl1[1] = pw_buf1[1];
894 wordl1[2] = pw_buf1[2];
895 wordl1[3] = pw_buf1[3];
897 u32x wordr0[4] = { 0 };
898 u32x wordr1[4] = { 0 };
899 u32x wordr2[4] = { 0 };
900 u32x wordr3[4] = { 0 };
902 wordr0[0] = ix_create_combt (combs_buf, il_pos, 0);
903 wordr0[1] = ix_create_combt (combs_buf, il_pos, 1);
904 wordr0[2] = ix_create_combt (combs_buf, il_pos, 2);
905 wordr0[3] = ix_create_combt (combs_buf, il_pos, 3);
906 wordr1[0] = ix_create_combt (combs_buf, il_pos, 4);
907 wordr1[1] = ix_create_combt (combs_buf, il_pos, 5);
908 wordr1[2] = ix_create_combt (combs_buf, il_pos, 6);
909 wordr1[3] = ix_create_combt (combs_buf, il_pos, 7);
911 if (combs_mode == COMBINATOR_MODE_BASE_LEFT)
913 switch_buffer_by_offset_le_VV (wordr0, wordr1, wordr2, wordr3, pw_l_len);
917 switch_buffer_by_offset_le_VV (wordl0, wordl1, wordl2, wordl3, pw_r_len);
925 w0[0] = wordl0[0] | wordr0[0];
926 w0[1] = wordl0[1] | wordr0[1];
927 w0[2] = wordl0[2] | wordr0[2];
928 w0[3] = wordl0[3] | wordr0[3];
929 w1[0] = wordl1[0] | wordr1[0];
930 w1[1] = wordl1[1] | wordr1[1];
931 w1[2] = wordl1[2] | wordr1[2];
932 w1[3] = wordl1[3] | wordr1[3];
933 w2[0] = wordl2[0] | wordr2[0];
934 w2[1] = wordl2[1] | wordr2[1];
935 w2[2] = wordl2[2] | wordr2[2];
936 w2[3] = wordl2[3] | wordr2[3];
937 w3[0] = wordl3[0] | wordr3[0];
938 w3[1] = wordl3[1] | wordr3[1];
939 w3[2] = wordl3[2] | wordr3[2];
940 w3[3] = wordl3[3] | wordr3[3];
946 switch_buffer_by_offset_le (w0, w1, w2, w3, salt_len);
950 dst[ 0] = w0[0] | salt_buf0[0];
951 dst[ 1] = w0[1] | salt_buf0[1];
952 dst[ 2] = w0[2] | salt_buf0[2];
953 dst[ 3] = w0[3] | salt_buf0[3];
954 dst[ 4] = w1[0] | salt_buf1[0];
955 dst[ 5] = w1[1] | salt_buf1[1];
956 dst[ 6] = w1[2] | salt_buf1[2];
957 dst[ 7] = w1[3] | salt_buf1[3];
968 * precompute key1 since key is static: 0x0123456789abcdef
969 * plus LEFT_ROTATE by 2
1000 Kd[ 7] = 0x80701c1c;
1001 Kd[ 8] = 0x9cd49430;
1002 Kd[ 9] = 0x4c8ce078;
1003 Kd[10] = 0x5c18c088;
1004 Kd[11] = 0x28a8a4c8;
1005 Kd[12] = 0x3c180838;
1006 Kd[13] = 0xb0b86c20;
1007 Kd[14] = 0xac84a094;
1008 Kd[15] = 0x4ce0c0c4;
1011 * key1 (generate key)
1019 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
1023 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
1024 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
1029 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
1033 * key2 (generate hash)
1036 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
1041 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
1045 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
1046 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
1051 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
1060 COMPARE_S_SIMD (iv[0], iv[1], z, z);
1064 __kernel void m03100_s08 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1068 __kernel void m03100_s16 (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global comb_t *combs_buf, __global bf_t *bfs_buf, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)