2 * Author......: Jens Steube <jens.steube@gmail.com>
8 #include "include/constants.h"
9 #include "include/kernel_vendor.h"
16 #include "include/kernel_functions.c"
17 #include "types_ocl.c"
20 #define COMPARE_S "check_single_comp4.c"
21 #define COMPARE_M "check_multi_comp4.c"
23 #define PERM_OP(a,b,tt,n,m) \
33 #define HPERM_OP(a,tt,n,m) \
39 tt = tt >> (16 + n); \
45 PERM_OP (r, l, tt, 4, 0x0f0f0f0f); \
46 PERM_OP (l, r, tt, 16, 0x0000ffff); \
47 PERM_OP (r, l, tt, 2, 0x33333333); \
48 PERM_OP (l, r, tt, 8, 0x00ff00ff); \
49 PERM_OP (r, l, tt, 1, 0x55555555); \
54 PERM_OP (l, r, tt, 1, 0x55555555); \
55 PERM_OP (r, l, tt, 8, 0x00ff00ff); \
56 PERM_OP (l, r, tt, 2, 0x33333333); \
57 PERM_OP (r, l, tt, 16, 0x0000ffff); \
58 PERM_OP (l, r, tt, 4, 0x0f0f0f0f); \
61 __constant u32 c_SPtrans[8][64] =
64 0x02080800, 0x00080000, 0x02000002, 0x02080802,
65 0x02000000, 0x00080802, 0x00080002, 0x02000002,
66 0x00080802, 0x02080800, 0x02080000, 0x00000802,
67 0x02000802, 0x02000000, 0x00000000, 0x00080002,
68 0x00080000, 0x00000002, 0x02000800, 0x00080800,
69 0x02080802, 0x02080000, 0x00000802, 0x02000800,
70 0x00000002, 0x00000800, 0x00080800, 0x02080002,
71 0x00000800, 0x02000802, 0x02080002, 0x00000000,
72 0x00000000, 0x02080802, 0x02000800, 0x00080002,
73 0x02080800, 0x00080000, 0x00000802, 0x02000800,
74 0x02080002, 0x00000800, 0x00080800, 0x02000002,
75 0x00080802, 0x00000002, 0x02000002, 0x02080000,
76 0x02080802, 0x00080800, 0x02080000, 0x02000802,
77 0x02000000, 0x00000802, 0x00080002, 0x00000000,
78 0x00080000, 0x02000000, 0x02000802, 0x02080800,
79 0x00000002, 0x02080002, 0x00000800, 0x00080802,
82 0x40108010, 0x00000000, 0x00108000, 0x40100000,
83 0x40000010, 0x00008010, 0x40008000, 0x00108000,
84 0x00008000, 0x40100010, 0x00000010, 0x40008000,
85 0x00100010, 0x40108000, 0x40100000, 0x00000010,
86 0x00100000, 0x40008010, 0x40100010, 0x00008000,
87 0x00108010, 0x40000000, 0x00000000, 0x00100010,
88 0x40008010, 0x00108010, 0x40108000, 0x40000010,
89 0x40000000, 0x00100000, 0x00008010, 0x40108010,
90 0x00100010, 0x40108000, 0x40008000, 0x00108010,
91 0x40108010, 0x00100010, 0x40000010, 0x00000000,
92 0x40000000, 0x00008010, 0x00100000, 0x40100010,
93 0x00008000, 0x40000000, 0x00108010, 0x40008010,
94 0x40108000, 0x00008000, 0x00000000, 0x40000010,
95 0x00000010, 0x40108010, 0x00108000, 0x40100000,
96 0x40100010, 0x00100000, 0x00008010, 0x40008000,
97 0x40008010, 0x00000010, 0x40100000, 0x00108000,
100 0x04000001, 0x04040100, 0x00000100, 0x04000101,
101 0x00040001, 0x04000000, 0x04000101, 0x00040100,
102 0x04000100, 0x00040000, 0x04040000, 0x00000001,
103 0x04040101, 0x00000101, 0x00000001, 0x04040001,
104 0x00000000, 0x00040001, 0x04040100, 0x00000100,
105 0x00000101, 0x04040101, 0x00040000, 0x04000001,
106 0x04040001, 0x04000100, 0x00040101, 0x04040000,
107 0x00040100, 0x00000000, 0x04000000, 0x00040101,
108 0x04040100, 0x00000100, 0x00000001, 0x00040000,
109 0x00000101, 0x00040001, 0x04040000, 0x04000101,
110 0x00000000, 0x04040100, 0x00040100, 0x04040001,
111 0x00040001, 0x04000000, 0x04040101, 0x00000001,
112 0x00040101, 0x04000001, 0x04000000, 0x04040101,
113 0x00040000, 0x04000100, 0x04000101, 0x00040100,
114 0x04000100, 0x00000000, 0x04040001, 0x00000101,
115 0x04000001, 0x00040101, 0x00000100, 0x04040000,
118 0x00401008, 0x10001000, 0x00000008, 0x10401008,
119 0x00000000, 0x10400000, 0x10001008, 0x00400008,
120 0x10401000, 0x10000008, 0x10000000, 0x00001008,
121 0x10000008, 0x00401008, 0x00400000, 0x10000000,
122 0x10400008, 0x00401000, 0x00001000, 0x00000008,
123 0x00401000, 0x10001008, 0x10400000, 0x00001000,
124 0x00001008, 0x00000000, 0x00400008, 0x10401000,
125 0x10001000, 0x10400008, 0x10401008, 0x00400000,
126 0x10400008, 0x00001008, 0x00400000, 0x10000008,
127 0x00401000, 0x10001000, 0x00000008, 0x10400000,
128 0x10001008, 0x00000000, 0x00001000, 0x00400008,
129 0x00000000, 0x10400008, 0x10401000, 0x00001000,
130 0x10000000, 0x10401008, 0x00401008, 0x00400000,
131 0x10401008, 0x00000008, 0x10001000, 0x00401008,
132 0x00400008, 0x00401000, 0x10400000, 0x10001008,
133 0x00001008, 0x10000000, 0x10000008, 0x10401000,
136 0x08000000, 0x00010000, 0x00000400, 0x08010420,
137 0x08010020, 0x08000400, 0x00010420, 0x08010000,
138 0x00010000, 0x00000020, 0x08000020, 0x00010400,
139 0x08000420, 0x08010020, 0x08010400, 0x00000000,
140 0x00010400, 0x08000000, 0x00010020, 0x00000420,
141 0x08000400, 0x00010420, 0x00000000, 0x08000020,
142 0x00000020, 0x08000420, 0x08010420, 0x00010020,
143 0x08010000, 0x00000400, 0x00000420, 0x08010400,
144 0x08010400, 0x08000420, 0x00010020, 0x08010000,
145 0x00010000, 0x00000020, 0x08000020, 0x08000400,
146 0x08000000, 0x00010400, 0x08010420, 0x00000000,
147 0x00010420, 0x08000000, 0x00000400, 0x00010020,
148 0x08000420, 0x00000400, 0x00000000, 0x08010420,
149 0x08010020, 0x08010400, 0x00000420, 0x00010000,
150 0x00010400, 0x08010020, 0x08000400, 0x00000420,
151 0x00000020, 0x00010420, 0x08010000, 0x08000020,
154 0x80000040, 0x00200040, 0x00000000, 0x80202000,
155 0x00200040, 0x00002000, 0x80002040, 0x00200000,
156 0x00002040, 0x80202040, 0x00202000, 0x80000000,
157 0x80002000, 0x80000040, 0x80200000, 0x00202040,
158 0x00200000, 0x80002040, 0x80200040, 0x00000000,
159 0x00002000, 0x00000040, 0x80202000, 0x80200040,
160 0x80202040, 0x80200000, 0x80000000, 0x00002040,
161 0x00000040, 0x00202000, 0x00202040, 0x80002000,
162 0x00002040, 0x80000000, 0x80002000, 0x00202040,
163 0x80202000, 0x00200040, 0x00000000, 0x80002000,
164 0x80000000, 0x00002000, 0x80200040, 0x00200000,
165 0x00200040, 0x80202040, 0x00202000, 0x00000040,
166 0x80202040, 0x00202000, 0x00200000, 0x80002040,
167 0x80000040, 0x80200000, 0x00202040, 0x00000000,
168 0x00002000, 0x80000040, 0x80002040, 0x80202000,
169 0x80200000, 0x00002040, 0x00000040, 0x80200040,
172 0x00004000, 0x00000200, 0x01000200, 0x01000004,
173 0x01004204, 0x00004004, 0x00004200, 0x00000000,
174 0x01000000, 0x01000204, 0x00000204, 0x01004000,
175 0x00000004, 0x01004200, 0x01004000, 0x00000204,
176 0x01000204, 0x00004000, 0x00004004, 0x01004204,
177 0x00000000, 0x01000200, 0x01000004, 0x00004200,
178 0x01004004, 0x00004204, 0x01004200, 0x00000004,
179 0x00004204, 0x01004004, 0x00000200, 0x01000000,
180 0x00004204, 0x01004000, 0x01004004, 0x00000204,
181 0x00004000, 0x00000200, 0x01000000, 0x01004004,
182 0x01000204, 0x00004204, 0x00004200, 0x00000000,
183 0x00000200, 0x01000004, 0x00000004, 0x01000200,
184 0x00000000, 0x01000204, 0x01000200, 0x00004200,
185 0x00000204, 0x00004000, 0x01004204, 0x01000000,
186 0x01004200, 0x00000004, 0x00004004, 0x01004204,
187 0x01000004, 0x01004200, 0x01004000, 0x00004004,
190 0x20800080, 0x20820000, 0x00020080, 0x00000000,
191 0x20020000, 0x00800080, 0x20800000, 0x20820080,
192 0x00000080, 0x20000000, 0x00820000, 0x00020080,
193 0x00820080, 0x20020080, 0x20000080, 0x20800000,
194 0x00020000, 0x00820080, 0x00800080, 0x20020000,
195 0x20820080, 0x20000080, 0x00000000, 0x00820000,
196 0x20000000, 0x00800000, 0x20020080, 0x20800080,
197 0x00800000, 0x00020000, 0x20820000, 0x00000080,
198 0x00800000, 0x00020000, 0x20000080, 0x20820080,
199 0x00020080, 0x20000000, 0x00000000, 0x00820000,
200 0x20800080, 0x20020080, 0x20020000, 0x00800080,
201 0x20820000, 0x00000080, 0x00800080, 0x20020000,
202 0x20820080, 0x00800000, 0x20800000, 0x20000080,
203 0x00820000, 0x00020080, 0x20020080, 0x20800000,
204 0x00000080, 0x20820000, 0x00820080, 0x00000000,
205 0x20000000, 0x20800080, 0x00020000, 0x00820080,
209 __constant u32 c_skb[8][64] =
212 0x00000000, 0x00000010, 0x20000000, 0x20000010,
213 0x00010000, 0x00010010, 0x20010000, 0x20010010,
214 0x00000800, 0x00000810, 0x20000800, 0x20000810,
215 0x00010800, 0x00010810, 0x20010800, 0x20010810,
216 0x00000020, 0x00000030, 0x20000020, 0x20000030,
217 0x00010020, 0x00010030, 0x20010020, 0x20010030,
218 0x00000820, 0x00000830, 0x20000820, 0x20000830,
219 0x00010820, 0x00010830, 0x20010820, 0x20010830,
220 0x00080000, 0x00080010, 0x20080000, 0x20080010,
221 0x00090000, 0x00090010, 0x20090000, 0x20090010,
222 0x00080800, 0x00080810, 0x20080800, 0x20080810,
223 0x00090800, 0x00090810, 0x20090800, 0x20090810,
224 0x00080020, 0x00080030, 0x20080020, 0x20080030,
225 0x00090020, 0x00090030, 0x20090020, 0x20090030,
226 0x00080820, 0x00080830, 0x20080820, 0x20080830,
227 0x00090820, 0x00090830, 0x20090820, 0x20090830,
230 0x00000000, 0x02000000, 0x00002000, 0x02002000,
231 0x00200000, 0x02200000, 0x00202000, 0x02202000,
232 0x00000004, 0x02000004, 0x00002004, 0x02002004,
233 0x00200004, 0x02200004, 0x00202004, 0x02202004,
234 0x00000400, 0x02000400, 0x00002400, 0x02002400,
235 0x00200400, 0x02200400, 0x00202400, 0x02202400,
236 0x00000404, 0x02000404, 0x00002404, 0x02002404,
237 0x00200404, 0x02200404, 0x00202404, 0x02202404,
238 0x10000000, 0x12000000, 0x10002000, 0x12002000,
239 0x10200000, 0x12200000, 0x10202000, 0x12202000,
240 0x10000004, 0x12000004, 0x10002004, 0x12002004,
241 0x10200004, 0x12200004, 0x10202004, 0x12202004,
242 0x10000400, 0x12000400, 0x10002400, 0x12002400,
243 0x10200400, 0x12200400, 0x10202400, 0x12202400,
244 0x10000404, 0x12000404, 0x10002404, 0x12002404,
245 0x10200404, 0x12200404, 0x10202404, 0x12202404,
248 0x00000000, 0x00000001, 0x00040000, 0x00040001,
249 0x01000000, 0x01000001, 0x01040000, 0x01040001,
250 0x00000002, 0x00000003, 0x00040002, 0x00040003,
251 0x01000002, 0x01000003, 0x01040002, 0x01040003,
252 0x00000200, 0x00000201, 0x00040200, 0x00040201,
253 0x01000200, 0x01000201, 0x01040200, 0x01040201,
254 0x00000202, 0x00000203, 0x00040202, 0x00040203,
255 0x01000202, 0x01000203, 0x01040202, 0x01040203,
256 0x08000000, 0x08000001, 0x08040000, 0x08040001,
257 0x09000000, 0x09000001, 0x09040000, 0x09040001,
258 0x08000002, 0x08000003, 0x08040002, 0x08040003,
259 0x09000002, 0x09000003, 0x09040002, 0x09040003,
260 0x08000200, 0x08000201, 0x08040200, 0x08040201,
261 0x09000200, 0x09000201, 0x09040200, 0x09040201,
262 0x08000202, 0x08000203, 0x08040202, 0x08040203,
263 0x09000202, 0x09000203, 0x09040202, 0x09040203,
266 0x00000000, 0x00100000, 0x00000100, 0x00100100,
267 0x00000008, 0x00100008, 0x00000108, 0x00100108,
268 0x00001000, 0x00101000, 0x00001100, 0x00101100,
269 0x00001008, 0x00101008, 0x00001108, 0x00101108,
270 0x04000000, 0x04100000, 0x04000100, 0x04100100,
271 0x04000008, 0x04100008, 0x04000108, 0x04100108,
272 0x04001000, 0x04101000, 0x04001100, 0x04101100,
273 0x04001008, 0x04101008, 0x04001108, 0x04101108,
274 0x00020000, 0x00120000, 0x00020100, 0x00120100,
275 0x00020008, 0x00120008, 0x00020108, 0x00120108,
276 0x00021000, 0x00121000, 0x00021100, 0x00121100,
277 0x00021008, 0x00121008, 0x00021108, 0x00121108,
278 0x04020000, 0x04120000, 0x04020100, 0x04120100,
279 0x04020008, 0x04120008, 0x04020108, 0x04120108,
280 0x04021000, 0x04121000, 0x04021100, 0x04121100,
281 0x04021008, 0x04121008, 0x04021108, 0x04121108,
284 0x00000000, 0x10000000, 0x00010000, 0x10010000,
285 0x00000004, 0x10000004, 0x00010004, 0x10010004,
286 0x20000000, 0x30000000, 0x20010000, 0x30010000,
287 0x20000004, 0x30000004, 0x20010004, 0x30010004,
288 0x00100000, 0x10100000, 0x00110000, 0x10110000,
289 0x00100004, 0x10100004, 0x00110004, 0x10110004,
290 0x20100000, 0x30100000, 0x20110000, 0x30110000,
291 0x20100004, 0x30100004, 0x20110004, 0x30110004,
292 0x00001000, 0x10001000, 0x00011000, 0x10011000,
293 0x00001004, 0x10001004, 0x00011004, 0x10011004,
294 0x20001000, 0x30001000, 0x20011000, 0x30011000,
295 0x20001004, 0x30001004, 0x20011004, 0x30011004,
296 0x00101000, 0x10101000, 0x00111000, 0x10111000,
297 0x00101004, 0x10101004, 0x00111004, 0x10111004,
298 0x20101000, 0x30101000, 0x20111000, 0x30111000,
299 0x20101004, 0x30101004, 0x20111004, 0x30111004,
302 0x00000000, 0x08000000, 0x00000008, 0x08000008,
303 0x00000400, 0x08000400, 0x00000408, 0x08000408,
304 0x00020000, 0x08020000, 0x00020008, 0x08020008,
305 0x00020400, 0x08020400, 0x00020408, 0x08020408,
306 0x00000001, 0x08000001, 0x00000009, 0x08000009,
307 0x00000401, 0x08000401, 0x00000409, 0x08000409,
308 0x00020001, 0x08020001, 0x00020009, 0x08020009,
309 0x00020401, 0x08020401, 0x00020409, 0x08020409,
310 0x02000000, 0x0A000000, 0x02000008, 0x0A000008,
311 0x02000400, 0x0A000400, 0x02000408, 0x0A000408,
312 0x02020000, 0x0A020000, 0x02020008, 0x0A020008,
313 0x02020400, 0x0A020400, 0x02020408, 0x0A020408,
314 0x02000001, 0x0A000001, 0x02000009, 0x0A000009,
315 0x02000401, 0x0A000401, 0x02000409, 0x0A000409,
316 0x02020001, 0x0A020001, 0x02020009, 0x0A020009,
317 0x02020401, 0x0A020401, 0x02020409, 0x0A020409,
320 0x00000000, 0x00000100, 0x00080000, 0x00080100,
321 0x01000000, 0x01000100, 0x01080000, 0x01080100,
322 0x00000010, 0x00000110, 0x00080010, 0x00080110,
323 0x01000010, 0x01000110, 0x01080010, 0x01080110,
324 0x00200000, 0x00200100, 0x00280000, 0x00280100,
325 0x01200000, 0x01200100, 0x01280000, 0x01280100,
326 0x00200010, 0x00200110, 0x00280010, 0x00280110,
327 0x01200010, 0x01200110, 0x01280010, 0x01280110,
328 0x00000200, 0x00000300, 0x00080200, 0x00080300,
329 0x01000200, 0x01000300, 0x01080200, 0x01080300,
330 0x00000210, 0x00000310, 0x00080210, 0x00080310,
331 0x01000210, 0x01000310, 0x01080210, 0x01080310,
332 0x00200200, 0x00200300, 0x00280200, 0x00280300,
333 0x01200200, 0x01200300, 0x01280200, 0x01280300,
334 0x00200210, 0x00200310, 0x00280210, 0x00280310,
335 0x01200210, 0x01200310, 0x01280210, 0x01280310,
338 0x00000000, 0x04000000, 0x00040000, 0x04040000,
339 0x00000002, 0x04000002, 0x00040002, 0x04040002,
340 0x00002000, 0x04002000, 0x00042000, 0x04042000,
341 0x00002002, 0x04002002, 0x00042002, 0x04042002,
342 0x00000020, 0x04000020, 0x00040020, 0x04040020,
343 0x00000022, 0x04000022, 0x00040022, 0x04040022,
344 0x00002020, 0x04002020, 0x00042020, 0x04042020,
345 0x00002022, 0x04002022, 0x00042022, 0x04042022,
346 0x00000800, 0x04000800, 0x00040800, 0x04040800,
347 0x00000802, 0x04000802, 0x00040802, 0x04040802,
348 0x00002800, 0x04002800, 0x00042800, 0x04042800,
349 0x00002802, 0x04002802, 0x00042802, 0x04042802,
350 0x00000820, 0x04000820, 0x00040820, 0x04040820,
351 0x00000822, 0x04000822, 0x00040822, 0x04040822,
352 0x00002820, 0x04002820, 0x00042820, 0x04042820,
353 0x00002822, 0x04002822, 0x00042822, 0x04042822
357 #define BOX(i,n,S) (S)[(n)][(i)]
359 static void _des_crypt_encrypt (u32 iv[2], u32 data[2], u32 Kc[16], u32 Kd[16], __local u32 s_SPtrans[8][64])
372 for (u32 i = 0; i < 16; i += 2)
378 t = Kd[i + 0] ^ rotl32 (r, 28u);
380 l ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
381 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
382 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
383 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
384 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
385 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
386 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
387 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
390 t = Kd[i + 1] ^ rotl32 (l, 28u);
392 r ^= BOX (((u >> 2) & 0x3f), 0, s_SPtrans)
393 | BOX (((u >> 10) & 0x3f), 2, s_SPtrans)
394 | BOX (((u >> 18) & 0x3f), 4, s_SPtrans)
395 | BOX (((u >> 26) & 0x3f), 6, s_SPtrans)
396 | BOX (((t >> 2) & 0x3f), 1, s_SPtrans)
397 | BOX (((t >> 10) & 0x3f), 3, s_SPtrans)
398 | BOX (((t >> 18) & 0x3f), 5, s_SPtrans)
399 | BOX (((t >> 26) & 0x3f), 7, s_SPtrans);
411 static void _des_crypt_keysetup (u32 c, u32 d, u32 Kc[16], u32 Kd[16], __local u32 s_skb[8][64])
415 PERM_OP (d, c, tt, 4, 0x0f0f0f0f);
416 HPERM_OP (c, tt, 2, 0xcccc0000);
417 HPERM_OP (d, tt, 2, 0xcccc0000);
418 PERM_OP (d, c, tt, 1, 0x55555555);
419 PERM_OP (c, d, tt, 8, 0x00ff00ff);
420 PERM_OP (d, c, tt, 1, 0x55555555);
422 d = ((d & 0x000000ff) << 16)
423 | ((d & 0x0000ff00) << 0)
424 | ((d & 0x00ff0000) >> 16)
425 | ((c & 0xf0000000) >> 4);
430 for (u32 i = 0; i < 16; i++)
432 if ((i < 2) || (i == 8) || (i == 15))
434 c = ((c >> 1) | (c << 27));
435 d = ((d >> 1) | (d << 27));
439 c = ((c >> 2) | (c << 26));
440 d = ((d >> 2) | (d << 26));
446 const u32 c00 = (c >> 0) & 0x0000003f;
447 const u32 c06 = (c >> 6) & 0x00383003;
448 const u32 c07 = (c >> 7) & 0x0000003c;
449 const u32 c13 = (c >> 13) & 0x0000060f;
450 const u32 c20 = (c >> 20) & 0x00000001;
452 u32 s = BOX (((c00 >> 0) & 0xff), 0, s_skb)
453 | BOX (((c06 >> 0) & 0xff)
454 |((c07 >> 0) & 0xff), 1, s_skb)
455 | BOX (((c13 >> 0) & 0xff)
456 |((c06 >> 8) & 0xff), 2, s_skb)
457 | BOX (((c20 >> 0) & 0xff)
459 |((c06 >> 16) & 0xff), 3, s_skb);
461 const u32 d00 = (d >> 0) & 0x00003c3f;
462 const u32 d07 = (d >> 7) & 0x00003f03;
463 const u32 d21 = (d >> 21) & 0x0000000f;
464 const u32 d22 = (d >> 22) & 0x00000030;
466 u32 t = BOX (((d00 >> 0) & 0xff), 4, s_skb)
467 | BOX (((d07 >> 0) & 0xff)
468 |((d00 >> 8) & 0xff), 5, s_skb)
469 | BOX (((d07 >> 8) & 0xff), 6, s_skb)
470 | BOX (((d21 >> 0) & 0xff)
471 |((d22 >> 0) & 0xff), 7, s_skb);
473 Kc[i] = ((t << 16) | (s & 0x0000ffff));
474 Kd[i] = ((s >> 16) | (t & 0xffff0000));
476 Kc[i] = rotl32 (Kc[i], 2u);
477 Kd[i] = rotl32 (Kd[i], 2u);
481 static void overwrite_at (u32 sw[16], const u32 w0, const u32 salt_len)
483 #if defined cl_amd_media_ops
488 case 1: sw[0] = amd_bytealign (w0, sw[0] << 24, 3);
489 sw[1] = amd_bytealign (sw[1] >> 8, w0, 3);
491 case 2: sw[0] = amd_bytealign (w0, sw[0] << 16, 2);
492 sw[1] = amd_bytealign (sw[1] >> 16, w0, 2);
494 case 3: sw[0] = amd_bytealign (w0, sw[0] << 8, 1);
495 sw[1] = amd_bytealign (sw[1] >> 24, w0, 1);
499 case 5: sw[1] = amd_bytealign (w0, sw[1] << 24, 3);
500 sw[2] = amd_bytealign (sw[2] >> 8, w0, 3);
502 case 6: sw[1] = amd_bytealign (w0, sw[1] << 16, 2);
503 sw[2] = amd_bytealign (sw[2] >> 16, w0, 2);
505 case 7: sw[1] = amd_bytealign (w0, sw[1] << 8, 1);
506 sw[2] = amd_bytealign (sw[2] >> 24, w0, 1);
510 case 9: sw[2] = amd_bytealign (w0, sw[2] << 24, 3);
511 sw[3] = amd_bytealign (sw[3] >> 8, w0, 3);
513 case 10: sw[2] = amd_bytealign (w0, sw[2] << 16, 2);
514 sw[3] = amd_bytealign (sw[3] >> 16, w0, 2);
516 case 11: sw[2] = amd_bytealign (w0, sw[2] << 8, 1);
517 sw[3] = amd_bytealign (sw[3] >> 24, w0, 1);
521 case 13: sw[3] = amd_bytealign (w0, sw[3] << 24, 3);
522 sw[4] = amd_bytealign (sw[4] >> 8, w0, 3);
524 case 14: sw[3] = amd_bytealign (w0, sw[3] << 16, 2);
525 sw[4] = amd_bytealign (sw[4] >> 16, w0, 2);
527 case 15: sw[3] = amd_bytealign (w0, sw[3] << 8, 1);
528 sw[4] = amd_bytealign (sw[4] >> 24, w0, 1);
532 case 17: sw[4] = amd_bytealign (w0, sw[4] << 24, 3);
533 sw[5] = amd_bytealign (sw[5] >> 8, w0, 3);
535 case 18: sw[4] = amd_bytealign (w0, sw[4] << 16, 2);
536 sw[5] = amd_bytealign (sw[5] >> 16, w0, 2);
538 case 19: sw[4] = amd_bytealign (w0, sw[4] << 8, 1);
539 sw[5] = amd_bytealign (sw[5] >> 24, w0, 1);
543 case 21: sw[5] = amd_bytealign (w0, sw[5] << 24, 3);
544 sw[6] = amd_bytealign (sw[6] >> 8, w0, 3);
546 case 22: sw[5] = amd_bytealign (w0, sw[5] << 16, 2);
547 sw[6] = amd_bytealign (sw[6] >> 16, w0, 2);
549 case 23: sw[5] = amd_bytealign (w0, sw[5] << 8, 1);
550 sw[6] = amd_bytealign (sw[6] >> 24, w0, 1);
554 case 25: sw[6] = amd_bytealign (w0, sw[6] << 24, 3);
555 sw[7] = amd_bytealign (sw[7] >> 8, w0, 3);
557 case 26: sw[6] = amd_bytealign (w0, sw[6] << 16, 2);
558 sw[7] = amd_bytealign (sw[7] >> 16, w0, 2);
560 case 27: sw[6] = amd_bytealign (w0, sw[6] << 8, 1);
561 sw[7] = amd_bytealign (sw[7] >> 24, w0, 1);
565 case 29: sw[7] = amd_bytealign (w0, sw[7] << 24, 3);
566 sw[8] = amd_bytealign (sw[8] >> 8, w0, 3);
568 case 30: sw[7] = amd_bytealign (w0, sw[7] << 16, 2);
569 sw[8] = amd_bytealign (sw[8] >> 16, w0, 2);
571 case 31: sw[7] = amd_bytealign (w0, sw[7] << 8, 1);
572 sw[8] = amd_bytealign (sw[8] >> 24, w0, 1);
580 case 1: sw[0] = (sw[0] & 0x000000ff) | (w0 << 8);
581 sw[1] = (sw[1] & 0xffffff00) | (w0 >> 24);
583 case 2: sw[0] = (sw[0] & 0x0000ffff) | (w0 << 16);
584 sw[1] = (sw[1] & 0xffff0000) | (w0 >> 16);
586 case 3: sw[0] = (sw[0] & 0x00ffffff) | (w0 << 24);
587 sw[1] = (sw[1] & 0xff000000) | (w0 >> 8);
591 case 5: sw[1] = (sw[1] & 0x000000ff) | (w0 << 8);
592 sw[2] = (sw[2] & 0xffffff00) | (w0 >> 24);
594 case 6: sw[1] = (sw[1] & 0x0000ffff) | (w0 << 16);
595 sw[2] = (sw[2] & 0xffff0000) | (w0 >> 16);
597 case 7: sw[1] = (sw[1] & 0x00ffffff) | (w0 << 24);
598 sw[2] = (sw[2] & 0xff000000) | (w0 >> 8);
602 case 9: sw[2] = (sw[2] & 0x000000ff) | (w0 << 8);
603 sw[3] = (sw[3] & 0xffffff00) | (w0 >> 24);
605 case 10: sw[2] = (sw[2] & 0x0000ffff) | (w0 << 16);
606 sw[3] = (sw[3] & 0xffff0000) | (w0 >> 16);
608 case 11: sw[2] = (sw[2] & 0x00ffffff) | (w0 << 24);
609 sw[3] = (sw[3] & 0xff000000) | (w0 >> 8);
613 case 13: sw[3] = (sw[3] & 0x000000ff) | (w0 << 8);
614 sw[4] = (sw[4] & 0xffffff00) | (w0 >> 24);
616 case 14: sw[3] = (sw[3] & 0x0000ffff) | (w0 << 16);
617 sw[4] = (sw[4] & 0xffff0000) | (w0 >> 16);
619 case 15: sw[3] = (sw[3] & 0x00ffffff) | (w0 << 24);
620 sw[4] = (sw[4] & 0xff000000) | (w0 >> 8);
624 case 17: sw[4] = (sw[4] & 0x000000ff) | (w0 << 8);
625 sw[5] = (sw[5] & 0xffffff00) | (w0 >> 24);
627 case 18: sw[4] = (sw[4] & 0x0000ffff) | (w0 << 16);
628 sw[5] = (sw[5] & 0xffff0000) | (w0 >> 16);
630 case 19: sw[4] = (sw[4] & 0x00ffffff) | (w0 << 24);
631 sw[5] = (sw[5] & 0xff000000) | (w0 >> 8);
635 case 21: sw[5] = (sw[5] & 0x000000ff) | (w0 << 8);
636 sw[6] = (sw[6] & 0xffffff00) | (w0 >> 24);
638 case 22: sw[5] = (sw[5] & 0x0000ffff) | (w0 << 16);
639 sw[6] = (sw[6] & 0xffff0000) | (w0 >> 16);
641 case 23: sw[5] = (sw[5] & 0x00ffffff) | (w0 << 24);
642 sw[6] = (sw[6] & 0xff000000) | (w0 >> 8);
646 case 25: sw[6] = (sw[6] & 0x000000ff) | (w0 << 8);
647 sw[7] = (sw[7] & 0xffffff00) | (w0 >> 24);
649 case 26: sw[6] = (sw[6] & 0x0000ffff) | (w0 << 16);
650 sw[7] = (sw[7] & 0xffff0000) | (w0 >> 16);
652 case 27: sw[6] = (sw[6] & 0x00ffffff) | (w0 << 24);
653 sw[7] = (sw[7] & 0xff000000) | (w0 >> 8);
657 case 29: sw[7] = (sw[7] & 0x000000ff) | (w0 << 8);
658 sw[8] = (sw[8] & 0xffffff00) | (w0 >> 24);
660 case 30: sw[7] = (sw[7] & 0x0000ffff) | (w0 << 16);
661 sw[8] = (sw[8] & 0xffff0000) | (w0 >> 16);
663 case 31: sw[7] = (sw[7] & 0x00ffffff) | (w0 << 24);
664 sw[8] = (sw[8] & 0xff000000) | (w0 >> 8);
670 static void m03100m (__local u32 s_SPtrans[8][64], __local u32 s_skb[8][64], u32 w[16], const u32 pw_len, __global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset)
676 const u32 gid = get_global_id (0);
677 const u32 lid = get_local_id (0);
685 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
686 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
687 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
688 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
692 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
693 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
694 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
695 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
704 const u32 salt_len = salt_bufs[salt_pos].salt_len;
706 const u32 salt_word_len = (salt_len + pw_len) * 2;
734 switch_buffer_by_offset (w0_t, w1_t, w2_t, w3_t, salt_len);
736 w0_t[0] |= salt_buf0[0];
737 w0_t[1] |= salt_buf0[1];
738 w0_t[2] |= salt_buf0[2];
739 w0_t[3] |= salt_buf0[3];
740 w1_t[0] |= salt_buf1[0];
741 w1_t[1] |= salt_buf1[1];
742 w1_t[2] |= salt_buf1[2];
743 w1_t[3] |= salt_buf1[3];
744 w2_t[0] |= salt_buf2[0];
745 w2_t[1] |= salt_buf2[1];
746 w2_t[2] |= salt_buf2[2];
747 w2_t[3] |= salt_buf2[3];
778 for (u32 il_pos = 0; il_pos < bfs_cnt; il_pos++)
780 const u32 w0r = words_buf_r[il_pos];
782 const u32 w0 = w0l | w0r;
784 overwrite_at (dst, w0, salt_len);
787 * precompute key1 since key is static: 0x0123456789abcdef
788 * plus LEFT_ROTATE by 2
830 * key1 (generate key)
838 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
842 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
843 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
848 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
852 * key2 (generate hash)
855 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
860 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
864 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
865 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
870 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
877 const u32 r0 = iv[0];
878 const u32 r1 = iv[1];
886 static void m03100s (__local u32 s_SPtrans[8][64], __local u32 s_skb[8][64], u32 w[16], const u32 pw_len, __global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset)
892 const u32 gid = get_global_id (0);
893 const u32 lid = get_local_id (0);
901 salt_buf0[0] = salt_bufs[salt_pos].salt_buf[0];
902 salt_buf0[1] = salt_bufs[salt_pos].salt_buf[1];
903 salt_buf0[2] = salt_bufs[salt_pos].salt_buf[2];
904 salt_buf0[3] = salt_bufs[salt_pos].salt_buf[3];
908 salt_buf1[0] = salt_bufs[salt_pos].salt_buf[4];
909 salt_buf1[1] = salt_bufs[salt_pos].salt_buf[5];
910 salt_buf1[2] = salt_bufs[salt_pos].salt_buf[6];
911 salt_buf1[3] = salt_bufs[salt_pos].salt_buf[7];
920 const u32 salt_len = salt_bufs[salt_pos].salt_len;
922 const u32 salt_word_len = (salt_len + pw_len) * 2;
950 switch_buffer_by_offset (w0_t, w1_t, w2_t, w3_t, salt_len);
952 w0_t[0] |= salt_buf0[0];
953 w0_t[1] |= salt_buf0[1];
954 w0_t[2] |= salt_buf0[2];
955 w0_t[3] |= salt_buf0[3];
956 w1_t[0] |= salt_buf1[0];
957 w1_t[1] |= salt_buf1[1];
958 w1_t[2] |= salt_buf1[2];
959 w1_t[3] |= salt_buf1[3];
960 w2_t[0] |= salt_buf2[0];
961 w2_t[1] |= salt_buf2[1];
962 w2_t[2] |= salt_buf2[2];
963 w2_t[3] |= salt_buf2[3];
992 const u32 search[4] =
994 digests_buf[digests_offset].digest_buf[DGST_R0],
995 digests_buf[digests_offset].digest_buf[DGST_R1],
996 digests_buf[digests_offset].digest_buf[DGST_R2],
997 digests_buf[digests_offset].digest_buf[DGST_R3]
1006 for (u32 il_pos = 0; il_pos < bfs_cnt; il_pos++)
1008 const u32 w0r = words_buf_r[il_pos];
1010 const u32 w0 = w0l | w0r;
1012 overwrite_at (dst, w0, salt_len);
1015 * precompute key1 since key is static: 0x0123456789abcdef
1016 * plus LEFT_ROTATE by 2
1021 Kc[ 0] = 0x64649040;
1022 Kc[ 1] = 0x14909858;
1023 Kc[ 2] = 0xc4b44888;
1024 Kc[ 3] = 0x9094e438;
1025 Kc[ 4] = 0xd8a004f0;
1026 Kc[ 5] = 0xa8f02810;
1027 Kc[ 6] = 0xc84048d8;
1028 Kc[ 7] = 0x68d804a8;
1029 Kc[ 8] = 0x0490e40c;
1030 Kc[ 9] = 0xac183024;
1031 Kc[10] = 0x24c07c10;
1032 Kc[11] = 0x8c88c038;
1033 Kc[12] = 0xc048c824;
1034 Kc[13] = 0x4c0470a8;
1035 Kc[14] = 0x584020b4;
1036 Kc[15] = 0x00742c4c;
1040 Kd[ 0] = 0xa42ce40c;
1041 Kd[ 1] = 0x64689858;
1042 Kd[ 2] = 0x484050b8;
1043 Kd[ 3] = 0xe8184814;
1044 Kd[ 4] = 0x405cc070;
1045 Kd[ 5] = 0xa010784c;
1046 Kd[ 6] = 0x6074a800;
1047 Kd[ 7] = 0x80701c1c;
1048 Kd[ 8] = 0x9cd49430;
1049 Kd[ 9] = 0x4c8ce078;
1050 Kd[10] = 0x5c18c088;
1051 Kd[11] = 0x28a8a4c8;
1052 Kd[12] = 0x3c180838;
1053 Kd[13] = 0xb0b86c20;
1054 Kd[14] = 0xac84a094;
1055 Kd[15] = 0x4ce0c0c4;
1058 * key1 (generate key)
1066 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
1070 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
1071 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
1076 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
1080 * key2 (generate hash)
1083 _des_crypt_keysetup (iv[0], iv[1], Kc, Kd, s_skb);
1088 for (u32 j = 0, k = 0; j < salt_word_len; j += 8, k++)
1092 data[0] = ((dst[k] << 16) & 0xff000000) | ((dst[k] << 8) & 0x0000ff00);
1093 data[1] = ((dst[k] >> 0) & 0xff000000) | ((dst[k] >> 8) & 0x0000ff00);
1098 _des_crypt_encrypt (iv, data, Kc, Kd, s_SPtrans);
1105 const u32 r0 = iv[0];
1106 const u32 r1 = iv[1];
1114 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m03100_m04 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1116 __local u32 s_SPtrans[8][64];
1118 __local u32 s_skb[8][64];
1124 const u32 gid = get_global_id (0);
1125 const u32 lid = get_local_id (0);
1129 w[ 0] = pws[gid].i[ 0];
1130 w[ 1] = pws[gid].i[ 1];
1131 w[ 2] = pws[gid].i[ 2];
1132 w[ 3] = pws[gid].i[ 3];
1146 const u32 pw_len = pws[gid].pw_len;
1152 s_SPtrans[0][lid] = c_SPtrans[0][lid];
1153 s_SPtrans[1][lid] = c_SPtrans[1][lid];
1154 s_SPtrans[2][lid] = c_SPtrans[2][lid];
1155 s_SPtrans[3][lid] = c_SPtrans[3][lid];
1156 s_SPtrans[4][lid] = c_SPtrans[4][lid];
1157 s_SPtrans[5][lid] = c_SPtrans[5][lid];
1158 s_SPtrans[6][lid] = c_SPtrans[6][lid];
1159 s_SPtrans[7][lid] = c_SPtrans[7][lid];
1161 s_skb[0][lid] = c_skb[0][lid];
1162 s_skb[1][lid] = c_skb[1][lid];
1163 s_skb[2][lid] = c_skb[2][lid];
1164 s_skb[3][lid] = c_skb[3][lid];
1165 s_skb[4][lid] = c_skb[4][lid];
1166 s_skb[5][lid] = c_skb[5][lid];
1167 s_skb[6][lid] = c_skb[6][lid];
1168 s_skb[7][lid] = c_skb[7][lid];
1170 barrier (CLK_LOCAL_MEM_FENCE);
1172 if (gid >= gid_max) return;
1178 m03100m (s_SPtrans, s_skb, w, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1181 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m03100_m08 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1183 __local u32 s_SPtrans[8][64];
1185 __local u32 s_skb[8][64];
1191 const u32 gid = get_global_id (0);
1192 const u32 lid = get_local_id (0);
1196 w[ 0] = pws[gid].i[ 0];
1197 w[ 1] = pws[gid].i[ 1];
1198 w[ 2] = pws[gid].i[ 2];
1199 w[ 3] = pws[gid].i[ 3];
1200 w[ 4] = pws[gid].i[ 4];
1201 w[ 5] = pws[gid].i[ 5];
1202 w[ 6] = pws[gid].i[ 6];
1203 w[ 7] = pws[gid].i[ 7];
1213 const u32 pw_len = pws[gid].pw_len;
1219 s_SPtrans[0][lid] = c_SPtrans[0][lid];
1220 s_SPtrans[1][lid] = c_SPtrans[1][lid];
1221 s_SPtrans[2][lid] = c_SPtrans[2][lid];
1222 s_SPtrans[3][lid] = c_SPtrans[3][lid];
1223 s_SPtrans[4][lid] = c_SPtrans[4][lid];
1224 s_SPtrans[5][lid] = c_SPtrans[5][lid];
1225 s_SPtrans[6][lid] = c_SPtrans[6][lid];
1226 s_SPtrans[7][lid] = c_SPtrans[7][lid];
1228 s_skb[0][lid] = c_skb[0][lid];
1229 s_skb[1][lid] = c_skb[1][lid];
1230 s_skb[2][lid] = c_skb[2][lid];
1231 s_skb[3][lid] = c_skb[3][lid];
1232 s_skb[4][lid] = c_skb[4][lid];
1233 s_skb[5][lid] = c_skb[5][lid];
1234 s_skb[6][lid] = c_skb[6][lid];
1235 s_skb[7][lid] = c_skb[7][lid];
1237 barrier (CLK_LOCAL_MEM_FENCE);
1239 if (gid >= gid_max) return;
1245 m03100m (s_SPtrans, s_skb, w, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1248 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m03100_m16 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1252 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m03100_s04 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1254 __local u32 s_SPtrans[8][64];
1256 __local u32 s_skb[8][64];
1262 const u32 gid = get_global_id (0);
1263 const u32 lid = get_local_id (0);
1267 w[ 0] = pws[gid].i[ 0];
1268 w[ 1] = pws[gid].i[ 1];
1269 w[ 2] = pws[gid].i[ 2];
1270 w[ 3] = pws[gid].i[ 3];
1284 const u32 pw_len = pws[gid].pw_len;
1290 s_SPtrans[0][lid] = c_SPtrans[0][lid];
1291 s_SPtrans[1][lid] = c_SPtrans[1][lid];
1292 s_SPtrans[2][lid] = c_SPtrans[2][lid];
1293 s_SPtrans[3][lid] = c_SPtrans[3][lid];
1294 s_SPtrans[4][lid] = c_SPtrans[4][lid];
1295 s_SPtrans[5][lid] = c_SPtrans[5][lid];
1296 s_SPtrans[6][lid] = c_SPtrans[6][lid];
1297 s_SPtrans[7][lid] = c_SPtrans[7][lid];
1299 s_skb[0][lid] = c_skb[0][lid];
1300 s_skb[1][lid] = c_skb[1][lid];
1301 s_skb[2][lid] = c_skb[2][lid];
1302 s_skb[3][lid] = c_skb[3][lid];
1303 s_skb[4][lid] = c_skb[4][lid];
1304 s_skb[5][lid] = c_skb[5][lid];
1305 s_skb[6][lid] = c_skb[6][lid];
1306 s_skb[7][lid] = c_skb[7][lid];
1308 barrier (CLK_LOCAL_MEM_FENCE);
1310 if (gid >= gid_max) return;
1316 m03100s (s_SPtrans, s_skb, w, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1319 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m03100_s08 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)
1321 __local u32 s_SPtrans[8][64];
1323 __local u32 s_skb[8][64];
1329 const u32 gid = get_global_id (0);
1330 const u32 lid = get_local_id (0);
1334 w[ 0] = pws[gid].i[ 0];
1335 w[ 1] = pws[gid].i[ 1];
1336 w[ 2] = pws[gid].i[ 2];
1337 w[ 3] = pws[gid].i[ 3];
1338 w[ 4] = pws[gid].i[ 4];
1339 w[ 5] = pws[gid].i[ 5];
1340 w[ 6] = pws[gid].i[ 6];
1341 w[ 7] = pws[gid].i[ 7];
1351 const u32 pw_len = pws[gid].pw_len;
1357 s_SPtrans[0][lid] = c_SPtrans[0][lid];
1358 s_SPtrans[1][lid] = c_SPtrans[1][lid];
1359 s_SPtrans[2][lid] = c_SPtrans[2][lid];
1360 s_SPtrans[3][lid] = c_SPtrans[3][lid];
1361 s_SPtrans[4][lid] = c_SPtrans[4][lid];
1362 s_SPtrans[5][lid] = c_SPtrans[5][lid];
1363 s_SPtrans[6][lid] = c_SPtrans[6][lid];
1364 s_SPtrans[7][lid] = c_SPtrans[7][lid];
1366 s_skb[0][lid] = c_skb[0][lid];
1367 s_skb[1][lid] = c_skb[1][lid];
1368 s_skb[2][lid] = c_skb[2][lid];
1369 s_skb[3][lid] = c_skb[3][lid];
1370 s_skb[4][lid] = c_skb[4][lid];
1371 s_skb[5][lid] = c_skb[5][lid];
1372 s_skb[6][lid] = c_skb[6][lid];
1373 s_skb[7][lid] = c_skb[7][lid];
1375 barrier (CLK_LOCAL_MEM_FENCE);
1377 if (gid >= gid_max) return;
1383 m03100s (s_SPtrans, s_skb, w, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_scryptV_buf, bitmap_mask, bitmap_shift1, bitmap_shift2, salt_pos, loop_pos, loop_cnt, bfs_cnt, digests_cnt, digests_offset);
1386 __kernel void __attribute__((reqd_work_group_size (64, 1, 1))) m03100_s16 (__global pw_t *pws, __global gpu_rule_t *rules_buf, __global comb_t *combs_buf, __constant u32 * words_buf_r, __global void *tmps, __global void *hooks, __global u32 *bitmaps_buf_s1_a, __global u32 *bitmaps_buf_s1_b, __global u32 *bitmaps_buf_s1_c, __global u32 *bitmaps_buf_s1_d, __global u32 *bitmaps_buf_s2_a, __global u32 *bitmaps_buf_s2_b, __global u32 *bitmaps_buf_s2_c, __global u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global digest_t *digests_buf, __global u32 *hashes_shown, __global salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 bfs_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max)