/** * Author......: See docs/credits.txt * License.....: MIT */ #include "inc_vendor.cl" #include "inc_hash_constants.h" #include "inc_hash_functions.cl" #include "inc_types.cl" #include "inc_common.cl" #include "inc_hash_sha256.cl" void memcat8c_be (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 len, const u32 append, u32 digest[8]) { const u32 func_len = len & 63; const u32 mod = func_len & 3; const u32 div = func_len / 4; u32 tmp0; u32 tmp1; #ifdef IS_NV const int selector = (0x76543210 >> ((func_len & 3) * 4)) & 0xffff; tmp0 = __byte_perm (append, 0, selector); tmp1 = __byte_perm (0, append, selector); #endif #if defined IS_AMD || defined IS_GENERIC tmp0 = amd_bytealign (0, append, func_len); tmp1 = amd_bytealign (append, 0, func_len); #endif u32 carry = 0; switch (div) { case 0: w0[0] |= tmp0; w0[1] = tmp1; break; case 1: w0[1] |= tmp0; w0[2] = tmp1; break; case 2: w0[2] |= tmp0; w0[3] = tmp1; break; case 3: w0[3] |= tmp0; w1[0] = tmp1; break; case 4: w1[0] |= tmp0; w1[1] = tmp1; break; case 5: w1[1] |= tmp0; w1[2] = tmp1; break; case 6: w1[2] |= tmp0; w1[3] = tmp1; break; case 7: w1[3] |= tmp0; w2[0] = tmp1; break; case 8: w2[0] |= tmp0; w2[1] = tmp1; break; case 9: w2[1] |= tmp0; w2[2] = tmp1; break; case 10: w2[2] |= tmp0; w2[3] = tmp1; break; case 11: w2[3] |= tmp0; w3[0] = tmp1; break; case 12: w3[0] |= tmp0; w3[1] = tmp1; break; case 13: w3[1] |= tmp0; w3[2] = tmp1; break; case 14: w3[2] |= tmp0; w3[3] = tmp1; break; case 15: w3[3] |= tmp0; carry = tmp1; break; } const u32 new_len = func_len + 8; if (new_len >= 64) { sha256_transform (w0, w1, w2, w3, digest); w0[0] = carry; w0[1] = 0; w0[2] = 0; w0[3] = 0; w1[0] = 0; w1[1] = 0; w1[2] = 0; w1[3] = 0; w2[0] = 0; w2[1] = 0; w2[2] = 0; w2[3] = 0; w3[0] = 0; w3[1] = 0; w3[2] = 0; w3[3] = 0; } } __kernel void m11600_init (__global pw_t *pws, __global const kernel_rule_t *rules_buf, __global const pw_t *combs_buf, __global const bf_t *bfs_buf, __global seven_zip_tmp_t *tmps, __global seven_zip_hook_t *seven_zip_hook, __global const u32 *bitmaps_buf_s1_a, __global const u32 *bitmaps_buf_s1_b, __global const u32 *bitmaps_buf_s1_c, __global const u32 *bitmaps_buf_s1_d, __global const u32 *bitmaps_buf_s2_a, __global const u32 *bitmaps_buf_s2_b, __global const u32 *bitmaps_buf_s2_c, __global const u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global const digest_t *digests_buf, __global u32 *hashes_shown, __global const salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max) { /** * base */ const u32 gid = get_global_id (0); if (gid >= gid_max) return; /** * context save */ sha256_ctx_t ctx; sha256_init (&ctx); tmps[gid].h[0] = ctx.h[0]; tmps[gid].h[1] = ctx.h[1]; tmps[gid].h[2] = ctx.h[2]; tmps[gid].h[3] = ctx.h[3]; tmps[gid].h[4] = ctx.h[4]; tmps[gid].h[5] = ctx.h[5]; tmps[gid].h[6] = ctx.h[6]; tmps[gid].h[7] = ctx.h[7]; tmps[gid].w0[0] = ctx.w0[0]; tmps[gid].w0[1] = ctx.w0[1]; tmps[gid].w0[2] = ctx.w0[2]; tmps[gid].w0[3] = ctx.w0[3]; tmps[gid].w1[0] = ctx.w1[0]; tmps[gid].w1[1] = ctx.w1[1]; tmps[gid].w1[2] = ctx.w1[2]; tmps[gid].w1[3] = ctx.w1[3]; tmps[gid].w2[0] = ctx.w2[0]; tmps[gid].w2[1] = ctx.w2[1]; tmps[gid].w2[2] = ctx.w2[2]; tmps[gid].w2[3] = ctx.w2[3]; tmps[gid].w3[0] = ctx.w3[0]; tmps[gid].w3[1] = ctx.w3[1]; tmps[gid].w3[2] = ctx.w3[2]; tmps[gid].w3[3] = ctx.w3[3]; tmps[gid].len = ctx.len; } __kernel void m11600_loop (__global pw_t *pws, __global const kernel_rule_t *rules_buf, __global const pw_t *combs_buf, __global const bf_t *bfs_buf, __global seven_zip_tmp_t *tmps, __global seven_zip_hook_t *seven_zip_hook, __global const u32 *bitmaps_buf_s1_a, __global const u32 *bitmaps_buf_s1_b, __global const u32 *bitmaps_buf_s1_c, __global const u32 *bitmaps_buf_s1_d, __global const u32 *bitmaps_buf_s2_a, __global const u32 *bitmaps_buf_s2_b, __global const u32 *bitmaps_buf_s2_c, __global const u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global const digest_t *digests_buf, __global u32 *hashes_shown, __global const salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max) { /** * base */ const u32 gid = get_global_id (0); if (gid >= gid_max) return; const u32 pw_len = pws[gid].pw_len; const u32 pw_lenv = ceil ((float) pw_len / 4); u32 w[64] = { 0 }; for (int idx = 0; idx < pw_lenv; idx++) { w[idx] = pws[gid].i[idx]; barrier (CLK_GLOBAL_MEM_FENCE); } /** * context load */ sha256_ctx_t ctx; ctx.h[0] = tmps[gid].h[0]; ctx.h[1] = tmps[gid].h[1]; ctx.h[2] = tmps[gid].h[2]; ctx.h[3] = tmps[gid].h[3]; ctx.h[4] = tmps[gid].h[4]; ctx.h[5] = tmps[gid].h[5]; ctx.h[6] = tmps[gid].h[6]; ctx.h[7] = tmps[gid].h[7]; ctx.w0[0] = tmps[gid].w0[0]; ctx.w0[1] = tmps[gid].w0[1]; ctx.w0[2] = tmps[gid].w0[2]; ctx.w0[3] = tmps[gid].w0[3]; ctx.w1[0] = tmps[gid].w1[0]; ctx.w1[1] = tmps[gid].w1[1]; ctx.w1[2] = tmps[gid].w1[2]; ctx.w1[3] = tmps[gid].w1[3]; ctx.w2[0] = tmps[gid].w2[0]; ctx.w2[1] = tmps[gid].w2[1]; ctx.w2[2] = tmps[gid].w2[2]; ctx.w2[3] = tmps[gid].w2[3]; ctx.w3[0] = tmps[gid].w3[0]; ctx.w3[1] = tmps[gid].w3[1]; ctx.w3[2] = tmps[gid].w3[2]; ctx.w3[3] = tmps[gid].w3[3]; ctx.len = tmps[gid].len; /** * base */ for (u32 i = 0, j = loop_pos; i < loop_cnt; i++, j++) { sha256_update_utf16le_swap (&ctx, w, pw_len); memcat8c_be (ctx.w0, ctx.w1, ctx.w2, ctx.w3, ctx.len, swap32_S (j), ctx.h); ctx.len += 8; } /** * context save */ tmps[gid].h[0] = ctx.h[0]; tmps[gid].h[1] = ctx.h[1]; tmps[gid].h[2] = ctx.h[2]; tmps[gid].h[3] = ctx.h[3]; tmps[gid].h[4] = ctx.h[4]; tmps[gid].h[5] = ctx.h[5]; tmps[gid].h[6] = ctx.h[6]; tmps[gid].h[7] = ctx.h[7]; tmps[gid].w0[0] = ctx.w0[0]; tmps[gid].w0[1] = ctx.w0[1]; tmps[gid].w0[2] = ctx.w0[2]; tmps[gid].w0[3] = ctx.w0[3]; tmps[gid].w1[0] = ctx.w1[0]; tmps[gid].w1[1] = ctx.w1[1]; tmps[gid].w1[2] = ctx.w1[2]; tmps[gid].w1[3] = ctx.w1[3]; tmps[gid].w2[0] = ctx.w2[0]; tmps[gid].w2[1] = ctx.w2[1]; tmps[gid].w2[2] = ctx.w2[2]; tmps[gid].w2[3] = ctx.w2[3]; tmps[gid].w3[0] = ctx.w3[0]; tmps[gid].w3[1] = ctx.w3[1]; tmps[gid].w3[2] = ctx.w3[2]; tmps[gid].w3[3] = ctx.w3[3]; tmps[gid].len = ctx.len; } __kernel void m11600_hook23 (__global pw_t *pws, __global const kernel_rule_t *rules_buf, __global const pw_t *combs_buf, __global const bf_t *bfs_buf, __global seven_zip_tmp_t *tmps, __global seven_zip_hook_t *seven_zip_hook, __global const u32 *bitmaps_buf_s1_a, __global const u32 *bitmaps_buf_s1_b, __global const u32 *bitmaps_buf_s1_c, __global const u32 *bitmaps_buf_s1_d, __global const u32 *bitmaps_buf_s2_a, __global const u32 *bitmaps_buf_s2_b, __global const u32 *bitmaps_buf_s2_c, __global const u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global const digest_t *digests_buf, __global u32 *hashes_shown, __global const salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max) { const u32 gid = get_global_id (0); const u32 lid = get_local_id (0); const u32 lsz = get_local_size (0); if (gid >= gid_max) return; /** * context load */ sha256_ctx_t ctx; ctx.h[0] = tmps[gid].h[0]; ctx.h[1] = tmps[gid].h[1]; ctx.h[2] = tmps[gid].h[2]; ctx.h[3] = tmps[gid].h[3]; ctx.h[4] = tmps[gid].h[4]; ctx.h[5] = tmps[gid].h[5]; ctx.h[6] = tmps[gid].h[6]; ctx.h[7] = tmps[gid].h[7]; ctx.w0[0] = tmps[gid].w0[0]; ctx.w0[1] = tmps[gid].w0[1]; ctx.w0[2] = tmps[gid].w0[2]; ctx.w0[3] = tmps[gid].w0[3]; ctx.w1[0] = tmps[gid].w1[0]; ctx.w1[1] = tmps[gid].w1[1]; ctx.w1[2] = tmps[gid].w1[2]; ctx.w1[3] = tmps[gid].w1[3]; ctx.w2[0] = tmps[gid].w2[0]; ctx.w2[1] = tmps[gid].w2[1]; ctx.w2[2] = tmps[gid].w2[2]; ctx.w2[3] = tmps[gid].w2[3]; ctx.w3[0] = tmps[gid].w3[0]; ctx.w3[1] = tmps[gid].w3[1]; ctx.w3[2] = tmps[gid].w3[2]; ctx.w3[3] = tmps[gid].w3[3]; ctx.len = tmps[gid].len; sha256_final (&ctx); seven_zip_hook[gid].ukey[0] = swap32 (ctx.h[0]); seven_zip_hook[gid].ukey[1] = swap32 (ctx.h[1]); seven_zip_hook[gid].ukey[2] = swap32 (ctx.h[2]); seven_zip_hook[gid].ukey[3] = swap32 (ctx.h[3]); seven_zip_hook[gid].ukey[4] = swap32 (ctx.h[4]); seven_zip_hook[gid].ukey[5] = swap32 (ctx.h[5]); seven_zip_hook[gid].ukey[6] = swap32 (ctx.h[6]); seven_zip_hook[gid].ukey[7] = swap32 (ctx.h[7]); } __kernel void m11600_comp (__global pw_t *pws, __global const kernel_rule_t *rules_buf, __global const pw_t *combs_buf, __global const bf_t *bfs_buf, __global seven_zip_tmp_t *tmps, __global seven_zip_hook_t *seven_zip_hook, __global const u32 *bitmaps_buf_s1_a, __global const u32 *bitmaps_buf_s1_b, __global const u32 *bitmaps_buf_s1_c, __global const u32 *bitmaps_buf_s1_d, __global const u32 *bitmaps_buf_s2_a, __global const u32 *bitmaps_buf_s2_b, __global const u32 *bitmaps_buf_s2_c, __global const u32 *bitmaps_buf_s2_d, __global plain_t *plains_buf, __global const digest_t *digests_buf, __global u32 *hashes_shown, __global const salt_t *salt_bufs, __global void *esalt_bufs, __global u32 *d_return_buf, __global u32 *d_scryptV0_buf, __global u32 *d_scryptV1_buf, __global u32 *d_scryptV2_buf, __global u32 *d_scryptV3_buf, const u32 bitmap_mask, const u32 bitmap_shift1, const u32 bitmap_shift2, const u32 salt_pos, const u32 loop_pos, const u32 loop_cnt, const u32 il_cnt, const u32 digests_cnt, const u32 digests_offset, const u32 combs_mode, const u32 gid_max) { /** * base */ const u32 gid = get_global_id (0); if (gid >= gid_max) return; if (seven_zip_hook[gid].hook_success == 1) { if (atomic_inc (&hashes_shown[digests_offset]) == 0) { mark_hash (plains_buf, d_return_buf, salt_pos, digests_cnt, 0, digests_offset + 0, gid, 0); } return; } }