/** * Author......: See docs/credits.txt * License.....: MIT */ #define NEW_SIMD_CODE #ifdef KERNEL_STATIC #include M2S(INCLUDE_PATH/inc_vendor.h) #include M2S(INCLUDE_PATH/inc_types.h) #include M2S(INCLUDE_PATH/inc_platform.cl) #include M2S(INCLUDE_PATH/inc_common.cl) #include M2S(INCLUDE_PATH/inc_simd.cl) #include M2S(INCLUDE_PATH/inc_hash_md5.cl) #endif #if VECT_SIZE == 1 #define uint_to_hex_lower8(i) make_u32x (l_bin2asc[(i)]) #elif VECT_SIZE == 2 #define uint_to_hex_lower8(i) make_u32x (l_bin2asc[(i).s0], l_bin2asc[(i).s1]) #elif VECT_SIZE == 4 #define uint_to_hex_lower8(i) make_u32x (l_bin2asc[(i).s0], l_bin2asc[(i).s1], l_bin2asc[(i).s2], l_bin2asc[(i).s3]) #elif VECT_SIZE == 8 #define uint_to_hex_lower8(i) make_u32x (l_bin2asc[(i).s0], l_bin2asc[(i).s1], l_bin2asc[(i).s2], l_bin2asc[(i).s3], l_bin2asc[(i).s4], l_bin2asc[(i).s5], l_bin2asc[(i).s6], l_bin2asc[(i).s7]) #elif VECT_SIZE == 16 #define uint_to_hex_lower8(i) make_u32x (l_bin2asc[(i).s0], l_bin2asc[(i).s1], l_bin2asc[(i).s2], l_bin2asc[(i).s3], l_bin2asc[(i).s4], l_bin2asc[(i).s5], l_bin2asc[(i).s6], l_bin2asc[(i).s7], l_bin2asc[(i).s8], l_bin2asc[(i).s9], l_bin2asc[(i).sa], l_bin2asc[(i).sb], l_bin2asc[(i).sc], l_bin2asc[(i).sd], l_bin2asc[(i).se], l_bin2asc[(i).sf]) #endif typedef struct md5_triple_salt { u32 salt1_buf[64]; int salt1_len; u32 salt2_buf[64]; int salt2_len; u32 salt3_buf[64]; int salt3_len; } md5_triple_salt_t; DECLSPEC void m32300m (PRIVATE_AS u32 *w0, PRIVATE_AS u32 *w1, PRIVATE_AS u32 *w2, PRIVATE_AS u32 *w3, const u32 pw_len, KERN_ATTR_FUNC_VECTOR_ESALT (md5_triple_salt_t), LOCAL_AS u32 *l_bin2asc) { /** * modifiers are taken from args */ /** * salt1 */ const u32 salt1_len = esalt_bufs[DIGESTS_OFFSET_HOST].salt1_len; u32x salt1_buf[64] = { 0 }; for (u32 i = 0, idx = 0; i < salt1_len; i += 4, idx += 1) { salt1_buf[idx] = esalt_bufs[DIGESTS_OFFSET_HOST].salt1_buf[idx]; } /** * salt2 */ const u32 salt2_len = esalt_bufs[DIGESTS_OFFSET_HOST].salt2_len; u32x salt2_buf[64] = { 0 }; for (u32 i = 0, idx = 0; i < salt2_len; i += 4, idx += 1) { salt2_buf[idx] = esalt_bufs[DIGESTS_OFFSET_HOST].salt2_buf[idx]; } /** * salt3 */ const u32 salt3_len = esalt_bufs[DIGESTS_OFFSET_HOST].salt3_len; u32x salt3_buf[64] = { 0 }; for (u32 i = 0, idx = 0; i < salt3_len; i += 4, idx += 1) { salt3_buf[idx] = esalt_bufs[DIGESTS_OFFSET_HOST].salt3_buf[idx]; } /** * loop */ u32 w0l = w0[0]; for (u32 il_pos = 0; il_pos < IL_CNT; il_pos += VECT_SIZE) { const u32x w0r = words_buf_r[il_pos / VECT_SIZE]; const u32x w0lr = w0l | w0r; u32x w0_t[4]; u32x w1_t[4]; u32x w2_t[4]; u32x w3_t[4]; w0_t[0] = w0lr; w0_t[1] = w0[1]; w0_t[2] = w0[2]; w0_t[3] = w0[3]; w1_t[0] = w1[0]; w1_t[1] = w1[1]; w1_t[2] = w1[2]; w1_t[3] = w1[3]; w2_t[0] = w2[0]; w2_t[1] = w2[1]; w2_t[2] = w2[2]; w2_t[3] = w2[3]; w3_t[0] = w3[0]; w3_t[1] = w3[1]; w3_t[2] = w3[2]; w3_t[3] = w3[3]; /** * md5 */ u32x a = MD5M_A; u32x b = MD5M_B; u32x c = MD5M_C; u32x d = MD5M_D; MD5_STEP (MD5_Fo, a, b, c, d, w0_t[0], MD5C00, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w0_t[1], MD5C01, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w0_t[2], MD5C02, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w0_t[3], MD5C03, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, w1_t[0], MD5C04, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w1_t[1], MD5C05, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w1_t[2], MD5C06, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w1_t[3], MD5C07, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, w2_t[0], MD5C08, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w2_t[1], MD5C09, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w2_t[2], MD5C0a, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w2_t[3], MD5C0b, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, w3_t[0], MD5C0c, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w3_t[1], MD5C0d, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w3_t[2], MD5C0e, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w3_t[3], MD5C0f, MD5S03); MD5_STEP (MD5_Go, a, b, c, d, w0_t[1], MD5C10, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w1_t[2], MD5C11, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w2_t[3], MD5C12, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w0_t[0], MD5C13, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, w1_t[1], MD5C14, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w2_t[2], MD5C15, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w3_t[3], MD5C16, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w1_t[0], MD5C17, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, w2_t[1], MD5C18, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w3_t[2], MD5C19, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w0_t[3], MD5C1a, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w2_t[0], MD5C1b, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, w3_t[1], MD5C1c, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w0_t[2], MD5C1d, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w1_t[3], MD5C1e, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w3_t[0], MD5C1f, MD5S13); u32x t; MD5_STEP (MD5_H1, a, b, c, d, w1_t[1], MD5C20, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w2_t[0], MD5C21, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w2_t[3], MD5C22, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w3_t[2], MD5C23, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, w0_t[1], MD5C24, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w1_t[0], MD5C25, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w1_t[3], MD5C26, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w2_t[2], MD5C27, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, w3_t[1], MD5C28, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w0_t[0], MD5C29, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w0_t[3], MD5C2a, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w1_t[2], MD5C2b, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, w2_t[1], MD5C2c, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w3_t[0], MD5C2d, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w3_t[3], MD5C2e, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w0_t[2], MD5C2f, MD5S23); MD5_STEP (MD5_I , a, b, c, d, w0_t[0], MD5C30, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w1_t[3], MD5C31, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w3_t[2], MD5C32, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w1_t[1], MD5C33, MD5S33); MD5_STEP (MD5_I , a, b, c, d, w3_t[0], MD5C34, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w0_t[3], MD5C35, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w2_t[2], MD5C36, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w0_t[1], MD5C37, MD5S33); MD5_STEP (MD5_I , a, b, c, d, w2_t[0], MD5C38, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w3_t[3], MD5C39, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w1_t[2], MD5C3a, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w3_t[1], MD5C3b, MD5S33); MD5_STEP (MD5_I , a, b, c, d, w1_t[0], MD5C3c, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w2_t[3], MD5C3d, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w0_t[2], MD5C3e, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w2_t[1], MD5C3f, MD5S33); a += make_u32x (MD5M_A); b += make_u32x (MD5M_B); c += make_u32x (MD5M_C); d += make_u32x (MD5M_D); md5_ctx_vector_t ctx; md5_init_vector (&ctx); ctx.w0[0] = uint_to_hex_lower8 ((a >> 0) & 255) << 0 | uint_to_hex_lower8 ((a >> 8) & 255) << 16; ctx.w0[1] = uint_to_hex_lower8 ((a >> 16) & 255) << 0 | uint_to_hex_lower8 ((a >> 24) & 255) << 16; ctx.w0[2] = uint_to_hex_lower8 ((b >> 0) & 255) << 0 | uint_to_hex_lower8 ((b >> 8) & 255) << 16; ctx.w0[3] = uint_to_hex_lower8 ((b >> 16) & 255) << 0 | uint_to_hex_lower8 ((b >> 24) & 255) << 16; ctx.w1[0] = uint_to_hex_lower8 ((c >> 0) & 255) << 0 | uint_to_hex_lower8 ((c >> 8) & 255) << 16; ctx.w1[1] = uint_to_hex_lower8 ((c >> 16) & 255) << 0 | uint_to_hex_lower8 ((c >> 24) & 255) << 16; ctx.w1[2] = uint_to_hex_lower8 ((d >> 0) & 255) << 0 | uint_to_hex_lower8 ((d >> 8) & 255) << 16; ctx.w1[3] = uint_to_hex_lower8 ((d >> 16) & 255) << 0 | uint_to_hex_lower8 ((d >> 24) & 255) << 16; ctx.len = 32; md5_update_vector (&ctx, salt1_buf, salt1_len); md5_final_vector (&ctx); a = ctx.h[0]; b = ctx.h[1]; c = ctx.h[2]; d = ctx.h[3]; md5_init_vector (&ctx); md5_update_vector (&ctx, salt2_buf, salt2_len); u32x ww0[4]; u32x ww1[4]; u32x ww2[4]; u32x ww3[4]; ww0[0] = uint_to_hex_lower8 ((a >> 0) & 255) << 0 | uint_to_hex_lower8 ((a >> 8) & 255) << 16; ww0[1] = uint_to_hex_lower8 ((a >> 16) & 255) << 0 | uint_to_hex_lower8 ((a >> 24) & 255) << 16; ww0[2] = uint_to_hex_lower8 ((b >> 0) & 255) << 0 | uint_to_hex_lower8 ((b >> 8) & 255) << 16; ww0[3] = uint_to_hex_lower8 ((b >> 16) & 255) << 0 | uint_to_hex_lower8 ((b >> 24) & 255) << 16; ww1[0] = uint_to_hex_lower8 ((c >> 0) & 255) << 0 | uint_to_hex_lower8 ((c >> 8) & 255) << 16; ww1[1] = uint_to_hex_lower8 ((c >> 16) & 255) << 0 | uint_to_hex_lower8 ((c >> 24) & 255) << 16; ww1[2] = uint_to_hex_lower8 ((d >> 0) & 255) << 0 | uint_to_hex_lower8 ((d >> 8) & 255) << 16; ww1[3] = uint_to_hex_lower8 ((d >> 16) & 255) << 0 | uint_to_hex_lower8 ((d >> 24) & 255) << 16; ww2[0] = 0; ww2[1] = 0; ww2[2] = 0; ww2[3] = 0; ww3[0] = 0; ww3[1] = 0; ww3[2] = 0; ww3[3] = 0; md5_update_vector_64 (&ctx, ww0, ww1, ww2, ww3, 32); md5_update_vector (&ctx, salt3_buf, salt3_len); // md5_final_vector const int pos = ctx.len & 63; append_0x80_4x4 (ctx.w0, ctx.w1, ctx.w2, ctx.w3, pos); if (pos >= 56) { md5_transform_vector (ctx.w0, ctx.w1, ctx.w2, ctx.w3, ctx.h); ctx.w0[0] = 0; ctx.w0[1] = 0; ctx.w0[2] = 0; ctx.w0[3] = 0; ctx.w1[0] = 0; ctx.w1[1] = 0; ctx.w1[2] = 0; ctx.w1[3] = 0; ctx.w2[0] = 0; ctx.w2[1] = 0; ctx.w2[2] = 0; ctx.w2[3] = 0; ctx.w3[0] = 0; ctx.w3[1] = 0; ctx.w3[2] = 0; ctx.w3[3] = 0; } ctx.w3[2] = ctx.len * 8; ctx.w3[3] = 0; a = ctx.h[0]; b = ctx.h[1]; c = ctx.h[2]; d = ctx.h[3]; MD5_STEP (MD5_Fo, a, b, c, d, ctx.w0[0], MD5C00, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w0[1], MD5C01, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w0[2], MD5C02, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w0[3], MD5C03, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, ctx.w1[0], MD5C04, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w1[1], MD5C05, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w1[2], MD5C06, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w1[3], MD5C07, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, ctx.w2[0], MD5C08, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w2[1], MD5C09, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w2[2], MD5C0a, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w2[3], MD5C0b, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, ctx.w3[0], MD5C0c, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w3[1], MD5C0d, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w3[2], MD5C0e, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w3[3], MD5C0f, MD5S03); MD5_STEP (MD5_Go, a, b, c, d, ctx.w0[1], MD5C10, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w1[2], MD5C11, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w2[3], MD5C12, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w0[0], MD5C13, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, ctx.w1[1], MD5C14, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w2[2], MD5C15, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w3[3], MD5C16, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w1[0], MD5C17, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, ctx.w2[1], MD5C18, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w3[2], MD5C19, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w0[3], MD5C1a, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w2[0], MD5C1b, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, ctx.w3[1], MD5C1c, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w0[2], MD5C1d, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w1[3], MD5C1e, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w3[0], MD5C1f, MD5S13); MD5_STEP (MD5_H1, a, b, c, d, ctx.w1[1], MD5C20, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w2[0], MD5C21, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w2[3], MD5C22, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w3[2], MD5C23, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, ctx.w0[1], MD5C24, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w1[0], MD5C25, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w1[3], MD5C26, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w2[2], MD5C27, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, ctx.w3[1], MD5C28, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w0[0], MD5C29, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w0[3], MD5C2a, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w1[2], MD5C2b, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, ctx.w2[1], MD5C2c, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w3[0], MD5C2d, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w3[3], MD5C2e, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w0[2], MD5C2f, MD5S23); MD5_STEP (MD5_I , a, b, c, d, ctx.w0[0], MD5C30, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w1[3], MD5C31, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w3[2], MD5C32, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w1[1], MD5C33, MD5S33); MD5_STEP (MD5_I , a, b, c, d, ctx.w3[0], MD5C34, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w0[3], MD5C35, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w2[2], MD5C36, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w0[1], MD5C37, MD5S33); MD5_STEP (MD5_I , a, b, c, d, ctx.w2[0], MD5C38, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w3[3], MD5C39, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w1[2], MD5C3a, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w3[1], MD5C3b, MD5S33); MD5_STEP (MD5_I , a, b, c, d, ctx.w1[0], MD5C3c, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w2[3], MD5C3d, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w0[2], MD5C3e, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w2[1], MD5C3f, MD5S33); a += ctx.h[0] - make_u32x (MD5M_A); b += ctx.h[1] - make_u32x (MD5M_B); c += ctx.h[2] - make_u32x (MD5M_C); d += ctx.h[3] - make_u32x (MD5M_D); COMPARE_M_SIMD (a, d, c, b); } } DECLSPEC void m32300s (PRIVATE_AS u32 *w0, PRIVATE_AS u32 *w1, PRIVATE_AS u32 *w2, PRIVATE_AS u32 *w3, const u32 pw_len, KERN_ATTR_FUNC_VECTOR_ESALT (md5_triple_salt_t), LOCAL_AS u32 *l_bin2asc) { /** * modifiers are taken from args */ /** * salt1 */ const u32 salt1_len = esalt_bufs[DIGESTS_OFFSET_HOST].salt1_len; u32x salt1_buf[64] = { 0 }; for (u32 i = 0, idx = 0; i < salt1_len; i += 4, idx += 1) { salt1_buf[idx] = esalt_bufs[DIGESTS_OFFSET_HOST].salt1_buf[idx]; } /** * salt2 */ const u32 salt2_len = esalt_bufs[DIGESTS_OFFSET_HOST].salt2_len; u32x salt2_buf[64] = { 0 }; for (u32 i = 0, idx = 0; i < salt2_len; i += 4, idx += 1) { salt2_buf[idx] = esalt_bufs[DIGESTS_OFFSET_HOST].salt2_buf[idx]; } /** * salt3 */ const u32 salt3_len = esalt_bufs[DIGESTS_OFFSET_HOST].salt3_len; u32x salt3_buf[64] = { 0 }; for (u32 i = 0, idx = 0; i < salt3_len; i += 4, idx += 1) { salt3_buf[idx] = esalt_bufs[DIGESTS_OFFSET_HOST].salt3_buf[idx]; } /** * digest */ const u32 search[4] = { digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R0], digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R1], digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R2], digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R3] }; /** * loop */ u32 w0l = w0[0]; for (u32 il_pos = 0; il_pos < IL_CNT; il_pos += VECT_SIZE) { const u32x w0r = words_buf_r[il_pos / VECT_SIZE]; const u32x w0lr = w0l | w0r; u32x w0_t[4]; u32x w1_t[4]; u32x w2_t[4]; u32x w3_t[4]; w0_t[0] = w0lr; w0_t[1] = w0[1]; w0_t[2] = w0[2]; w0_t[3] = w0[3]; w1_t[0] = w1[0]; w1_t[1] = w1[1]; w1_t[2] = w1[2]; w1_t[3] = w1[3]; w2_t[0] = w2[0]; w2_t[1] = w2[1]; w2_t[2] = w2[2]; w2_t[3] = w2[3]; w3_t[0] = w3[0]; w3_t[1] = w3[1]; w3_t[2] = w3[2]; w3_t[3] = w3[3]; /** * md5 */ u32x a = MD5M_A; u32x b = MD5M_B; u32x c = MD5M_C; u32x d = MD5M_D; MD5_STEP (MD5_Fo, a, b, c, d, w0_t[0], MD5C00, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w0_t[1], MD5C01, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w0_t[2], MD5C02, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w0_t[3], MD5C03, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, w1_t[0], MD5C04, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w1_t[1], MD5C05, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w1_t[2], MD5C06, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w1_t[3], MD5C07, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, w2_t[0], MD5C08, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w2_t[1], MD5C09, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w2_t[2], MD5C0a, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w2_t[3], MD5C0b, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, w3_t[0], MD5C0c, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, w3_t[1], MD5C0d, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, w3_t[2], MD5C0e, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, w3_t[3], MD5C0f, MD5S03); MD5_STEP (MD5_Go, a, b, c, d, w0_t[1], MD5C10, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w1_t[2], MD5C11, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w2_t[3], MD5C12, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w0_t[0], MD5C13, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, w1_t[1], MD5C14, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w2_t[2], MD5C15, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w3_t[3], MD5C16, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w1_t[0], MD5C17, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, w2_t[1], MD5C18, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w3_t[2], MD5C19, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w0_t[3], MD5C1a, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w2_t[0], MD5C1b, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, w3_t[1], MD5C1c, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, w0_t[2], MD5C1d, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, w1_t[3], MD5C1e, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, w3_t[0], MD5C1f, MD5S13); u32x t; MD5_STEP (MD5_H1, a, b, c, d, w1_t[1], MD5C20, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w2_t[0], MD5C21, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w2_t[3], MD5C22, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w3_t[2], MD5C23, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, w0_t[1], MD5C24, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w1_t[0], MD5C25, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w1_t[3], MD5C26, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w2_t[2], MD5C27, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, w3_t[1], MD5C28, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w0_t[0], MD5C29, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w0_t[3], MD5C2a, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w1_t[2], MD5C2b, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, w2_t[1], MD5C2c, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, w3_t[0], MD5C2d, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, w3_t[3], MD5C2e, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, w0_t[2], MD5C2f, MD5S23); MD5_STEP (MD5_I , a, b, c, d, w0_t[0], MD5C30, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w1_t[3], MD5C31, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w3_t[2], MD5C32, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w1_t[1], MD5C33, MD5S33); MD5_STEP (MD5_I , a, b, c, d, w3_t[0], MD5C34, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w0_t[3], MD5C35, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w2_t[2], MD5C36, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w0_t[1], MD5C37, MD5S33); MD5_STEP (MD5_I , a, b, c, d, w2_t[0], MD5C38, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w3_t[3], MD5C39, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w1_t[2], MD5C3a, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w3_t[1], MD5C3b, MD5S33); MD5_STEP (MD5_I , a, b, c, d, w1_t[0], MD5C3c, MD5S30); MD5_STEP (MD5_I , d, a, b, c, w2_t[3], MD5C3d, MD5S31); MD5_STEP (MD5_I , c, d, a, b, w0_t[2], MD5C3e, MD5S32); MD5_STEP (MD5_I , b, c, d, a, w2_t[1], MD5C3f, MD5S33); a += make_u32x (MD5M_A); b += make_u32x (MD5M_B); c += make_u32x (MD5M_C); d += make_u32x (MD5M_D); md5_ctx_vector_t ctx; md5_init_vector (&ctx); ctx.w0[0] = uint_to_hex_lower8 ((a >> 0) & 255) << 0 | uint_to_hex_lower8 ((a >> 8) & 255) << 16; ctx.w0[1] = uint_to_hex_lower8 ((a >> 16) & 255) << 0 | uint_to_hex_lower8 ((a >> 24) & 255) << 16; ctx.w0[2] = uint_to_hex_lower8 ((b >> 0) & 255) << 0 | uint_to_hex_lower8 ((b >> 8) & 255) << 16; ctx.w0[3] = uint_to_hex_lower8 ((b >> 16) & 255) << 0 | uint_to_hex_lower8 ((b >> 24) & 255) << 16; ctx.w1[0] = uint_to_hex_lower8 ((c >> 0) & 255) << 0 | uint_to_hex_lower8 ((c >> 8) & 255) << 16; ctx.w1[1] = uint_to_hex_lower8 ((c >> 16) & 255) << 0 | uint_to_hex_lower8 ((c >> 24) & 255) << 16; ctx.w1[2] = uint_to_hex_lower8 ((d >> 0) & 255) << 0 | uint_to_hex_lower8 ((d >> 8) & 255) << 16; ctx.w1[3] = uint_to_hex_lower8 ((d >> 16) & 255) << 0 | uint_to_hex_lower8 ((d >> 24) & 255) << 16; ctx.len = 32; md5_update_vector (&ctx, salt1_buf, salt1_len); md5_final_vector (&ctx); a = ctx.h[0]; b = ctx.h[1]; c = ctx.h[2]; d = ctx.h[3]; md5_init_vector (&ctx); md5_update_vector (&ctx, salt2_buf, salt2_len); u32x ww0[4]; u32x ww1[4]; u32x ww2[4]; u32x ww3[4]; ww0[0] = uint_to_hex_lower8 ((a >> 0) & 255) << 0 | uint_to_hex_lower8 ((a >> 8) & 255) << 16; ww0[1] = uint_to_hex_lower8 ((a >> 16) & 255) << 0 | uint_to_hex_lower8 ((a >> 24) & 255) << 16; ww0[2] = uint_to_hex_lower8 ((b >> 0) & 255) << 0 | uint_to_hex_lower8 ((b >> 8) & 255) << 16; ww0[3] = uint_to_hex_lower8 ((b >> 16) & 255) << 0 | uint_to_hex_lower8 ((b >> 24) & 255) << 16; ww1[0] = uint_to_hex_lower8 ((c >> 0) & 255) << 0 | uint_to_hex_lower8 ((c >> 8) & 255) << 16; ww1[1] = uint_to_hex_lower8 ((c >> 16) & 255) << 0 | uint_to_hex_lower8 ((c >> 24) & 255) << 16; ww1[2] = uint_to_hex_lower8 ((d >> 0) & 255) << 0 | uint_to_hex_lower8 ((d >> 8) & 255) << 16; ww1[3] = uint_to_hex_lower8 ((d >> 16) & 255) << 0 | uint_to_hex_lower8 ((d >> 24) & 255) << 16; ww2[0] = 0; ww2[1] = 0; ww2[2] = 0; ww2[3] = 0; ww3[0] = 0; ww3[1] = 0; ww3[2] = 0; ww3[3] = 0; md5_update_vector_64 (&ctx, ww0, ww1, ww2, ww3, 32); md5_update_vector (&ctx, salt3_buf, salt3_len); // md5_final_vector const int pos = ctx.len & 63; append_0x80_4x4 (ctx.w0, ctx.w1, ctx.w2, ctx.w3, pos); if (pos >= 56) { md5_transform_vector (ctx.w0, ctx.w1, ctx.w2, ctx.w3, ctx.h); ctx.w0[0] = 0; ctx.w0[1] = 0; ctx.w0[2] = 0; ctx.w0[3] = 0; ctx.w1[0] = 0; ctx.w1[1] = 0; ctx.w1[2] = 0; ctx.w1[3] = 0; ctx.w2[0] = 0; ctx.w2[1] = 0; ctx.w2[2] = 0; ctx.w2[3] = 0; ctx.w3[0] = 0; ctx.w3[1] = 0; ctx.w3[2] = 0; ctx.w3[3] = 0; } ctx.w3[2] = ctx.len * 8; ctx.w3[3] = 0; a = ctx.h[0]; b = ctx.h[1]; c = ctx.h[2]; d = ctx.h[3]; MD5_STEP (MD5_Fo, a, b, c, d, ctx.w0[0], MD5C00, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w0[1], MD5C01, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w0[2], MD5C02, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w0[3], MD5C03, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, ctx.w1[0], MD5C04, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w1[1], MD5C05, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w1[2], MD5C06, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w1[3], MD5C07, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, ctx.w2[0], MD5C08, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w2[1], MD5C09, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w2[2], MD5C0a, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w2[3], MD5C0b, MD5S03); MD5_STEP (MD5_Fo, a, b, c, d, ctx.w3[0], MD5C0c, MD5S00); MD5_STEP (MD5_Fo, d, a, b, c, ctx.w3[1], MD5C0d, MD5S01); MD5_STEP (MD5_Fo, c, d, a, b, ctx.w3[2], MD5C0e, MD5S02); MD5_STEP (MD5_Fo, b, c, d, a, ctx.w3[3], MD5C0f, MD5S03); MD5_STEP (MD5_Go, a, b, c, d, ctx.w0[1], MD5C10, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w1[2], MD5C11, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w2[3], MD5C12, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w0[0], MD5C13, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, ctx.w1[1], MD5C14, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w2[2], MD5C15, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w3[3], MD5C16, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w1[0], MD5C17, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, ctx.w2[1], MD5C18, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w3[2], MD5C19, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w0[3], MD5C1a, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w2[0], MD5C1b, MD5S13); MD5_STEP (MD5_Go, a, b, c, d, ctx.w3[1], MD5C1c, MD5S10); MD5_STEP (MD5_Go, d, a, b, c, ctx.w0[2], MD5C1d, MD5S11); MD5_STEP (MD5_Go, c, d, a, b, ctx.w1[3], MD5C1e, MD5S12); MD5_STEP (MD5_Go, b, c, d, a, ctx.w3[0], MD5C1f, MD5S13); MD5_STEP (MD5_H1, a, b, c, d, ctx.w1[1], MD5C20, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w2[0], MD5C21, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w2[3], MD5C22, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w3[2], MD5C23, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, ctx.w0[1], MD5C24, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w1[0], MD5C25, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w1[3], MD5C26, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w2[2], MD5C27, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, ctx.w3[1], MD5C28, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w0[0], MD5C29, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w0[3], MD5C2a, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w1[2], MD5C2b, MD5S23); MD5_STEP (MD5_H1, a, b, c, d, ctx.w2[1], MD5C2c, MD5S20); MD5_STEP (MD5_H2, d, a, b, c, ctx.w3[0], MD5C2d, MD5S21); MD5_STEP (MD5_H1, c, d, a, b, ctx.w3[3], MD5C2e, MD5S22); MD5_STEP (MD5_H2, b, c, d, a, ctx.w0[2], MD5C2f, MD5S23); MD5_STEP (MD5_I , a, b, c, d, ctx.w0[0], MD5C30, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w1[3], MD5C31, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w3[2], MD5C32, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w1[1], MD5C33, MD5S33); MD5_STEP (MD5_I , a, b, c, d, ctx.w3[0], MD5C34, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w0[3], MD5C35, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w2[2], MD5C36, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w0[1], MD5C37, MD5S33); MD5_STEP (MD5_I , a, b, c, d, ctx.w2[0], MD5C38, MD5S30); MD5_STEP (MD5_I , d, a, b, c, ctx.w3[3], MD5C39, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w1[2], MD5C3a, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w3[1], MD5C3b, MD5S33); MD5_STEP (MD5_I , a, b, c, d, ctx.w1[0], MD5C3c, MD5S30); if (MATCHES_NONE_VS ((a + ctx.h[0] - make_u32x (MD5M_A)), search[0])) continue; MD5_STEP (MD5_I , d, a, b, c, ctx.w2[3], MD5C3d, MD5S31); MD5_STEP (MD5_I , c, d, a, b, ctx.w0[2], MD5C3e, MD5S32); MD5_STEP (MD5_I , b, c, d, a, ctx.w2[1], MD5C3f, MD5S33); a += ctx.h[0] - make_u32x (MD5M_A); b += ctx.h[1] - make_u32x (MD5M_B); c += ctx.h[2] - make_u32x (MD5M_C); d += ctx.h[3] - make_u32x (MD5M_D); COMPARE_S_SIMD (a, d, c, b); } } KERNEL_FQ void m32300_m04 (KERN_ATTR_VECTOR_ESALT (md5_triple_salt_t)) { /** * base */ const u64 lid = get_local_id (0); const u64 gid = get_global_id (0); const u64 lsz = get_local_size (0); /** * bin2asc table */ LOCAL_VK u32 l_bin2asc[256]; for (u32 i = lid; i < 256; i += lsz) { const u32 i0 = (i >> 0) & 15; const u32 i1 = (i >> 4) & 15; l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 8 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 0; } SYNC_THREADS (); if (gid >= GID_CNT) return; /** * modifier */ u32 w0[4]; w0[0] = pws[gid].i[ 0]; w0[1] = pws[gid].i[ 1]; w0[2] = pws[gid].i[ 2]; w0[3] = pws[gid].i[ 3]; u32 w1[4]; w1[0] = 0; w1[1] = 0; w1[2] = 0; w1[3] = 0; u32 w2[4]; w2[0] = 0; w2[1] = 0; w2[2] = 0; w2[3] = 0; u32 w3[4]; w3[0] = 0; w3[1] = 0; w3[2] = pws[gid].i[14]; w3[3] = 0; const u32 pw_len = pws[gid].pw_len & 63; /** * main */ m32300m (w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_extra0_buf, d_extra1_buf, d_extra2_buf, d_extra3_buf, kernel_param, gid, lid, lsz, l_bin2asc); } KERNEL_FQ void m32300_m08 (KERN_ATTR_VECTOR_ESALT (md5_triple_salt_t)) { /** * base */ const u64 lid = get_local_id (0); const u64 gid = get_global_id (0); const u64 lsz = get_local_size (0); /** * modifier */ u32 w0[4]; w0[0] = pws[gid].i[ 0]; w0[1] = pws[gid].i[ 1]; w0[2] = pws[gid].i[ 2]; w0[3] = pws[gid].i[ 3]; u32 w1[4]; w1[0] = pws[gid].i[ 4]; w1[1] = pws[gid].i[ 5]; w1[2] = pws[gid].i[ 6]; w1[3] = pws[gid].i[ 7]; u32 w2[4]; w2[0] = 0; w2[1] = 0; w2[2] = 0; w2[3] = 0; u32 w3[4]; w3[0] = 0; w3[1] = 0; w3[2] = pws[gid].i[14]; w3[3] = 0; const u32 pw_len = pws[gid].pw_len & 63; /** * bin2asc table */ LOCAL_VK u32 l_bin2asc[256]; for (u32 i = lid; i < 256; i += lsz) { const u32 i0 = (i >> 0) & 15; const u32 i1 = (i >> 4) & 15; l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 8 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 0; } SYNC_THREADS (); if (gid >= GID_CNT) return; /** * main */ m32300m (w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_extra0_buf, d_extra1_buf, d_extra2_buf, d_extra3_buf, kernel_param, gid, lid, lsz, l_bin2asc); } KERNEL_FQ void m32300_m16 (KERN_ATTR_VECTOR_ESALT (md5_triple_salt_t)) { /** * base */ const u64 lid = get_local_id (0); const u64 gid = get_global_id (0); const u64 lsz = get_local_size (0); /** * modifier */ u32 w0[4]; w0[0] = pws[gid].i[ 0]; w0[1] = pws[gid].i[ 1]; w0[2] = pws[gid].i[ 2]; w0[3] = pws[gid].i[ 3]; u32 w1[4]; w1[0] = pws[gid].i[ 4]; w1[1] = pws[gid].i[ 5]; w1[2] = pws[gid].i[ 6]; w1[3] = pws[gid].i[ 7]; u32 w2[4]; w2[0] = pws[gid].i[ 8]; w2[1] = pws[gid].i[ 9]; w2[2] = pws[gid].i[10]; w2[3] = pws[gid].i[11]; u32 w3[4]; w3[0] = pws[gid].i[12]; w3[1] = pws[gid].i[13]; w3[2] = pws[gid].i[14]; w3[3] = pws[gid].i[15]; const u32 pw_len = pws[gid].pw_len & 63; /** * bin2asc table */ LOCAL_VK u32 l_bin2asc[256]; for (u32 i = lid; i < 256; i += lsz) { const u32 i0 = (i >> 0) & 15; const u32 i1 = (i >> 4) & 15; l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 8 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 0; } SYNC_THREADS (); if (gid >= GID_CNT) return; /** * main */ m32300m (w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_extra0_buf, d_extra1_buf, d_extra2_buf, d_extra3_buf, kernel_param, gid, lid, lsz, l_bin2asc); } KERNEL_FQ void m32300_s04 (KERN_ATTR_VECTOR_ESALT (md5_triple_salt_t)) { /** * base */ const u64 lid = get_local_id (0); const u64 gid = get_global_id (0); const u64 lsz = get_local_size (0); /** * modifier */ u32 w0[4]; w0[0] = pws[gid].i[ 0]; w0[1] = pws[gid].i[ 1]; w0[2] = pws[gid].i[ 2]; w0[3] = pws[gid].i[ 3]; u32 w1[4]; w1[0] = 0; w1[1] = 0; w1[2] = 0; w1[3] = 0; u32 w2[4]; w2[0] = 0; w2[1] = 0; w2[2] = 0; w2[3] = 0; u32 w3[4]; w3[0] = 0; w3[1] = 0; w3[2] = pws[gid].i[14]; w3[3] = 0; const u32 pw_len = pws[gid].pw_len & 63; /** * bin2asc table */ LOCAL_VK u32 l_bin2asc[256]; for (u32 i = lid; i < 256; i += lsz) { const u32 i0 = (i >> 0) & 15; const u32 i1 = (i >> 4) & 15; l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 8 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 0; } SYNC_THREADS (); if (gid >= GID_CNT) return; /** * main */ m32300s (w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_extra0_buf, d_extra1_buf, d_extra2_buf, d_extra3_buf, kernel_param, gid, lid, lsz, l_bin2asc); } KERNEL_FQ void m32300_s08 (KERN_ATTR_VECTOR_ESALT (md5_triple_salt_t)) { /** * base */ const u64 lid = get_local_id (0); const u64 gid = get_global_id (0); const u64 lsz = get_local_size (0); /** * modifier */ u32 w0[4]; w0[0] = pws[gid].i[ 0]; w0[1] = pws[gid].i[ 1]; w0[2] = pws[gid].i[ 2]; w0[3] = pws[gid].i[ 3]; u32 w1[4]; w1[0] = pws[gid].i[ 4]; w1[1] = pws[gid].i[ 5]; w1[2] = pws[gid].i[ 6]; w1[3] = pws[gid].i[ 7]; u32 w2[4]; w2[0] = 0; w2[1] = 0; w2[2] = 0; w2[3] = 0; u32 w3[4]; w3[0] = 0; w3[1] = 0; w3[2] = pws[gid].i[14]; w3[3] = 0; const u32 pw_len = pws[gid].pw_len & 63; /** * bin2asc table */ LOCAL_VK u32 l_bin2asc[256]; for (u32 i = lid; i < 256; i += lsz) { const u32 i0 = (i >> 0) & 15; const u32 i1 = (i >> 4) & 15; l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 8 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 0; } SYNC_THREADS (); if (gid >= GID_CNT) return; /** * main */ m32300s (w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_extra0_buf, d_extra1_buf, d_extra2_buf, d_extra3_buf, kernel_param, gid, lid, lsz, l_bin2asc); } KERNEL_FQ void m32300_s16 (KERN_ATTR_VECTOR_ESALT (md5_triple_salt_t)) { /** * base */ const u64 lid = get_local_id (0); const u64 gid = get_global_id (0); const u64 lsz = get_local_size (0); /** * bin2asc table */ LOCAL_VK u32 l_bin2asc[256]; for (u32 i = lid; i < 256; i += lsz) { const u32 i0 = (i >> 0) & 15; const u32 i1 = (i >> 4) & 15; l_bin2asc[i] = ((i0 < 10) ? '0' + i0 : 'a' - 10 + i0) << 8 | ((i1 < 10) ? '0' + i1 : 'a' - 10 + i1) << 0; } SYNC_THREADS (); if (gid >= GID_CNT) return; /** * modifier */ u32 w0[4]; w0[0] = pws[gid].i[ 0]; w0[1] = pws[gid].i[ 1]; w0[2] = pws[gid].i[ 2]; w0[3] = pws[gid].i[ 3]; u32 w1[4]; w1[0] = pws[gid].i[ 4]; w1[1] = pws[gid].i[ 5]; w1[2] = pws[gid].i[ 6]; w1[3] = pws[gid].i[ 7]; u32 w2[4]; w2[0] = pws[gid].i[ 8]; w2[1] = pws[gid].i[ 9]; w2[2] = pws[gid].i[10]; w2[3] = pws[gid].i[11]; u32 w3[4]; w3[0] = pws[gid].i[12]; w3[1] = pws[gid].i[13]; w3[2] = pws[gid].i[14]; w3[3] = pws[gid].i[15]; const u32 pw_len = pws[gid].pw_len & 63; /** * main */ m32300s (w0, w1, w2, w3, pw_len, pws, rules_buf, combs_buf, words_buf_r, tmps, hooks, bitmaps_buf_s1_a, bitmaps_buf_s1_b, bitmaps_buf_s1_c, bitmaps_buf_s1_d, bitmaps_buf_s2_a, bitmaps_buf_s2_b, bitmaps_buf_s2_c, bitmaps_buf_s2_d, plains_buf, digests_buf, hashes_shown, salt_bufs, esalt_bufs, d_return_buf, d_extra0_buf, d_extra1_buf, d_extra2_buf, d_extra3_buf, kernel_param, gid, lid, lsz, l_bin2asc); }