/** * Author......: See docs/credits.txt * License.....: MIT */ //#define NEW_SIMD_CODE #define XSTR(x) #x #define STR(x) XSTR(x) #ifdef KERNEL_STATIC #include STR(INCLUDE_PATH/inc_vendor.h) #include STR(INCLUDE_PATH/inc_types.h) #include STR(INCLUDE_PATH/inc_platform.cl) #include STR(INCLUDE_PATH/inc_common.cl) #include STR(INCLUDE_PATH/inc_scalar.cl) #include STR(INCLUDE_PATH/inc_hash_sha512.cl) #include STR(INCLUDE_PATH/inc_cipher_twofish.cl) #endif typedef struct cryptoapi { u32 kern_type; u32 key_size; } cryptoapi_t; KERNEL_FQ void m14533_mxx (KERN_ATTR_VECTOR_ESALT (cryptoapi_t)) { /** * modifier */ const u64 gid = get_global_id (0); if (gid >= GID_CNT) return; /** * base */ u32 twofish_key_len = esalt_bufs[DIGESTS_OFFSET_HOST].key_size; const u32 pw_len = pws[gid].pw_len; u32x w[64] = { 0 }; for (u32 i = 0, idx = 0; i < pw_len; i += 4, idx += 1) { w[idx] = pws[gid].i[idx]; } /** * loop */ u32x w0l = w[0]; for (u32 il_pos = 0; il_pos < IL_CNT; il_pos += VECT_SIZE) { const u32x w0r = words_buf_r[il_pos / VECT_SIZE]; const u32x w0 = w0l | w0r; w[0] = w0; sha512_ctx_t ctx0; sha512_init (&ctx0); sha512_update_swap (&ctx0, w, pw_len); sha512_final (&ctx0); const u32 k0 = h32_from_64_S (ctx0.h[0]); const u32 k1 = l32_from_64_S (ctx0.h[0]); const u32 k2 = h32_from_64_S (ctx0.h[1]); const u32 k3 = l32_from_64_S (ctx0.h[1]); u32 k4 = 0, k5 = 0, k6 = 0, k7 = 0; if (twofish_key_len > 128) { k4 = h32_from_64_S (ctx0.h[2]); k5 = l32_from_64_S (ctx0.h[2]); if (twofish_key_len > 192) { k6 = h32_from_64_S (ctx0.h[3]); k7 = l32_from_64_S (ctx0.h[3]); } } // key u32 ukey[8] = { 0 }; ukey[0] = hc_swap32_S (k0); ukey[1] = hc_swap32_S (k1); ukey[2] = hc_swap32_S (k2); ukey[3] = hc_swap32_S (k3); if (twofish_key_len > 128) { ukey[4] = hc_swap32_S (k4); ukey[5] = hc_swap32_S (k5); if (twofish_key_len > 192) { ukey[6] = hc_swap32_S (k6); ukey[7] = hc_swap32_S (k7); } } // IV const u32 iv[4] = { salt_bufs[SALT_POS_HOST].salt_buf[0], salt_bufs[SALT_POS_HOST].salt_buf[1], salt_bufs[SALT_POS_HOST].salt_buf[2], salt_bufs[SALT_POS_HOST].salt_buf[3] }; // CT u32 CT[4] = { 0 }; // twofish u32 sk1[4] = { 0 }; u32 lk1[40] = { 0 }; if (twofish_key_len == 128) { twofish128_set_key (sk1, lk1, ukey); twofish128_encrypt (sk1, lk1, iv, CT); } else if (twofish_key_len == 192) { twofish192_set_key (sk1, lk1, ukey); twofish192_encrypt (sk1, lk1, iv, CT); } else { twofish256_set_key (sk1, lk1, ukey); twofish256_encrypt (sk1, lk1, iv, CT); } const u32 r0 = hc_swap32_S (CT[0]); const u32 r1 = hc_swap32_S (CT[1]); const u32 r2 = hc_swap32_S (CT[2]); const u32 r3 = hc_swap32_S (CT[3]); COMPARE_M_SCALAR (r0, r1, r2, r3); } } KERNEL_FQ void m14533_sxx (KERN_ATTR_VECTOR_ESALT (cryptoapi_t)) { /** * modifier */ const u64 gid = get_global_id (0); if (gid >= GID_CNT) return; /** * digest */ const u32 search[4] = { digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R0], digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R1], digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R2], digests_buf[DIGESTS_OFFSET_HOST].digest_buf[DGST_R3] }; /** * base */ u32 twofish_key_len = esalt_bufs[DIGESTS_OFFSET_HOST].key_size; const u32 pw_len = pws[gid].pw_len; u32x w[64] = { 0 }; for (u32 i = 0, idx = 0; i < pw_len; i += 4, idx += 1) { w[idx] = pws[gid].i[idx]; } /** * loop */ u32x w0l = w[0]; for (u32 il_pos = 0; il_pos < IL_CNT; il_pos += VECT_SIZE) { const u32x w0r = words_buf_r[il_pos / VECT_SIZE]; const u32x w0 = w0l | w0r; w[0] = w0; sha512_ctx_t ctx0; sha512_init (&ctx0); sha512_update_swap (&ctx0, w, pw_len); sha512_final (&ctx0); const u32 k0 = h32_from_64_S (ctx0.h[0]); const u32 k1 = l32_from_64_S (ctx0.h[0]); const u32 k2 = h32_from_64_S (ctx0.h[1]); const u32 k3 = l32_from_64_S (ctx0.h[1]); u32 k4 = 0, k5 = 0, k6 = 0, k7 = 0; if (twofish_key_len > 128) { k4 = h32_from_64_S (ctx0.h[2]); k5 = l32_from_64_S (ctx0.h[2]); if (twofish_key_len > 192) { k6 = h32_from_64_S (ctx0.h[3]); k7 = l32_from_64_S (ctx0.h[3]); } } // key u32 ukey[8] = { 0 }; ukey[0] = hc_swap32_S (k0); ukey[1] = hc_swap32_S (k1); ukey[2] = hc_swap32_S (k2); ukey[3] = hc_swap32_S (k3); if (twofish_key_len > 128) { ukey[4] = hc_swap32_S (k4); ukey[5] = hc_swap32_S (k5); if (twofish_key_len > 192) { ukey[6] = hc_swap32_S (k6); ukey[7] = hc_swap32_S (k7); } } // IV const u32 iv[4] = { salt_bufs[SALT_POS_HOST].salt_buf[0], salt_bufs[SALT_POS_HOST].salt_buf[1], salt_bufs[SALT_POS_HOST].salt_buf[2], salt_bufs[SALT_POS_HOST].salt_buf[3] }; // CT u32 CT[4] = { 0 }; // twofish u32 sk1[4] = { 0 }; u32 lk1[40] = { 0 }; if (twofish_key_len == 128) { twofish128_set_key (sk1, lk1, ukey); twofish128_encrypt (sk1, lk1, iv, CT); } else if (twofish_key_len == 192) { twofish192_set_key (sk1, lk1, ukey); twofish192_encrypt (sk1, lk1, iv, CT); } else { twofish256_set_key (sk1, lk1, ukey); twofish256_encrypt (sk1, lk1, iv, CT); } const u32 r0 = hc_swap32_S (CT[0]); const u32 r1 = hc_swap32_S (CT[1]); const u32 r2 = hc_swap32_S (CT[2]); const u32 r3 = hc_swap32_S (CT[3]); COMPARE_S_SCALAR (r0, r1, r2, r3); } }