mirror of
https://github.com/hashcat/hashcat.git
synced 2025-07-03 21:32:35 +00:00

Updated kernel declarations from "KERNEL_FQ void HC_ATTR_SEQ" to "KERNEL_FQ KERNEL_FA void". Please update your custom plugin kernels accordingly. Added spilling size as a factor in calculating usable memory per device. This is based on undocumented variables and may not be 100% accurate, but it works well in practice. Added a compiler hint to scrypt-based kernels indicating the guaranteed maximum thread count per kernel invocation. Removed redundant kernel code 29800, as it is identical to 27700, and updated the plugin.
1763 lines
46 KiB
Common Lisp
1763 lines
46 KiB
Common Lisp
/**
|
|
* Author......: See docs/credits.txt
|
|
* License.....: MIT
|
|
*/
|
|
|
|
#ifdef KERNEL_STATIC
|
|
#include M2S(INCLUDE_PATH/inc_vendor.h)
|
|
#include M2S(INCLUDE_PATH/inc_types.h)
|
|
#include M2S(INCLUDE_PATH/inc_platform.cl)
|
|
#include M2S(INCLUDE_PATH/inc_common.cl)
|
|
#include M2S(INCLUDE_PATH/inc_hash_sha256.cl)
|
|
#endif
|
|
|
|
#define COMPARE_S M2S(INCLUDE_PATH/inc_comp_single.cl)
|
|
#define COMPARE_M M2S(INCLUDE_PATH/inc_comp_multi.cl)
|
|
|
|
#define MIN(a,b) (((a) < (b)) ? (a) : (b))
|
|
|
|
typedef struct sha256crypt_tmp
|
|
{
|
|
// pure version
|
|
|
|
u32 alt_result[8];
|
|
u32 p_bytes[64];
|
|
u32 s_bytes[64];
|
|
|
|
} sha256crypt_tmp_t;
|
|
|
|
DECLSPEC void init_ctx (PRIVATE_AS u32 *digest)
|
|
{
|
|
digest[0] = SHA256M_A;
|
|
digest[1] = SHA256M_B;
|
|
digest[2] = SHA256M_C;
|
|
digest[3] = SHA256M_D;
|
|
digest[4] = SHA256M_E;
|
|
digest[5] = SHA256M_F;
|
|
digest[6] = SHA256M_G;
|
|
digest[7] = SHA256M_H;
|
|
}
|
|
|
|
DECLSPEC u32 memcat16 (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be (in3, 0, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (0, in3, selector);
|
|
#endif
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
break;
|
|
case 4: block[ 4] |= tmp0;
|
|
block[ 5] = tmp1;
|
|
block[ 6] = tmp2;
|
|
block[ 7] = tmp3;
|
|
block[ 8] = tmp4;
|
|
break;
|
|
case 5: block[ 5] |= tmp0;
|
|
block[ 6] = tmp1;
|
|
block[ 7] = tmp2;
|
|
block[ 8] = tmp3;
|
|
block[ 9] = tmp4;
|
|
break;
|
|
case 6: block[ 6] |= tmp0;
|
|
block[ 7] = tmp1;
|
|
block[ 8] = tmp2;
|
|
block[ 9] = tmp3;
|
|
block[10] = tmp4;
|
|
break;
|
|
case 7: block[ 7] |= tmp0;
|
|
block[ 8] = tmp1;
|
|
block[ 9] = tmp2;
|
|
block[10] = tmp3;
|
|
block[11] = tmp4;
|
|
break;
|
|
case 8: block[ 8] |= tmp0;
|
|
block[ 9] = tmp1;
|
|
block[10] = tmp2;
|
|
block[11] = tmp3;
|
|
block[12] = tmp4;
|
|
break;
|
|
case 9: block[ 9] |= tmp0;
|
|
block[10] = tmp1;
|
|
block[11] = tmp2;
|
|
block[12] = tmp3;
|
|
block[13] = tmp4;
|
|
break;
|
|
case 10: block[10] |= tmp0;
|
|
block[11] = tmp1;
|
|
block[12] = tmp2;
|
|
block[13] = tmp3;
|
|
block[14] = tmp4;
|
|
break;
|
|
case 11: block[11] |= tmp0;
|
|
block[12] = tmp1;
|
|
block[13] = tmp2;
|
|
block[14] = tmp3;
|
|
block[15] = tmp4;
|
|
break;
|
|
case 12: block[12] |= tmp0;
|
|
block[13] = tmp1;
|
|
block[14] = tmp2;
|
|
block[15] = tmp3;
|
|
break;
|
|
case 13: block[13] |= tmp0;
|
|
block[14] = tmp1;
|
|
block[15] = tmp2;
|
|
break;
|
|
case 14: block[14] |= tmp0;
|
|
block[15] = tmp1;
|
|
break;
|
|
case 15: block[15] |= tmp0;
|
|
break;
|
|
}
|
|
|
|
u32 new_len = offset + append_len;
|
|
|
|
return new_len;
|
|
}
|
|
|
|
DECLSPEC u32 memcat16c (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len, PRIVATE_AS u32 *digest)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be (in3, 0, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (0, in3, selector);
|
|
#endif
|
|
|
|
u32 carry[4] = { 0 };
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
break;
|
|
case 4: block[ 4] |= tmp0;
|
|
block[ 5] = tmp1;
|
|
block[ 6] = tmp2;
|
|
block[ 7] = tmp3;
|
|
block[ 8] = tmp4;
|
|
break;
|
|
case 5: block[ 5] |= tmp0;
|
|
block[ 6] = tmp1;
|
|
block[ 7] = tmp2;
|
|
block[ 8] = tmp3;
|
|
block[ 9] = tmp4;
|
|
break;
|
|
case 6: block[ 6] |= tmp0;
|
|
block[ 7] = tmp1;
|
|
block[ 8] = tmp2;
|
|
block[ 9] = tmp3;
|
|
block[10] = tmp4;
|
|
break;
|
|
case 7: block[ 7] |= tmp0;
|
|
block[ 8] = tmp1;
|
|
block[ 9] = tmp2;
|
|
block[10] = tmp3;
|
|
block[11] = tmp4;
|
|
break;
|
|
case 8: block[ 8] |= tmp0;
|
|
block[ 9] = tmp1;
|
|
block[10] = tmp2;
|
|
block[11] = tmp3;
|
|
block[12] = tmp4;
|
|
break;
|
|
case 9: block[ 9] |= tmp0;
|
|
block[10] = tmp1;
|
|
block[11] = tmp2;
|
|
block[12] = tmp3;
|
|
block[13] = tmp4;
|
|
break;
|
|
case 10: block[10] |= tmp0;
|
|
block[11] = tmp1;
|
|
block[12] = tmp2;
|
|
block[13] = tmp3;
|
|
block[14] = tmp4;
|
|
break;
|
|
case 11: block[11] |= tmp0;
|
|
block[12] = tmp1;
|
|
block[13] = tmp2;
|
|
block[14] = tmp3;
|
|
block[15] = tmp4;
|
|
break;
|
|
case 12: block[12] |= tmp0;
|
|
block[13] = tmp1;
|
|
block[14] = tmp2;
|
|
block[15] = tmp3;
|
|
carry[ 0] = tmp4;
|
|
break;
|
|
case 13: block[13] |= tmp0;
|
|
block[14] = tmp1;
|
|
block[15] = tmp2;
|
|
carry[ 0] = tmp3;
|
|
carry[ 1] = tmp4;
|
|
break;
|
|
case 14: block[14] |= tmp0;
|
|
block[15] = tmp1;
|
|
carry[ 0] = tmp2;
|
|
carry[ 1] = tmp3;
|
|
carry[ 2] = tmp4;
|
|
break;
|
|
case 15: block[15] |= tmp0;
|
|
carry[ 0] = tmp1;
|
|
carry[ 1] = tmp2;
|
|
carry[ 2] = tmp3;
|
|
carry[ 3] = tmp4;
|
|
break;
|
|
}
|
|
|
|
u32 new_len = offset + append_len;
|
|
|
|
if (new_len >= 64)
|
|
{
|
|
new_len -= 64;
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, digest);
|
|
|
|
block[ 0] = carry[0];
|
|
block[ 1] = carry[1];
|
|
block[ 2] = carry[2];
|
|
block[ 3] = carry[3];
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
}
|
|
|
|
return new_len;
|
|
}
|
|
|
|
DECLSPEC u32 memcat16s (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
u32 in4 = append[4];
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be (in3, in4, offset);
|
|
const u32 tmp5 = hc_bytealign_be (in4, 0, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (in4, in3, selector);
|
|
const u32 tmp5 = hc_byte_perm_S (0, in4, selector);
|
|
#endif
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
block[ 5] = tmp5;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
block[ 6] = tmp5;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
block[ 7] = tmp5;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
block[ 8] = tmp5;
|
|
break;
|
|
case 4: block[ 4] |= tmp0;
|
|
block[ 5] = tmp1;
|
|
block[ 6] = tmp2;
|
|
block[ 7] = tmp3;
|
|
block[ 8] = tmp4;
|
|
block[ 9] = tmp5;
|
|
break;
|
|
case 5: block[ 5] |= tmp0;
|
|
block[ 6] = tmp1;
|
|
block[ 7] = tmp2;
|
|
block[ 8] = tmp3;
|
|
block[ 9] = tmp4;
|
|
block[10] = tmp5;
|
|
break;
|
|
case 6: block[ 6] |= tmp0;
|
|
block[ 7] = tmp1;
|
|
block[ 8] = tmp2;
|
|
block[ 9] = tmp3;
|
|
block[10] = tmp4;
|
|
block[11] = tmp5;
|
|
break;
|
|
case 7: block[ 7] |= tmp0;
|
|
block[ 8] = tmp1;
|
|
block[ 9] = tmp2;
|
|
block[10] = tmp3;
|
|
block[11] = tmp4;
|
|
block[12] = tmp5;
|
|
break;
|
|
case 8: block[ 8] |= tmp0;
|
|
block[ 9] = tmp1;
|
|
block[10] = tmp2;
|
|
block[11] = tmp3;
|
|
block[12] = tmp4;
|
|
block[13] = tmp5;
|
|
break;
|
|
case 9: block[ 9] |= tmp0;
|
|
block[10] = tmp1;
|
|
block[11] = tmp2;
|
|
block[12] = tmp3;
|
|
block[13] = tmp4;
|
|
block[14] = tmp5;
|
|
break;
|
|
case 10: block[10] |= tmp0;
|
|
block[11] = tmp1;
|
|
block[12] = tmp2;
|
|
block[13] = tmp3;
|
|
block[14] = tmp4;
|
|
block[15] = tmp5;
|
|
break;
|
|
case 11: block[11] |= tmp0;
|
|
block[12] = tmp1;
|
|
block[13] = tmp2;
|
|
block[14] = tmp3;
|
|
block[15] = tmp4;
|
|
break;
|
|
case 12: block[12] |= tmp0;
|
|
block[13] = tmp1;
|
|
block[14] = tmp2;
|
|
block[15] = tmp3;
|
|
break;
|
|
case 13: block[13] |= tmp0;
|
|
block[14] = tmp1;
|
|
block[15] = tmp2;
|
|
break;
|
|
case 14: block[14] |= tmp0;
|
|
block[15] = tmp1;
|
|
break;
|
|
case 15: block[15] |= tmp0;
|
|
break;
|
|
}
|
|
|
|
u32 new_len = offset + append_len;
|
|
|
|
return new_len;
|
|
}
|
|
|
|
DECLSPEC u32 memcat16sc (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len, PRIVATE_AS u32 *digest)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
u32 in4 = append[4];
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be (in3, in4, offset);
|
|
const u32 tmp5 = hc_bytealign_be (in4, 0, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (in4, in3, selector);
|
|
const u32 tmp5 = hc_byte_perm_S (0, in4, selector);
|
|
#endif
|
|
|
|
u32 carry[5] = { 0 };
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
block[ 5] = tmp5;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
block[ 6] = tmp5;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
block[ 7] = tmp5;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
block[ 8] = tmp5;
|
|
break;
|
|
case 4: block[ 4] |= tmp0;
|
|
block[ 5] = tmp1;
|
|
block[ 6] = tmp2;
|
|
block[ 7] = tmp3;
|
|
block[ 8] = tmp4;
|
|
block[ 9] = tmp5;
|
|
break;
|
|
case 5: block[ 5] |= tmp0;
|
|
block[ 6] = tmp1;
|
|
block[ 7] = tmp2;
|
|
block[ 8] = tmp3;
|
|
block[ 9] = tmp4;
|
|
block[10] = tmp5;
|
|
break;
|
|
case 6: block[ 6] |= tmp0;
|
|
block[ 7] = tmp1;
|
|
block[ 8] = tmp2;
|
|
block[ 9] = tmp3;
|
|
block[10] = tmp4;
|
|
block[11] = tmp5;
|
|
break;
|
|
case 7: block[ 7] |= tmp0;
|
|
block[ 8] = tmp1;
|
|
block[ 9] = tmp2;
|
|
block[10] = tmp3;
|
|
block[11] = tmp4;
|
|
block[12] = tmp5;
|
|
break;
|
|
case 8: block[ 8] |= tmp0;
|
|
block[ 9] = tmp1;
|
|
block[10] = tmp2;
|
|
block[11] = tmp3;
|
|
block[12] = tmp4;
|
|
block[13] = tmp5;
|
|
break;
|
|
case 9: block[ 9] |= tmp0;
|
|
block[10] = tmp1;
|
|
block[11] = tmp2;
|
|
block[12] = tmp3;
|
|
block[13] = tmp4;
|
|
block[14] = tmp5;
|
|
break;
|
|
case 10: block[10] |= tmp0;
|
|
block[11] = tmp1;
|
|
block[12] = tmp2;
|
|
block[13] = tmp3;
|
|
block[14] = tmp4;
|
|
block[15] = tmp5;
|
|
break;
|
|
case 11: block[11] |= tmp0;
|
|
block[12] = tmp1;
|
|
block[13] = tmp2;
|
|
block[14] = tmp3;
|
|
block[15] = tmp4;
|
|
carry[ 0] = tmp5;
|
|
break;
|
|
case 12: block[12] |= tmp0;
|
|
block[13] = tmp1;
|
|
block[14] = tmp2;
|
|
block[15] = tmp3;
|
|
carry[ 0] = tmp4;
|
|
carry[ 1] = tmp5;
|
|
break;
|
|
case 13: block[13] |= tmp0;
|
|
block[14] = tmp1;
|
|
block[15] = tmp2;
|
|
carry[ 0] = tmp3;
|
|
carry[ 1] = tmp4;
|
|
carry[ 2] = tmp5;
|
|
break;
|
|
case 14: block[14] |= tmp0;
|
|
block[15] = tmp1;
|
|
carry[ 0] = tmp2;
|
|
carry[ 1] = tmp3;
|
|
carry[ 2] = tmp4;
|
|
carry[ 3] = tmp5;
|
|
break;
|
|
case 15: block[15] |= tmp0;
|
|
carry[ 0] = tmp1;
|
|
carry[ 1] = tmp2;
|
|
carry[ 2] = tmp3;
|
|
carry[ 3] = tmp4;
|
|
carry[ 4] = tmp5;
|
|
break;
|
|
}
|
|
|
|
u32 new_len = offset + append_len;
|
|
|
|
if (new_len >= 64)
|
|
{
|
|
new_len -= 64;
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, digest);
|
|
|
|
block[ 0] = carry[0];
|
|
block[ 1] = carry[1];
|
|
block[ 2] = carry[2];
|
|
block[ 3] = carry[3];
|
|
block[ 4] = carry[4];
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
}
|
|
|
|
return new_len;
|
|
}
|
|
|
|
DECLSPEC void truncate_block_5x4_be_S (PRIVATE_AS u32 *w0, const u32 len)
|
|
{
|
|
switch (len)
|
|
{
|
|
case 0:
|
|
w0[0] = 0;
|
|
w0[1] = 0;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 1:
|
|
w0[0] &= 0xff000000;
|
|
w0[1] = 0;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 2:
|
|
w0[0] &= 0xffff0000;
|
|
w0[1] = 0;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 3:
|
|
w0[0] &= 0xffffff00;
|
|
w0[1] = 0;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 4:
|
|
w0[1] = 0;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 5:
|
|
w0[1] &= 0xff000000;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 6:
|
|
w0[1] &= 0xffff0000;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 7:
|
|
w0[1] &= 0xffffff00;
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 8:
|
|
w0[2] = 0;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 9:
|
|
w0[2] &= 0xff000000;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 10:
|
|
w0[2] &= 0xffff0000;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 11:
|
|
w0[2] &= 0xffffff00;
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 12:
|
|
w0[3] = 0;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 13:
|
|
w0[3] &= 0xff000000;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 14:
|
|
w0[3] &= 0xffff0000;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 15:
|
|
w0[3] &= 0xffffff00;
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 16:
|
|
w0[4] = 0;
|
|
break;
|
|
|
|
case 17:
|
|
w0[4] &= 0xff000000;
|
|
break;
|
|
|
|
case 18:
|
|
w0[4] &= 0xffff0000;
|
|
break;
|
|
|
|
case 19:
|
|
w0[4] &= 0xffffff00;
|
|
break;
|
|
}
|
|
}
|
|
|
|
DECLSPEC u32 memcat20 (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be_S ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be_S (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be_S (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be_S (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be_S (in3, 0, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (0, in3, selector);
|
|
#endif
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
break;
|
|
case 4: block[ 4] |= tmp0;
|
|
block[ 5] = tmp1;
|
|
block[ 6] = tmp2;
|
|
block[ 7] = tmp3;
|
|
block[ 8] = tmp4;
|
|
break;
|
|
case 5: block[ 5] |= tmp0;
|
|
block[ 6] = tmp1;
|
|
block[ 7] = tmp2;
|
|
block[ 8] = tmp3;
|
|
block[ 9] = tmp4;
|
|
break;
|
|
case 6: block[ 6] |= tmp0;
|
|
block[ 7] = tmp1;
|
|
block[ 8] = tmp2;
|
|
block[ 9] = tmp3;
|
|
block[10] = tmp4;
|
|
break;
|
|
case 7: block[ 7] |= tmp0;
|
|
block[ 8] = tmp1;
|
|
block[ 9] = tmp2;
|
|
block[10] = tmp3;
|
|
block[11] = tmp4;
|
|
break;
|
|
case 8: block[ 8] |= tmp0;
|
|
block[ 9] = tmp1;
|
|
block[10] = tmp2;
|
|
block[11] = tmp3;
|
|
block[12] = tmp4;
|
|
break;
|
|
case 9: block[ 9] |= tmp0;
|
|
block[10] = tmp1;
|
|
block[11] = tmp2;
|
|
block[12] = tmp3;
|
|
block[13] = tmp4;
|
|
break;
|
|
case 10: block[10] |= tmp0;
|
|
block[11] = tmp1;
|
|
block[12] = tmp2;
|
|
block[13] = tmp3;
|
|
block[14] = tmp4;
|
|
break;
|
|
case 11: block[11] |= tmp0;
|
|
block[12] = tmp1;
|
|
block[13] = tmp2;
|
|
block[14] = tmp3;
|
|
block[15] = tmp4;
|
|
break;
|
|
case 12: block[12] |= tmp0;
|
|
block[13] = tmp1;
|
|
block[14] = tmp2;
|
|
block[15] = tmp3;
|
|
block[16] = tmp4;
|
|
break;
|
|
case 13: block[13] |= tmp0;
|
|
block[14] = tmp1;
|
|
block[15] = tmp2;
|
|
block[16] = tmp3;
|
|
block[17] = tmp4;
|
|
break;
|
|
case 14: block[14] |= tmp0;
|
|
block[15] = tmp1;
|
|
block[16] = tmp2;
|
|
block[17] = tmp3;
|
|
block[18] = tmp4;
|
|
break;
|
|
case 15: block[15] |= tmp0;
|
|
block[16] = tmp1;
|
|
block[17] = tmp2;
|
|
block[18] = tmp3;
|
|
block[19] = tmp4;
|
|
break;
|
|
case 16: block[16] |= tmp0;
|
|
block[17] = tmp1;
|
|
block[18] = tmp2;
|
|
block[19] = tmp3;
|
|
block[20] = tmp4;
|
|
break;
|
|
case 17: block[17] |= tmp0;
|
|
block[18] = tmp1;
|
|
block[19] = tmp2;
|
|
block[20] = tmp3;
|
|
block[21] = tmp4;
|
|
break;
|
|
case 18: block[18] |= tmp0;
|
|
block[19] = tmp1;
|
|
block[20] = tmp2;
|
|
block[21] = tmp3;
|
|
block[22] = tmp4;
|
|
break;
|
|
case 19: block[19] |= tmp0;
|
|
block[20] = tmp1;
|
|
block[21] = tmp2;
|
|
block[22] = tmp3;
|
|
block[23] = tmp4;
|
|
break;
|
|
case 20: block[20] |= tmp0;
|
|
block[21] = tmp1;
|
|
block[22] = tmp2;
|
|
block[23] = tmp3;
|
|
block[24] = tmp4;
|
|
break;
|
|
}
|
|
|
|
return offset + append_len;
|
|
}
|
|
|
|
DECLSPEC u32 memcat20_x80 (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
u32 in4 = 0x80000000;
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be_S ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be_S (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be_S (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be_S (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be_S (in3, in4, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (in4, in3, selector);
|
|
#endif
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
break;
|
|
case 4: block[ 4] |= tmp0;
|
|
block[ 5] = tmp1;
|
|
block[ 6] = tmp2;
|
|
block[ 7] = tmp3;
|
|
block[ 8] = tmp4;
|
|
break;
|
|
case 5: block[ 5] |= tmp0;
|
|
block[ 6] = tmp1;
|
|
block[ 7] = tmp2;
|
|
block[ 8] = tmp3;
|
|
block[ 9] = tmp4;
|
|
break;
|
|
case 6: block[ 6] |= tmp0;
|
|
block[ 7] = tmp1;
|
|
block[ 8] = tmp2;
|
|
block[ 9] = tmp3;
|
|
block[10] = tmp4;
|
|
break;
|
|
case 7: block[ 7] |= tmp0;
|
|
block[ 8] = tmp1;
|
|
block[ 9] = tmp2;
|
|
block[10] = tmp3;
|
|
block[11] = tmp4;
|
|
break;
|
|
case 8: block[ 8] |= tmp0;
|
|
block[ 9] = tmp1;
|
|
block[10] = tmp2;
|
|
block[11] = tmp3;
|
|
block[12] = tmp4;
|
|
break;
|
|
case 9: block[ 9] |= tmp0;
|
|
block[10] = tmp1;
|
|
block[11] = tmp2;
|
|
block[12] = tmp3;
|
|
block[13] = tmp4;
|
|
break;
|
|
case 10: block[10] |= tmp0;
|
|
block[11] = tmp1;
|
|
block[12] = tmp2;
|
|
block[13] = tmp3;
|
|
block[14] = tmp4;
|
|
break;
|
|
case 11: block[11] |= tmp0;
|
|
block[12] = tmp1;
|
|
block[13] = tmp2;
|
|
block[14] = tmp3;
|
|
block[15] = tmp4;
|
|
break;
|
|
case 12: block[12] |= tmp0;
|
|
block[13] = tmp1;
|
|
block[14] = tmp2;
|
|
block[15] = tmp3;
|
|
block[16] = tmp4;
|
|
break;
|
|
case 13: block[13] |= tmp0;
|
|
block[14] = tmp1;
|
|
block[15] = tmp2;
|
|
block[16] = tmp3;
|
|
block[17] = tmp4;
|
|
break;
|
|
case 14: block[14] |= tmp0;
|
|
block[15] = tmp1;
|
|
block[16] = tmp2;
|
|
block[17] = tmp3;
|
|
block[18] = tmp4;
|
|
break;
|
|
case 15: block[15] |= tmp0;
|
|
block[16] = tmp1;
|
|
block[17] = tmp2;
|
|
block[18] = tmp3;
|
|
block[19] = tmp4;
|
|
break;
|
|
case 16: block[16] |= tmp0;
|
|
block[17] = tmp1;
|
|
block[18] = tmp2;
|
|
block[19] = tmp3;
|
|
block[20] = tmp4;
|
|
break;
|
|
case 17: block[17] |= tmp0;
|
|
block[18] = tmp1;
|
|
block[19] = tmp2;
|
|
block[20] = tmp3;
|
|
block[21] = tmp4;
|
|
break;
|
|
case 18: block[18] |= tmp0;
|
|
block[19] = tmp1;
|
|
block[20] = tmp2;
|
|
block[21] = tmp3;
|
|
block[22] = tmp4;
|
|
break;
|
|
case 19: block[19] |= tmp0;
|
|
block[20] = tmp1;
|
|
block[21] = tmp2;
|
|
block[22] = tmp3;
|
|
block[23] = tmp4;
|
|
break;
|
|
case 20: block[20] |= tmp0;
|
|
block[21] = tmp1;
|
|
block[22] = tmp2;
|
|
block[23] = tmp3;
|
|
block[24] = tmp4;
|
|
break;
|
|
}
|
|
|
|
return offset + append_len;
|
|
}
|
|
|
|
DECLSPEC u32 memcat24 (PRIVATE_AS u32 *block, const u32 offset, PRIVATE_AS const u32 *append, const u32 append_len)
|
|
{
|
|
u32 in0 = append[0];
|
|
u32 in1 = append[1];
|
|
u32 in2 = append[2];
|
|
u32 in3 = append[3];
|
|
u32 in4 = append[4];
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 0) || defined IS_GENERIC
|
|
const u32 tmp0 = hc_bytealign_be_S ( 0, in0, offset);
|
|
const u32 tmp1 = hc_bytealign_be_S (in0, in1, offset);
|
|
const u32 tmp2 = hc_bytealign_be_S (in1, in2, offset);
|
|
const u32 tmp3 = hc_bytealign_be_S (in2, in3, offset);
|
|
const u32 tmp4 = hc_bytealign_be_S (in3, in4, offset);
|
|
const u32 tmp5 = hc_bytealign_be_S (in4, 0, offset);
|
|
#endif
|
|
|
|
#if ((defined IS_AMD || defined IS_HIP) && HAS_VPERM == 1) || defined IS_NV
|
|
|
|
#if defined IS_NV
|
|
const int selector = (0x76543210 >> ((offset & 3) * 4)) & 0xffff;
|
|
#endif
|
|
|
|
#if (defined IS_AMD || defined IS_HIP)
|
|
const int selector = l32_from_64_S (0x0706050403020100UL >> ((offset & 3) * 8));
|
|
#endif
|
|
|
|
const u32 tmp0 = hc_byte_perm_S (in0, 0, selector);
|
|
const u32 tmp1 = hc_byte_perm_S (in1, in0, selector);
|
|
const u32 tmp2 = hc_byte_perm_S (in2, in1, selector);
|
|
const u32 tmp3 = hc_byte_perm_S (in3, in2, selector);
|
|
const u32 tmp4 = hc_byte_perm_S (in4, in3, selector);
|
|
const u32 tmp5 = hc_byte_perm_S (0, in4, selector);
|
|
#endif
|
|
|
|
switch (offset / 4)
|
|
{
|
|
case 0: block[ 0] |= tmp0;
|
|
block[ 1] = tmp1;
|
|
block[ 2] = tmp2;
|
|
block[ 3] = tmp3;
|
|
block[ 4] = tmp4;
|
|
block[ 5] = tmp5;
|
|
break;
|
|
case 1: block[ 1] |= tmp0;
|
|
block[ 2] = tmp1;
|
|
block[ 3] = tmp2;
|
|
block[ 4] = tmp3;
|
|
block[ 5] = tmp4;
|
|
block[ 6] = tmp5;
|
|
break;
|
|
case 2: block[ 2] |= tmp0;
|
|
block[ 3] = tmp1;
|
|
block[ 4] = tmp2;
|
|
block[ 5] = tmp3;
|
|
block[ 6] = tmp4;
|
|
block[ 7] = tmp5;
|
|
break;
|
|
case 3: block[ 3] |= tmp0;
|
|
block[ 4] = tmp1;
|
|
block[ 5] = tmp2;
|
|
block[ 6] = tmp3;
|
|
block[ 7] = tmp4;
|
|
block[ 8] = tmp5;
|
|
break;
|
|
}
|
|
|
|
return offset + append_len;
|
|
}
|
|
|
|
KERNEL_FQ KERNEL_FA void m07400_init (KERN_ATTR_TMPS (sha256crypt_tmp_t))
|
|
{
|
|
/**
|
|
* base
|
|
*/
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
if (gid >= GID_CNT) return;
|
|
|
|
u32 w0[4];
|
|
|
|
w0[0] = hc_swap32_S (pws[gid].i[0]);
|
|
w0[1] = hc_swap32_S (pws[gid].i[1]);
|
|
w0[2] = hc_swap32_S (pws[gid].i[2]);
|
|
w0[3] = hc_swap32_S (pws[gid].i[3]);
|
|
|
|
const u32 pw_len = MIN (pws[gid].pw_len, 15);
|
|
|
|
/**
|
|
* salt
|
|
*/
|
|
|
|
u32 salt_buf[5];
|
|
|
|
salt_buf[0] = hc_swap32_S (salt_bufs[SALT_POS_HOST].salt_buf[0]);
|
|
salt_buf[1] = hc_swap32_S (salt_bufs[SALT_POS_HOST].salt_buf[1]);
|
|
salt_buf[2] = hc_swap32_S (salt_bufs[SALT_POS_HOST].salt_buf[2]);
|
|
salt_buf[3] = hc_swap32_S (salt_bufs[SALT_POS_HOST].salt_buf[3]);
|
|
salt_buf[4] = hc_swap32_S (salt_bufs[SALT_POS_HOST].salt_buf[4]);
|
|
|
|
const u32 salt_len = MIN (salt_bufs[SALT_POS_HOST].salt_len, 20);
|
|
|
|
/**
|
|
* buffers
|
|
*/
|
|
|
|
u32 block_len; // never reaches > 64
|
|
u32 transform_len; // required for w[15] = len * 8
|
|
|
|
u32 block[16];
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
|
|
u32 alt_result[8];
|
|
u32 p_bytes[8];
|
|
u32 s_bytes[8];
|
|
|
|
/* Prepare for the real work. */
|
|
|
|
block_len = 0;
|
|
|
|
/* Add key. */
|
|
|
|
block_len = memcat16 (block, block_len, w0, pw_len);
|
|
|
|
/* Add salt. */
|
|
|
|
block_len = memcat16s (block, block_len, salt_buf, salt_len);
|
|
|
|
/* Add key again. */
|
|
|
|
block_len = memcat16 (block, block_len, w0, pw_len);
|
|
|
|
append_0x80_1x16 (block, block_len ^ 3);
|
|
|
|
block[15] = block_len * 8;
|
|
|
|
init_ctx (alt_result);
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, alt_result);
|
|
|
|
u32 alt_result_tmp[8];
|
|
|
|
alt_result_tmp[0] = alt_result[0];
|
|
alt_result_tmp[1] = alt_result[1];
|
|
alt_result_tmp[2] = alt_result[2];
|
|
alt_result_tmp[3] = alt_result[3];
|
|
alt_result_tmp[4] = 0;
|
|
alt_result_tmp[5] = 0;
|
|
alt_result_tmp[6] = 0;
|
|
alt_result_tmp[7] = 0;
|
|
|
|
truncate_block_4x4_be_S (alt_result_tmp, pw_len);
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
|
|
block_len = 0;
|
|
|
|
/* Add the key string. */
|
|
|
|
block_len = memcat16 (block, block_len, w0, pw_len);
|
|
|
|
/* The last part is the salt string. This must be at most 8
|
|
characters and it ends at the first `$' character (for
|
|
compatibility with existing implementations). */
|
|
|
|
block_len = memcat16s (block, block_len, salt_buf, salt_len);
|
|
|
|
/* Now get result of this (32 bytes) and add it to the other
|
|
context. */
|
|
|
|
block_len = memcat16 (block, block_len, alt_result_tmp, pw_len);
|
|
|
|
transform_len = block_len;
|
|
|
|
/* Take the binary representation of the length of the key and for every
|
|
1 add the alternate sum, for every 0 the key. */
|
|
|
|
alt_result_tmp[0] = alt_result[0];
|
|
alt_result_tmp[1] = alt_result[1];
|
|
alt_result_tmp[2] = alt_result[2];
|
|
alt_result_tmp[3] = alt_result[3];
|
|
alt_result_tmp[4] = alt_result[4];
|
|
alt_result_tmp[5] = alt_result[5];
|
|
alt_result_tmp[6] = alt_result[6];
|
|
alt_result_tmp[7] = alt_result[7];
|
|
|
|
init_ctx (alt_result);
|
|
|
|
for (u32 j = pw_len; j; j >>= 1)
|
|
{
|
|
if (j & 1)
|
|
{
|
|
block_len = memcat16c (block, block_len, &alt_result_tmp[0], 16, alt_result);
|
|
block_len = memcat16c (block, block_len, &alt_result_tmp[4], 16, alt_result);
|
|
|
|
transform_len += 32;
|
|
}
|
|
else
|
|
{
|
|
block_len = memcat16c (block, block_len, w0, pw_len, alt_result);
|
|
|
|
transform_len += pw_len;
|
|
}
|
|
}
|
|
|
|
append_0x80_1x16 (block, block_len ^ 3);
|
|
|
|
if (block_len >= 56)
|
|
{
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, alt_result);
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
}
|
|
|
|
block[15] = transform_len * 8;
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, alt_result);
|
|
|
|
tmps[gid].alt_result[0] = alt_result[0];
|
|
tmps[gid].alt_result[1] = alt_result[1];
|
|
tmps[gid].alt_result[2] = alt_result[2];
|
|
tmps[gid].alt_result[3] = alt_result[3];
|
|
tmps[gid].alt_result[4] = alt_result[4];
|
|
tmps[gid].alt_result[5] = alt_result[5];
|
|
tmps[gid].alt_result[6] = alt_result[6];
|
|
tmps[gid].alt_result[7] = alt_result[7];
|
|
|
|
/* Start computation of P byte sequence. */
|
|
|
|
transform_len = 0;
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
|
|
block_len = 0;
|
|
|
|
/* For every character in the password add the entire password. */
|
|
|
|
init_ctx (p_bytes);
|
|
|
|
for (u32 j = 0; j < pw_len; j++)
|
|
{
|
|
block_len = memcat16c (block, block_len, w0, pw_len, p_bytes);
|
|
|
|
transform_len += pw_len;
|
|
}
|
|
|
|
/* Finish the digest. */
|
|
|
|
append_0x80_1x16 (block, block_len ^ 3);
|
|
|
|
if (block_len >= 56)
|
|
{
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, p_bytes);
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
}
|
|
|
|
block[15] = transform_len * 8;
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, p_bytes);
|
|
|
|
truncate_block_4x4_be_S (p_bytes, pw_len);
|
|
|
|
tmps[gid].p_bytes[0] = p_bytes[0];
|
|
tmps[gid].p_bytes[1] = p_bytes[1];
|
|
tmps[gid].p_bytes[2] = p_bytes[2];
|
|
tmps[gid].p_bytes[3] = p_bytes[3];
|
|
|
|
/* Start computation of S byte sequence. */
|
|
|
|
transform_len = 0;
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
|
|
block_len = 0;
|
|
|
|
/* For every character in the password add the entire password. */
|
|
|
|
init_ctx (s_bytes);
|
|
|
|
for (u32 j = 0; j < 16 + (alt_result[0] >> 24); j++)
|
|
{
|
|
block_len = memcat16sc (block, block_len, salt_buf, salt_len, s_bytes);
|
|
|
|
transform_len += salt_len;
|
|
}
|
|
|
|
/* Finish the digest. */
|
|
|
|
append_0x80_1x16 (block, block_len ^ 3);
|
|
|
|
if (block_len >= 56)
|
|
{
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, s_bytes);
|
|
|
|
block[ 0] = 0;
|
|
block[ 1] = 0;
|
|
block[ 2] = 0;
|
|
block[ 3] = 0;
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
}
|
|
|
|
block[15] = transform_len * 8;
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, s_bytes);
|
|
|
|
truncate_block_5x4_be_S (s_bytes, salt_len);
|
|
|
|
tmps[gid].s_bytes[0] = s_bytes[0];
|
|
tmps[gid].s_bytes[1] = s_bytes[1];
|
|
tmps[gid].s_bytes[2] = s_bytes[2];
|
|
tmps[gid].s_bytes[3] = s_bytes[3];
|
|
tmps[gid].s_bytes[4] = s_bytes[4];
|
|
}
|
|
|
|
KERNEL_FQ KERNEL_FA void m07400_loop (KERN_ATTR_TMPS (sha256crypt_tmp_t))
|
|
{
|
|
/**
|
|
* base
|
|
*/
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
if (gid >= GID_CNT) return;
|
|
|
|
const u32 pw_len = MIN (pws[gid].pw_len, 15);
|
|
|
|
/**
|
|
* base
|
|
*/
|
|
|
|
u32 p_bytes[4];
|
|
|
|
p_bytes[0] = tmps[gid].p_bytes[0];
|
|
p_bytes[1] = tmps[gid].p_bytes[1];
|
|
p_bytes[2] = tmps[gid].p_bytes[2];
|
|
p_bytes[3] = tmps[gid].p_bytes[3];
|
|
|
|
u32 s_bytes[5];
|
|
|
|
s_bytes[0] = tmps[gid].s_bytes[0];
|
|
s_bytes[1] = tmps[gid].s_bytes[1];
|
|
s_bytes[2] = tmps[gid].s_bytes[2];
|
|
s_bytes[3] = tmps[gid].s_bytes[3];
|
|
s_bytes[4] = tmps[gid].s_bytes[4]; // 4 extra bytes for MySQL 7.5+ hashes
|
|
|
|
u32 alt_result[8];
|
|
|
|
alt_result[0] = tmps[gid].alt_result[0];
|
|
alt_result[1] = tmps[gid].alt_result[1];
|
|
alt_result[2] = tmps[gid].alt_result[2];
|
|
alt_result[3] = tmps[gid].alt_result[3];
|
|
alt_result[4] = tmps[gid].alt_result[4];
|
|
alt_result[5] = tmps[gid].alt_result[5];
|
|
alt_result[6] = tmps[gid].alt_result[6];
|
|
alt_result[7] = tmps[gid].alt_result[7];
|
|
|
|
const u32 salt_len = MIN (salt_bufs[SALT_POS_HOST].salt_len, 20);
|
|
|
|
// just an optimization
|
|
|
|
u32 p_bytes_x80[4];
|
|
|
|
p_bytes_x80[0] = p_bytes[0];
|
|
p_bytes_x80[1] = p_bytes[1];
|
|
p_bytes_x80[2] = p_bytes[2];
|
|
p_bytes_x80[3] = p_bytes[3];
|
|
|
|
append_0x80_1x4_S (p_bytes_x80, pw_len ^ 3);
|
|
|
|
/* Repeatedly run the collected hash value through SHA256 to burn
|
|
CPU cycles. */
|
|
|
|
for (u32 i = 0, j = LOOP_POS; i < LOOP_CNT; i++, j++)
|
|
{
|
|
u32 tmp[8];
|
|
|
|
init_ctx (tmp);
|
|
|
|
u32 block[25];
|
|
|
|
u32 block_len = 0;
|
|
|
|
const u32 j1 = (j & 1) ? 1 : 0;
|
|
const u32 j3 = (j % 3) ? 1 : 0;
|
|
const u32 j7 = (j % 7) ? 1 : 0;
|
|
|
|
if (j1)
|
|
{
|
|
block[ 0] = p_bytes[0];
|
|
block[ 1] = p_bytes[1];
|
|
block[ 2] = p_bytes[2];
|
|
block[ 3] = p_bytes[3];
|
|
block[ 4] = 0;
|
|
block[ 5] = 0;
|
|
block[ 6] = 0;
|
|
block[ 7] = 0;
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
block[16] = 0;
|
|
block[17] = 0;
|
|
block[18] = 0;
|
|
block[19] = 0;
|
|
block[20] = 0;
|
|
block[21] = 0;
|
|
block[22] = 0;
|
|
block[23] = 0;
|
|
block[24] = 0;
|
|
|
|
block_len = pw_len;
|
|
|
|
if (j3)
|
|
{
|
|
block_len = memcat24 (block, block_len, s_bytes, salt_len);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
block[ 0] = alt_result[0];
|
|
block[ 1] = alt_result[1];
|
|
block[ 2] = alt_result[2];
|
|
block[ 3] = alt_result[3];
|
|
block[ 4] = alt_result[4];
|
|
block[ 5] = alt_result[5];
|
|
block[ 6] = alt_result[6];
|
|
block[ 7] = alt_result[7];
|
|
block[ 8] = 0;
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
block[16] = 0;
|
|
block[17] = 0;
|
|
block[18] = 0;
|
|
block[19] = 0;
|
|
block[20] = 0;
|
|
block[21] = 0;
|
|
block[22] = 0;
|
|
block[23] = 0;
|
|
block[24] = 0;
|
|
|
|
block_len = 32;
|
|
|
|
if (j3)
|
|
{
|
|
block[ 8] = s_bytes[0];
|
|
block[ 9] = s_bytes[1];
|
|
block[10] = s_bytes[2];
|
|
block[11] = s_bytes[3];
|
|
block[12] = s_bytes[4];
|
|
|
|
block_len += salt_len;
|
|
}
|
|
}
|
|
|
|
if (j7)
|
|
{
|
|
block_len = memcat20 (block, block_len, p_bytes, pw_len);
|
|
}
|
|
|
|
if (j1)
|
|
{
|
|
block_len = memcat20 (block, block_len, &alt_result[0], 16);
|
|
block_len = memcat20_x80 (block, block_len, &alt_result[4], 16);
|
|
}
|
|
else
|
|
{
|
|
block_len = memcat20 (block, block_len, p_bytes_x80, pw_len);
|
|
}
|
|
|
|
if (block_len >= 56)
|
|
{
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, tmp);
|
|
|
|
block[ 0] = block[16];
|
|
block[ 1] = block[17];
|
|
block[ 2] = block[18];
|
|
block[ 3] = block[19];
|
|
block[ 4] = block[20];
|
|
block[ 5] = block[21];
|
|
block[ 6] = block[22];
|
|
block[ 7] = block[23];
|
|
block[ 8] = block[24];
|
|
block[ 9] = 0;
|
|
block[10] = 0;
|
|
block[11] = 0;
|
|
block[12] = 0;
|
|
block[13] = 0;
|
|
block[14] = 0;
|
|
block[15] = 0;
|
|
}
|
|
|
|
block[14] = 0;
|
|
block[15] = block_len * 8;
|
|
|
|
sha256_transform (block + 0, block + 4, block + 8, block + 12, tmp);
|
|
|
|
alt_result[0] = tmp[0];
|
|
alt_result[1] = tmp[1];
|
|
alt_result[2] = tmp[2];
|
|
alt_result[3] = tmp[3];
|
|
alt_result[4] = tmp[4];
|
|
alt_result[5] = tmp[5];
|
|
alt_result[6] = tmp[6];
|
|
alt_result[7] = tmp[7];
|
|
}
|
|
|
|
tmps[gid].alt_result[0] = alt_result[0];
|
|
tmps[gid].alt_result[1] = alt_result[1];
|
|
tmps[gid].alt_result[2] = alt_result[2];
|
|
tmps[gid].alt_result[3] = alt_result[3];
|
|
tmps[gid].alt_result[4] = alt_result[4];
|
|
tmps[gid].alt_result[5] = alt_result[5];
|
|
tmps[gid].alt_result[6] = alt_result[6];
|
|
tmps[gid].alt_result[7] = alt_result[7];
|
|
}
|
|
|
|
KERNEL_FQ KERNEL_FA void m07400_comp (KERN_ATTR_TMPS (sha256crypt_tmp_t))
|
|
{
|
|
/**
|
|
* base
|
|
*/
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
if (gid >= GID_CNT) return;
|
|
|
|
const u64 lid = get_local_id (0);
|
|
|
|
const u32 r0 = hc_swap32_S (tmps[gid].alt_result[0]);
|
|
const u32 r1 = hc_swap32_S (tmps[gid].alt_result[1]);
|
|
const u32 r2 = hc_swap32_S (tmps[gid].alt_result[2]);
|
|
const u32 r3 = hc_swap32_S (tmps[gid].alt_result[3]);
|
|
|
|
#define il_pos 0
|
|
|
|
#ifdef KERNEL_STATIC
|
|
#include COMPARE_M
|
|
#endif
|
|
}
|