2020-02-01 08:00:48 +00:00
|
|
|
/**
|
|
|
|
* Author......: See docs/credits.txt
|
|
|
|
* License.....: MIT
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifdef KERNEL_STATIC
|
|
|
|
#include "inc_vendor.h"
|
|
|
|
#include "inc_types.h"
|
|
|
|
#include "inc_platform.cl"
|
|
|
|
#include "inc_common.cl"
|
|
|
|
#endif
|
|
|
|
|
2020-03-04 12:30:09 +00:00
|
|
|
DECLSPEC void gpu_decompress_entry (GLOBAL_AS pw_idx_t *pws_idx, GLOBAL_AS u32 *pws_comp, pw_t *buf, const u64 gid)
|
2020-02-01 08:00:48 +00:00
|
|
|
{
|
|
|
|
const u32 off = pws_idx[gid].off;
|
|
|
|
const u32 cnt = pws_idx[gid].cnt;
|
|
|
|
const u32 len = pws_idx[gid].len;
|
|
|
|
|
2020-03-04 12:30:09 +00:00
|
|
|
pw_t pw;
|
|
|
|
|
|
|
|
pw.i[ 0] = 0;
|
|
|
|
pw.i[ 1] = 0;
|
|
|
|
pw.i[ 2] = 0;
|
|
|
|
pw.i[ 3] = 0;
|
|
|
|
pw.i[ 4] = 0;
|
|
|
|
pw.i[ 5] = 0;
|
|
|
|
pw.i[ 6] = 0;
|
|
|
|
pw.i[ 7] = 0;
|
|
|
|
pw.i[ 8] = 0;
|
|
|
|
pw.i[ 9] = 0;
|
|
|
|
pw.i[10] = 0;
|
|
|
|
pw.i[11] = 0;
|
|
|
|
pw.i[12] = 0;
|
|
|
|
pw.i[13] = 0;
|
|
|
|
pw.i[14] = 0;
|
|
|
|
pw.i[15] = 0;
|
|
|
|
pw.i[16] = 0;
|
|
|
|
pw.i[17] = 0;
|
|
|
|
pw.i[18] = 0;
|
|
|
|
pw.i[19] = 0;
|
|
|
|
pw.i[20] = 0;
|
|
|
|
pw.i[21] = 0;
|
|
|
|
pw.i[22] = 0;
|
|
|
|
pw.i[23] = 0;
|
|
|
|
pw.i[24] = 0;
|
|
|
|
pw.i[25] = 0;
|
|
|
|
pw.i[26] = 0;
|
|
|
|
pw.i[27] = 0;
|
|
|
|
pw.i[28] = 0;
|
|
|
|
pw.i[29] = 0;
|
|
|
|
pw.i[30] = 0;
|
|
|
|
pw.i[31] = 0;
|
|
|
|
pw.i[32] = 0;
|
|
|
|
pw.i[33] = 0;
|
|
|
|
pw.i[34] = 0;
|
|
|
|
pw.i[35] = 0;
|
|
|
|
pw.i[36] = 0;
|
|
|
|
pw.i[37] = 0;
|
|
|
|
pw.i[38] = 0;
|
|
|
|
pw.i[39] = 0;
|
|
|
|
pw.i[40] = 0;
|
|
|
|
pw.i[41] = 0;
|
|
|
|
pw.i[42] = 0;
|
|
|
|
pw.i[43] = 0;
|
|
|
|
pw.i[44] = 0;
|
|
|
|
pw.i[45] = 0;
|
|
|
|
pw.i[46] = 0;
|
|
|
|
pw.i[47] = 0;
|
|
|
|
pw.i[48] = 0;
|
|
|
|
pw.i[49] = 0;
|
|
|
|
pw.i[50] = 0;
|
|
|
|
pw.i[51] = 0;
|
|
|
|
pw.i[52] = 0;
|
|
|
|
pw.i[53] = 0;
|
|
|
|
pw.i[54] = 0;
|
|
|
|
pw.i[55] = 0;
|
|
|
|
pw.i[56] = 0;
|
|
|
|
pw.i[57] = 0;
|
|
|
|
pw.i[58] = 0;
|
|
|
|
pw.i[59] = 0;
|
|
|
|
pw.i[60] = 0;
|
|
|
|
pw.i[61] = 0;
|
|
|
|
pw.i[62] = 0;
|
|
|
|
pw.i[63] = 0;
|
|
|
|
|
|
|
|
pw.pw_len = len;
|
2020-02-01 08:00:48 +00:00
|
|
|
|
|
|
|
for (u32 i = 0, j = off; i < cnt; i++, j++)
|
|
|
|
{
|
2020-03-04 12:30:09 +00:00
|
|
|
pw.i[i] = pws_comp[j];
|
2020-02-01 08:00:48 +00:00
|
|
|
}
|
|
|
|
|
2020-03-04 12:30:09 +00:00
|
|
|
*buf = pw;
|
2020-02-01 08:00:48 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
KERNEL_FQ void gpu_decompress (GLOBAL_AS pw_idx_t *pws_idx, GLOBAL_AS u32 *pws_comp, GLOBAL_AS pw_t *pws_buf, const u64 gid_max)
|
|
|
|
{
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
|
|
|
|
if (gid >= gid_max) return;
|
|
|
|
|
|
|
|
pw_t pw;
|
|
|
|
|
|
|
|
gpu_decompress_entry (pws_idx, pws_comp, &pw, gid);
|
|
|
|
|
|
|
|
pws_buf[gid] = pw;
|
|
|
|
}
|
|
|
|
|
2021-07-28 16:49:02 +00:00
|
|
|
KERNEL_FQ void gpu_memset (GLOBAL_AS uint4 *buf, const u32 value, const u64 gid_max)
|
|
|
|
{
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
|
|
|
|
if (gid >= gid_max) return;
|
|
|
|
|
|
|
|
uint4 r;
|
|
|
|
|
|
|
|
#if defined IS_NATIVE
|
|
|
|
r = value;
|
|
|
|
#elif defined IS_OPENCL
|
|
|
|
r = (uint4) (value);
|
|
|
|
#elif defined IS_CUDA
|
|
|
|
r.x = value;
|
|
|
|
r.y = value;
|
|
|
|
r.z = value;
|
|
|
|
r.w = value;
|
|
|
|
#elif defined IS_HIP
|
|
|
|
r.x = value;
|
|
|
|
r.y = value;
|
|
|
|
r.z = value;
|
|
|
|
r.w = value;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
buf[gid] = r;
|
|
|
|
}
|
|
|
|
|
2021-07-17 16:00:10 +00:00
|
|
|
KERNEL_FQ void gpu_bzero(GLOBAL_AS uint4* buf, const u64 gid_max)
|
|
|
|
{
|
|
|
|
const u64 gid = get_global_id(0);
|
|
|
|
|
|
|
|
if (gid >= gid_max) return;
|
|
|
|
|
|
|
|
uint4 r;
|
|
|
|
|
|
|
|
#if defined IS_NATIVE
|
|
|
|
r = 0;
|
|
|
|
#elif defined IS_OPENCL
|
|
|
|
r = (uint4) (0);
|
|
|
|
#elif defined IS_CUDA
|
|
|
|
r.x = 0;
|
|
|
|
r.y = 0;
|
|
|
|
r.z = 0;
|
|
|
|
r.w = 0;
|
|
|
|
#elif defined IS_HIP
|
|
|
|
r.x = 0;
|
|
|
|
r.y = 0;
|
|
|
|
r.z = 0;
|
|
|
|
r.w = 0;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
buf[gid] = r;
|
|
|
|
}
|
|
|
|
|
2020-02-01 08:00:48 +00:00
|
|
|
KERNEL_FQ void gpu_atinit (GLOBAL_AS pw_t *buf, const u64 gid_max)
|
|
|
|
{
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
|
|
|
|
if (gid >= gid_max) return;
|
|
|
|
|
|
|
|
const u32 l32 = l32_from_64_S (gid);
|
|
|
|
const u32 h32 = h32_from_64_S (gid);
|
|
|
|
|
|
|
|
pw_t pw;
|
|
|
|
|
|
|
|
pw.i[ 0] = 0x5c5c5c5c ^ l32;
|
|
|
|
pw.i[ 1] = 0x36363636 ^ h32;
|
|
|
|
pw.i[ 2] = 0;
|
|
|
|
pw.i[ 3] = 0;
|
|
|
|
pw.i[ 4] = 0;
|
|
|
|
pw.i[ 5] = 0;
|
|
|
|
pw.i[ 6] = 0;
|
|
|
|
pw.i[ 7] = 0;
|
|
|
|
pw.i[ 8] = 0;
|
|
|
|
pw.i[ 9] = 0;
|
|
|
|
pw.i[10] = 0;
|
|
|
|
pw.i[11] = 0;
|
|
|
|
pw.i[12] = 0;
|
|
|
|
pw.i[13] = 0;
|
|
|
|
pw.i[14] = 0;
|
|
|
|
pw.i[15] = 0;
|
|
|
|
pw.i[16] = 0;
|
|
|
|
pw.i[17] = 0;
|
|
|
|
pw.i[18] = 0;
|
|
|
|
pw.i[19] = 0;
|
|
|
|
pw.i[20] = 0;
|
|
|
|
pw.i[21] = 0;
|
|
|
|
pw.i[22] = 0;
|
|
|
|
pw.i[23] = 0;
|
|
|
|
pw.i[24] = 0;
|
|
|
|
pw.i[25] = 0;
|
|
|
|
pw.i[26] = 0;
|
|
|
|
pw.i[27] = 0;
|
|
|
|
pw.i[28] = 0;
|
|
|
|
pw.i[29] = 0;
|
|
|
|
pw.i[30] = 0;
|
|
|
|
pw.i[31] = 0;
|
|
|
|
pw.i[32] = 0;
|
|
|
|
pw.i[33] = 0;
|
|
|
|
pw.i[34] = 0;
|
|
|
|
pw.i[35] = 0;
|
|
|
|
pw.i[36] = 0;
|
|
|
|
pw.i[37] = 0;
|
|
|
|
pw.i[38] = 0;
|
|
|
|
pw.i[39] = 0;
|
|
|
|
pw.i[40] = 0;
|
|
|
|
pw.i[41] = 0;
|
|
|
|
pw.i[42] = 0;
|
|
|
|
pw.i[43] = 0;
|
|
|
|
pw.i[44] = 0;
|
|
|
|
pw.i[45] = 0;
|
|
|
|
pw.i[46] = 0;
|
|
|
|
pw.i[47] = 0;
|
|
|
|
pw.i[48] = 0;
|
|
|
|
pw.i[49] = 0;
|
|
|
|
pw.i[50] = 0;
|
|
|
|
pw.i[51] = 0;
|
|
|
|
pw.i[52] = 0;
|
|
|
|
pw.i[53] = 0;
|
|
|
|
pw.i[54] = 0;
|
|
|
|
pw.i[55] = 0;
|
|
|
|
pw.i[56] = 0;
|
|
|
|
pw.i[57] = 0;
|
|
|
|
pw.i[58] = 0;
|
|
|
|
pw.i[59] = 0;
|
|
|
|
pw.i[60] = 0;
|
|
|
|
pw.i[61] = 0;
|
|
|
|
pw.i[62] = 0;
|
|
|
|
pw.i[63] = 0; // yep that's faster
|
|
|
|
|
|
|
|
//pw.pw_len = 1 + (l32 & 15);
|
|
|
|
pw.pw_len = 7; // some algorithms are very sensible on this (example: 12500)
|
|
|
|
|
|
|
|
buf[gid] = pw;
|
|
|
|
}
|
2021-05-20 12:34:24 +00:00
|
|
|
|
|
|
|
KERNEL_FQ void gpu_utf8_to_utf16 (GLOBAL_AS pw_t *pws_buf, const u64 gid_max)
|
|
|
|
{
|
|
|
|
const u64 gid = get_global_id (0);
|
|
|
|
|
|
|
|
if (gid >= gid_max) return;
|
|
|
|
|
|
|
|
pw_t pw_in = pws_buf[gid];
|
|
|
|
|
|
|
|
pw_t pw_out;
|
|
|
|
|
|
|
|
for (int i = 0; i < 64; i++) pw_out.i[i] = 0;
|
|
|
|
|
|
|
|
hc_enc_t hc_enc;
|
|
|
|
|
|
|
|
hc_enc_init (&hc_enc);
|
|
|
|
|
2021-05-21 20:04:24 +00:00
|
|
|
pw_out.pw_len = hc_enc_next (&hc_enc, pw_in.i, pw_in.pw_len, 256, pw_out.i, 256);
|
2021-05-20 12:34:24 +00:00
|
|
|
|
|
|
|
pws_buf[gid] = pw_out;
|
|
|
|
}
|