|
|
|
@ -2214,7 +2214,7 @@ void m01500m (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global co
|
|
|
|
|
|
|
|
|
|
if (tmpResult == 0xffffffff) continue;
|
|
|
|
|
|
|
|
|
|
const u32 slice = 31 - clz (~tmpResult);
|
|
|
|
|
const u32 slice = ffz (tmpResult);
|
|
|
|
|
|
|
|
|
|
const u32 r0 = search[0];
|
|
|
|
|
const u32 r1 = search[1];
|
|
|
|
@ -2234,8 +2234,8 @@ void m01500m (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global co
|
|
|
|
|
#endif
|
|
|
|
|
for (int i = 0; i < 32; i++)
|
|
|
|
|
{
|
|
|
|
|
out0[i] = out[ 0 + 31 - i];
|
|
|
|
|
out1[i] = out[32 + 31 - i];
|
|
|
|
|
out0[i] = out[ 0 + i];
|
|
|
|
|
out1[i] = out[32 + i];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
transpose32c (out0);
|
|
|
|
@ -2246,8 +2246,8 @@ void m01500m (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global co
|
|
|
|
|
#endif
|
|
|
|
|
for (int slice = 0; slice < 32; slice++)
|
|
|
|
|
{
|
|
|
|
|
const u32 r0 = out0[31 - slice];
|
|
|
|
|
const u32 r1 = out1[31 - slice];
|
|
|
|
|
const u32 r0 = out0[slice];
|
|
|
|
|
const u32 r1 = out1[slice];
|
|
|
|
|
const u32 r2 = 0;
|
|
|
|
|
const u32 r3 = 0;
|
|
|
|
|
|
|
|
|
@ -2640,7 +2640,7 @@ void m01500s (__global pw_t *pws, __global kernel_rule_t *rules_buf, __global co
|
|
|
|
|
|
|
|
|
|
if (tmpResult == 0xffffffff) return;
|
|
|
|
|
|
|
|
|
|
const u32 slice = 31 - clz (~tmpResult);
|
|
|
|
|
const u32 slice = ffz (tmpResult);
|
|
|
|
|
|
|
|
|
|
#include COMPARE_S
|
|
|
|
|
}
|
|
|
|
|