|
|
|
@ -1282,17 +1282,11 @@ DECLSPEC void append_0x80_1x16 (u32x w[16], const u32 offset)
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_le (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
w0[0] = swap32 (w0[0]);
|
|
|
|
@ -1991,17 +1985,11 @@ DECLSPEC void switch_buffer_by_offset_le (u32x w0[4], u32x w1[4], u32x w2[4], u3
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_carry_le (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], u32x c0[4], u32x c1[4], u32x c2[4], u32x c3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if defined IS_AMD || defined IS_GENERIC
|
|
|
|
|
w0[0] = swap32 (w0[0]);
|
|
|
|
@ -3315,13 +3303,7 @@ DECLSPEC void switch_buffer_by_offset_carry_le (u32x w0[4], u32x w1[4], u32x w2[
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_be (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
|
|
|
|
@ -3988,13 +3970,7 @@ DECLSPEC void switch_buffer_by_offset_be (u32x w0[4], u32x w1[4], u32x w2[4], u3
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_carry_be (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], u32x c0[4], u32x c1[4], u32x c2[4], u32x c3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -4930,17 +4906,11 @@ DECLSPEC void switch_buffer_by_offset_carry_be (u32x w0[4], u32x w1[4], u32x w2[
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_8x4_le (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], u32x w4[4], u32x w5[4], u32x w6[4], u32x w7[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
w0[0] = swap32 (w0[0]);
|
|
|
|
@ -6742,13 +6712,7 @@ DECLSPEC void switch_buffer_by_offset_8x4_le (u32x w0[4], u32x w1[4], u32x w2[4]
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_8x4_be (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], u32x w4[4], u32x w5[4], u32x w6[4], u32x w7[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -9076,13 +9040,7 @@ DECLSPEC void switch_buffer_by_offset_8x4_be (u32x w0[4], u32x w1[4], u32x w2[4]
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_8x4_carry_be (u32x w0[4], u32x w1[4], u32x w2[4], u32x w3[4], u32x w4[4], u32x w5[4], u32x w6[4], u32x w7[4], u32x c0[4], u32x c1[4], u32x c2[4], u32x c3[4], u32x c4[4], u32x c5[4], u32x c6[4], u32x c7[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -12466,17 +12424,11 @@ DECLSPEC void switch_buffer_by_offset_8x4_carry_be (u32x w0[4], u32x w1[4], u32x
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_1x64_le (u32x w[64], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
|
|
|
|
@ -21212,13 +21164,7 @@ DECLSPEC void switch_buffer_by_offset_1x64_le (u32x w[64], const u32 offset)
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_1x64_be (u32x w[64], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -32504,17 +32450,11 @@ DECLSPEC void undo_utf16le_S (const u32 in1[4], const u32 in2[4], u32 out[4])
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_le_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
w0[0] = swap32_S (w0[0]);
|
|
|
|
@ -33212,17 +33152,11 @@ DECLSPEC void switch_buffer_by_offset_le_S (u32 w0[4], u32 w1[4], u32 w2[4], u32
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_carry_le_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], u32 c0[4], u32 c1[4], u32 c2[4], u32 c3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if defined IS_AMD || defined IS_GENERIC
|
|
|
|
|
w0[0] = swap32_S (w0[0]);
|
|
|
|
@ -34536,13 +34470,7 @@ DECLSPEC void switch_buffer_by_offset_carry_le_S (u32 w0[4], u32 w1[4], u32 w2[4
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_be_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -35206,13 +35134,7 @@ DECLSPEC void switch_buffer_by_offset_be_S (u32 w0[4], u32 w1[4], u32 w2[4], u32
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_carry_be_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], u32 c0[4], u32 c1[4], u32 c2[4], u32 c3[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -36148,17 +36070,11 @@ DECLSPEC void switch_buffer_by_offset_carry_be_S (u32 w0[4], u32 w1[4], u32 w2[4
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_8x4_le_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], u32 w4[4], u32 w5[4], u32 w6[4], u32 w7[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
w0[0] = swap32_S (w0[0]);
|
|
|
|
@ -37960,13 +37876,7 @@ DECLSPEC void switch_buffer_by_offset_8x4_le_S (u32 w0[4], u32 w1[4], u32 w2[4],
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_8x4_be_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], u32 w4[4], u32 w5[4], u32 w6[4], u32 w7[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -40294,13 +40204,7 @@ DECLSPEC void switch_buffer_by_offset_8x4_be_S (u32 w0[4], u32 w1[4], u32 w2[4],
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_8x4_carry_be_S (u32 w0[4], u32 w1[4], u32 w2[4], u32 w3[4], u32 w4[4], u32 w5[4], u32 w6[4], u32 w7[4], u32 c0[4], u32 c1[4], u32 c2[4], u32 c3[4], u32 c4[4], u32 c5[4], u32 c6[4], u32 c7[4], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
@ -43684,17 +43588,11 @@ DECLSPEC void switch_buffer_by_offset_8x4_carry_be_S (u32 w0[4], u32 w1[4], u32
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_1x64_le_S (u32 w[64], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
const int offset_mod_4 = offset & 3;
|
|
|
|
|
|
|
|
|
|
const int offset_minus_4 = 4 - offset_mod_4;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
|
|
|
|
@ -52430,13 +52328,7 @@ DECLSPEC void switch_buffer_by_offset_1x64_le_S (u32 w[64], const u32 offset)
|
|
|
|
|
|
|
|
|
|
DECLSPEC void switch_buffer_by_offset_1x64_be_S (u32 w[64], const u32 offset)
|
|
|
|
|
{
|
|
|
|
|
if (offset == 0) return;
|
|
|
|
|
|
|
|
|
|
#ifdef IS_AMD
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#else
|
|
|
|
|
const int offset_switch = offset / 4;
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
#if (defined IS_AMD && AMD_GCN < 3) || defined IS_GENERIC
|
|
|
|
|
switch (offset_switch)
|
|
|
|
|