Remove some unroll to reduce register pressure

pull/330/head
jsteube 8 years ago
parent 303cfcae15
commit bd1f555c9c

@ -116,12 +116,7 @@ void sha512_transform (const u64x w0[4], const u64x w1[4], const u64x w2[4], con
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64x w0[4], const u64x w1[4], const u64x w2[4], con
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64x w0[4], const u64x w1[4], const u64x w2[4], con
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -116,12 +116,7 @@ void sha512_transform (const u64x w0[4], const u64x w1[4], const u64x w2[4], con
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64x w0[4], const u64x w1[4], const u64x w2[4], con
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64x w0[4], const u64x w1[4], const u64x w2[4], con
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -23,7 +23,8 @@
// Buggy drivers...
#ifdef IS_AMD
#define STATE_DECL volatile
//#define STATE_DECL volatile
#define STATE_DECL
#else
#define STATE_DECL
#endif
@ -133,7 +134,7 @@ void sha512_transform (const u64 w[16], u64 digest[8])
ROUND_STEP (0);
#pragma unroll
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -115,12 +115,7 @@ void sha512_transform (const u64 w[16], u64 dgst[8])
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -115,12 +115,7 @@ void sha512_transform (const u64 w[16], u64 dgst[8])
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -115,12 +115,7 @@ void sha512_transform (const u64 w[16], u64 dgst[8])
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64 w0[4], const u64 w1[4], const u64 w2[4], const
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64 w[16], u64 dgst[8])
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

@ -321,12 +321,7 @@ void sha512_transform (const u64 w[16], u64 dgst[8])
ROUND512_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND512_EXPAND (); ROUND512_STEP (i);

@ -242,7 +242,7 @@ void sha384_transform (const u64 w0[4], const u64 w1[4], const u64 w2[4], const
ROUND384_STEP (0);
#pragma unroll
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND384_EXPAND (); ROUND384_STEP (i);
@ -352,7 +352,7 @@ void sha512_transform (const u64 w0[4], const u64 w1[4], const u64 w2[4], const
ROUND512_STEP (0);
#pragma unroll
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND512_EXPAND (); ROUND512_STEP (i);

@ -114,12 +114,7 @@ void sha512_transform (const u64 w[16], u64 dgst[8])
ROUND_STEP (0);
#ifdef IS_AMD
// #pragma unroll
// breaks compiler
#else
#pragma unroll
#endif
//#pragma unroll
for (int i = 16; i < 80; i += 16)
{
ROUND_EXPAND (); ROUND_STEP (i);

Loading…
Cancel
Save