Browse Source

unified code for generating nonce in kernel and moved addition of base to the end -> faster

nfactor-troky
Philip Kaufmann 13 years ago
parent
commit
d7d0797969
  1. 10
      diakgcn120223.cl

10
diakgcn120223.cl

@ -53,14 +53,10 @@ __kernel
u V[8]; u V[8];
u W[16]; u W[16];
#ifdef VECTORS8 #if defined(VECTORS2) || defined(VECTORS4) || defined(VECTORS8)
const u nonce = base + (uint)(get_local_id(0)) * 8u + (uint)(get_group_id(0)) * (WORKVEC); const u nonce = (uint)(get_local_id(0)) * (uint)(vec_step(u)) + (uint)(get_group_id(0)) * (uint)(WORKVEC) + base;
#elif VECTORS4
const u nonce = base + (uint)(get_local_id(0)) * 4u + (uint)(get_group_id(0)) * (WORKVEC);
#elif defined VECTORS2
const u nonce = base + (uint)(get_local_id(0)) * 2u + (uint)(get_group_id(0)) * (WORKVEC);
#else #else
const u nonce = base + get_local_id(0) + get_group_id(0) * (WORKSIZE); const u nonce = (uint)(get_local_id(0)) + (uint)(get_group_id(0)) * (uint)(WORKSIZE) + base;
#endif #endif
V[0] = PreVal0 + nonce; V[0] = PreVal0 + nonce;

Loading…
Cancel
Save