x11/qubit: remove some extra MyStreamSynchronize
only one per loop is required to prevent 100% cpu usage
This commit is contained in:
parent
163430daae
commit
e7ae27137e
@ -235,8 +235,8 @@ __global__ void quark_blake512_gpu_hash_80(uint32_t threads, uint32_t startNounc
|
|||||||
|
|
||||||
// ---------------------------- END CUDA quark_blake512 functions ------------------------------------
|
// ---------------------------- END CUDA quark_blake512 functions ------------------------------------
|
||||||
|
|
||||||
// Setup-Funktionen
|
__host__
|
||||||
__host__ void quark_blake512_cpu_init(int thr_id, uint32_t threads)
|
void quark_blake512_cpu_init(int thr_id, uint32_t threads)
|
||||||
{
|
{
|
||||||
// Kopiere die Hash-Tabellen in den GPU-Speicher
|
// Kopiere die Hash-Tabellen in den GPU-Speicher
|
||||||
CUDA_CALL_OR_RET( cudaMemcpyToSymbol(c_sigma,
|
CUDA_CALL_OR_RET( cudaMemcpyToSymbol(c_sigma,
|
||||||
@ -246,7 +246,8 @@ __host__ void quark_blake512_cpu_init(int thr_id, uint32_t threads)
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Blake512 für 80 Byte grosse Eingangsdaten
|
// Blake512 für 80 Byte grosse Eingangsdaten
|
||||||
__host__ void quark_blake512_cpu_setBlock_80(void *pdata)
|
__host__
|
||||||
|
void quark_blake512_cpu_setBlock_80(void *pdata)
|
||||||
{
|
{
|
||||||
// Message mit Padding bereitstellen
|
// Message mit Padding bereitstellen
|
||||||
// lediglich die korrekte Nonce ist noch ab Byte 76 einzusetzen.
|
// lediglich die korrekte Nonce ist noch ab Byte 76 einzusetzen.
|
||||||
@ -263,7 +264,8 @@ __host__ void quark_blake512_cpu_setBlock_80(void *pdata)
|
|||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
__host__ void quark_blake512_cpu_hash_64(int thr_id, uint32_t threads, uint32_t startNounce, uint32_t *d_nonceVector, uint32_t *d_outputHash, int order)
|
__host__
|
||||||
|
void quark_blake512_cpu_hash_64(int thr_id, uint32_t threads, uint32_t startNounce, uint32_t *d_nonceVector, uint32_t *d_outputHash, int order)
|
||||||
{
|
{
|
||||||
const uint32_t threadsperblock = 256;
|
const uint32_t threadsperblock = 256;
|
||||||
|
|
||||||
@ -271,28 +273,19 @@ __host__ void quark_blake512_cpu_hash_64(int thr_id, uint32_t threads, uint32_t
|
|||||||
dim3 grid((threads + threadsperblock-1)/threadsperblock);
|
dim3 grid((threads + threadsperblock-1)/threadsperblock);
|
||||||
dim3 block(threadsperblock);
|
dim3 block(threadsperblock);
|
||||||
|
|
||||||
// Größe des dynamischen Shared Memory Bereichs
|
quark_blake512_gpu_hash_64<<<grid, block>>>(threads, startNounce, d_nonceVector, (uint64_t*)d_outputHash);
|
||||||
size_t shared_size = 0;
|
|
||||||
|
|
||||||
quark_blake512_gpu_hash_64<<<grid, block, shared_size>>>(threads, startNounce, d_nonceVector, (uint64_t*)d_outputHash);
|
|
||||||
|
|
||||||
// Strategisches Sleep Kommando zur Senkung der CPU Last
|
// Strategisches Sleep Kommando zur Senkung der CPU Last
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
//MyStreamSynchronize(NULL, order, thr_id);
|
||||||
}
|
}
|
||||||
|
|
||||||
__host__ void quark_blake512_cpu_hash_80(int thr_id, uint32_t threads, uint32_t startNounce, uint32_t *d_outputHash, int order)
|
__host__
|
||||||
|
void quark_blake512_cpu_hash_80(int thr_id, uint32_t threads, uint32_t startNounce, uint32_t *d_outputHash, int order)
|
||||||
{
|
{
|
||||||
const uint32_t threadsperblock = 256;
|
const uint32_t threadsperblock = 256;
|
||||||
|
|
||||||
// berechne wie viele Thread Blocks wir brauchen
|
|
||||||
dim3 grid((threads + threadsperblock-1)/threadsperblock);
|
dim3 grid((threads + threadsperblock-1)/threadsperblock);
|
||||||
dim3 block(threadsperblock);
|
dim3 block(threadsperblock);
|
||||||
|
|
||||||
// Größe des dynamischen Shared Memory Bereichs
|
quark_blake512_gpu_hash_80<<<grid, block>>>(threads, startNounce, d_outputHash);
|
||||||
size_t shared_size = 0;
|
|
||||||
|
|
||||||
quark_blake512_gpu_hash_80<<<grid, block, shared_size>>>(threads, startNounce, d_outputHash);
|
|
||||||
|
|
||||||
// Strategisches Sleep Kommando zur Senkung der CPU Last
|
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
|
||||||
}
|
}
|
||||||
|
@ -487,7 +487,6 @@ void qubit_luffa512_cpu_hash_80(int thr_id, uint32_t threads, uint32_t startNoun
|
|||||||
size_t shared_size = 0;
|
size_t shared_size = 0;
|
||||||
|
|
||||||
qubit_luffa512_gpu_hash_80 <<<grid, block, shared_size>>> (threads, startNounce, d_outputHash);
|
qubit_luffa512_gpu_hash_80 <<<grid, block, shared_size>>> (threads, startNounce, d_outputHash);
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
__host__
|
__host__
|
||||||
|
@ -306,6 +306,6 @@ void x11_cubehash512_cpu_hash_64(int thr_id, uint32_t threads, uint32_t startNou
|
|||||||
size_t shared_size = 0;
|
size_t shared_size = 0;
|
||||||
|
|
||||||
x11_cubehash512_gpu_hash_64<<<grid, block, shared_size>>>(threads, startNounce, (uint64_t*)d_hash, d_nonceVector);
|
x11_cubehash512_gpu_hash_64<<<grid, block, shared_size>>>(threads, startNounce, (uint64_t*)d_hash, d_nonceVector);
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
//MyStreamSynchronize(NULL, order, thr_id);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -1442,7 +1442,7 @@ void x11_shavite512_cpu_hash_64(int thr_id, uint32_t threads, uint32_t startNoun
|
|||||||
dim3 block(threadsperblock);
|
dim3 block(threadsperblock);
|
||||||
|
|
||||||
x11_shavite512_gpu_hash_64<<<grid, block>>>(threads, startNounce, (uint64_t*)d_hash, d_nonceVector);
|
x11_shavite512_gpu_hash_64<<<grid, block>>>(threads, startNounce, (uint64_t*)d_hash, d_nonceVector);
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
//MyStreamSynchronize(NULL, order, thr_id);
|
||||||
}
|
}
|
||||||
|
|
||||||
__host__
|
__host__
|
||||||
@ -1454,7 +1454,6 @@ void x11_shavite512_cpu_hash_80(int thr_id, uint32_t threads, uint32_t startNoun
|
|||||||
dim3 block(threadsperblock);
|
dim3 block(threadsperblock);
|
||||||
|
|
||||||
x11_shavite512_gpu_hash_80<<<grid, block>>>(threads, startNounce, d_outputHash);
|
x11_shavite512_gpu_hash_80<<<grid, block>>>(threads, startNounce, d_outputHash);
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
__host__
|
__host__
|
||||||
|
@ -697,5 +697,5 @@ void x11_simd512_cpu_hash_64(int thr_id, uint32_t threads, uint32_t startNounce,
|
|||||||
|
|
||||||
x11_simd512_gpu_final_64 <<<grid, block>>> (threads, d_hash, d_temp4[thr_id], d_state[thr_id]);
|
x11_simd512_gpu_final_64 <<<grid, block>>> (threads, d_hash, d_temp4[thr_id], d_state[thr_id]);
|
||||||
|
|
||||||
MyStreamSynchronize(NULL, order, thr_id);
|
//MyStreamSynchronize(NULL, order, thr_id);
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user