49a73971c4
seems to resolve solo mining lock on share. export also computed solo work diff in api (not perfect) In high rate algos, throughput should be unsigned... This fixes keccak, blake and doom problems And change terminal color of debug lines, to be selectable in putty, color code is not supported in windows but selection is ok there.
98 lines
2.5 KiB
Plaintext
98 lines
2.5 KiB
Plaintext
/*
|
|
* qubit algorithm
|
|
*
|
|
*/
|
|
extern "C" {
|
|
#include "sph/sph_luffa.h"
|
|
}
|
|
|
|
#include "miner.h"
|
|
|
|
#include "cuda_helper.h"
|
|
|
|
static uint32_t *d_hash[8];
|
|
|
|
extern void qubit_luffa512_cpu_init(int thr_id, int threads);
|
|
extern void qubit_luffa512_cpu_setBlock_80(void *pdata);
|
|
extern void qubit_luffa512_cpu_hash_80(int thr_id, int threads, uint32_t startNounce, uint32_t *d_hash, int order);
|
|
extern void qubit_luffa512_cpufinal_setBlock_80(void *pdata, const void *ptarget);
|
|
extern uint32_t qubit_luffa512_cpu_finalhash_80(int thr_id, int threads, uint32_t startNounce, uint32_t *d_hash, int order);
|
|
|
|
extern void doomhash(void *state, const void *input)
|
|
{
|
|
// luffa512
|
|
sph_luffa512_context ctx_luffa;
|
|
|
|
uint8_t hash[64];
|
|
|
|
sph_luffa512_init(&ctx_luffa);
|
|
sph_luffa512 (&ctx_luffa, input, 80);
|
|
sph_luffa512_close(&ctx_luffa, (void*) hash);
|
|
|
|
memcpy(state, hash, 32);
|
|
}
|
|
|
|
static bool init[8] = { 0 };
|
|
|
|
extern "C" int scanhash_doom(int thr_id, uint32_t *pdata,
|
|
const uint32_t *ptarget, uint32_t max_nonce,
|
|
unsigned long *hashes_done)
|
|
{
|
|
const uint32_t first_nonce = pdata[19];
|
|
uint32_t endiandata[20];
|
|
uint32_t throughput = opt_work_size ? opt_work_size : (1 << 22); // 256*256*8*8
|
|
throughput = min(throughput, (max_nonce - first_nonce));
|
|
|
|
if (opt_benchmark)
|
|
((uint32_t*)ptarget)[7] = 0x0000f;
|
|
|
|
if (!init[thr_id])
|
|
{
|
|
cudaSetDevice(device_map[thr_id]);
|
|
|
|
CUDA_SAFE_CALL(cudaMalloc(&d_hash[thr_id], 16 * sizeof(uint32_t) * throughput));
|
|
|
|
qubit_luffa512_cpu_init(thr_id, (int) throughput);
|
|
|
|
init[thr_id] = true;
|
|
}
|
|
|
|
for (int k=0; k < 20; k++)
|
|
be32enc(&endiandata[k], ((uint32_t*)pdata)[k]);
|
|
|
|
qubit_luffa512_cpufinal_setBlock_80((void*)endiandata,ptarget);
|
|
|
|
do {
|
|
int order = 0;
|
|
|
|
uint32_t foundNonce = qubit_luffa512_cpu_finalhash_80(thr_id, (int) throughput, pdata[19], d_hash[thr_id], order++);
|
|
if (foundNonce != UINT32_MAX)
|
|
{
|
|
const uint32_t Htarg = ptarget[7];
|
|
uint32_t vhash64[8];
|
|
be32enc(&endiandata[19], foundNonce);
|
|
doomhash(vhash64, endiandata);
|
|
|
|
if (vhash64[7] <= Htarg && fulltest(vhash64, ptarget)) {
|
|
*hashes_done = min(max_nonce - first_nonce, (uint64_t) pdata[19] - first_nonce + throughput);
|
|
pdata[19] = foundNonce;
|
|
return 1;
|
|
}
|
|
else {
|
|
applog(LOG_INFO, "GPU #%d: result for nonce $%08X does not validate on CPU!", thr_id, foundNonce);
|
|
}
|
|
}
|
|
|
|
if ((uint64_t) pdata[19] + throughput > max_nonce) {
|
|
// pdata[19] = max_nonce;
|
|
break;
|
|
}
|
|
|
|
pdata[19] += throughput;
|
|
|
|
} while (!work_restart[thr_id].restart);
|
|
|
|
*hashes_done = pdata[19] - first_nonce + 1;
|
|
return 0;
|
|
}
|