mirror of
https://github.com/GOSTSec/ccminer
synced 2025-01-24 13:34:19 +00:00
intensity: do not reduce throughput before init
Else the memory allocated could be less than required later btw, use the new "cuda" function to apply intensity/throughput
This commit is contained in:
parent
c6dcc5e5cf
commit
d195f2e8a2
@ -389,7 +389,7 @@ extern "C" int scanhash_blake256(int thr_id, struct work* work, uint32_t max_non
|
|||||||
uint64_t targetHigh = ((uint64_t*)ptarget)[3];
|
uint64_t targetHigh = ((uint64_t*)ptarget)[3];
|
||||||
int intensity = (device_sm[device_map[thr_id]] > 500) ? 22 : 20;
|
int intensity = (device_sm[device_map[thr_id]] > 500) ? 22 : 20;
|
||||||
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
int rc = 0;
|
int rc = 0;
|
||||||
|
|
||||||
|
@ -45,8 +45,8 @@ extern "C" int scanhash_bmw(int thr_id, struct work* work, uint32_t max_nonce, u
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
bool swapnonce = true;
|
bool swapnonce = true;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 21);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 21);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x0005;
|
ptarget[7] = 0x0005;
|
||||||
|
@ -42,8 +42,8 @@ extern "C" int scanhash_keccak256(int thr_id, struct work* work, uint32_t max_no
|
|||||||
uint32_t *pdata = work->data;
|
uint32_t *pdata = work->data;
|
||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 21); // 256*256*8*4
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 21); // 256*256*8*4
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x00ff;
|
ptarget[7] = 0x00ff;
|
||||||
|
@ -96,8 +96,8 @@ extern "C" int scanhash_jackpot(int thr_id, struct work *work, uint32_t max_nonc
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 20);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 20);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x000f;
|
((uint32_t*)ptarget)[7] = 0x000f;
|
||||||
|
@ -29,6 +29,10 @@ void bench_init(int threads)
|
|||||||
applog(LOG_BLUE, "Starting benchmark mode with %s", algo_names[opt_algo]);
|
applog(LOG_BLUE, "Starting benchmark mode with %s", algo_names[opt_algo]);
|
||||||
pthread_barrier_init(&miner_barr, NULL, threads);
|
pthread_barrier_init(&miner_barr, NULL, threads);
|
||||||
pthread_barrier_init(&algo_barr, NULL, threads);
|
pthread_barrier_init(&algo_barr, NULL, threads);
|
||||||
|
// required for usage of first algo.
|
||||||
|
for (int n=0; n < opt_n_threads; n++) {
|
||||||
|
device_mem_free[n] = cuda_available_memory(n);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
void bench_free()
|
void bench_free()
|
||||||
|
@ -75,8 +75,8 @@ extern "C" int scanhash_nist5(int thr_id, struct work *work, uint32_t max_nonce,
|
|||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int res = 0;
|
int res = 0;
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << 20); // 256*256*16
|
uint32_t throughput = cuda_default_throughput(thr_id, 1 << 20); // 256*256*16
|
||||||
throughput = min(throughput, (max_nonce - first_nonce));
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x00FF;
|
((uint32_t*)ptarget)[7] = 0x00FF;
|
||||||
|
@ -38,8 +38,8 @@ int scanhash_fugue256(int thr_id, struct work* work, uint32_t max_nonce, unsigne
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
uint32_t start_nonce = pdata[19]++;
|
uint32_t start_nonce = pdata[19]++;
|
||||||
int intensity = (device_sm[device_map[thr_id]] > 500) ? 22 : 19;
|
int intensity = (device_sm[device_map[thr_id]] > 500) ? 22 : 19;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << intensity); // 256*256*8
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity); // 256*256*8
|
||||||
throughput = min(throughput, max_nonce - start_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - start_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0xf;
|
((uint32_t*)ptarget)[7] = 0xf;
|
||||||
@ -113,4 +113,4 @@ void free_fugue256(int thr_id)
|
|||||||
init[thr_id] = false;
|
init[thr_id] = false;
|
||||||
|
|
||||||
cudaDeviceSynchronize();
|
cudaDeviceSynchronize();
|
||||||
}
|
}
|
||||||
|
@ -33,8 +33,8 @@ int scanhash_groestlcoin(int thr_id, struct work *work, uint32_t max_nonce, unsi
|
|||||||
uint32_t *pdata = work->data;
|
uint32_t *pdata = work->data;
|
||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
uint32_t start_nonce = pdata[19];
|
uint32_t start_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << 19); // 256*256*8
|
uint32_t throughput = cuda_default_throughput(thr_id, 1 << 19); // 256*256*8
|
||||||
throughput = min(throughput, max_nonce - start_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - start_nonce);
|
||||||
|
|
||||||
uint32_t *outputHash = (uint32_t*)malloc(throughput * 64);
|
uint32_t *outputHash = (uint32_t*)malloc(throughput * 64);
|
||||||
|
|
||||||
@ -103,4 +103,4 @@ void free_groestlcoin(int thr_id)
|
|||||||
init[thr_id] = false;
|
init[thr_id] = false;
|
||||||
|
|
||||||
cudaDeviceSynchronize();
|
cudaDeviceSynchronize();
|
||||||
}
|
}
|
||||||
|
@ -136,8 +136,8 @@ int scanhash_heavy(int thr_id, struct work *work, uint32_t max_nonce, unsigned l
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
// CUDA will process thousands of threads.
|
// CUDA will process thousands of threads.
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, (1U << 19) - 256);
|
uint32_t throughput = cuda_default_throughput(thr_id, (1U << 19) - 256);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
int rc = 0;
|
int rc = 0;
|
||||||
uint32_t *hash = NULL;
|
uint32_t *hash = NULL;
|
||||||
|
@ -85,8 +85,8 @@ extern "C" int scanhash_lyra2(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int intensity = (device_sm[device_map[thr_id]] >= 500 && !is_windows()) ? 18 : 17;
|
int intensity = (device_sm[device_map[thr_id]] >= 500 && !is_windows()) ? 18 : 17;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << intensity); // 18=256*256*4;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity); // 18=256*256*4;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x00ff;
|
ptarget[7] = 0x00ff;
|
||||||
|
@ -82,8 +82,8 @@ extern "C" int scanhash_lyra2v2(int thr_id, struct work* work, uint32_t max_nonc
|
|||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int dev_id = device_map[thr_id];
|
int dev_id = device_map[thr_id];
|
||||||
int intensity = (device_sm[dev_id] > 500 && !is_windows()) ? 20 : 18;
|
int intensity = (device_sm[dev_id] > 500 && !is_windows()) ? 20 : 18;
|
||||||
unsigned int defthr = 1U << intensity;
|
uint32_t throughput = cuda_default_throughput(dev_id, 1U << intensity);
|
||||||
uint32_t throughput = device_intensity(dev_id, __func__, defthr);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x00ff;
|
ptarget[7] = 0x00ff;
|
||||||
|
@ -37,8 +37,8 @@ int scanhash_myriad(int thr_id, struct work *work, uint32_t max_nonce, unsigned
|
|||||||
uint32_t *pdata = work->data;
|
uint32_t *pdata = work->data;
|
||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
uint32_t start_nonce = pdata[19];
|
uint32_t start_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << 17);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 17);
|
||||||
throughput = min(throughput, max_nonce - start_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - start_nonce);
|
||||||
|
|
||||||
uint32_t *outputHash = (uint32_t*)malloc(throughput * 64);
|
uint32_t *outputHash = (uint32_t*)malloc(throughput * 64);
|
||||||
|
|
||||||
@ -108,4 +108,4 @@ void free_myriad(int thr_id)
|
|||||||
init[thr_id] = false;
|
init[thr_id] = false;
|
||||||
|
|
||||||
cudaDeviceSynchronize();
|
cudaDeviceSynchronize();
|
||||||
}
|
}
|
||||||
|
@ -18,9 +18,9 @@ int scanhash_neoscrypt(int thr_id, struct work* work, uint32_t max_nonce, unsign
|
|||||||
|
|
||||||
int dev_id = device_map[thr_id];
|
int dev_id = device_map[thr_id];
|
||||||
int intensity = is_windows() ? 18 : 19;
|
int intensity = is_windows() ? 18 : 19;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << intensity);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity);
|
||||||
throughput = throughput / 32; /* set for max intensity ~= 20 */
|
throughput = throughput / 32; /* set for max intensity ~= 20 */
|
||||||
throughput = min(throughput, max_nonce - first_nonce + 1);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce + 1);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x00ff;
|
ptarget[7] = 0x00ff;
|
||||||
|
@ -371,8 +371,8 @@ extern "C" int scanhash_pentablake(int thr_id, struct work *work, uint32_t max_n
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int rc = 0;
|
int rc = 0;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 128U * 2560); // 18.5
|
uint32_t throughput = cuda_default_throughput(thr_id, 128U * 2560); // 18.5
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x000F;
|
((uint32_t*)ptarget)[7] = 0x000F;
|
||||||
|
@ -141,8 +141,8 @@ extern "C" int scanhash_quark(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << 20); // 256*4096
|
uint32_t throughput = cuda_default_throughput(thr_id, 1 << 20); // 256*4096
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x00F;
|
((uint32_t*)ptarget)[7] = 0x00F;
|
||||||
|
@ -58,8 +58,8 @@ extern "C" int scanhash_deep(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
uint32_t *pdata = work->data;
|
uint32_t *pdata = work->data;
|
||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 19); // 256*256*8
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 256*256*8
|
||||||
throughput = min(throughput, (max_nonce - first_nonce));
|
if (init[thr_id]) throughput = min(throughput, (max_nonce - first_nonce));
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x0000f;
|
((uint32_t*)ptarget)[7] = 0x0000f;
|
||||||
@ -143,4 +143,4 @@ extern "C" void free_deep(int thr_id)
|
|||||||
init[thr_id] = false;
|
init[thr_id] = false;
|
||||||
|
|
||||||
cudaDeviceSynchronize();
|
cudaDeviceSynchronize();
|
||||||
}
|
}
|
||||||
|
@ -36,8 +36,8 @@ extern "C" int scanhash_luffa(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
uint32_t *pdata = work->data;
|
uint32_t *pdata = work->data;
|
||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 22); // 256*256*8*8
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 22); // 256*256*8*8
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x0000f;
|
((uint32_t*)ptarget)[7] = 0x0000f;
|
||||||
|
@ -77,8 +77,8 @@ extern "C" int scanhash_qubit(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
uint32_t *pdata = work->data;
|
uint32_t *pdata = work->data;
|
||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 19); // 256*256*8
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 256*256*8
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x0000ff;
|
((uint32_t*)ptarget)[7] = 0x0000ff;
|
||||||
|
4
skein.cu
4
skein.cu
@ -360,8 +360,8 @@ extern "C" int scanhash_skeincoin(int thr_id, struct work* work, uint32_t max_no
|
|||||||
sm5 = (device_sm[device_map[thr_id]] >= 500);
|
sm5 = (device_sm[device_map[thr_id]] >= 500);
|
||||||
bool checkSecnonce = (have_stratum || have_longpoll) && !sm5;
|
bool checkSecnonce = (have_stratum || have_longpoll) && !sm5;
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 20);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 20);
|
||||||
throughput = min(throughput, (max_nonce - first_nonce));
|
if (init[thr_id]) throughput = min(throughput, (max_nonce - first_nonce));
|
||||||
|
|
||||||
uint32_t foundNonce, secNonce = 0;
|
uint32_t foundNonce, secNonce = 0;
|
||||||
uint64_t target64 = 0;
|
uint64_t target64 = 0;
|
||||||
|
@ -44,8 +44,8 @@ int scanhash_skein2(int thr_id, struct work* work, uint32_t max_nonce, unsigned
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << 19); // 256*256*8
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 256*256*8
|
||||||
throughput = min(throughput, (max_nonce - first_nonce));
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0;
|
((uint32_t*)ptarget)[7] = 0;
|
||||||
|
@ -147,8 +147,8 @@ extern "C" int scanhash_c11(int thr_id, struct work* work, uint32_t max_nonce, u
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int intensity = (device_sm[device_map[thr_id]] >= 500 && !is_windows()) ? 20 : 19;
|
int intensity = (device_sm[device_map[thr_id]] >= 500 && !is_windows()) ? 20 : 19;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << intensity); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x5;
|
((uint32_t*)ptarget)[7] = 0x5;
|
||||||
|
@ -74,8 +74,8 @@ extern "C" int scanhash_fresh(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t endiandata[20];
|
uint32_t endiandata[20];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << 19);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1 << 19);
|
||||||
throughput = min(throughput, (max_nonce - first_nonce));
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x00ff;
|
((uint32_t*)ptarget)[7] = 0x00ff;
|
||||||
@ -170,4 +170,4 @@ extern "C" void free_fresh(int thr_id)
|
|||||||
init[thr_id] = false;
|
init[thr_id] = false;
|
||||||
|
|
||||||
cudaDeviceSynchronize();
|
cudaDeviceSynchronize();
|
||||||
}
|
}
|
||||||
|
@ -63,8 +63,8 @@ extern "C" int scanhash_s3(int thr_id, struct work* work, uint32_t max_nonce, un
|
|||||||
// reduce by one the intensity on windows
|
// reduce by one the intensity on windows
|
||||||
intensity--;
|
intensity--;
|
||||||
#endif
|
#endif
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << intensity);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1 << intensity);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0xF;
|
((uint32_t*)ptarget)[7] = 0xF;
|
||||||
|
@ -146,8 +146,8 @@ extern "C" int scanhash_x11(int thr_id, struct work* work, uint32_t max_nonce, u
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int intensity = (device_sm[device_map[thr_id]] >= 500 && !is_windows()) ? 20 : 19;
|
int intensity = (device_sm[device_map[thr_id]] >= 500 && !is_windows()) ? 20 : 19;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << intensity); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x5;
|
((uint32_t*)ptarget)[7] = 0x5;
|
||||||
|
@ -150,8 +150,8 @@ extern "C" int scanhash_x13(int thr_id, struct work* work, uint32_t max_nonce, u
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
int intensity = 19; // (device_sm[device_map[thr_id]] > 500 && !is_windows()) ? 20 : 19;
|
int intensity = 19; // (device_sm[device_map[thr_id]] > 500 && !is_windows()) ? 20 : 19;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1 << intensity); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1 << intensity); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x000f;
|
((uint32_t*)ptarget)[7] = 0x000f;
|
||||||
|
@ -58,8 +58,8 @@ extern "C" int scanhash_whirl(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
uint32_t* ptarget = work->target;
|
uint32_t* ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 19); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x0000ff;
|
((uint32_t*)ptarget)[7] = 0x0000ff;
|
||||||
|
@ -45,8 +45,8 @@ extern "C" int scanhash_whirlx(int thr_id, struct work* work, uint32_t max_nonc
|
|||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t endiandata[20];
|
uint32_t endiandata[20];
|
||||||
int intensity = is_windows() ? 20 : 22;
|
int intensity = is_windows() ? 20 : 22;
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << intensity);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << intensity);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x0000ff;
|
((uint32_t*)ptarget)[7] = 0x0000ff;
|
||||||
|
@ -164,8 +164,8 @@ extern "C" int scanhash_x14(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t endiandata[20];
|
uint32_t endiandata[20];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 19); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x000f;
|
ptarget[7] = 0x000f;
|
||||||
|
@ -174,8 +174,8 @@ extern "C" int scanhash_x15(int thr_id, struct work* work, uint32_t max_nonce,
|
|||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t endiandata[20];
|
uint32_t endiandata[20];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 19); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x00FF;
|
ptarget[7] = 0x00FF;
|
||||||
|
@ -191,8 +191,8 @@ extern "C" int scanhash_x17(int thr_id, struct work* work, uint32_t max_nonce, u
|
|||||||
uint32_t *ptarget = work->target;
|
uint32_t *ptarget = work->target;
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
|
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 19); // 19=256*256*8;
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 19); // 19=256*256*8;
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
((uint32_t*)ptarget)[7] = 0x00ff;
|
((uint32_t*)ptarget)[7] = 0x00ff;
|
||||||
|
4
zr5.cu
4
zr5.cu
@ -338,9 +338,9 @@ extern "C" int scanhash_zr5(int thr_id, struct work *work,
|
|||||||
const uint32_t oldp0 = pdata[0];
|
const uint32_t oldp0 = pdata[0];
|
||||||
const uint32_t version = (oldp0 & (~POK_DATA_MASK)) | (use_pok ? POK_BOOL_MASK : 0);
|
const uint32_t version = (oldp0 & (~POK_DATA_MASK)) | (use_pok ? POK_BOOL_MASK : 0);
|
||||||
const uint32_t first_nonce = pdata[19];
|
const uint32_t first_nonce = pdata[19];
|
||||||
uint32_t throughput = device_intensity(thr_id, __func__, 1U << 18);
|
uint32_t throughput = cuda_default_throughput(thr_id, 1U << 18);
|
||||||
throughput = min(throughput, (1U << 20)-1024);
|
throughput = min(throughput, (1U << 20)-1024);
|
||||||
throughput = min(throughput, max_nonce - first_nonce);
|
if (init[thr_id]) throughput = min(throughput, max_nonce - first_nonce);
|
||||||
|
|
||||||
if (opt_benchmark)
|
if (opt_benchmark)
|
||||||
ptarget[7] = 0x0000ff;
|
ptarget[7] = 0x0000ff;
|
||||||
|
Loading…
x
Reference in New Issue
Block a user