Browse Source

reset: take care of multi-threaded gpus (-d 0,0)

to be tested... could create problems when reset in a chain like x11...
2upstream
Tanguy Pruvot 10 years ago
parent
commit
1ad34dc13d
  1. 4
      ccminer.cpp
  2. 18
      cuda.cpp
  3. 1
      cuda_helper.h
  4. 1
      skein.cu
  5. 7
      skein2.cu
  6. 3
      zr5.cu

4
ccminer.cpp

@ -58,7 +58,7 @@ BOOL WINAPI ConsoleHandler(DWORD); @@ -58,7 +58,7 @@ BOOL WINAPI ConsoleHandler(DWORD);
// from cuda.cpp
int cuda_num_devices();
void cuda_devicenames();
void cuda_devicereset();
void cuda_shutdown();
int cuda_finddevice(char *name);
void cuda_print_devices();
@ -485,7 +485,7 @@ void proper_exit(int reason) @@ -485,7 +485,7 @@ void proper_exit(int reason)
{
abort_flag = true;
usleep(200 * 1000);
cuda_devicereset();
cuda_shutdown();
if (reason == EXIT_CODE_OK && app_exit_code != EXIT_CODE_OK) {
reason = app_exit_code;

18
cuda.cpp

@ -82,9 +82,9 @@ void cuda_print_devices() @@ -82,9 +82,9 @@ void cuda_print_devices()
}
}
// Can't be called directly in cpu-miner.c
void cuda_devicereset()
void cuda_shutdown()
{
cudaDeviceSynchronize();
cudaDeviceReset();
}
@ -173,6 +173,20 @@ int cuda_gpu_clocks(struct cgpu_info *gpu) @@ -173,6 +173,20 @@ int cuda_gpu_clocks(struct cgpu_info *gpu)
return -1;
}
// if we use 2 threads on the same gpu, we need to reinit the threads
void cuda_reset_device(int thr_id, bool *init)
{
int dev_id = device_map[thr_id];
for (int i=0; i < MAX_GPUS; i++) {
if (device_map[i] == dev_id) {
init[i] = false;
}
}
restart_threads();
cudaDeviceSynchronize();
cudaDeviceReset();
}
void cudaReportHardwareFailure(int thr_id, cudaError_t err, const char* func)
{
struct cgpu_info *gpu = &thr_info[thr_id].gpu;

1
cuda_helper.h

@ -24,6 +24,7 @@ extern int cuda_arch[MAX_GPUS]; @@ -24,6 +24,7 @@ extern int cuda_arch[MAX_GPUS];
// common functions
extern int cuda_get_arch(int thr_id);
extern void cuda_reset_device(int thr_id, bool *init);
extern void cuda_check_cpu_init(int thr_id, uint32_t threads);
extern void cuda_check_cpu_setTarget(const void *ptarget);
extern uint32_t cuda_check_hash(int thr_id, uint32_t threads, uint32_t startNounce, uint32_t *d_inputHash);

1
skein.cu

@ -359,7 +359,6 @@ extern "C" int scanhash_skeincoin(int thr_id, uint32_t *pdata, const uint32_t *p @@ -359,7 +359,6 @@ extern "C" int scanhash_skeincoin(int thr_id, uint32_t *pdata, const uint32_t *p
if (!init[thr_id])
{
cudaDeviceReset();
cudaSetDevice(device_map[thr_id]);
cudaMalloc(&d_hash[thr_id], throughput * 64U);

7
skein2.cu

@ -48,15 +48,14 @@ extern "C" int scanhash_skein2(int thr_id, uint32_t *pdata, const uint32_t *ptar @@ -48,15 +48,14 @@ extern "C" int scanhash_skein2(int thr_id, uint32_t *pdata, const uint32_t *ptar
if (!init[thr_id])
{
cudaDeviceReset();
cudaSetDevice(device_map[thr_id]);
cudaMalloc(&d_hash[thr_id], throughput * 64U);
quark_skein512_cpu_init(thr_id, throughput);
cuda_check_cpu_init(thr_id, throughput);
quark_skein512_cpu_init(thr_id, throughput);
cuda_check_cpu_init(thr_id, throughput);
CUDA_SAFE_CALL(cudaDeviceSynchronize());
CUDA_SAFE_CALL(cudaDeviceSynchronize());
init[thr_id] = true;
}

3
zr5.cu

@ -302,7 +302,6 @@ extern "C" int scanhash_zr5(int thr_id, uint32_t *pdata, const uint32_t *ptarget @@ -302,7 +302,6 @@ extern "C" int scanhash_zr5(int thr_id, uint32_t *pdata, const uint32_t *ptarget
if (!init[thr_id])
{
cudaDeviceReset();
cudaSetDevice(device_map[thr_id]);
// constants
@ -408,7 +407,7 @@ extern "C" int scanhash_zr5(int thr_id, uint32_t *pdata, const uint32_t *ptarget @@ -408,7 +407,7 @@ extern "C" int scanhash_zr5(int thr_id, uint32_t *pdata, const uint32_t *ptarget
applog(LOG_WARNING, "GPU #%d: result for %08x does not validate on CPU!", device_map[thr_id], foundNonce);
// reinit the card..
init[thr_id] = false;
cuda_reset_device(thr_id, init);
pdata[19]++;
pdata[0] = oldp0;

Loading…
Cancel
Save