/* * Copyright 2011-2012 Con Kolivas * Copyright 2011-2012 Luke Dashjr * Copyright 2010 Jeff Garzik * * This program is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License as published by the Free * Software Foundation; either version 2 of the License, or (at your option) * any later version. See COPYING for more details. */ #include "config.h" #include #include #include #include #include #include #include #include #include #ifndef WIN32 #include #endif #include #include "compat.h" #include "miner.h" #include "bench_block.h" #include "device-cpu.h" #if defined(unix) #include #include #endif #ifdef __linux /* Linux specific policy and affinity management */ #include static inline void drop_policy(void) { struct sched_param param; #ifdef SCHED_BATCH #ifdef SCHED_IDLE if (unlikely(sched_setscheduler(0, SCHED_IDLE, ¶m) == -1)) #endif sched_setscheduler(0, SCHED_BATCH, ¶m); #endif } static inline void affine_to_cpu(int id, int cpu) { cpu_set_t set; CPU_ZERO(&set); CPU_SET(cpu, &set); sched_setaffinity(0, sizeof(&set), &set); applog(LOG_INFO, "Binding cpu mining thread %d to cpu %d", id, cpu); } #else static inline void drop_policy(void) { } static inline void affine_to_cpu(int id, int cpu) { } #endif /* TODO: resolve externals */ extern bool submit_work_sync(struct thr_info *thr, const struct work *work_in); extern char *set_int_range(const char *arg, int *i, int min, int max); extern int dev_from_id(int thr_id); #ifdef WANT_CPUMINE static size_t max_name_len = 0; static char *name_spaces_pad = NULL; const char *algo_names[] = { [ALGO_C] = "c", #ifdef WANT_SSE2_4WAY [ALGO_4WAY] = "4way", #endif #ifdef WANT_VIA_PADLOCK [ALGO_VIA] = "via", #endif [ALGO_CRYPTOPP] = "cryptopp", #ifdef WANT_CRYPTOPP_ASM32 [ALGO_CRYPTOPP_ASM32] = "cryptopp_asm32", #endif #ifdef WANT_X8632_SSE2 [ALGO_SSE2_32] = "sse2_32", #endif #ifdef WANT_X8664_SSE2 [ALGO_SSE2_64] = "sse2_64", #endif #ifdef WANT_X8664_SSE4 [ALGO_SSE4_64] = "sse4_64", #endif #ifdef WANT_ALTIVEC_4WAY [ALGO_ALTIVEC_4WAY] = "altivec_4way", #endif }; static const sha256_func sha256_funcs[] = { [ALGO_C] = (sha256_func)scanhash_c, #ifdef WANT_SSE2_4WAY [ALGO_4WAY] = (sha256_func)ScanHash_4WaySSE2, #endif #ifdef WANT_ALTIVEC_4WAY [ALGO_ALTIVEC_4WAY] = (sha256_func) ScanHash_altivec_4way, #endif #ifdef WANT_VIA_PADLOCK [ALGO_VIA] = (sha256_func)scanhash_via, #endif [ALGO_CRYPTOPP] = (sha256_func)scanhash_cryptopp, #ifdef WANT_CRYPTOPP_ASM32 [ALGO_CRYPTOPP_ASM32] = (sha256_func)scanhash_asm32, #endif #ifdef WANT_X8632_SSE2 [ALGO_SSE2_32] = (sha256_func)scanhash_sse2_32, #endif #ifdef WANT_X8664_SSE2 [ALGO_SSE2_64] = (sha256_func)scanhash_sse2_64, #endif #ifdef WANT_X8664_SSE4 [ALGO_SSE4_64] = (sha256_func)scanhash_sse4_64 #endif }; #endif #ifdef WANT_CPUMINE #if defined(WANT_X8664_SSE2) && defined(__SSE2__) enum sha256_algos opt_algo = ALGO_SSE2_64; #elif defined(WANT_X8632_SSE2) && defined(__SSE2__) enum sha256_algos opt_algo = ALGO_SSE2_32; #else enum sha256_algos opt_algo = ALGO_C; #endif bool opt_usecpu = false; static int cpur_thr_id; static bool forced_n_threads; #endif #ifdef WANT_CPUMINE // Algo benchmark, crash-prone, system independent stage double bench_algo_stage3( enum sha256_algos algo ) { // Use a random work block pulled from a pool static uint8_t bench_block[] = { CGMINER_BENCHMARK_BLOCK }; struct work work __attribute__((aligned(128))); size_t bench_size = sizeof(work); size_t work_size = sizeof(bench_block); size_t min_size = (work_size < bench_size ? work_size : bench_size); memset(&work, 0, sizeof(work)); memcpy(&work, &bench_block, min_size); struct work_restart dummy; work_restart = &dummy; struct timeval end; struct timeval start; uint32_t max_nonce = (1<<22); uint32_t last_nonce = 0; gettimeofday(&start, 0); { sha256_func func = sha256_funcs[algo]; (*func)( 0, work.midstate, work.data, work.hash1, work.hash, work.target, max_nonce, &last_nonce, work.blk.nonce ); } gettimeofday(&end, 0); work_restart = NULL; uint64_t usec_end = ((uint64_t)end.tv_sec)*1000*1000 + end.tv_usec; uint64_t usec_start = ((uint64_t)start.tv_sec)*1000*1000 + start.tv_usec; uint64_t usec_elapsed = usec_end - usec_start; double rate = -1.0; if (0 MAX_DEVICES) opt_n_threads = MAX_DEVICES - total_devices; cpus = calloc(opt_n_threads, sizeof(struct cgpu_info)); if (unlikely(!cpus)) quit(1, "Failed to calloc cpus"); for (i = 0; i < opt_n_threads; ++i) { struct cgpu_info *cgpu; cgpu = devices[total_devices + i] = &cpus[i]; cgpu->api = &cpu_api; cgpu->enabled = true; cgpu->device_id = i; cgpu->threads = 1; } total_devices += opt_n_threads; } static void reinit_cpu_device(struct cgpu_info *cpu) { tq_push(thr_info[cpur_thr_id].q, cpu); } static bool cpu_thread_prepare(struct thr_info *thr) { thread_reportin(thr); return true; } static uint64_t cpu_can_limit_work(struct thr_info *thr) { return 0xfffff; } static bool cpu_thread_init(struct thr_info *thr) { const int thr_id = thr->id; /* Set worker threads to nice 19 and then preferentially to SCHED_IDLE * and if that fails, then SCHED_BATCH. No need for this to be an * error if it fails */ setpriority(PRIO_PROCESS, 0, 19); drop_policy(); /* Cpu affinity only makes sense if the number of threads is a multiple * of the number of CPUs */ if (!(opt_n_threads % num_processors)) affine_to_cpu(dev_from_id(thr_id), dev_from_id(thr_id) % num_processors); return true; } static uint64_t cpu_scanhash(struct thr_info *thr, struct work *work, uint64_t max_nonce) { const int thr_id = thr->id; uint32_t first_nonce = work->blk.nonce; uint32_t last_nonce; bool rc; CPUSearch: last_nonce = first_nonce; rc = false; /* scan nonces for a proof-of-work hash */ { sha256_func func = sha256_funcs[opt_algo]; rc = (*func)( thr_id, work->midstate, work->data, work->hash1, work->hash, work->target, max_nonce, &last_nonce, work->blk.nonce ); } /* if nonce found, submit work */ if (unlikely(rc)) { if (opt_debug) applog(LOG_DEBUG, "CPU %d found something?", dev_from_id(thr_id)); if (unlikely(!submit_work_sync(thr, work))) { applog(LOG_ERR, "Failed to submit_work_sync in miner_thread %d", thr_id); } work->blk.nonce = last_nonce + 1; goto CPUSearch; } else if (unlikely(last_nonce == first_nonce)) return 0; work->blk.nonce = last_nonce + 1; return last_nonce - first_nonce + 1; } struct device_api cpu_api = { .name = "CPU", .api_detect = cpu_detect, .reinit_device = reinit_cpu_device, .thread_prepare = cpu_thread_prepare, .can_limit_work = cpu_can_limit_work, .thread_init = cpu_thread_init, .scanhash = cpu_scanhash, }; #endif