/* * Copyright 2013 Andrew Smith * Copyright 2013 Con Kolivas * Copyright 2013 Chris Savery * * This program is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License as published by the Free * Software Foundation; either version 3 of the License, or (at your option) * any later version. See COPYING for more details. */ #include #include #include #include #include #include #include #include #include #include "config.h" #ifdef WIN32 #include #endif #include "compat.h" #include "miner.h" #include "usbutils.h" #define K1 "K1" #define K16 "K16" #define K64 "K64" static const char *msg_detect_send = "DSend"; static const char *msg_detect_reply = "DReply"; static const char *msg_send = "Send"; static const char *msg_reply = "Reply"; #define KLN_CMD_ABORT 'A' #define KLN_CMD_CONFIG 'C' #define KLN_CMD_ENABLE 'E' #define KLN_CMD_IDENT 'I' #define KLN_CMD_NONCE '=' #define KLN_CMD_STATUS 'S' #define KLN_CMD_WORK 'W' #define KLN_CMD_ENABLE_OFF '0' #define KLN_CMD_ENABLE_ON '1' #define MIDSTATE_BYTES 32 #define MERKLE_OFFSET 64 #define MERKLE_BYTES 12 #define REPLY_SIZE 15 // adequate for all types of replies #define MAX_KLINES 1024 // unhandled reply limit #define REPLY_WAIT_TIME 100 // poll interval for a cmd waiting it's reply #define CMD_REPLY_RETRIES 8 // how many retries for cmds #define MAX_WORK_COUNT 4 // for now, must be binary multiple and match firmware #define TACH_FACTOR 87890 // fan rpm divisor #define KLN_KILLWORK_TEMP 53.5 #define KLN_COOLED_DOWN 45.5 /* * Work older than 5s will already be completed * FYI it must not be possible to complete 256 work * items this quickly on a single device - * thus limited to 219.9GH/s per device */ #define OLD_WORK_MS ((int)(5 * 1000)) /* * How many incorrect slave counts to ignore in a row * 2 means it allows random grabage returned twice * Until slaves are implemented, this should never occur * so allowing 2 in a row should ignore random errros */ #define KLN_ISS_IGNORE 2 /* * If the queue status hasn't been updated for this long then do it now * 5GH/s = 859ms per full nonce range */ #define LATE_UPDATE_MS ((int)(2.5 * 1000)) // If 5 late updates in a row, try to reset the device #define LATE_UPDATE_LIMIT 5 // If the reset fails sleep for 1s #define LATE_UPDATE_SLEEP_MS 1000 // However give up after 8s #define LATE_UPDATE_NODEV_MS ((int)(8.0 * 1000)) struct device_drv klondike_drv; typedef struct klondike_header { uint8_t cmd; uint8_t dev; uint8_t buf[REPLY_SIZE-2]; } HEADER; #define K_2(_bytes) ((int)(_bytes[0]) + \ ((int)(_bytes[1]) << 8)) #define K_4(_bytes) ((uint64_t)(_bytes[0]) + \ ((uint64_t)(_bytes[1]) << 8) + \ ((uint64_t)(_bytes[2]) << 16) + \ ((uint64_t)(_bytes[3]) << 24)) #define K_SERIAL(_serial) K_4(_serial) #define K_HASHCOUNT(_hashcount) K_2(_hashcount) #define K_MAXCOUNT(_maxcount) K_2(_maxcount) #define K_NONCE(_nonce) K_4(_nonce) #define K_HASHCLOCK(_hashclock) K_2(_hashclock) #define SET_HASHCLOCK(_hashclock, _value) do { \ (_hashclock)[0] = (uint8_t)((_value) & 0xff); \ (_hashclock)[1] = (uint8_t)(((_value) >> 8) & 0xff); \ } while(0) #define KSENDHD(_add) (sizeof(uint8_t) + sizeof(uint8_t) + _add) typedef struct klondike_id { uint8_t cmd; uint8_t dev; uint8_t version; uint8_t product[7]; uint8_t serial[4]; } IDENTITY; typedef struct klondike_status { uint8_t cmd; uint8_t dev; uint8_t state; uint8_t chipcount; uint8_t slavecount; uint8_t workqc; uint8_t workid; uint8_t temp; uint8_t fanspeed; uint8_t errorcount; uint8_t hashcount[2]; uint8_t maxcount[2]; uint8_t noise; } WORKSTATUS; typedef struct _worktask { uint8_t cmd; uint8_t dev; uint8_t workid; uint8_t midstate[32]; uint8_t merkle[12]; } WORKTASK; typedef struct _workresult { uint8_t cmd; uint8_t dev; uint8_t workid; uint8_t nonce[4]; } WORKRESULT; typedef struct klondike_cfg { uint8_t cmd; uint8_t dev; uint8_t hashclock[2]; uint8_t temptarget; uint8_t tempcritical; uint8_t fantarget; uint8_t pad2; } WORKCFG; typedef struct kline { union { HEADER hd; IDENTITY id; WORKSTATUS ws; WORKTASK wt; WORKRESULT wr; WORKCFG cfg; }; } KLINE; #define zero_kline(_kline) memset((void *)(_kline), 0, sizeof(KLINE)); typedef struct device_info { uint32_t noncecount; uint32_t nextworkid; uint16_t lasthashcount; uint64_t totalhashcount; uint32_t rangesize; uint32_t *chipstats; } DEVINFO; typedef struct klist { struct klist *prev; struct klist *next; KLINE kline; struct timeval tv_when; int block_seq; bool ready; bool working; } KLIST; typedef struct jobque { int workqc; struct timeval last_update; bool overheat; int late_update_count; int late_update_sequential; } JOBQUE; struct klondike_info { pthread_rwlock_t stat_lock; struct thr_info replies_thr; cglock_t klist_lock; KLIST *used; KLIST *free; int kline_count; int used_count; int block_seq; KLIST *status; DEVINFO *devinfo; KLIST *cfg; JOBQUE *jobque; int noncecount; uint64_t hashcount; uint64_t errorcount; uint64_t noisecount; int incorrect_slave_sequential; // us Delay from USB reply to being processed double delay_count; double delay_total; double delay_min; double delay_max; struct timeval tv_last_nonce_received; // Time from recieving one nonce to the next double nonce_count; double nonce_total; double nonce_min; double nonce_max; int wque_size; int wque_cleared; bool initialised; }; static KLIST *new_klist_set(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *klist = NULL; int i; klist = calloc(MAX_KLINES, sizeof(*klist)); if (!klist) quit(1, "Failed to calloc klist - when old count=%d", klninfo->kline_count); klninfo->kline_count += MAX_KLINES; klist[0].prev = NULL; klist[0].next = &(klist[1]); for (i = 1; i < MAX_KLINES-1; i++) { klist[i].prev = &klist[i-1]; klist[i].next = &klist[i+1]; } klist[MAX_KLINES-1].prev = &(klist[MAX_KLINES-2]); klist[MAX_KLINES-1].next = NULL; return klist; } static KLIST *allocate_kitem(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *kitem = NULL; int ran_out = 0; char errbuf[1024]; cg_wlock(&klninfo->klist_lock); if (klninfo->free == NULL) { ran_out = klninfo->kline_count; klninfo->free = new_klist_set(klncgpu); snprintf(errbuf, sizeof(errbuf), "%s%i: KLINE count exceeded %d, now %d", klncgpu->drv->name, klncgpu->device_id, ran_out, klninfo->kline_count); } kitem = klninfo->free; klninfo->free = klninfo->free->next; if (klninfo->free) klninfo->free->prev = NULL; kitem->next = klninfo->used; kitem->prev = NULL; if (kitem->next) kitem->next->prev = kitem; klninfo->used = kitem; kitem->ready = false; kitem->working = false; memset((void *)&(kitem->kline), 0, sizeof(kitem->kline)); klninfo->used_count++; cg_wunlock(&klninfo->klist_lock); if (ran_out > 0) applog(LOG_ERR, "%s", errbuf); return kitem; } static KLIST *release_kitem(struct cgpu_info *klncgpu, KLIST *kitem) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); cg_wlock(&klninfo->klist_lock); if (kitem == klninfo->used) klninfo->used = kitem->next; if (kitem->next) kitem->next->prev = kitem->prev; if (kitem->prev) kitem->prev->next = kitem->next; kitem->next = klninfo->free; if (klninfo->free) klninfo->free->prev = kitem; kitem->prev = NULL; klninfo->free = kitem; klninfo->used_count--; cg_wunlock(&klninfo->klist_lock); return NULL; } static double cvtKlnToC(uint8_t temp) { double Rt, stein, celsius; if (temp == 0) return 0.0; Rt = 1000.0 * 255.0 / (double)temp - 1000.0; stein = log(Rt / 2200.0) / 3987.0; stein += 1.0 / (double)(25.0 + 273.15); celsius = (1.0 / stein) - 273.15; // For display of bad data if (celsius < 0.0) celsius = 0.0; if (celsius > 200.0) celsius = 200.0; return celsius; } static int cvtCToKln(double deg) { double Rt, stein, temp; if (deg < 0.0) deg = 0.0; stein = 1.0 / (deg + 273.15); stein -= 1.0 / (double)(25.0 + 273.15); Rt = exp(stein * 3987.0) * 2200.0; if (Rt == -1000.0) Rt++; temp = 1000.0 * 256.0 / (Rt + 1000.0); if (temp > 255) temp = 255; if (temp < 0) temp = 0; return (int)temp; } // Change this to LOG_WARNING if you wish to always see the replies #define READ_DEBUG LOG_DEBUG static void display_kline(struct cgpu_info *klncgpu, KLINE *kline, const char *msg) { char *hexdata; switch (kline->hd.cmd) { case KLN_CMD_NONCE: applog(READ_DEBUG, "%s%i:%d %s work [%c] dev=%d workid=%d" " nonce=0x%08x", klncgpu->drv->name, klncgpu->device_id, (int)(kline->wr.dev), msg, kline->wr.cmd, (int)(kline->wr.dev), (int)(kline->wr.workid), (unsigned int)K_NONCE(kline->wr.nonce) - 0xC0); break; case KLN_CMD_STATUS: case KLN_CMD_WORK: case KLN_CMD_ENABLE: case KLN_CMD_ABORT: applog(READ_DEBUG, "%s%i:%d %s status [%c] dev=%d chips=%d" " slaves=%d workcq=%d workid=%d temp=%d fan=%d" " errors=%d hashes=%d max=%d noise=%d", klncgpu->drv->name, klncgpu->device_id, (int)(kline->ws.dev), msg, kline->ws.cmd, (int)(kline->ws.dev), (int)(kline->ws.chipcount), (int)(kline->ws.slavecount), (int)(kline->ws.workqc), (int)(kline->ws.workid), (int)(kline->ws.temp), (int)(kline->ws.fanspeed), (int)(kline->ws.errorcount), K_HASHCOUNT(kline->ws.hashcount), K_MAXCOUNT(kline->ws.maxcount), (int)(kline->ws.noise)); break; case KLN_CMD_CONFIG: applog(READ_DEBUG, "%s%i:%d %s config [%c] dev=%d clock=%d" " temptarget=%d tempcrit=%d fan=%d", klncgpu->drv->name, klncgpu->device_id, (int)(kline->cfg.dev), msg, kline->cfg.cmd, (int)(kline->cfg.dev), K_HASHCLOCK(kline->cfg.hashclock), (int)(kline->cfg.temptarget), (int)(kline->cfg.tempcritical), (int)(kline->cfg.fantarget)); break; case KLN_CMD_IDENT: applog(READ_DEBUG, "%s%i:%d %s info [%c] version=0x%02x prod=%.7s" " serial=0x%08x", klncgpu->drv->name, klncgpu->device_id, (int)(kline->hd.dev), msg, kline->hd.cmd, (int)(kline->id.version), kline->id.product, (unsigned int)K_SERIAL(kline->id.serial)); break; default: hexdata = bin2hex((unsigned char *)&(kline->hd.dev), REPLY_SIZE - 1); applog(LOG_ERR, "%s%i:%d %s [%c:%s] unknown and ignored", klncgpu->drv->name, klncgpu->device_id, (int)(kline->hd.dev), msg, kline->hd.cmd, hexdata); free(hexdata); break; } } static void display_send_kline(struct cgpu_info *klncgpu, KLINE *kline, const char *msg) { char *hexdata; switch (kline->hd.cmd) { case KLN_CMD_WORK: applog(READ_DEBUG, "%s%i:%d %s work [%c] dev=%d workid=0x%02x ...", klncgpu->drv->name, klncgpu->device_id, (int)(kline->wt.dev), msg, kline->ws.cmd, (int)(kline->wt.dev), (int)(kline->wt.workid)); break; case KLN_CMD_CONFIG: applog(READ_DEBUG, "%s%i:%d %s config [%c] dev=%d clock=%d" " temptarget=%d tempcrit=%d fan=%d", klncgpu->drv->name, klncgpu->device_id, (int)(kline->cfg.dev), msg, kline->cfg.cmd, (int)(kline->cfg.dev), K_HASHCLOCK(kline->cfg.hashclock), (int)(kline->cfg.temptarget), (int)(kline->cfg.tempcritical), (int)(kline->cfg.fantarget)); break; case KLN_CMD_IDENT: case KLN_CMD_STATUS: case KLN_CMD_ABORT: applog(READ_DEBUG, "%s%i:%d %s cmd [%c]", klncgpu->drv->name, klncgpu->device_id, (int)(kline->hd.dev), msg, kline->hd.cmd); break; case KLN_CMD_ENABLE: applog(READ_DEBUG, "%s%i:%d %s enable [%c] enable=%c", klncgpu->drv->name, klncgpu->device_id, (int)(kline->hd.dev), msg, kline->hd.cmd, (char)(kline->hd.buf[0])); break; case KLN_CMD_NONCE: default: hexdata = bin2hex((unsigned char *)&(kline->hd.dev), REPLY_SIZE - 1); applog(LOG_ERR, "%s%i:%d %s [%c:%s] unknown/unexpected and ignored", klncgpu->drv->name, klncgpu->device_id, (int)(kline->hd.dev), msg, kline->hd.cmd, hexdata); free(hexdata); break; } } static bool SendCmd(struct cgpu_info *klncgpu, KLINE *kline, int datalen) { int err, amt, writ; if (klncgpu->usbinfo.nodev) return false; display_send_kline(klncgpu, kline, msg_send); writ = KSENDHD(datalen); err = usb_write(klncgpu, (char *)kline, writ, &amt, C_REQUESTRESULTS); if (err < 0 || amt != writ) { applog(LOG_ERR, "%s%i:%d Cmd:%c Dev:%d, write failed (%d:%d:%d)", klncgpu->drv->name, klncgpu->device_id, (int)(kline->hd.dev), kline->hd.cmd, (int)(kline->hd.dev), writ, amt, err); return false; } return true; } static KLIST *GetReply(struct cgpu_info *klncgpu, uint8_t cmd, uint8_t dev) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *kitem; int retries = CMD_REPLY_RETRIES; while (retries-- > 0 && klncgpu->shutdown == false) { cgsleep_ms(REPLY_WAIT_TIME); cg_rlock(&klninfo->klist_lock); kitem = klninfo->used; while (kitem) { if (kitem->kline.hd.cmd == cmd && kitem->kline.hd.dev == dev && kitem->ready == true && kitem->working == false) { kitem->working = true; cg_runlock(&klninfo->klist_lock); return kitem; } kitem = kitem->next; } cg_runlock(&klninfo->klist_lock); } return NULL; } static KLIST *SendCmdGetReply(struct cgpu_info *klncgpu, KLINE *kline, int datalen) { if (!SendCmd(klncgpu, kline, datalen)) return NULL; return GetReply(klncgpu, kline->hd.cmd, kline->hd.dev); } static bool klondike_get_stats(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *kitem; KLINE kline; int slaves, dev; if (klncgpu->usbinfo.nodev || klninfo->status == NULL) return false; applog(LOG_DEBUG, "%s%i: getting status", klncgpu->drv->name, klncgpu->device_id); rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; rd_unlock(&(klninfo->stat_lock)); // loop thru devices and get status for each for (dev = 0; dev <= slaves; dev++) { zero_kline(&kline); kline.hd.cmd = KLN_CMD_STATUS; kline.hd.dev = dev; kitem = SendCmdGetReply(klncgpu, &kline, 0); if (kitem != NULL) { wr_lock(&(klninfo->stat_lock)); memcpy((void *)(&(klninfo->status[dev])), (void *)kitem, sizeof(klninfo->status[dev])); wr_unlock(&(klninfo->stat_lock)); kitem = release_kitem(klncgpu, kitem); } else { applog(LOG_ERR, "%s%i:%d failed to update stats", klncgpu->drv->name, klncgpu->device_id, dev); } } return true; } // TODO: this only enables the master (no slaves) static bool kln_enable(struct cgpu_info *klncgpu) { KLIST *kitem; KLINE kline; int tries = 2; bool ok = false; zero_kline(&kline); kline.hd.cmd = KLN_CMD_ENABLE; kline.hd.dev = 0; kline.hd.buf[0] = KLN_CMD_ENABLE_ON; while (tries-- > 0) { kitem = SendCmdGetReply(klncgpu, &kline, 1); if (kitem) { kitem = release_kitem(klncgpu, kitem); ok = true; break; } cgsleep_ms(50); } if (ok) cgsleep_ms(50); return ok; } static void kln_disable(struct cgpu_info *klncgpu, int dev, bool all) { KLINE kline; int i; zero_kline(&kline); kline.hd.cmd = KLN_CMD_ENABLE; kline.hd.buf[0] = KLN_CMD_ENABLE_OFF; for (i = (all ? 0 : dev); i <= dev; i++) { kline.hd.dev = i; SendCmd(klncgpu, &kline, KSENDHD(1)); } } static bool klondike_init(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *kitem; KLINE kline; int slaves, dev; klninfo->initialised = false; zero_kline(&kline); kline.hd.cmd = KLN_CMD_STATUS; kline.hd.dev = 0; kitem = SendCmdGetReply(klncgpu, &kline, 0); if (kitem == NULL) return false; slaves = kitem->kline.ws.slavecount; if (klninfo->status == NULL) { applog(LOG_DEBUG, "%s%i: initializing data", klncgpu->drv->name, klncgpu->device_id); // alloc space for status, devinfo, cfg and jobque for master and slaves klninfo->status = calloc(slaves+1, sizeof(*(klninfo->status))); if (unlikely(!klninfo->status)) quit(1, "Failed to calloc status array in klondke_get_stats"); klninfo->devinfo = calloc(slaves+1, sizeof(*(klninfo->devinfo))); if (unlikely(!klninfo->devinfo)) quit(1, "Failed to calloc devinfo array in klondke_get_stats"); klninfo->cfg = calloc(slaves+1, sizeof(*(klninfo->cfg))); if (unlikely(!klninfo->cfg)) quit(1, "Failed to calloc cfg array in klondke_get_stats"); klninfo->jobque = calloc(slaves+1, sizeof(*(klninfo->jobque))); if (unlikely(!klninfo->jobque)) quit(1, "Failed to calloc jobque array in klondke_get_stats"); } memcpy((void *)(&(klninfo->status[0])), (void *)kitem, sizeof(klninfo->status[0])); kitem = release_kitem(klncgpu, kitem); // zero init triggers read back only zero_kline(&kline); kline.cfg.cmd = KLN_CMD_CONFIG; int size = 2; // boundaries are checked by device, with valid values returned if (opt_klondike_options != NULL) { int hashclock, fantarget; double temp1, temp2; sscanf(opt_klondike_options, "%d:%lf:%lf:%d", &hashclock, &temp1, &temp2, &fantarget); SET_HASHCLOCK(kline.cfg.hashclock, hashclock); kline.cfg.temptarget = cvtCToKln(temp1); kline.cfg.tempcritical = cvtCToKln(temp2); if (fantarget < 0) { applog(LOG_WARNING, "%s%i: %s options invalid fantarget < 0 using 0", klncgpu->drv->name, klncgpu->device_id, klncgpu->drv->dname); fantarget = 0; } else if (fantarget > 100) { applog(LOG_WARNING, "%s%i: %s options invalid fantarget > 100 using 100", klncgpu->drv->name, klncgpu->device_id, klncgpu->drv->dname); fantarget = 100; } kline.cfg.fantarget = (int)(255 * fantarget / 100); size = sizeof(kline.cfg) - 2; } for (dev = 0; dev <= slaves; dev++) { kline.cfg.dev = dev; kitem = SendCmdGetReply(klncgpu, &kline, size); if (kitem != NULL) { memcpy((void *)&(klninfo->cfg[dev]), kitem, sizeof(klninfo->cfg[dev])); applog(LOG_WARNING, "%s%i:%d config (%d: Clk: %d, T:%.0lf, C:%.0lf, F:%d)", klncgpu->drv->name, klncgpu->device_id, dev, dev, K_HASHCLOCK(klninfo->cfg[dev].kline.cfg.hashclock), cvtKlnToC(klninfo->cfg[dev].kline.cfg.temptarget), cvtKlnToC(klninfo->cfg[dev].kline.cfg.tempcritical), (int)100*klninfo->cfg[dev].kline.cfg.fantarget/256); kitem = release_kitem(klncgpu, kitem); } } klondike_get_stats(klncgpu); klninfo->initialised = true; for (dev = 0; dev <= slaves; dev++) { klninfo->devinfo[dev].rangesize = ((uint64_t)1<<32) / klninfo->status[dev].kline.ws.chipcount; klninfo->devinfo[dev].chipstats = calloc(klninfo->status[dev].kline.ws.chipcount*2 , sizeof(uint32_t)); } bool ok = kln_enable(klncgpu); if (!ok) applog(LOG_ERR, "%s%i: failed to enable", klncgpu->drv->name, klncgpu->device_id); return ok; } static void control_init(struct cgpu_info *klncgpu) { int err, interface; if (klncgpu->usbinfo.nodev) return; interface = usb_interface(klncgpu); err = usb_transfer(klncgpu, 0, 9, 1, interface, C_RESET); applog(LOG_DEBUG, "%s%i: reset got err %d", klncgpu->drv->name, klncgpu->device_id, err); } static bool klondike_detect_one(struct libusb_device *dev, struct usb_find_devices *found) { struct cgpu_info *klncgpu = usb_alloc_cgpu(&klondike_drv, 1); struct klondike_info *klninfo = NULL; KLINE kline; if (unlikely(!klncgpu)) quit(1, "Failed to calloc klncgpu in klondike_detect_one"); klninfo = calloc(1, sizeof(*klninfo)); if (unlikely(!klninfo)) quit(1, "Failed to calloc klninfo in klondke_detect_one"); klncgpu->device_data = (void *)klninfo; klninfo->free = new_klist_set(klncgpu); if (usb_init(klncgpu, dev, found)) { int sent, recd, err; KLIST kitem; int attempts = 0; control_init(klncgpu); while (attempts++ < 3) { kline.hd.cmd = KLN_CMD_IDENT; kline.hd.dev = 0; display_send_kline(klncgpu, &kline, msg_detect_send); err = usb_write(klncgpu, (char *)&(kline.hd), 2, &sent, C_REQUESTRESULTS); if (err < 0 || sent != 2) { applog(LOG_ERR, "%s (%s) detect write failed (%d:%d)", klncgpu->drv->dname, klncgpu->device_path, sent, err); } cgsleep_ms(REPLY_WAIT_TIME*10); err = usb_read(klncgpu, (char *)&(kitem.kline), REPLY_SIZE, &recd, C_GETRESULTS); if (err < 0) { applog(LOG_ERR, "%s (%s) detect read failed (%d:%d)", klncgpu->drv->dname, klncgpu->device_path, recd, err); } else if (recd < 1) { applog(LOG_ERR, "%s (%s) detect empty reply (%d)", klncgpu->drv->dname, klncgpu->device_path, recd); } else if (kitem.kline.hd.cmd == KLN_CMD_IDENT && kitem.kline.hd.dev == 0) { display_kline(klncgpu, &kitem.kline, msg_detect_reply); applog(LOG_DEBUG, "%s (%s) detect successful (%d attempt%s)", klncgpu->drv->dname, klncgpu->device_path, attempts, attempts == 1 ? "" : "s"); if (!add_cgpu(klncgpu)) break; update_usb_stats(klncgpu); applog(LOG_DEBUG, "Klondike cgpu added"); cglock_init(&klninfo->klist_lock); return true; } } usb_uninit(klncgpu); } free(klninfo->free); free(klninfo); free(klncgpu); return false; } static void klondike_detect(bool __maybe_unused hotplug) { usb_detect(&klondike_drv, klondike_detect_one); } static void klondike_identify(__maybe_unused struct cgpu_info *klncgpu) { /* KLINE kline; zero_kline(&kline); kline.hd.cmd = KLN_CMD_IDENT; kline.hd.dev = 0; SendCmdGetReply(klncgpu, &kline, KSENDHD(0)); */ } static void klondike_check_nonce(struct cgpu_info *klncgpu, KLIST *kitem) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); struct work *work, *look, *tmp; KLINE *kline = &(kitem->kline); struct timeval tv_now; double us_diff; uint32_t nonce = K_NONCE(kline->wr.nonce) - 0xC0; applog(LOG_DEBUG, "%s%i:%d FOUND NONCE (%02x:%08x)", klncgpu->drv->name, klncgpu->device_id, (int)(kline->wr.dev), kline->wr.workid, (unsigned int)nonce); work = NULL; cgtime(&tv_now); rd_lock(&(klncgpu->qlock)); HASH_ITER(hh, klncgpu->queued_work, look, tmp) { if (ms_tdiff(&tv_now, &(look->tv_stamp)) < OLD_WORK_MS && (look->subid == (kline->wr.dev*256 + kline->wr.workid))) { work = look; break; } } rd_unlock(&(klncgpu->qlock)); if (work) { wr_lock(&(klninfo->stat_lock)); klninfo->devinfo[kline->wr.dev].noncecount++; klninfo->noncecount++; wr_unlock(&(klninfo->stat_lock)); applog(LOG_DEBUG, "%s%i:%d SUBMIT NONCE (%02x:%08x)", klncgpu->drv->name, klncgpu->device_id, (int)(kline->wr.dev), kline->wr.workid, (unsigned int)nonce); cgtime(&tv_now); bool ok = submit_nonce(klncgpu->thr[0], work, nonce); applog(LOG_DEBUG, "%s%i:%d chip stats %d, %08x, %d, %d", klncgpu->drv->name, klncgpu->device_id, (int)(kline->wr.dev), kline->wr.dev, (unsigned int)nonce, klninfo->devinfo[kline->wr.dev].rangesize, klninfo->status[kline->wr.dev].kline.ws.chipcount); klninfo->devinfo[kline->wr.dev].chipstats[(nonce / klninfo->devinfo[kline->wr.dev].rangesize) + (ok ? 0 : klninfo->status[kline->wr.dev].kline.ws.chipcount)]++; us_diff = us_tdiff(&tv_now, &(kitem->tv_when)); if (klninfo->delay_count == 0) { klninfo->delay_min = us_diff; klninfo->delay_max = us_diff; } else { if (klninfo->delay_min > us_diff) klninfo->delay_min = us_diff; if (klninfo->delay_max < us_diff) klninfo->delay_max = us_diff; } klninfo->delay_count++; klninfo->delay_total += us_diff; if (klninfo->nonce_count > 0) { us_diff = us_tdiff(&(kitem->tv_when), &(klninfo->tv_last_nonce_received)); if (klninfo->nonce_count == 1) { klninfo->nonce_min = us_diff; klninfo->nonce_max = us_diff; } else { if (klninfo->nonce_min > us_diff) klninfo->nonce_min = us_diff; if (klninfo->nonce_max < us_diff) klninfo->nonce_max = us_diff; } klninfo->nonce_total += us_diff; } klninfo->nonce_count++; memcpy(&(klninfo->tv_last_nonce_received), &(kitem->tv_when), sizeof(klninfo->tv_last_nonce_received)); return; } applog(LOG_ERR, "%s%i:%d unknown work (%02x:%08x) - ignored", klncgpu->drv->name, klncgpu->device_id, (int)(kline->wr.dev), kline->wr.workid, (unsigned int)nonce); //inc_hw_errors(klncgpu->thr[0]); } // thread to keep looking for replies static void *klondike_get_replies(void *userdata) { struct cgpu_info *klncgpu = (struct cgpu_info *)userdata; struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *kitem = NULL; char *hexdata; int err, recd, slaves, dev, isc; bool overheat, sent; applog(LOG_DEBUG, "%s%i: listening for replies", klncgpu->drv->name, klncgpu->device_id); while (klncgpu->shutdown == false) { if (klncgpu->usbinfo.nodev) return NULL; if (kitem == NULL) kitem = allocate_kitem(klncgpu); else memset((void *)&(kitem->kline), 0, sizeof(kitem->kline)); err = usb_read(klncgpu, (char *)&(kitem->kline), REPLY_SIZE, &recd, C_GETRESULTS); if (err || recd != REPLY_SIZE) { if (err != -7) applog(LOG_ERR, "%s%i: reply err=%d amt=%d", klncgpu->drv->name, klncgpu->device_id, err, recd); } if (!err && recd == REPLY_SIZE) { cgtime(&(kitem->tv_when)); kitem->block_seq = klninfo->block_seq; if (opt_log_level <= READ_DEBUG) { hexdata = bin2hex((unsigned char *)&(kitem->kline.hd.dev), recd-1); applog(READ_DEBUG, "%s%i:%d reply [%c:%s]", klncgpu->drv->name, klncgpu->device_id, (int)(kitem->kline.hd.dev), kitem->kline.hd.cmd, hexdata); free(hexdata); } // We can't check this until it's initialised if (klninfo->initialised) { rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; rd_unlock(&(klninfo->stat_lock)); if (kitem->kline.hd.dev > slaves) { applog(LOG_ERR, "%s%i: reply [%c] has invalid dev=%d (max=%d) using 0", klncgpu->drv->name, klncgpu->device_id, (char)(kitem->kline.hd.cmd), (int)(kitem->kline.hd.dev), slaves); /* TODO: this is rather problematic if there are slaves * however without slaves - it should always be zero */ kitem->kline.hd.dev = 0; } else { wr_lock(&(klninfo->stat_lock)); klninfo->jobque[kitem->kline.hd.dev].late_update_sequential = 0; wr_unlock(&(klninfo->stat_lock)); } } switch (kitem->kline.hd.cmd) { case KLN_CMD_NONCE: klondike_check_nonce(klncgpu, kitem); display_kline(klncgpu, &kitem->kline, msg_reply); break; case KLN_CMD_STATUS: case KLN_CMD_WORK: case KLN_CMD_ABORT: // We can't do/check this until it's initialised if (klninfo->initialised) { dev = kitem->kline.ws.dev; wr_lock(&(klninfo->stat_lock)); klninfo->jobque[dev].workqc = (int)(kitem->kline.ws.workqc); cgtime(&(klninfo->jobque[dev].last_update)); slaves = klninfo->status[0].kline.ws.slavecount; overheat = klninfo->jobque[dev].overheat; if (dev == 0) { if (kitem->kline.ws.slavecount != slaves) isc = ++klninfo->incorrect_slave_sequential; else isc = klninfo->incorrect_slave_sequential = 0; } wr_unlock(&(klninfo->stat_lock)); if (isc) { applog(LOG_ERR, "%s%i:%d reply [%c] has a diff" " # of slaves=%d (curr=%d)%s", klncgpu->drv->name, klncgpu->device_id, dev, (char)(kitem->kline.ws.cmd), (int)(kitem->kline.ws.slavecount), slaves, isc <= KLN_ISS_IGNORE ? "" : " disabling device"); if (isc > KLN_ISS_IGNORE) usb_nodev(klncgpu); break; } if (!overheat) { double temp = cvtKlnToC(kitem->kline.ws.temp); if (temp >= KLN_KILLWORK_TEMP) { KLINE kline; wr_lock(&(klninfo->stat_lock)); klninfo->jobque[dev].overheat = true; wr_unlock(&(klninfo->stat_lock)); applog(LOG_ERR, "%s%i:%d Critical overheat (%.0fC)", klncgpu->drv->name, klncgpu->device_id, dev, temp); zero_kline(&kline); kline.hd.cmd = KLN_CMD_ABORT; kline.hd.dev = dev; sent = SendCmd(klncgpu, &kline, KSENDHD(0)); kln_disable(klncgpu, dev, false); if (!sent) { applog(LOG_ERR, "%s%i:%d overheat failed to" " abort work - disabling device", klncgpu->drv->name, klncgpu->device_id, dev); usb_nodev(klncgpu); } } } } case KLN_CMD_ENABLE: wr_lock(&(klninfo->stat_lock)); klninfo->errorcount += kitem->kline.ws.errorcount; klninfo->noisecount += kitem->kline.ws.noise; wr_unlock(&(klninfo->stat_lock)); display_kline(klncgpu, &kitem->kline, msg_reply); kitem->ready = true; kitem = NULL; break; case KLN_CMD_CONFIG: display_kline(klncgpu, &kitem->kline, msg_reply); kitem->ready = true; kitem = NULL; break; case KLN_CMD_IDENT: display_kline(klncgpu, &kitem->kline, msg_reply); kitem->ready = true; kitem = NULL; break; default: display_kline(klncgpu, &kitem->kline, msg_reply); break; } } } return NULL; } static void klondike_flush_work(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); KLIST *kitem; KLINE kline; int slaves, dev; klninfo->block_seq++; applog(LOG_DEBUG, "%s%i: flushing work", klncgpu->drv->name, klncgpu->device_id); rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; rd_unlock(&(klninfo->stat_lock)); zero_kline(&kline); kline.hd.cmd = KLN_CMD_ABORT; for (dev = 0; dev <= slaves; dev++) { kline.hd.dev = dev; kitem = SendCmdGetReply(klncgpu, &kline, KSENDHD(0)); if (kitem != NULL) { wr_lock(&(klninfo->stat_lock)); memcpy((void *)&(klninfo->status[dev]), kitem, sizeof(klninfo->status[dev])); wr_unlock(&(klninfo->stat_lock)); kitem = release_kitem(klncgpu, kitem); } } } static bool klondike_thread_prepare(struct thr_info *thr) { struct cgpu_info *klncgpu = thr->cgpu; struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); if (thr_info_create(&(klninfo->replies_thr), NULL, klondike_get_replies, (void *)klncgpu)) { applog(LOG_ERR, "%s%i: thread create failed", klncgpu->drv->name, klncgpu->device_id); return false; } pthread_detach(klninfo->replies_thr.pth); // let the listening get started cgsleep_ms(100); return klondike_init(klncgpu); } static bool klondike_thread_init(struct thr_info *thr) { struct cgpu_info *klncgpu = thr->cgpu; if (klncgpu->usbinfo.nodev) return false; klondike_flush_work(klncgpu); return true; } static void klondike_shutdown(struct thr_info *thr) { struct cgpu_info *klncgpu = thr->cgpu; struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); applog(LOG_DEBUG, "%s%i: shutting down work", klncgpu->drv->name, klncgpu->device_id); kln_disable(klncgpu, klninfo->status[0].kline.ws.slavecount, true); klncgpu->shutdown = true; } static void klondike_thread_enable(struct thr_info *thr) { struct cgpu_info *klncgpu = thr->cgpu; if (klncgpu->usbinfo.nodev) return; /* KLINE kline; zero_kline(&kline); kline.hd.cmd = KLN_CMD_ENABLE; kline.hd.dev = dev; kline.hd.buf[0] = KLN_CMD_ENABLE_OFF; kitem = SendCmdGetReply(klncgpu, &kline, KSENDHD(1)); */ } static bool klondike_send_work(struct cgpu_info *klncgpu, int dev, struct work *work) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); struct work *look, *tmp; KLINE kline; struct timeval tv_old; int wque_size, wque_cleared; if (klncgpu->usbinfo.nodev) return false; zero_kline(&kline); kline.wt.cmd = KLN_CMD_WORK; kline.wt.dev = dev; memcpy(kline.wt.midstate, work->midstate, MIDSTATE_BYTES); memcpy(kline.wt.merkle, work->data + MERKLE_OFFSET, MERKLE_BYTES); kline.wt.workid = (uint8_t)(klninfo->devinfo[dev].nextworkid++ & 0xFF); work->subid = dev*256 + kline.wt.workid; cgtime(&work->tv_stamp); if (opt_log_level <= LOG_DEBUG) { char *hexdata = bin2hex((void *)&kline.wt, sizeof(kline.wt)); applog(LOG_DEBUG, "WORKDATA: %s", hexdata); free(hexdata); } applog(LOG_DEBUG, "%s%i:%d sending work (%d:%02x)", klncgpu->drv->name, klncgpu->device_id, dev, dev, kline.wt.workid); KLIST *kitem = SendCmdGetReply(klncgpu, &kline, sizeof(kline.wt)); if (kitem != NULL) { wr_lock(&(klninfo->stat_lock)); memcpy((void *)&(klninfo->status[dev]), kitem, sizeof(klninfo->status[dev])); wr_unlock(&(klninfo->stat_lock)); kitem = release_kitem(klncgpu, kitem); // remove old work wque_size = 0; wque_cleared = 0; cgtime(&tv_old); wr_lock(&klncgpu->qlock); HASH_ITER(hh, klncgpu->queued_work, look, tmp) { if (ms_tdiff(&tv_old, &(look->tv_stamp)) > OLD_WORK_MS) { __work_completed(klncgpu, look); free_work(look); wque_cleared++; } else wque_size++; } wr_unlock(&klncgpu->qlock); wr_lock(&(klninfo->stat_lock)); klninfo->wque_size = wque_size; klninfo->wque_cleared = wque_cleared; wr_unlock(&(klninfo->stat_lock)); return true; } return false; } static bool klondike_queue_full(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); struct work *work = NULL; int dev, queued, slaves, seq, howlong; struct timeval now; bool nowork; if (klncgpu->shutdown == true) return true; cgtime(&now); rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; for (dev = 0; dev <= slaves; dev++) if (ms_tdiff(&now, &(klninfo->jobque[dev].last_update)) > LATE_UPDATE_MS) { klninfo->jobque[dev].late_update_count++; seq = ++klninfo->jobque[dev].late_update_sequential; rd_unlock(&(klninfo->stat_lock)); if (seq < LATE_UPDATE_LIMIT) { applog(LOG_ERR, "%s%i:%d late update", klncgpu->drv->name, klncgpu->device_id, dev); klondike_get_stats(klncgpu); goto que; } else { applog(LOG_ERR, "%s%i:%d late update (%d) reached - attempting reset", klncgpu->drv->name, klncgpu->device_id, dev, LATE_UPDATE_LIMIT); control_init(klncgpu); kln_enable(klncgpu); klondike_get_stats(klncgpu); rd_lock(&(klninfo->stat_lock)); howlong = ms_tdiff(&now, &(klninfo->jobque[dev].last_update)); if (howlong > LATE_UPDATE_MS) { rd_unlock(&(klninfo->stat_lock)); if (howlong > LATE_UPDATE_NODEV_MS) { applog(LOG_ERR, "%s%i:%d reset failed - dropping device", klncgpu->drv->name, klncgpu->device_id, dev); usb_nodev(klncgpu); } else cgsleep_ms(LATE_UPDATE_SLEEP_MS); return true; } break; } } rd_unlock(&(klninfo->stat_lock)); que: nowork = true; for (queued = 0; queued < MAX_WORK_COUNT-1; queued++) for (dev = 0; dev <= slaves; dev++) { tryagain: rd_lock(&(klninfo->stat_lock)); if (klninfo->jobque[dev].overheat) { double temp = cvtKlnToC(klninfo->status[0].kline.ws.temp); if ((queued == MAX_WORK_COUNT-2) && ms_tdiff(&now, &(klninfo->jobque[dev].last_update)) > (LATE_UPDATE_MS/2)) { rd_unlock(&(klninfo->stat_lock)); klondike_get_stats(klncgpu); goto tryagain; } if (temp <= KLN_COOLED_DOWN) { klninfo->jobque[dev].overheat = false; rd_unlock(&(klninfo->stat_lock)); applog(LOG_ERR, "%s%i:%d Overheat recovered (%.0fC)", klncgpu->drv->name, klncgpu->device_id, dev, temp); kln_enable(klncgpu); goto tryagain; } else { rd_unlock(&(klninfo->stat_lock)); continue; } } if (klninfo->jobque[dev].workqc <= queued) { rd_unlock(&(klninfo->stat_lock)); if (!work) work = get_queued(klncgpu); if (unlikely(!work)) return false; nowork = false; if (klondike_send_work(klncgpu, dev, work)) return false; } else rd_unlock(&(klninfo->stat_lock)); } if (nowork) cgsleep_ms(10); // avoid a hard loop in case we have nothing to do return true; } static int64_t klondike_scanwork(struct thr_info *thr) { struct cgpu_info *klncgpu = thr->cgpu; struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); int64_t newhashcount = 0; int dev, slaves; if (klncgpu->usbinfo.nodev) return -1; restart_wait(thr, 200); if (klninfo->status != NULL) { rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; for (dev = 0; dev <= slaves; dev++) { uint64_t newhashdev = 0, hashcount; int maxcount; hashcount = K_HASHCOUNT(klninfo->status[dev].kline.ws.hashcount); maxcount = K_MAXCOUNT(klninfo->status[dev].kline.ws.maxcount); // todo: chg this to check workid for wrapped instead if (klninfo->devinfo[dev].lasthashcount > hashcount) newhashdev += maxcount; // hash counter wrapped newhashdev += hashcount - klninfo->devinfo[dev].lasthashcount; klninfo->devinfo[dev].lasthashcount = hashcount; if (maxcount != 0) klninfo->hashcount += (newhashdev << 32) / maxcount; } newhashcount += 0xffffffffull * (uint64_t)klninfo->noncecount; klninfo->noncecount = 0; rd_unlock(&(klninfo->stat_lock)); } return newhashcount; } static void get_klondike_statline_before(char *buf, size_t siz, struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); uint8_t temp = 0xFF; uint16_t fan = 0; uint16_t clock = 0; int dev, slaves; char tmp[16]; if (klninfo->status == NULL) { blank_get_statline_before(buf, siz, klncgpu); return; } rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; for (dev = 0; dev <= slaves; dev++) { if (klninfo->status[dev].kline.ws.temp < temp) temp = klninfo->status[dev].kline.ws.temp; fan += klninfo->cfg[dev].kline.cfg.fantarget; clock += (uint16_t)K_HASHCLOCK(klninfo->cfg[dev].kline.cfg.hashclock); } rd_unlock(&(klninfo->stat_lock)); fan /= slaves + 1; fan *= 100/255; if (fan > 99) // short on screen space fan = 99; clock /= slaves + 1; if (clock > 999) // error - so truncate it clock = 999; snprintf(tmp, sizeof(tmp), "%2.0fC", cvtKlnToC(temp)); if (strlen(tmp) < 4) strcat(tmp, " "); tailsprintf(buf, siz, "%3dMHz %2d%% %s| ", (int)clock, fan, tmp); } static struct api_data *klondike_api_stats(struct cgpu_info *klncgpu) { struct klondike_info *klninfo = (struct klondike_info *)(klncgpu->device_data); struct api_data *root = NULL; char buf[32]; int dev, slaves; if (klninfo->status == NULL) return NULL; rd_lock(&(klninfo->stat_lock)); slaves = klninfo->status[0].kline.ws.slavecount; for (dev = 0; dev <= slaves; dev++) { float fTemp = cvtKlnToC(klninfo->status[dev].kline.ws.temp); sprintf(buf, "Temp %d", dev); root = api_add_temp(root, buf, &fTemp, true); double dClk = (double)K_HASHCLOCK(klninfo->cfg[dev].kline.cfg.hashclock); sprintf(buf, "Clock %d", dev); root = api_add_freq(root, buf, &dClk, true); unsigned int iFan = (unsigned int)100 * klninfo->cfg[dev].kline.cfg.fantarget / 255; sprintf(buf, "Fan Percent %d", dev); root = api_add_int(root, buf, (int *)(&iFan), true); iFan = 0; if (klninfo->status[dev].kline.ws.fanspeed > 0) iFan = (unsigned int)TACH_FACTOR / klninfo->status[dev].kline.ws.fanspeed; sprintf(buf, "Fan RPM %d", dev); root = api_add_int(root, buf, (int *)(&iFan), true); if (klninfo->devinfo[dev].chipstats != NULL) { char data[2048]; char one[32]; int n; sprintf(buf, "Nonces / Chip %d", dev); data[0] = '\0'; for (n = 0; n < klninfo->status[dev].kline.ws.chipcount; n++) { snprintf(one, sizeof(one), "%07d ", klninfo->devinfo[dev].chipstats[n]); strcat(data, one); } root = api_add_string(root, buf, data, true); sprintf(buf, "Errors / Chip %d", dev); data[0] = '\0'; for (n = 0; n < klninfo->status[dev].kline.ws.chipcount; n++) { snprintf(one, sizeof(one), "%07d ", klninfo->devinfo[dev].chipstats[n + klninfo->status[dev].kline.ws.chipcount]); strcat(data, one); } root = api_add_string(root, buf, data, true); } } root = api_add_uint64(root, "Hash Count", &(klninfo->hashcount), true); root = api_add_uint64(root, "Error Count", &(klninfo->errorcount), true); root = api_add_uint64(root, "Noise Count", &(klninfo->noisecount), true); root = api_add_int(root, "KLine Limit", &(klninfo->kline_count), true); root = api_add_int(root, "KLine Used", &(klninfo->used_count), true); root = api_add_elapsed(root, "KQue Delay Count", &(klninfo->delay_count), true); root = api_add_elapsed(root, "KQue Delay Total", &(klninfo->delay_total), true); root = api_add_elapsed(root, "KQue Delay Min", &(klninfo->delay_min), true); root = api_add_elapsed(root, "KQue Delay Max", &(klninfo->delay_max), true); double avg; if (klninfo->delay_count == 0) avg = 0; else avg = klninfo->delay_total / klninfo->delay_count; root = api_add_diff(root, "KQue Delay Avg", &avg, true); root = api_add_elapsed(root, "KQue Nonce Count", &(klninfo->nonce_count), true); root = api_add_elapsed(root, "KQue Nonce Total", &(klninfo->nonce_total), true); root = api_add_elapsed(root, "KQue Nonce Min", &(klninfo->nonce_min), true); root = api_add_elapsed(root, "KQue Nonce Max", &(klninfo->nonce_max), true); if (klninfo->nonce_count == 0) avg = 0; else avg = klninfo->nonce_total / klninfo->nonce_count; root = api_add_diff(root, "KQue Nonce Avg", &avg, true); root = api_add_int(root, "WQue Size", &(klninfo->wque_size), true); root = api_add_int(root, "WQue Cleared", &(klninfo->wque_cleared), true); rd_unlock(&(klninfo->stat_lock)); return root; } struct device_drv klondike_drv = { .drv_id = DRIVER_klondike, .dname = "Klondike", .name = "KLN", .drv_detect = klondike_detect, .get_api_stats = klondike_api_stats, .get_statline_before = get_klondike_statline_before, .get_stats = klondike_get_stats, .identify_device = klondike_identify, .thread_prepare = klondike_thread_prepare, .thread_init = klondike_thread_init, .hash_work = hash_queued_work, .scanwork = klondike_scanwork, .queue_full = klondike_queue_full, .flush_work = klondike_flush_work, .thread_shutdown = klondike_shutdown, .thread_enable = klondike_thread_enable };