ccminer/myriadgroestl.cpp

#include <string.h>
#include <stdint.h>
#include <cuda_runtime.h>
#include <openssl/sha.h>

#include "sph/sph_groestl.h"

#include "miner.h"

void myriadgroestl_cpu_init(int thr_id, uint32_t threads);
void myriadgroestl_cpu_free(int thr_id);
void myriadgroestl_cpu_setBlock(int thr_id, void *data, void *pTargetIn);
void myriadgroestl_cpu_hash(int thr_id, uint32_t threads, uint32_t startNounce, void *outputHashes, uint32_t *nounce);

void myriadhash(void *state, const void *input)
{
	uint32_t _ALIGN(64) hash[16];
	sph_groestl512_context ctx_groestl;
	SHA256_CTX sha256;

	sph_groestl512_init(&ctx_groestl);
	sph_groestl512(&ctx_groestl, input, 80);
	sph_groestl512_close(&ctx_groestl, hash);

	SHA256_Init(&sha256);
	SHA256_Update(&sha256,(unsigned char *)hash, 64);
	SHA256_Final((unsigned char *)hash, &sha256);

	memcpy(state, hash, 32);
}

static bool init[MAX_GPUS] = { 0 };

int scanhash_myriad(int thr_id, struct work *work, uint32_t max_nonce, unsigned long *hashes_done)
{
	uint32_t _ALIGN(64) endiandata[32];
	uint32_t *pdata = work->data;
	uint32_t *ptarget = work->target;
	uint32_t start_nonce = pdata[19];
	uint32_t throughput = cuda_default_throughput(thr_id, 1U << 17);
	if (init[thr_id]) throughput = min(throughput, max_nonce - start_nonce);

	uint32_t *outputHash = (uint32_t*)malloc(throughput * 64);

	if (opt_benchmark)
		((uint32_t*)ptarget)[7] = 0x0000ff;

	// init
	if(!init[thr_id])
	{
		cudaSetDevice(device_map[thr_id]);
		myriadgroestl_cpu_init(thr_id, throughput);
		init[thr_id] = true;
	}

	for (int k=0; k < 20; k++)
		be32enc(&endiandata[k], pdata[k]);

	// Context mit dem Endian gedrehten Blockheader vorbereiten (Nonce wird sp<EFBFBD>ter ersetzt)
	myriadgroestl_cpu_setBlock(thr_id, endiandata, (void*)ptarget);

	do {
		// GPU
		uint32_t foundNounce = UINT32_MAX;

		*hashes_done = pdata[19] - start_nonce + throughput;

		myriadgroestl_cpu_hash(thr_id, throughput, pdata[19], outputHash, &foundNounce);

		if (foundNounce < UINT32_MAX)
		{
			uint32_t _ALIGN(64) vhash[8];
			endiandata[19] = swab32(foundNounce);
			myriadhash(vhash, endiandata);
			if (vhash[7] <= ptarget[7] && fulltest(vhash, ptarget)) {
				work_set_target_ratio(work, vhash);
				pdata[19] = foundNounce;
				free(outputHash);
				return 1;
			} else {
				gpulog(LOG_WARNING, thr_id, "result for %08x does not validate on CPU!", foundNounce);
			}
		}

		if ((uint64_t) pdata[19] + throughput > max_nonce) {
			*hashes_done = pdata[19] - start_nonce;
			pdata[19] = max_nonce;
			break;
		}
		pdata[19] += throughput;

	} while (!work_restart[thr_id].restart);

	free(outputHash);
	return 0;
}

// cleanup
void free_myriad(int thr_id)
{
	if (!init[thr_id])
		return;

	cudaThreadSynchronize();

	myriadgroestl_cpu_free(thr_id);
	init[thr_id] = false;

	cudaDeviceSynchronize();
}
-												min() and max(a,b) are not defined on linux,

in fact max exists in jansson includes (in tree only)

Add them to miner.h

											
										
										
											10 years ago
+								#include <string.h>
 								#include <stdint.h>
-												Various algos cleanup + lyra2 sec nonce fix

											
										
										
											10 years ago
+								#include <cuda_runtime.h>
-												min() and max(a,b) are not defined on linux,

in fact max exists in jansson includes (in tree only)

Add them to miner.h

											
										
										
											10 years ago
+								#include <openssl/sha.h>
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+								#include "sph/sph_groestl.h"
 								#include "miner.h"
-												cleanup: use unsigned throughput parameters

Yes, its a big commit, was waiting 1.6 to do that...
Sorry for your possible merge issues ;)

											
										
										
											10 years ago
+								void myriadgroestl_cpu_init(int thr_id, uint32_t threads);
-												algos: add functions to free allocated resources

Will be used later for algo switching

not really tested yet...

											
										
										
											9 years ago
+								void myriadgroestl_cpu_free(int thr_id);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+								void myriadgroestl_cpu_setBlock(int thr_id, void *data, void *pTargetIn);
-												cleanup: use unsigned throughput parameters

Yes, its a big commit, was waiting 1.6 to do that...
Sorry for your possible merge issues ;)

											
										
										
											10 years ago
+								void myriadgroestl_cpu_hash(int thr_id, uint32_t threads, uint32_t startNounce, void *outputHashes, uint32_t *nounce);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+								void myriadhash(void *state, const void *input)
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+								{
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+									uint32_t _ALIGN(64) hash[16];
-												myr-gr: clean up

											
										
										
											10 years ago
+									sph_groestl512_context ctx_groestl;
 									SHA256_CTX sha256;
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												myr-gr: clean up

											
										
										
											10 years ago
+									sph_groestl512_init(&ctx_groestl);
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+									sph_groestl512(&ctx_groestl, input, 80);
 									sph_groestl512_close(&ctx_groestl, hash);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												myr-gr: clean up

											
										
										
											10 years ago
+									SHA256_Init(&sha256);
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+									SHA256_Update(&sha256,(unsigned char *)hash, 64);
 									SHA256_Final((unsigned char *)hash, &sha256);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+									memcpy(state, hash, 32);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+								}
-												Handle a maximum of 16 gpus (vs 8 before)

Some cards have 2 gpus on board...

											
										
										
											10 years ago
+								static bool init[MAX_GPUS] = { 0 };
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												start v1.7, apply new prototypes to all algos

											
										
										
											9 years ago
+								int scanhash_myriad(int thr_id, struct work *work, uint32_t max_nonce, unsigned long *hashes_done)
-												Allow different intensity per device

and clean the old variables, no more required

											
										
										
											10 years ago
+								{
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+									uint32_t _ALIGN(64) endiandata[32];
-												start v1.7, apply new prototypes to all algos

											
										
										
											9 years ago
+									uint32_t *pdata = work->data;
 									uint32_t *ptarget = work->target;
-												rename skein2 to c++, no cuda kernel code

and some other changes...

											
										
										
											10 years ago
+									uint32_t start_nonce = pdata[19];
-												intensity: do not reduce throughput before init

Else the memory allocated could be less than required later

btw, use the new "cuda" function to apply intensity/throughput

											
										
										
											9 years ago
+									uint32_t throughput = cuda_default_throughput(thr_id, 1U << 17);
 									if (init[thr_id]) throughput = min(throughput, max_nonce - start_nonce);
-												bump to revision V1.1 with Killer Groestl

											
										
										
											11 years ago
-												Various algos cleanup + lyra2 sec nonce fix

											
										
										
											10 years ago
+									uint32_t *outputHash = (uint32_t*)malloc(throughput * 64);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
 									if (opt_benchmark)
 										((uint32_t*)ptarget)[7] = 0x0000ff;
 									// init
 									if(!init[thr_id])
 									{
-												Various algos cleanup + lyra2 sec nonce fix

											
										
										
											10 years ago
+										cudaSetDevice(device_map[thr_id]);
-												api: report throughput  when default

											
										
										
											10 years ago
+										myriadgroestl_cpu_init(thr_id, throughput);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+										init[thr_id] = true;
 									}
-												Allow different intensity per device

and clean the old variables, no more required

											
										
										
											10 years ago
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+									for (int k=0; k < 20; k++)
 										be32enc(&endiandata[k], pdata[k]);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
 									// Context mit dem Endian gedrehten Blockheader vorbereiten (Nonce wird sp<EFBFBD>ter ersetzt)
 									myriadgroestl_cpu_setBlock(thr_id, endiandata, (void*)ptarget);
-												Allow different intensity per device

and clean the old variables, no more required

											
										
										
											10 years ago
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+									do {
 										// GPU
-												Add skein algo (Skeincoin, Myriad, Unat...)

SKEIN512 + SHA256

Signed-off-by: Tanguy Pruvot <tanguy.pruvot@gmail.com>

											
										
										
											10 years ago
+										uint32_t foundNounce = UINT32_MAX;
-												Various algos cleanup + lyra2 sec nonce fix

											
										
										
											10 years ago
 										*hashes_done = pdata[19] - start_nonce + throughput;
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												api: report throughput  when default

											
										
										
											10 years ago
+										myriadgroestl_cpu_hash(thr_id, throughput, pdata[19], outputHash, &foundNounce);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												Add skein algo (Skeincoin, Myriad, Unat...)

SKEIN512 + SHA256

Signed-off-by: Tanguy Pruvot <tanguy.pruvot@gmail.com>

											
										
										
											10 years ago
+										if (foundNounce < UINT32_MAX)
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+										{
-												start v1.7, apply new prototypes to all algos

											
										
										
											9 years ago
+											uint32_t _ALIGN(64) vhash[8];
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+											endiandata[19] = swab32(foundNounce);
-												start v1.7, apply new prototypes to all algos

											
										
										
											9 years ago
+											myriadhash(vhash, endiandata);
 											if (vhash[7] <= ptarget[7] && fulltest(vhash, ptarget)) {
-												diff: use the new function in all algos

											
										
										
											9 years ago
+												work_set_target_ratio(work, vhash);
-												Various algos cleanup + lyra2 sec nonce fix

											
										
										
											10 years ago
+												pdata[19] = foundNounce;
 												free(outputHash);
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+												return 1;
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+											} else {
-												benchmark: enhance the mem leak detection

reduce "false" warnings, and ignore unrelated/small ones <= 1 MB

On windows the gpu memory can be allocated by other processes

+ some cleanup in algos... (free/gpulog)

											
										
										
											9 years ago
+												gpulog(LOG_WARNING, thr_id, "result for %08x does not validate on CPU!", foundNounce);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+											}
 										}
-												myriad/groestl: some more cleanup + tabs...

											
										
										
											10 years ago
+										if ((uint64_t) pdata[19] + throughput > max_nonce) {
-												rename skein2 to c++, no cuda kernel code

and some other changes...

											
										
										
											10 years ago
+											*hashes_done = pdata[19] - start_nonce;
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+											pdata[19] = max_nonce;
-												Add intensity to last algos and fix quark speed

											
										
										
											10 years ago
+											break;
 										}
-												api: report throughput  when default

											
										
										
											10 years ago
+										pdata[19] += throughput;
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
-												Add intensity to last algos and fix quark speed

											
										
										
											10 years ago
+									} while (!work_restart[thr_id].restart);
-												Revision 0.6 with myriad-groestl and jackpot coin

											
										
										
											11 years ago
+									free(outputHash);
 									return 0;
 								}
-												algos: add functions to free allocated resources

Will be used later for algo switching

not really tested yet...

											
										
										
											9 years ago
+								// cleanup
 								void free_myriad(int thr_id)
 								{
 									if (!init[thr_id])
 										return;
-												benchmark: enhance the mem leak detection

reduce "false" warnings, and ignore unrelated/small ones <= 1 MB

On windows the gpu memory can be allocated by other processes

+ some cleanup in algos... (free/gpulog)

											
										
										
											9 years ago
+									cudaThreadSynchronize();
-												algos: add functions to free allocated resources

Will be used later for algo switching

not really tested yet...

											
										
										
											9 years ago
 									myriadgroestl_cpu_free(thr_id);
 									init[thr_id] = false;
 									cudaDeviceSynchronize();
-												intensity: do not reduce throughput before init

Else the memory allocated could be less than required later

btw, use the new "cuda" function to apply intensity/throughput

											
										
										
											9 years ago
+								}