mirror of https://github.com/GOSTSec/sgminer
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
226 lines
7.0 KiB
226 lines
7.0 KiB
#include "build_kernel.h" |
|
#include "patch_kernel.h" |
|
|
|
static char *file_contents(const char *filename, int *length) |
|
{ |
|
char *fullpath = (char *)alloca(PATH_MAX); |
|
void *buffer; |
|
FILE *f; |
|
|
|
/* Try in the optional kernel path first, defaults to PREFIX */ |
|
strcpy(fullpath, opt_kernel_path); |
|
strcat(fullpath, filename); |
|
f = fopen(fullpath, "rb"); |
|
if (!f) { |
|
/* Then try from the path sgminer was called */ |
|
strcpy(fullpath, sgminer_path); |
|
strcat(fullpath, filename); |
|
f = fopen(fullpath, "rb"); |
|
} |
|
if (!f) { |
|
/* Then from `pwd`/kernel/ */ |
|
strcpy(fullpath, sgminer_path); |
|
strcat(fullpath, "/kernel/"); |
|
strcat(fullpath, filename); |
|
f = fopen(fullpath, "rb"); |
|
} |
|
/* Finally try opening it directly */ |
|
if (!f) |
|
f = fopen(filename, "rb"); |
|
|
|
if (!f) { |
|
applog(LOG_ERR, "Unable to open %s or %s for reading", |
|
filename, fullpath); |
|
return NULL; |
|
} |
|
|
|
fseek(f, 0, SEEK_END); |
|
*length = ftell(f); |
|
fseek(f, 0, SEEK_SET); |
|
|
|
buffer = malloc(*length+1); |
|
*length = fread(buffer, 1, *length, f); |
|
fclose(f); |
|
((char*)buffer)[*length] = '\0'; |
|
|
|
return (char*)buffer; |
|
} |
|
|
|
void set_base_compiler_options(build_kernel_data *data) |
|
{ |
|
char buf[255]; |
|
sprintf(data->compiler_options, "-I \"%s\" -I \"%s/kernel\" -I \".\" -D WORKSIZE=%d", |
|
data->sgminer_path, data->sgminer_path, (int)data->work_size); |
|
applog(LOG_DEBUG, "Setting worksize to %d", (int)(data->work_size)); |
|
|
|
sprintf(buf, "w%dl%d", (int)data->work_size, (int)sizeof(long)); |
|
strcat(data->binary_filename, buf); |
|
|
|
if (data->has_bit_align) { |
|
strcat(data->compiler_options, " -D BITALIGN"); |
|
applog(LOG_DEBUG, "cl_amd_media_ops found, setting BITALIGN"); |
|
} else |
|
applog(LOG_DEBUG, "cl_amd_media_ops not found, will not set BITALIGN"); |
|
|
|
if (data->kernel_path) { |
|
strcat(data->compiler_options, " -I \""); |
|
strcat(data->compiler_options, data->kernel_path); |
|
strcat(data->compiler_options, "\""); |
|
} |
|
|
|
if (data->patch_bfi) { |
|
strcat(data->compiler_options, " -D BFI_INT"); |
|
applog(LOG_DEBUG, "BFI_INT patch requiring device found, patched source with BFI_INT"); |
|
} else |
|
applog(LOG_DEBUG, "BFI_INT patch requiring device not found, will not BFI_INT patch"); |
|
|
|
if (data->opencl_version < 1.1) |
|
strcat(data->compiler_options, " -D OCL1"); |
|
} |
|
|
|
bool needs_bfi_patch(build_kernel_data *data) |
|
{ |
|
if (data->has_bit_align && |
|
(data->opencl_version < 1.2) && |
|
(strstr(data->platform, "Cedar") || |
|
strstr(data->platform, "Redwood") || |
|
strstr(data->platform, "Juniper") || |
|
strstr(data->platform, "Cypress" ) || |
|
strstr(data->platform, "Hemlock" ) || |
|
strstr(data->platform, "Caicos" ) || |
|
strstr(data->platform, "Turks" ) || |
|
strstr(data->platform, "Barts" ) || |
|
strstr(data->platform, "Cayman" ) || |
|
strstr(data->platform, "Antilles" ) || |
|
strstr(data->platform, "Wrestler" ) || |
|
strstr(data->platform, "Zacate" ) || |
|
strstr(data->platform, "WinterPark" ))) |
|
return true; |
|
else |
|
return false; |
|
} |
|
|
|
cl_program build_opencl_kernel(build_kernel_data *data, const char *filename) |
|
{ |
|
int pl; |
|
char *source = file_contents(data->source_filename, &pl); |
|
size_t sourceSize[] = {(size_t)pl}; |
|
cl_int status; |
|
cl_program program = NULL; |
|
cl_program ret = NULL; |
|
|
|
if (!source) |
|
goto out; |
|
|
|
program = clCreateProgramWithSource(data->context, 1, (const char **)&source, sourceSize, &status); |
|
if (status != CL_SUCCESS) { |
|
applog(LOG_ERR, "Error %d: Loading Binary into cl_program (clCreateProgramWithSource)", status); |
|
goto out; |
|
} |
|
|
|
applog(LOG_DEBUG, "CompilerOptions: %s", data->compiler_options); |
|
status = clBuildProgram(program, 1, data->device, data->compiler_options, NULL, NULL); |
|
|
|
if (status != CL_SUCCESS) { |
|
size_t log_size; |
|
applog(LOG_ERR, "Error %d: Building Program (clBuildProgram)", status); |
|
status = clGetProgramBuildInfo(program, *data->device, CL_PROGRAM_BUILD_LOG, 0, NULL, &log_size); |
|
|
|
char *sz_log = (char *)malloc(log_size + 1); |
|
status = clGetProgramBuildInfo(program, *data->device, CL_PROGRAM_BUILD_LOG, log_size, sz_log, NULL); |
|
sz_log[log_size] = '\0'; |
|
applogsiz(LOG_ERR, log_size, "%s", sz_log); |
|
free(sz_log); |
|
goto out; |
|
} |
|
|
|
ret = program; |
|
out: |
|
if (source) free(source); |
|
return ret; |
|
} |
|
|
|
bool save_opencl_kernel(build_kernel_data *data, cl_program program) |
|
{ |
|
cl_uint slot, cpnd = 0; |
|
size_t *binary_sizes = (size_t *)calloc(MAX_GPUDEVICES * 4, sizeof(size_t)); |
|
char **binaries = NULL; |
|
cl_int status; |
|
FILE *binaryfile; |
|
bool ret = false; |
|
|
|
#ifdef __APPLE__ |
|
/* OSX OpenCL breaks reading off binaries with >1 GPU so always build |
|
* from source. */ |
|
goto out; |
|
#endif |
|
|
|
status = clGetProgramInfo(program, CL_PROGRAM_NUM_DEVICES, sizeof(cl_uint), &cpnd, NULL); |
|
if (unlikely(status != CL_SUCCESS)) { |
|
applog(LOG_ERR, "Error %d: Getting program info CL_PROGRAM_NUM_DEVICES. (clGetProgramInfo)", status); |
|
goto out; |
|
} |
|
|
|
status = clGetProgramInfo(program, CL_PROGRAM_BINARY_SIZES, sizeof(size_t)*cpnd, binary_sizes, NULL); |
|
if (unlikely(status != CL_SUCCESS)) { |
|
applog(LOG_ERR, "Error %d: Getting program info CL_PROGRAM_BINARY_SIZES. (clGetProgramInfo)", status); |
|
goto out; |
|
} |
|
|
|
binaries = (char **)calloc(MAX_GPUDEVICES * 4, sizeof(char *)); |
|
for (slot = 0; slot < cpnd; slot++) |
|
if (binary_sizes[slot]) |
|
binaries[slot] = (char *)calloc(binary_sizes[slot], 1); |
|
|
|
status = clGetProgramInfo(program, CL_PROGRAM_BINARIES, sizeof(char *) * cpnd, binaries, NULL ); |
|
if (unlikely(status != CL_SUCCESS)) { |
|
applog(LOG_ERR, "Error %d: Getting program info. CL_PROGRAM_BINARIES (clGetProgramInfo)", status); |
|
goto out; |
|
} |
|
|
|
/* The actual compiled binary ends up in a RANDOM slot! Grr, so we have |
|
* to iterate over all the binary slots and find where the real program |
|
* is. What the heck is this!? */ |
|
for (slot = 0; slot < cpnd; slot++) |
|
if (binary_sizes[slot]) |
|
break; |
|
|
|
/* copy over all of the generated binaries. */ |
|
applog(LOG_DEBUG, "Binary size found in binary slot %d: %d", slot, (int)(binary_sizes[slot])); |
|
if (!binary_sizes[slot]) { |
|
applog(LOG_ERR, "OpenCL compiler generated a zero sized binary!"); |
|
goto out; |
|
} |
|
|
|
/* Patch the kernel if the hardware supports BFI_INT but it needs to |
|
* be hacked in */ |
|
if (data->patch_bfi) { |
|
if (kernel_bfi_patch(binaries[slot], binary_sizes[slot]) != 0) { |
|
quit(1, "Could not patch BFI_INT, please report this issue."); |
|
} |
|
} |
|
|
|
/* Save the binary to be loaded next time */ |
|
binaryfile = fopen(data->binary_filename, "wb"); |
|
if (!binaryfile) { |
|
/* Not fatal, just means we build it again next time, unless BFI patch is needed */ |
|
applog(LOG_DEBUG, "Unable to create file %s", data->binary_filename); |
|
goto out; |
|
} else { |
|
if (unlikely(fwrite(binaries[slot], 1, binary_sizes[slot], binaryfile) != binary_sizes[slot])) { |
|
applog(LOG_ERR, "Unable to fwrite to binaryfile"); |
|
goto out; |
|
} |
|
fclose(binaryfile); |
|
} |
|
|
|
ret = true; |
|
out: |
|
for (slot = 0; slot < cpnd; slot++) |
|
if (binary_sizes[slot]) |
|
free(binaries[slot]); |
|
if (binaries) free(binaries); |
|
free(binary_sizes); |
|
|
|
return ret; |
|
}
|
|
|