libgpusolver_2libclwrapper_8cpp_source.html

 #define _CRT_SECURE_NO_WARNINGS

 #include <cstdio>
 #include <cstdlib>
 //#include <chrono>
 #include <fstream>
 #include <streambuf>
 #include <iostream>
 #include <queue>
 #include <vector>
 #include <random>
 //#include <atomic>
 #include "libclwrapper.h"
 #include "kernels/silentarmy.h" // Created from CMake
 #include "../primitives/block.h"

 // workaround lame platforms
 #if !CL_VERSION_1_2
 #define CL_MAP_WRITE_INVALIDATE_REGION CL_MAP_WRITE
 #define CL_MEM_HOST_READ_ONLY 0
 #endif

 #undef min
 #undef max

 //#define DEBUG

 using namespace std;

 unsigned const cl_gpuminer::c_defaultLocalWorkSize = 32;
 unsigned const cl_gpuminer::c_defaultGlobalWorkSizeMultiplier = 4096; // * CL_DEFAULT_LOCAL_WORK_SIZE
 unsigned const cl_gpuminer::c_defaultMSPerBatch = 0;
 bool cl_gpuminer::s_allowCPU = false;
 unsigned cl_gpuminer::s_extraRequiredGPUMem;
 unsigned cl_gpuminer::s_msPerBatch = cl_gpuminer::c_defaultMSPerBatch;
 unsigned cl_gpuminer::s_workgroupSize = cl_gpuminer::c_defaultLocalWorkSize;
 unsigned cl_gpuminer::s_initialGlobalWorkSize = cl_gpuminer::c_defaultGlobalWorkSizeMultiplier * cl_gpuminer::c_defaultLocalWorkSize;

 #if defined(_WIN32)
 extern "C" __declspec(dllimport) void __stdcall OutputDebugStringA(const char* lpOutputString);
 static std::atomic_flag s_logSpin = ATOMIC_FLAG_INIT;
 #define CL_LOG(_contents) \
         do \
         { \
                 std::stringstream ss; \
                 ss << _contents; \
                 while (s_logSpin.test_and_set(std::memory_order_acquire)) {} \
                 OutputDebugStringA(ss.str().c_str()); \
                 cerr << ss.str() << endl << flush; \
                 s_logSpin.clear(std::memory_order_release); \
         } while (false)
 #else
 #define CL_LOG(_contents) cout << "[OPENCL]:" << _contents << endl
 #endif

 // Types of OpenCL devices we are interested in
 #define CL_QUERIED_DEVICE_TYPES (CL_DEVICE_TYPE_GPU | CL_DEVICE_TYPE_ACCELERATOR)

 cl_gpuminer::cl_gpuminer()
 :       m_openclOnePointOne()
 {

         dst_solutions = (uint32_t *) malloc(10*NUM_INDICES*sizeof(uint32_t));
         if(dst_solutions == NULL)
                 std::cout << "Error allocating dst_solutions array!" << std::endl;

 }

 cl_gpuminer::~cl_gpuminer()
 {
         if(dst_solutions != NULL)
                 free(dst_solutions);
         finish();
 }

 std::vector<cl::Platform> cl_gpuminer::getPlatforms()
 {
         vector<cl::Platform> platforms;
         try
         {
                 cl::Platform::get(&platforms);
         }
         catch(cl::Error const& err)
         {
 #if defined(CL_PLATFORM_NOT_FOUND_KHR)
                 if (err.err() == CL_PLATFORM_NOT_FOUND_KHR)
                         CL_LOG("No OpenCL platforms found");
                 else
 #endif
                         throw err;
         }
         return platforms;
 }

 string cl_gpuminer::platform_info(unsigned _platformId, unsigned _deviceId)
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return {};
         // get GPU device of the selected platform
         unsigned platform_num = min<unsigned>(_platformId, platforms.size() - 1);
         vector<cl::Device> devices = getDevices(platforms, _platformId);
         if (devices.empty())
         {
                 CL_LOG("No OpenCL devices found.");
                 return {};
         }

         // use selected default device
         unsigned device_num = min<unsigned>(_deviceId, devices.size() - 1);
         cl::Device& device = devices[device_num];
         string device_version = device.getInfo<CL_DEVICE_VERSION>();

         return "{ \"platform\": \"" + platforms[platform_num].getInfo<CL_PLATFORM_NAME>() + "\", \"device\": \"" + device.getInfo<CL_DEVICE_NAME>() + "\", \"version\": \"" + device_version + "\" }";
 }

 std::vector<cl::Device> cl_gpuminer::getDevices(std::vector<cl::Platform> const& _platforms, unsigned _platformId)
 {
         vector<cl::Device> devices;
         unsigned platform_num = min<unsigned>(_platformId, _platforms.size() - 1);
         try
         {
                 _platforms[platform_num].getDevices(
                         s_allowCPU ? CL_DEVICE_TYPE_ALL : CL_QUERIED_DEVICE_TYPES,
                         &devices
                 );
         }
         catch (cl::Error const& err)
         {
                 // if simply no devices found return empty vector
                 if (err.err() != CL_DEVICE_NOT_FOUND)
                         throw err;
         }
         return devices;
 }

 unsigned cl_gpuminer::getNumPlatforms()
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return 0;
         return platforms.size();
 }

 unsigned cl_gpuminer::getNumDevices(unsigned _platformId)
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return 0;

         vector<cl::Device> devices = getDevices(platforms, _platformId);
         if (devices.empty())
         {
                 CL_LOG("No OpenCL devices found.");
                 return 0;
         }
         return devices.size();
 }

 // This needs customizing apon completion of the kernel - Checks memory requirements - May not be applicable
 bool cl_gpuminer::configureGPU(
         unsigned _platformId,
         unsigned _localWorkSize,
         unsigned _globalWorkSize
 )
 {
         // Set the local/global work sizes
         s_workgroupSize = _localWorkSize;
         s_initialGlobalWorkSize = _globalWorkSize;

         return searchForAllDevices(_platformId, [](cl::Device const& _device) -> bool
                 {
                         cl_ulong result;
                         _device.getInfo(CL_DEVICE_GLOBAL_MEM_SIZE, &result);

                                 CL_LOG(
                                         "Found suitable OpenCL device [" << _device.getInfo<CL_DEVICE_NAME>()
                                         << "] with " << result << " bytes of GPU memory"
                                 );
                                 return true;
                 }
         );
 }

 bool cl_gpuminer::searchForAllDevices(function<bool(cl::Device const&)> _callback)
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return false;
         for (unsigned i = 0; i < platforms.size(); ++i)
                 if (searchForAllDevices(i, _callback))
                         return true;

         return false;
 }

 bool cl_gpuminer::searchForAllDevices(unsigned _platformId, function<bool(cl::Device const&)> _callback)
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return false;
         if (_platformId >= platforms.size())
                 return false;

         vector<cl::Device> devices = getDevices(platforms, _platformId);
         for (cl::Device const& device: devices)
                 if (_callback(device))
                         return true;

         return false;
 }

 void cl_gpuminer::doForAllDevices(function<void(cl::Device const&)> _callback)
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return;
         for (unsigned i = 0; i < platforms.size(); ++i)
                 doForAllDevices(i, _callback);
 }

 void cl_gpuminer::doForAllDevices(unsigned _platformId, function<void(cl::Device const&)> _callback)
 {
         vector<cl::Platform> platforms = getPlatforms();
         if (platforms.empty())
                 return;
         if (_platformId >= platforms.size())
                 return;

         vector<cl::Device> devices = getDevices(platforms, _platformId);
         for (cl::Device const& device: devices)
                 _callback(device);
 }

 void cl_gpuminer::listDevices()
 {
         string outString ="\nListing OpenCL devices.\nFORMAT: [deviceID] deviceName\n";
         unsigned int i = 0;
         doForAllDevices([&outString, &i](cl::Device const _device)
                 {
                         outString += "[" + to_string(i) + "] " + _device.getInfo<CL_DEVICE_NAME>() + "\n";
                         outString += "\tCL_DEVICE_TYPE: ";
                         switch (_device.getInfo<CL_DEVICE_TYPE>())
                         {
                         case CL_DEVICE_TYPE_CPU:
                                 outString += "CPU\n";
                                 break;
                         case CL_DEVICE_TYPE_GPU:
                                 outString += "GPU\n";
                                 break;
                         case CL_DEVICE_TYPE_ACCELERATOR:
                                 outString += "ACCELERATOR\n";
                                 break;
                         default:
                                 outString += "DEFAULT\n";
                                 break;
                         }
                         outString += "\tCL_DEVICE_GLOBAL_MEM_SIZE: " + to_string(_device.getInfo<CL_DEVICE_GLOBAL_MEM_SIZE>()) + "\n";
                         outString += "\tCL_DEVICE_MAX_MEM_ALLOC_SIZE: " + to_string(_device.getInfo<CL_DEVICE_MAX_MEM_ALLOC_SIZE>()) + "\n";
                         outString += "\tCL_DEVICE_MAX_WORK_GROUP_SIZE: " + to_string(_device.getInfo<CL_DEVICE_MAX_WORK_GROUP_SIZE>()) + "\n";
                         ++i;
                 }
         );
         CL_LOG(outString);
 }

 void cl_gpuminer::finish()
 {

         if (m_queue())
                 m_queue.finish();
 }

 // Customise given kernel - This builds the kernel and creates memory buffers
 bool cl_gpuminer::init(
         unsigned _platformId,
         unsigned _deviceId,
         const std::vector<std::string> _kernels
 )
 {
         // get all platforms
         try
         {
                 vector<cl::Platform> platforms = getPlatforms();
                 if (platforms.empty())
                         return false;

                 // use selected platform
                 _platformId = min<unsigned>(_platformId, platforms.size() - 1);
                 CL_LOG("Using platform: " << platforms[_platformId].getInfo<CL_PLATFORM_NAME>().c_str());

                 // get GPU device of the default platform
                 vector<cl::Device> devices = getDevices(platforms, _platformId);
                 if (devices.empty())
                 {
                         CL_LOG("No OpenCL devices found.");
                         return false;
                 }

                 // use selected device
                 cl::Device& device = devices[min<unsigned>(_deviceId, devices.size() - 1)];
                 string device_version = device.getInfo<CL_DEVICE_VERSION>();
                 CL_LOG("Using device: " << device.getInfo<CL_DEVICE_NAME>().c_str() << "(" << device_version.c_str() << ")");

                 if (strncmp("OpenCL 1.0", device_version.c_str(), 10) == 0)
                 {
                         CL_LOG("OpenCL 1.0 is not supported.");
                         return false;
                 }
                 if (strncmp("OpenCL 1.1", device_version.c_str(), 10) == 0)
                         m_openclOnePointOne = true;

                 // create context
                 m_context = cl::Context(vector<cl::Device>(&device, &device + 1));
                 m_queue = cl::CommandQueue(m_context, device);

                 // make sure that global work size is evenly divisible by the local workgroup size
                 m_globalWorkSize = s_initialGlobalWorkSize;
                 if (m_globalWorkSize % s_workgroupSize != 0)
                         m_globalWorkSize = ((m_globalWorkSize / s_workgroupSize) + 1) * s_workgroupSize;
                 // remember the device's address bits
                 m_deviceBits = device.getInfo<CL_DEVICE_ADDRESS_BITS>();
                 // make sure first step of global work size adjustment is large enough
                 m_stepWorkSizeAdjust = pow(2, m_deviceBits / 2 + 1);

                 // patch source code
                 // note: CL_MINER_KERNEL is simply cl_gpuminer_kernel.cl compiled
                 // into a byte array by bin2h.cmake. There is no need to load the file by hand in runtime

                 // Uncomment for loading kernel from compiled cl file.
 #ifdef DEBUG
                 ifstream kernel_file("./libgpuminer/kernels/silentarmy.cl");
                 string code((istreambuf_iterator<char>(kernel_file)), istreambuf_iterator<char>());
                 kernel_file.close();
 #else
                 string code(CL_MINER_KERNEL, CL_MINER_KERNEL + CL_MINER_KERNEL_SIZE);
 #endif
                 // create miner OpenCL program
                 cl::Program::Sources sources;
                 sources.push_back({ code.c_str(), code.size() });

                 cl::Program program(m_context, sources);
                 try
                 {
                         program.build({ device });
                         CL_LOG("Printing program log");
                         CL_LOG(program.getBuildInfo<CL_PROGRAM_BUILD_LOG>(device).c_str());
                 }
                 catch (cl::Error const&)
                 {
                         CL_LOG(program.getBuildInfo<CL_PROGRAM_BUILD_LOG>(device).c_str());
                         return false;
                 }

                 try
                 {
                         for (auto & _kernel : _kernels)
                                 m_gpuKernels.push_back(cl::Kernel(program, _kernel.c_str()));
                 }
                 catch (cl::Error const& err)
                 {
                         CL_LOG("gpuKERNEL Creation failed: " << err.what() << "(" << err.err() << "). Bailing.");
                         return false;
                 }

                 buf_dbg = cl::Buffer(m_context, CL_MEM_READ_WRITE, dbg_size, NULL, NULL);

         m_queue.enqueueFillBuffer(buf_dbg, &zero, 1, 0, dbg_size, 0);
                 buf_ht[0] = cl::Buffer(m_context, CL_MEM_READ_WRITE, HT_SIZE, NULL, NULL);
                 buf_ht[1] = cl::Buffer(m_context, CL_MEM_READ_WRITE, HT_SIZE, NULL, NULL);
                 buf_sols = cl::Buffer(m_context, CL_MEM_READ_WRITE, sizeof (sols_t), NULL, NULL);
         rowCounters[0] = cl::Buffer(m_context, CL_MEM_READ_WRITE, NR_ROWS, NULL,NULL);
         rowCounters[1] = cl::Buffer(m_context, CL_MEM_READ_WRITE, NR_ROWS, NULL, NULL);

                 m_queue.finish();

         }
         catch (cl::Error const& err)
         {
                 CL_LOG("CL ERROR:" << get_error_string(err.err()));
                 return false;
         }
         return true;
 }


 void cl_gpuminer::run(uint8_t *header, size_t header_len, uint256 nonce, sols_t * indices, uint32_t * n_sol, uint256 * ptr)
 {
         try
         {
                 blake2b_state_t blake;
         cl::Buffer      buf_blake_st;
         cl::Buffer      databuf;
                 uint32_t                sol_found = 0;
                 size_t          local_ws = 64;
                 size_t              global_ws;
         unsigned char   buf[136] = {0};

         assert(header_len == CBlockHeader::HEADER_SIZE || header_len == CBlockHeader::HEADER_NEWSIZE);
         *ptr = *(uint256 *)(header + header_len - FABCOIN_NONCE_LEN);

                 zcash_blake2b_init(&blake, FABCOIN_HASH_LEN, PARAM_N, PARAM_K);

         zcash_blake2b_update(&blake, header, 128, 0);

         memcpy( buf + 8, header + 128, header_len - 128);
         buf[0] = (header_len - 128)/8+1;

                 buf_blake_st = cl::Buffer(m_context, CL_MEM_READ_ONLY, sizeof (blake.h), NULL, NULL);
                 m_queue.enqueueWriteBuffer(buf_blake_st, true, 0, sizeof(blake.h), blake.h);

         databuf = cl::Buffer(m_context, CL_MEM_READ_ONLY, 136, NULL, NULL);
         m_queue.enqueueWriteBuffer(databuf, true, 0, 136, buf);
         m_queue.finish();

                 for (unsigned round = 0; round < PARAM_K; round++)
         {
                         m_gpuKernels[0].setArg(0, buf_ht[round % 2]);
             m_gpuKernels[0].setArg(1, rowCounters[round % 2]);
                         m_queue.enqueueNDRangeKernel(m_gpuKernels[0], cl::NullRange, cl::NDRange(NR_ROWS / ROWS_PER_UINT), cl::NDRange(256));

                         if (!round)
             {
                                 m_gpuKernels[1+round].setArg(0, buf_blake_st);
                                 m_gpuKernels[1+round].setArg(1, buf_ht[round % 2]);
                 m_gpuKernels[1+round].setArg(2, databuf);
                 m_gpuKernels[1+round].setArg(3, rowCounters[round % 2]);
                                 global_ws = select_work_size_blake();
                         }
             else
             {
                                 m_gpuKernels[1+round].setArg(0, buf_ht[(round - 1) % 2]);
                                 m_gpuKernels[1+round].setArg(1, buf_ht[round % 2]);
                 m_gpuKernels[1+round].setArg(2, rowCounters[(round - 1) % 2]);
                 m_gpuKernels[1+round].setArg(3, rowCounters[round % 2]);
                                 global_ws = NR_ROWS;
                         }
             m_gpuKernels[1+round].setArg(4, buf_dbg);

             if (round == PARAM_K - 1)
             {
                 m_gpuKernels[1+round].setArg(5, buf_sols);
             }

                         m_queue.enqueueNDRangeKernel(m_gpuKernels[1+round], cl::NullRange, cl::NDRange(global_ws), cl::NDRange(local_ws));
                 }

                 m_gpuKernels[10].setArg(0, buf_ht[0]);
                 m_gpuKernels[10].setArg(1, buf_ht[1]);
                 m_gpuKernels[10].setArg(2, buf_sols);
         m_gpuKernels[10].setArg(3, rowCounters[0]);
         m_gpuKernels[10].setArg(4, rowCounters[1]);
                 global_ws = NR_ROWS;
                 m_queue.enqueueNDRangeKernel(m_gpuKernels[10], cl::NullRange, cl::NDRange(global_ws), cl::NDRange(local_ws));

                 sols_t  * sols;
         size_t sz = sizeof(sols_t)*1;

                 sols = (sols_t *)malloc(sz);
                 m_queue.enqueueReadBuffer(buf_sols, true, 0, sz, sols);
                 m_queue.finish();

                 if (sols->nr > MAX_SOLS)
         {
                         sols->nr = MAX_SOLS;
                 }

                 for (unsigned sol_i = 0; sol_i < sols->nr; sol_i++)
                         sol_found += verify_sol(sols, sol_i);

                 *n_sol = sol_found;
                 memcpy(indices, sols, sizeof(sols_t));
                 free(sols);
         }
         catch (cl::Error const& err)
         {
                 CL_LOG("CL ERROR:" << get_error_string(err.err()));
         }
 }
cl_gpuminer::platform_info
static std::string platform_info(unsigned _platformId=0, unsigned _deviceId=0)
Definition: libclwrapper.cpp:104

libclwrapper.h

cl_gpuminer::m_stepWorkSizeAdjust
unsigned int m_stepWorkSizeAdjust
The step used in the work size adjustment.
Definition: libclwrapper.h:232

cl_gpuminer::~cl_gpuminer
~cl_gpuminer()
Definition: libclwrapper.cpp:78

cl_gpuminer::zero
const cl_int zero
Definition: libclwrapper.h:223

CL_MINER_KERNEL
const unsigned char CL_MINER_KERNEL[]
Definition: silentarmy.h:1

CL_QUERIED_DEVICE_TYPES
#define CL_QUERIED_DEVICE_TYPES
Definition: libclwrapper.cpp:58

cl_gpuminer::m_queue
cl::CommandQueue m_queue
Definition: libclwrapper.h:212

cl::Program::getBuildInfo
cl_int getBuildInfo(const Device &device, cl_program_build_info name, T *param) const
Definition: cl.hpp:2506

NUM_INDICES
#define NUM_INDICES
Definition: libclwrapper.h:40

cl_gpuminer::c_defaultMSPerBatch
static unsigned const c_defaultMSPerBatch
Default value of the milliseconds per global work size (per batch)
Definition: libclwrapper.h:110

cl_gpuminer::m_globalWorkSize
unsigned m_globalWorkSize
Definition: libclwrapper.h:227

zcash_blake2b_init
void zcash_blake2b_init(blake2b_state_t *st, uint8_t hash_len, uint32_t n, uint32_t k)
Definition: blake.cpp:34

cl_gpuminer::s_msPerBatch
static unsigned s_msPerBatch
The target milliseconds per batch for the search. If 0, then no adjustment will happen.
Definition: libclwrapper.h:241

cl_gpuminer::run
void run(uint8_t *header, size_t header_len, uint256 nonce, sols_t *indices, uint32_t *n_sol, uint256 *ptr)
Definition: libclwrapper.cpp:413

cl_gpuminer::HT_SIZE
unsigned long HT_SIZE()
Definition: libclwrapper.h:298

cl_gpuminer::FABCOIN_HASH_LEN
unsigned int FABCOIN_HASH_LEN()
Definition: libclwrapper.h:305

cl::CommandQueue::enqueueWriteBuffer
cl_int enqueueWriteBuffer(const Buffer &buffer, cl_bool blocking,::size_t offset,::size_t size, const void *ptr, const VECTOR_CLASS< Event > *events=NULL, Event *event=NULL) const
Definition: cl.hpp:2638

std
std::hash for asio::adress
Definition: Common.h:323

assert
assert(len-trim+(2 *lenIndices)<=WIDTH)

cl_gpuminer::s_extraRequiredGPUMem
static unsigned s_extraRequiredGPUMem
GPU memory required for other things, like window rendering e.t.c.
Definition: libclwrapper.h:246

cl_gpuminer::getPlatforms
static std::vector< cl::Platform > getPlatforms()
Definition: libclwrapper.cpp:85

code
bytes code
Definition: SmartVM.cpp:45

cl_gpuminer::c_defaultLocalWorkSize
static unsigned const c_defaultLocalWorkSize
Default value of the local work size. Also known as workgroup size.
Definition: libclwrapper.h:106

FABCOIN_NONCE_LEN
#define FABCOIN_NONCE_LEN
Definition: libclwrapper.h:8

cl_gpuminer::searchForAllDevices
static bool searchForAllDevices(unsigned _platformId, std::function< bool(cl::Device const &)> _callback)

cl::CommandQueue::finish
cl_int finish() const
Definition: cl.hpp:3135

cl_gpuminer::NR_ROWS
unsigned long NR_ROWS()
Definition: libclwrapper.h:288

cl_gpuminer::dbg_size
size_t dbg_size
Definition: libclwrapper.h:221

cl_gpuminer::getNumDevices
static unsigned getNumDevices(unsigned _platformId=0)
Definition: libclwrapper.cpp:154

cl_gpuminer::s_allowCPU
static bool s_allowCPU
Allow CPU to appear as an OpenCL device or not. Default is false.
Definition: libclwrapper.h:243

cl_gpuminer::init
bool init(unsigned _platformId, unsigned _deviceId, std::vector< std::string > _kernels)
Definition: libclwrapper.cpp:284

cl::CommandQueue::enqueueFillBuffer
cl_int enqueueFillBuffer(const Buffer &buffer, const void *ptr,::size_t pattern_size,::size_t offset,::size_t size, const VECTOR_CLASS< Event > *events=NULL, Event *event=NULL) const
Definition: cl.hpp:2657

cl_gpuminer::m_gpuKernels
std::vector< cl::Kernel > m_gpuKernels
Definition: libclwrapper.h:213

cl_gpuminer::dst_solutions
uint32_t * dst_solutions
Definition: libclwrapper.h:225

cl_gpuminer::get_error_string
const char * get_error_string(cl_int error)
Definition: libclwrapper.h:318

cl::CommandQueue::enqueueNDRangeKernel
cl_int enqueueNDRangeKernel(const Kernel &kernel, const NDRange &offset, const NDRange &global, const NDRange &local, const VECTOR_CLASS< Event > *events=NULL, Event *event=NULL) const
Definition: cl.hpp:2961

cl_gpuminer::buf_sols
cl::Buffer buf_sols
Definition: libclwrapper.h:215

sols_s
Definition: libclwrapper.h:13

cl::Program::Sources
VECTOR_CLASS< std::pair< const char *,::size_t > > Sources
Definition: cl.hpp:2397

cl_gpuminer::nonce
uint64_t nonce
Definition: libclwrapper.h:219

zcash_blake2b_update
void zcash_blake2b_update(blake2b_state_t *st, const uint8_t *_msg, uint32_t msg_len, uint32_t is_final)
Definition: blake.cpp:78

cl_gpuminer::listDevices
static void listDevices()
Definition: libclwrapper.cpp:244

cl_gpuminer::m_context
cl::Context m_context
Definition: libclwrapper.h:211

cl_gpuminer::ROWS_PER_UINT
unsigned int ROWS_PER_UINT()
Definition: libclwrapper.h:310

cl_gpuminer::m_deviceBits
unsigned m_deviceBits
Definition: libclwrapper.h:229

blake2b_state_s::h
uint64_t h[8]
Definition: blake.h:3

MAX_SOLS
#define MAX_SOLS
Definition: libclwrapper.h:10

cl_gpuminer::buf_dbg
cl::Buffer buf_dbg
Definition: libclwrapper.h:216

uint256
256-bit opaque blob.
Definition: uint256.h:132

cl::CommandQueue
CommandQueue interface for cl_command_queue.
Definition: cl.hpp:2566

sols_s::nr
uint nr
Definition: libclwrapper.h:15

CBlockHeader::HEADER_SIZE
static const size_t HEADER_SIZE
Definition: block.h:39

CL_MINER_KERNEL_SIZE
const size_t CL_MINER_KERNEL_SIZE
Definition: silentarmy.h:709

memcpy
void * memcpy(void *a, const void *b, size_t c)
Definition: glibc_compat.cpp:17

cl_gpuminer::m_openclOnePointOne
bool m_openclOnePointOne
Definition: libclwrapper.h:228

cl::Program::build
cl_int build(const VECTOR_CLASS< Device > &devices, const char *options=NULL, void(CL_CALLBACK *notifyFptr)(cl_program, void *)=NULL, void *data=NULL) const
Definition: cl.hpp:2466

round
#define round(a, b, c, x, mul)

cl::Device::getInfo
cl_int getInfo(cl_device_info name, T *param) const
Definition: cl.hpp:1208

cl::Platform::get
static cl_int get(VECTOR_CLASS< Platform > *platforms)
Definition: cl.hpp:1397

cl_gpuminer::PARAM_K
unsigned int PARAM_K
Definition: libclwrapper.h:250

cl::Buffer
Memory buffer interface.
Definition: cl.hpp:1748

cl::NDRange
NDRange interface.
Definition: cl.hpp:2218

cl::CommandQueue::enqueueReadBuffer
cl_int enqueueReadBuffer(const Buffer &buffer, cl_bool blocking,::size_t offset,::size_t size, void *ptr, const VECTOR_CLASS< Event > *events=NULL, Event *event=NULL) const
Definition: cl.hpp:2619

cl_gpuminer::select_work_size_blake
size_t select_work_size_blake(void)
Definition: libclwrapper.h:152

cl_gpuminer::verify_sol
uint32_t verify_sol(sols_t *sols, unsigned sol_i)
Definition: libclwrapper.h:183

cl::Kernel
Kernel interface that implements cl_kernel.
Definition: cl.hpp:2296

cl_gpuminer::doForAllDevices
static void doForAllDevices(unsigned _platformId, std::function< void(cl::Device const &)> _callback)

cl_gpuminer::getNumPlatforms
static unsigned getNumPlatforms()
Definition: libclwrapper.cpp:146

cl_gpuminer::finish
void finish()
Definition: libclwrapper.cpp:276

cl_gpuminer::s_workgroupSize
static unsigned s_workgroupSize
The local work size for the search.
Definition: libclwrapper.h:237

cl_gpuminer::rowCounters
cl::Buffer rowCounters[2]
Definition: libclwrapper.h:217

cl::Device
Device interface for cl_device_id.
Definition: cl.hpp:1190

cl_gpuminer::buf_ht
cl::Buffer buf_ht[2]
Definition: libclwrapper.h:214

blake2b_state_s
Definition: blake.h:1

__declspec
__declspec(dllimport)
Definition: util_win32.c:26

CBlockHeader::HEADER_NEWSIZE
static const size_t HEADER_NEWSIZE
Definition: block.h:40

cl::Program
Program interface that implements cl_program.
Definition: cl.hpp:2393

cl_gpuminer::getDevices
static std::vector< cl::Device > getDevices(std::vector< cl::Platform > const &_platforms, unsigned _platformId)
Definition: libclwrapper.cpp:126

cl_gpuminer::c_defaultGlobalWorkSizeMultiplier
static unsigned const c_defaultGlobalWorkSizeMultiplier
Default value of the global work size as a multiplier of the local work size.
Definition: libclwrapper.h:108

cl::Context
Definition: cl.hpp:1424

cl_gpuminer::cl_gpuminer
cl_gpuminer()
Definition: libclwrapper.cpp:60

sols_t
struct sols_s sols_t

CL_LOG
#define CL_LOG(_contents)
Definition: libclwrapper.cpp:54

cl_gpuminer::configureGPU
static bool configureGPU(unsigned _platformId, unsigned _localWorkSize, unsigned _globalWorkSize)
Definition: libclwrapper.cpp:170

cl_gpuminer::s_initialGlobalWorkSize
static unsigned s_initialGlobalWorkSize
The initial global work size for the searches.
Definition: libclwrapper.h:239

cl_gpuminer::PARAM_N
unsigned int PARAM_N
Definition: libclwrapper.h:249