REDACTED-rig/src/backend/opencl/runners/tools/OclCnR.cpp
2021-08-25 18:45:15 +07:00

301 lines
7.9 KiB
C++

/* XMRig
* Copyright (c) 2018-2021 SChernykh <https://github.com/SChernykh>
* Copyright (c) 2016-2021 XMRig <https://github.com/xmrig>, <support@xmrig.com>
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
#include "backend/opencl/runners/tools/OclCnR.h"
#include "backend/opencl/cl/cn/cryptonight_r_cl.h"
#include "backend/opencl/interfaces/IOclRunner.h"
#include "backend/opencl/OclCache.h"
#include "backend/opencl/OclLaunchData.h"
#include "backend/opencl/OclThread.h"
#include "backend/opencl/wrappers/OclError.h"
#include "backend/opencl/wrappers/OclLib.h"
#include "base/io/log/Log.h"
#include "base/tools/Baton.h"
#include "base/tools/Chrono.h"
#include "crypto/cn/CryptoNight_monero.h"
#include <cstring>
#include <mutex>
#include <regex>
#include <sstream>
#include <string>
#include <thread>
#include <uv.h>
namespace xmrig {
class CnrCacheEntry
{
public:
inline CnrCacheEntry(const Algorithm &algo, uint64_t offset, uint32_t index, cl_program program) :
program(program),
m_algo(algo),
m_index(index),
m_offset(offset)
{}
inline bool isExpired(uint64_t offset) const { return m_offset + OclCnR::kHeightChunkSize < offset; }
inline bool match(const Algorithm &algo, uint64_t offset, uint32_t index) const { return m_algo == algo && m_offset == offset && m_index == index; }
inline bool match(const IOclRunner &runner, uint64_t offset) const { return match(runner.algorithm(), offset, runner.deviceIndex()); }
inline void release() const { OclLib::release(program); }
cl_program program;
private:
Algorithm m_algo;
uint32_t m_index;
uint64_t m_offset;
};
class CnrCache
{
public:
CnrCache() = default;
inline cl_program search(const IOclRunner &runner, uint64_t offset) { return search(runner.algorithm(), offset, runner.deviceIndex()); }
inline cl_program search(const Algorithm &algo, uint64_t offset, uint32_t index)
{
std::lock_guard<std::mutex> lock(m_mutex);
for (const auto &entry : m_data) {
if (entry.match(algo, offset, index)) {
return entry.program;
}
}
return nullptr;
}
void add(const Algorithm &algo, uint64_t offset, uint32_t index, cl_program program)
{
if (search(algo, offset, index)) {
OclLib::release(program);
return;
}
std::lock_guard<std::mutex> lock(m_mutex);
gc(offset);
m_data.emplace_back(algo, offset, index, program);
}
void clear()
{
std::lock_guard<std::mutex> lock(m_mutex);
for (auto &entry : m_data) {
entry.release();
}
m_data.clear();
}
private:
void gc(uint64_t offset)
{
for (size_t i = 0; i < m_data.size();) {
auto &entry = m_data[i];
if (entry.isExpired(offset)) {
entry.release();
entry = m_data.back();
m_data.pop_back();
}
else {
++i;
}
}
}
std::mutex m_mutex;
std::vector<CnrCacheEntry> m_data;
};
static CnrCache cache;
class CnrBuilder
{
public:
CnrBuilder() = default;
cl_program build(const IOclRunner &runner, uint64_t offset)
{
# ifdef APP_DEBUG
const uint64_t ts = Chrono::steadyMSecs();
# endif
std::lock_guard<std::mutex> lock(m_mutex);
cl_program program = cache.search(runner, offset);
if (program) {
return program;
}
cl_int ret = 0;
const std::string source = getSource(offset);
cl_device_id device = runner.data().device.id();
const char *s = source.c_str();
program = OclLib::createProgramWithSource(runner.ctx(), 1, &s, nullptr, &ret);
if (ret != CL_SUCCESS) {
return nullptr;
}
if (OclLib::buildProgram(program, 1, &device, runner.buildOptions()) != CL_SUCCESS) {
printf("BUILD LOG:\n%s\n", OclLib::getProgramBuildLog(program, device).data());
OclLib::release(program);
return nullptr;
}
LOG_DEBUG(GREEN_BOLD("[ocl]") " programs for heights %" PRIu64 " - %" PRIu64 " compiled. (%" PRIu64 "ms)", offset, offset + OclCnR::kHeightChunkSize - 1, Chrono::steadyMSecs() - ts);
cache.add(runner.algorithm(), offset, runner.deviceIndex(), program);
return program;
}
private:
static std::string getCode(const V4_Instruction *code, int code_size)
{
std::stringstream s;
for (int i = 0; i < code_size; ++i) {
const V4_Instruction inst = code[i];
const uint32_t a = inst.dst_index;
const uint32_t b = inst.src_index;
switch (inst.opcode)
{
case MUL:
s << 'r' << a << "*=r" << b << ';';
break;
case ADD:
s << 'r' << a << "+=r" << b << '+' << inst.C << "U;";
break;
case SUB:
s << 'r' << a << "-=r" << b << ';';
break;
case ROR:
case ROL:
s << 'r' << a << "=rotate(r" << a << ((inst.opcode == ROR) ? ",ROT_BITS-r" : ",r") << b << ");";
break;
case XOR:
s << 'r' << a << "^=r" << b << ';';
break;
}
s << '\n';
}
return s.str();
}
static std::string getSource(uint64_t offset)
{
std::string source(cryptonight_r_defines_cl);
for (size_t i = 0; i < OclCnR::kHeightChunkSize; ++i) {
V4_Instruction code[256];
const int code_size = v4_random_math_init<Algorithm::CN_R>(code, offset + i);
const std::string kernel = std::regex_replace(std::string(cryptonight_r_cl), std::regex("XMRIG_INCLUDE_RANDOM_MATH"), getCode(code, code_size));
source += std::regex_replace(kernel, std::regex("KERNEL_NAME"), "cn1_" + std::to_string(offset + i));
}
return source;
}
std::mutex m_mutex;
};
class CnrBaton : public Baton<uv_work_t>
{
public:
inline CnrBaton(const IOclRunner &runner, uint64_t offset) :
runner(runner),
offset(offset)
{}
const IOclRunner &runner;
const uint64_t offset;
};
static CnrBuilder builder;
static std::mutex bg_mutex;
} // namespace xmrig
cl_program xmrig::OclCnR::get(const IOclRunner &runner, uint64_t height)
{
const uint64_t offset = (height / kHeightChunkSize) * kHeightChunkSize;
if (offset + kHeightChunkSize - height == 1) {
auto baton = new CnrBaton(runner, offset + kHeightChunkSize);
uv_queue_work(uv_default_loop(), &baton->req,
[](uv_work_t *req) {
auto baton = static_cast<CnrBaton*>(req->data);
std::lock_guard<std::mutex> lock(bg_mutex);
builder.build(baton->runner, baton->offset);
},
[](uv_work_t *req, int) { delete static_cast<CnrBaton*>(req->data); }
);
}
cl_program program = cache.search(runner, offset);
if (program) {
return program;
}
return builder.build(runner, offset);;
}
void xmrig::OclCnR::clear()
{
std::lock_guard<std::mutex> lock(bg_mutex);
cache.clear();
}