Implemented OpenCL JIT mode.
This commit is contained in:
parent
db79911c4b
commit
04a4a6cadc
10 changed files with 322 additions and 60 deletions
|
@ -24,10 +24,15 @@
|
|||
|
||||
#include "backend/opencl/runners/OclRxJitRunner.h"
|
||||
|
||||
#include "backend/opencl/wrappers/OclLib.h"
|
||||
#include "backend/opencl/OclLaunchData.h"
|
||||
#include "backend/opencl/kernels/rx/HashAesKernel.h"
|
||||
#include "backend/opencl/cl/rx/randomx_run_gfx803.h"
|
||||
#include "backend/opencl/cl/rx/randomx_run_gfx900.h"
|
||||
#include "backend/opencl/kernels/rx/Blake2bHashRegistersKernel.h"
|
||||
#include "backend/opencl/kernels/rx/HashAesKernel.h"
|
||||
#include "backend/opencl/kernels/rx/RxJitKernel.h"
|
||||
#include "backend/opencl/kernels/rx/RxRunKernel.h"
|
||||
#include "backend/opencl/OclLaunchData.h"
|
||||
#include "backend/opencl/wrappers/OclLib.h"
|
||||
#include "backend/opencl/wrappers/OclError.h"
|
||||
|
||||
|
||||
xmrig::OclRxJitRunner::OclRxJitRunner(size_t index, const OclLaunchData &data) : OclRxBaseRunner(index, data)
|
||||
|
@ -37,6 +42,10 @@ xmrig::OclRxJitRunner::OclRxJitRunner(size_t index, const OclLaunchData &data) :
|
|||
|
||||
xmrig::OclRxJitRunner::~OclRxJitRunner()
|
||||
{
|
||||
delete m_randomx_jit;
|
||||
delete m_randomx_run;
|
||||
|
||||
OclLib::release(m_asmProgram);
|
||||
OclLib::release(m_intermediate_programs);
|
||||
OclLib::release(m_programs);
|
||||
OclLib::release(m_registers);
|
||||
|
@ -52,11 +61,28 @@ void xmrig::OclRxJitRunner::build()
|
|||
m_hashAes1Rx4->setArgs(m_scratchpads, m_registers, 256, batch_size);
|
||||
m_blake2b_hash_registers_32->setArgs(m_hashes, m_registers, 256);
|
||||
m_blake2b_hash_registers_64->setArgs(m_hashes, m_registers, 256);
|
||||
|
||||
m_randomx_jit = new RxJitKernel(m_program);
|
||||
m_randomx_jit->setArgs(m_entropy, m_registers, m_intermediate_programs, m_programs, batch_size, m_rounding);
|
||||
|
||||
if (!loadAsmProgram()) {
|
||||
throw std::runtime_error(OclError::toString(CL_INVALID_PROGRAM));
|
||||
}
|
||||
|
||||
m_randomx_run = new RxRunKernel(m_asmProgram);
|
||||
m_randomx_run->setArgs(data().dataset->get(), m_scratchpads, m_registers, m_rounding, m_programs, batch_size, m_algorithm);
|
||||
}
|
||||
|
||||
|
||||
void xmrig::OclRxJitRunner::execute(uint32_t iteration)
|
||||
{
|
||||
const uint32_t g_intensity = data().thread.intensity();
|
||||
|
||||
m_randomx_jit->enqueue(m_queue, g_intensity, iteration);
|
||||
|
||||
OclLib::finish(m_queue);
|
||||
|
||||
m_randomx_run->enqueue(m_queue, g_intensity);
|
||||
}
|
||||
|
||||
|
||||
|
@ -70,3 +96,46 @@ void xmrig::OclRxJitRunner::init()
|
|||
m_intermediate_programs = OclLib::createBuffer(m_ctx, CL_MEM_READ_WRITE, 5120 * g_thd, nullptr);
|
||||
m_programs = OclLib::createBuffer(m_ctx, CL_MEM_READ_WRITE, 10048 * g_thd, nullptr);
|
||||
}
|
||||
|
||||
|
||||
bool xmrig::OclRxJitRunner::loadAsmProgram()
|
||||
{
|
||||
// Adrenaline drivers on Windows and amdgpu-pro drivers on Linux use ELF header's flags (offset 0x30) to store internal device ID
|
||||
// Read it from compiled OpenCL code and substitute this ID into pre-compiled binary to make sure the driver accepts it
|
||||
uint32_t elf_header_flags = 0;
|
||||
const uint32_t elf_header_flags_offset = 0x30;
|
||||
|
||||
size_t bin_size;
|
||||
if (OclLib::getProgramInfo(m_program, CL_PROGRAM_BINARY_SIZES, sizeof(bin_size), &bin_size) != CL_SUCCESS) {
|
||||
return false;
|
||||
}
|
||||
|
||||
std::vector<char> binary_data(bin_size);
|
||||
char* tmp[1] = { binary_data.data() };
|
||||
if (OclLib::getProgramInfo(m_program, CL_PROGRAM_BINARIES, sizeof(char*), tmp) != CL_SUCCESS) {
|
||||
return false;
|
||||
}
|
||||
|
||||
if (bin_size >= elf_header_flags_offset + sizeof(uint32_t)) {
|
||||
elf_header_flags = *reinterpret_cast<uint32_t*>((binary_data.data() + elf_header_flags_offset));
|
||||
}
|
||||
|
||||
const size_t len = (m_gcn_version == 14) ? randomx_run_gfx900_bin_size : randomx_run_gfx803_bin_size;
|
||||
unsigned char *binary = (m_gcn_version == 14) ? randomx_run_gfx900_bin : randomx_run_gfx803_bin;
|
||||
|
||||
// Set correct internal device ID in the pre-compiled binary
|
||||
if (elf_header_flags) {
|
||||
*reinterpret_cast<uint32_t*>(binary + elf_header_flags_offset) = elf_header_flags;
|
||||
}
|
||||
|
||||
cl_int status;
|
||||
cl_int ret;
|
||||
cl_device_id device = data().device.id();
|
||||
|
||||
m_asmProgram = OclLib::createProgramWithBinary(ctx(), 1, &device, &len, (const unsigned char**) &binary, &status, &ret);
|
||||
if (ret != CL_SUCCESS) {
|
||||
return false;
|
||||
}
|
||||
|
||||
return OclLib::buildProgram(m_asmProgram, 1, &device) == CL_SUCCESS;
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue