/* This file is part of ethash. ethash is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. ethash is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with cpp-ethereum. If not, see . */ /** @file internal.c * @author Tim Hughes * @author Matthew Wampler-Doty * @date 2015 */ #include #include #include #include #include #include #include "ethash.h" #include "fnv.h" #include "endian.h" #include "ethash_internal.h" #include "data_sizes.h" #include "base/crypto/sha3.h" #if defined(_M_X64) || defined(__x86_64__) || defined(__SSE2__) #ifdef __GNUC__ #include #else #include #endif #define kp_prefetch(x) _mm_prefetch((x), _MM_HINT_T0); #else #define kp_prefetch(x) #endif #define SHA3_256(a, b, c) sha3_HashBuffer(256, SHA3_FLAGS_KECCAK, b, c, a, 32) #define SHA3_512(a, b, c) sha3_HashBuffer(512, SHA3_FLAGS_KECCAK, b, c, a, 64) uint64_t ethash_get_datasize(uint64_t const block_number) { assert(block_number / ETHASH_EPOCH_LENGTH < 2048); return dag_sizes[block_number / ETHASH_EPOCH_LENGTH]; } uint64_t ethash_get_cachesize(uint64_t const block_number) { assert(block_number / ETHASH_EPOCH_LENGTH < 2048); return cache_sizes[block_number / ETHASH_EPOCH_LENGTH]; } // Follows Sergio's "STRICT MEMORY HARD HASHING FUNCTIONS" (2014) // https://bitslog.files.wordpress.com/2013/12/memohash-v0-3.pdf // SeqMemoHash(s, R, N) bool ethash_compute_cache_nodes( void* nodes_ptr, uint64_t cache_size, ethash_h256_t const* seed ) { if (cache_size % sizeof(node) != 0) { return false; } uint32_t const num_nodes = (uint32_t) (cache_size / sizeof(node)); node* nodes = (node*)nodes_ptr; SHA3_512(nodes[0].bytes, (uint8_t*)seed, 32); for (uint32_t i = 1; i != num_nodes; ++i) { SHA3_512(nodes[i].bytes, nodes[i - 1].bytes, 64); } for (uint32_t j = 0; j != ETHASH_CACHE_ROUNDS; j++) { for (uint32_t i = 0; i != num_nodes; i++) { uint32_t const idx = nodes[i].words[0] % num_nodes; node data; data = nodes[(num_nodes - 1 + i) % num_nodes]; for (uint32_t w = 0; w != NODE_WORDS; ++w) { data.words[w] ^= nodes[idx].words[w]; } SHA3_512(nodes[i].bytes, data.bytes, sizeof(data)); } } // now perform endian conversion fix_endian_arr32(nodes->words, num_nodes * NODE_WORDS); return true; } void ethash_calculate_dag_item( node* const ret, uint32_t node_index, uint32_t num_parents, ethash_light_t const light ) { uint32_t num_parent_nodes = (uint32_t) (light->cache_size / sizeof(node)); node const* cache_nodes = (node const *) light->cache; node const* init = &cache_nodes[node_index % num_parent_nodes]; memcpy(ret, init, sizeof(node)); ret->words[0] ^= node_index; SHA3_512(ret->bytes, ret->bytes, sizeof(node)); #if defined(_M_X64) && ENABLE_SSE __m128i const fnv_prime = _mm_set1_epi32(FNV_PRIME); __m128i xmm0 = ret->xmm[0]; __m128i xmm1 = ret->xmm[1]; __m128i xmm2 = ret->xmm[2]; __m128i xmm3 = ret->xmm[3]; #endif for (uint32_t i = 0; i != num_parents; ++i) { uint32_t parent_index = fnv_hash(node_index ^ i, ret->words[i % NODE_WORDS]) % num_parent_nodes; node const *parent = &cache_nodes[parent_index]; #if defined(_M_X64) && ENABLE_SSE { xmm0 = _mm_mullo_epi32(xmm0, fnv_prime); xmm1 = _mm_mullo_epi32(xmm1, fnv_prime); xmm2 = _mm_mullo_epi32(xmm2, fnv_prime); xmm3 = _mm_mullo_epi32(xmm3, fnv_prime); xmm0 = _mm_xor_si128(xmm0, parent->xmm[0]); xmm1 = _mm_xor_si128(xmm1, parent->xmm[1]); xmm2 = _mm_xor_si128(xmm2, parent->xmm[2]); xmm3 = _mm_xor_si128(xmm3, parent->xmm[3]); // have to write to ret as values are used to compute index ret->xmm[0] = xmm0; ret->xmm[1] = xmm1; ret->xmm[2] = xmm2; ret->xmm[3] = xmm3; } #else { for (unsigned w = 0; w != NODE_WORDS; ++w) { ret->words[w] = fnv_hash(ret->words[w], parent->words[w]); } } #endif } SHA3_512(ret->bytes, ret->bytes, sizeof(node)); } static inline uint32_t fast_mod(uint64_t a, uint64_t d, uint64_t r, uint64_t i, uint64_t s) { const uint32_t q = ((a + i) * r) >> s; return a - q * d; } void ethash_calculate_dag_item_opt( node* const ret, uint32_t node_index, uint32_t num_parents, ethash_light_t const light ) { node const* cache_nodes = (node const*)light->cache; node const* init = &cache_nodes[fast_mod(node_index, light->num_parent_nodes, light->reciprocal, light->increment, light->shift)]; memcpy(ret, init, sizeof(node)); ret->words[0] ^= node_index; SHA3_512(ret->bytes, ret->bytes, sizeof(node)); for (uint32_t i = 0; i != num_parents; ++i) { uint32_t parent_index = fast_mod(fnv_hash(node_index ^ i, ret->words[i % NODE_WORDS]), light->num_parent_nodes, light->reciprocal, light->increment, light->shift); node const* parent = &cache_nodes[parent_index]; for (unsigned w = 0; w != NODE_WORDS; ++w) { ret->words[w] = fnv_hash(ret->words[w], parent->words[w]); } } SHA3_512(ret->bytes, ret->bytes, sizeof(node)); } void ethash_calculate_dag_item4_opt( node* ret, uint32_t node_index, uint32_t num_parents, ethash_light_t const light ) { node const* cache_nodes = (node const*)light->cache; for (size_t i = 0; i < 4; ++i) { node const* init = &cache_nodes[fast_mod(node_index + i, light->num_parent_nodes, light->reciprocal, light->increment, light->shift)]; memcpy(ret + i, init, sizeof(node)); ret[i].words[0] ^= node_index + i; SHA3_512(ret[i].bytes, ret[i].bytes, sizeof(node)); } for (uint32_t i = 0; i != num_parents; ++i) { node* parent[4]; for (uint32_t j = 0; j < 4; ++j) { const uint32_t parent_index = fast_mod(fnv_hash((node_index + j) ^ i, ret[j].words[i % NODE_WORDS]), light->num_parent_nodes, light->reciprocal, light->increment, light->shift); parent[j] = &cache_nodes[parent_index]; kp_prefetch(parent[j]); } for (unsigned w = 0; w != NODE_WORDS; ++w) ret[0].words[w] = fnv_hash(ret[0].words[w], parent[0]->words[w]); for (unsigned w = 0; w != NODE_WORDS; ++w) ret[1].words[w] = fnv_hash(ret[1].words[w], parent[1]->words[w]); for (unsigned w = 0; w != NODE_WORDS; ++w) ret[2].words[w] = fnv_hash(ret[2].words[w], parent[2]->words[w]); for (unsigned w = 0; w != NODE_WORDS; ++w) ret[3].words[w] = fnv_hash(ret[3].words[w], parent[3]->words[w]); } for (size_t i = 0; i < 4; ++i) { SHA3_512(ret[i].bytes, ret[i].bytes, sizeof(node)); } } bool ethash_compute_full_data( void* mem, uint64_t full_size, ethash_light_t const light, ethash_callback_t callback ) { if (full_size % (sizeof(uint32_t) * MIX_WORDS) != 0 || (full_size % sizeof(node)) != 0) { return false; } uint32_t const max_n = (uint32_t)(full_size / sizeof(node)); node* full_nodes = (node*) mem; double const progress_change = 1.0f / max_n; double progress = 0.0f; // now compute full nodes for (uint32_t n = 0; n != max_n; ++n) { if (callback && n % (max_n / 100) == 0 && callback((unsigned int)(ceil(progress * 100.0f))) != 0) { return false; } progress += progress_change; ethash_calculate_dag_item(&(full_nodes[n]), n, ETHASH_DATASET_PARENTS, light); } return true; } static bool ethash_hash( ethash_return_value_t* ret, node const* full_nodes, ethash_light_t const light, uint64_t full_size, ethash_h256_t const header_hash, uint64_t const nonce ) { if (full_size % MIX_WORDS != 0) { return false; } // pack hash and nonce together into first 40 bytes of s_mix assert(sizeof(node) * 8 == 512); node s_mix[MIX_NODES + 1]; memcpy(s_mix[0].bytes, &header_hash, 32); fix_endian64(s_mix[0].double_words[4], nonce); // compute sha3-512 hash and replicate across mix SHA3_512(s_mix->bytes, s_mix->bytes, 40); fix_endian_arr32(s_mix[0].words, 16); node* const mix = s_mix + 1; for (uint32_t w = 0; w != MIX_WORDS; ++w) { mix->words[w] = s_mix[0].words[w % NODE_WORDS]; } unsigned const page_size = sizeof(uint32_t) * MIX_WORDS; unsigned const num_full_pages = (unsigned) (full_size / page_size); for (unsigned i = 0; i != ETHASH_ACCESSES; ++i) { uint32_t const index = fnv_hash(s_mix->words[0] ^ i, mix->words[i % MIX_WORDS]) % num_full_pages; for (unsigned n = 0; n != MIX_NODES; ++n) { node const* dag_node; node tmp_node; if (full_nodes) { dag_node = &full_nodes[MIX_NODES * index + n]; } else { ethash_calculate_dag_item(&tmp_node, index * MIX_NODES + n, ETHASH_DATASET_PARENTS, light); dag_node = &tmp_node; } #if defined(_M_X64) && ENABLE_SSE { __m128i fnv_prime = _mm_set1_epi32(FNV_PRIME); __m128i xmm0 = _mm_mullo_epi32(fnv_prime, mix[n].xmm[0]); __m128i xmm1 = _mm_mullo_epi32(fnv_prime, mix[n].xmm[1]); __m128i xmm2 = _mm_mullo_epi32(fnv_prime, mix[n].xmm[2]); __m128i xmm3 = _mm_mullo_epi32(fnv_prime, mix[n].xmm[3]); mix[n].xmm[0] = _mm_xor_si128(xmm0, dag_node->xmm[0]); mix[n].xmm[1] = _mm_xor_si128(xmm1, dag_node->xmm[1]); mix[n].xmm[2] = _mm_xor_si128(xmm2, dag_node->xmm[2]); mix[n].xmm[3] = _mm_xor_si128(xmm3, dag_node->xmm[3]); } #else { for (unsigned w = 0; w != NODE_WORDS; ++w) { mix[n].words[w] = fnv_hash(mix[n].words[w], dag_node->words[w]); } } #endif } } // compress mix for (uint32_t w = 0; w != MIX_WORDS; w += 4) { uint32_t reduction = mix->words[w + 0]; reduction = reduction * FNV_PRIME ^ mix->words[w + 1]; reduction = reduction * FNV_PRIME ^ mix->words[w + 2]; reduction = reduction * FNV_PRIME ^ mix->words[w + 3]; mix->words[w / 4] = reduction; } fix_endian_arr32(mix->words, MIX_WORDS / 4); memcpy(&ret->mix_hash, mix->bytes, 32); // final Keccak hash SHA3_256(&ret->result, s_mix->bytes, 64 + 32); // Keccak-256(s + compressed_mix) return true; } void ethash_quick_hash( ethash_h256_t* return_hash, ethash_h256_t const* header_hash, uint64_t nonce, ethash_h256_t const* mix_hash ) { uint8_t buf[64 + 32]; memcpy(buf, header_hash, 32); fix_endian64_same(nonce); memcpy(&(buf[32]), &nonce, 8); SHA3_512(buf, buf, 40); memcpy(&(buf[64]), mix_hash, 32); SHA3_256(return_hash, buf, 64 + 32); } ethash_h256_t ethash_get_seedhash(uint64_t epoch) { ethash_h256_t ret; ethash_h256_reset(&ret); for (uint32_t i = 0; i < epoch; ++i) SHA3_256(&ret, (uint8_t*)&ret, 32); return ret; } bool ethash_quick_check_difficulty( ethash_h256_t const* header_hash, uint64_t const nonce, ethash_h256_t const* mix_hash, ethash_h256_t const* boundary ) { ethash_h256_t return_hash; ethash_quick_hash(&return_hash, header_hash, nonce, mix_hash); return ethash_check_difficulty(&return_hash, boundary); } ethash_light_t ethash_light_new_internal(uint64_t cache_size, ethash_h256_t const* seed) { struct ethash_light *ret; ret = (struct ethash_light*)calloc(sizeof(*ret), 1); if (!ret) { return NULL; } ret->cache = malloc((size_t)cache_size); if (!ret->cache) { goto fail_free_light; } node* nodes = (node*)ret->cache; if (!ethash_compute_cache_nodes(nodes, cache_size, seed)) { goto fail_free_cache_mem; } ret->cache_size = cache_size; return ret; fail_free_cache_mem: free(ret->cache); fail_free_light: free(ret); return NULL; } ethash_light_t ethash_light_new(uint64_t block_number) { ethash_h256_t seedhash = ethash_get_seedhash(block_number / ETHASH_EPOCH_LENGTH); ethash_light_t ret; ret = ethash_light_new_internal(ethash_get_cachesize(block_number), &seedhash); ret->block_number = block_number; return ret; } void ethash_light_delete(ethash_light_t light) { if (light->cache) { free(light->cache); } free(light); } ethash_return_value_t ethash_light_compute_internal( ethash_light_t light, uint64_t full_size, ethash_h256_t const header_hash, uint64_t nonce ) { ethash_return_value_t ret; ret.success = true; if (!ethash_hash(&ret, NULL, light, full_size, header_hash, nonce)) { ret.success = false; } return ret; } ethash_return_value_t ethash_light_compute( ethash_light_t light, ethash_h256_t const header_hash, uint64_t nonce ) { uint64_t full_size = ethash_get_datasize(light->block_number); return ethash_light_compute_internal(light, full_size, header_hash, nonce); } ethash_return_value_t ethash_full_compute( ethash_full_t full, ethash_h256_t const header_hash, uint64_t nonce ) { ethash_return_value_t ret; ret.success = true; if (!ethash_hash( &ret, (node const*)full->data, NULL, full->file_size, header_hash, nonce)) { ret.success = false; } return ret; } void const* ethash_full_dag(ethash_full_t full) { return full->data; } uint64_t ethash_full_dag_size(ethash_full_t full) { return full->file_size; }