From 27e9f33ed36c10b1a4e34c0ebc86d87ab2cfb5ff Mon Sep 17 00:00:00 2001 From: David Phillips Date: Sun, 19 Nov 2017 23:12:13 +1300 Subject: Initial dump of SHA CL port --- sand-leek-cl.c | 201 +++++++++++++++++++++++++++++++++++++++++++++------------ 1 file changed, 161 insertions(+), 40 deletions(-) (limited to 'sand-leek-cl.c') diff --git a/sand-leek-cl.c b/sand-leek-cl.c index a21829d..67157a0 100644 --- a/sand-leek-cl.c +++ b/sand-leek-cl.c @@ -2,19 +2,78 @@ #include #include #include +#include +#include -//#include +#include #include +#include +#include "key_update.h" #include "onion_base32.h" #include "trampoline.h" //#include "sha1.h" +/* hangover code from sand-leek.c */ +/* bitmasks to be used to compare remainder bits */ +unsigned char bitmasks[] = { + [0] = 0x00, + [1] = 0xF8, /* 5 MSB */ + [2] = 0xC0, /* 2 MSB */ + [3] = 0xFE, /* 7 MSB */ + [4] = 0xF0, /* 4 MSB */ + [5] = 0x80, /* 1 MSB */ + [6] = 0xFC, /* 6 MSB */ + [7] = 0xE0 /* 3 MSB */ +}; + +int truffle_valid(unsigned char *search_raw, int raw_len, char bitmask, struct sha_data sha, unsigned char e[4]) { + unsigned char digest[20] = {}; + sha_update(&sha, e, 4); + sha_final(&digest, &sha); + fprintf(stderr, "Need %x%x%x%x%x%x%x%x%x%x (%d)\n", + search_raw[0], + search_raw[1], + search_raw[2], + search_raw[3], + search_raw[4], + search_raw[5], + search_raw[6], + search_raw[7], + search_raw[8], + search_raw[9], + raw_len + ); + fprintf(stderr, "GPU got %x%x%x%x%x%x%x%x%x%x\n", + digest[0], + digest[1], + digest[2], + digest[3], + digest[4], + digest[5], + digest[6], + digest[7], + digest[8], + digest[9] + ); + return memcmp(digest, search_raw, raw_len) == 0 && + (search_raw[raw_len] & bitmask) == (digest[raw_len] & bitmask); +} + +double tv_delta(struct timespec *start, struct timespec *end) { + double s_delta = end->tv_sec - start->tv_sec; + long ns_delta = end->tv_nsec - start->tv_nsec; + return s_delta + (double)ns_delta/1e9; +} /* FIXME make loop internal to run(), rather than rebuilding kernel etc * each new key */ -int run(const char *preferred_platform, unsigned char *search_raw, size_t raw_len, struct sha_data *sha) +unsigned long run(const char *preferred_platform, unsigned char *search_raw, size_t raw_len, size_t search_len, struct sha_data *sha) { + struct timespec tv_start = {}; + struct timespec tv_end = {}; + int bitmask = bitmasks[search_len % 8]; + fprintf(stderr, "Building CL trampoline... "); if (tramp_init(preferred_platform)) { fprintf(stderr, "Failed.\n"); @@ -37,7 +96,7 @@ int run(const char *preferred_platform, unsigned char *search_raw, size_t raw_le fprintf(stderr, "Compiled.\n"); fprintf(stderr, "Setting kernel arguments... "); - if (tramp_set_kernel_args(raw_len)) { + if (tramp_set_kernel_args(raw_len, bitmask)) { fprintf(stderr, "Failed.\n"); return 1; } @@ -58,29 +117,66 @@ int run(const char *preferred_platform, unsigned char *search_raw, size_t raw_le fprintf(stderr, "Done.\n"); fprintf(stderr, "Running kernel... "); + clock_gettime(CLOCK_MONOTONIC, &tv_start); +/* FIXME magic */ +/* 65536 kernels doing 32767 each, except if it's 00xxxxxx */ +#define HASH_PER_RUN ((65536UL*32767UL) - (1<<24)) if (tramp_run_kernel()) { fprintf(stderr, "Failed.\n"); return 1; } - fprintf(stderr, "Done.\n"); + clock_gettime(CLOCK_MONOTONIC, &tv_end); + /*FIXME*/double clock_delta = tv_delta(&tv_start, &tv_end); + fprintf(stderr, "Done in %.2f seconds (%.3f MH/s).\n", clock_delta, (HASH_PER_RUN/clock_delta/1e6)); -/* char *buffer = malloc(size*size); + /* FIXME */cl_int *buffer = malloc(4*65536); if (!buffer) { perror("host data buffer malloc"); return 1; } fprintf(stderr, "Reading data from device... "); - if (tramp_copy_data((void*)&buffer, size*size)) { + if (tramp_copy_data((void*)&buffer, 4*65536)) { fprintf(stderr, "Failed.\n"); return 1; } fprintf(stderr, "Done.\n"); -*/ + + fprintf(stderr, "Analysing batch results. Successful nonces: \n"); + + /* FIXME */ int i = 0; + /* FIXME */ int count = 0; + for (i = 0; i < 65536; i++) { + if (buffer[i] != 0) { + count++; + fprintf(stderr, "%d \n", buffer[i]); + /* FIXME */unsigned char e[4] = {}; + /* FIXME */unsigned int smalls = (unsigned int)buffer[i]; + /* FIXME */unsigned int biggies = (unsigned int)i; + e[0] = (biggies >> 8) & 0xFF; + e[1] = biggies & 0xFF; + e[2] = (smalls >> 8) & 0xFF; + e[3] = smalls & 0xFF; + if (truffle_valid(search_raw, raw_len, bitmask, *sha, e)) { + fprintf(stderr, "«%x %x %x %x»\n", e[0], e[1], e[2], e[3]); + /* FIXME */unsigned long eLE = e[0] << 24 | e[1] << 16 | e[2] << 8 | e[3]; + fprintf(stderr, "Got eem: %xul!\n", eLE); + return eLE; + } else { + fprintf(stderr, "GPU doesn't agree with CPU: bug or hardware fault?\n"); + } + break; + } + } + if (count == 0) { + fprintf(stderr, "None. "); + } + fprintf(stderr, "Done.\n"); + fprintf(stderr, "Destroying CL trampoline... "); tramp_destroy(); fprintf(stderr, "Blown to smitherines.\n"); -/* free(buffer);*/ + free(buffer); return 0; } @@ -123,24 +219,11 @@ int main(int argc, char **argv) /* decode desired base32 */ onion_base32_dec(search_raw, search_pad); - /* hangover code from sand-leek.c */ - /* bitmasks to be used to compare remainder bits */ - unsigned char bitmasks[] = { - [1] = 0xF8, /* 5 MSB */ - [2] = 0xC0, /* 2 MSB */ - [3] = 0xFE, /* 7 MSB */ - [4] = 0xF0, /* 4 MSB */ - [5] = 0x80, /* 1 MSB */ - [6] = 0xFC, /* 6 MSB */ - [7] = 0xE0 /* 3 MSB */ - }; - /* number of whole bytes of raw hash to compare: * 10 is the size of the data a full onion address covers * 16 is the size of the base32-encoded onion address */ size_t search_len = strlen(search); int raw_len = (search_len*10)/16; - int bitmask = bitmasks[search_len % 8]; /* end hangover code from sand-leek.c */ RSA* rsa_key = NULL; @@ -161,7 +244,6 @@ int main(int argc, char **argv) struct sha_data sha_c; BIGNUM *bignum_e = NULL; - bignum_e = BN_new(); if (!bignum_e) { fprintf(stderr, "Failed to allocate bignum for exponent\n"); @@ -170,31 +252,70 @@ int main(int argc, char **argv) e = EXPONENT_MIN; BN_set_word(bignum_e, e); - if (!RSA_generate_key_ex(rsa_key, RSA_KEY_BITS, bignum_e, NULL)) { - fprintf(stderr, "Failed to generate RSA key\n"); - return 1; - } - der_length = i2d_RSAPublicKey(rsa_key, NULL); - if (der_length <= 0) { - fprintf(stderr, "i2d failed\n"); + + do { + if (!RSA_generate_key_ex(rsa_key, RSA_KEY_BITS, bignum_e, NULL)) { + fprintf(stderr, "Failed to generate RSA key\n"); + return 1; + } + der_length = i2d_RSAPublicKey(rsa_key, NULL); + if (der_length <= 0) { + fprintf(stderr, "i2d failed\n"); + return 1; + } + der_data = malloc(der_length); + if (!der_data) { + fprintf(stderr, "DER data malloc failed\n"); + return 1; + } + tmp_data = der_data; + if (i2d_RSAPublicKey(rsa_key, &tmp_data) != der_length) { + fprintf(stderr, "DER formatting failed\n"); + return 1; + } + + sha_init(&sha_c); + sha_update(&sha_c, der_data, der_length - EXPONENT_SIZE_BYTES); + free(der_data); + + e = run(preferred_platform, search_raw, raw_len, search_len, &sha_c); + } while (e == 0); + + BN_set_word(bignum_e, e); +fprintf(stderr, "exponent is %lx\n", e); + +#if OPENSSL_VERSION_NUMBER >= 0x10100000L + if (BN_set_word(bignum_e, e) != 1) { + fprintf(stderr, "BN_set_word failed\n"); return 1; } - der_data = malloc(der_length); - if (!der_data) { - fprintf(stderr, "DER data malloc failed\n"); + RSA_set0_key(rsa_key, NULL, bignum_e, NULL); + /* allocate what was freed by above function call */ + bignum_e = BN_new(); +#else + /* much tidier to be honest */ + BN_set_word(rsa_key->e, e); +#endif + if (key_update_d(rsa_key)) { + printf("Error updating d component of RSA key, stop.\n"); return 1; } - tmp_data = der_data; - if (i2d_RSAPublicKey(rsa_key, &tmp_data) != der_length) { - fprintf(stderr, "DER formatting failed\n"); + + if (RSA_check_key(rsa_key) == 1) { + fprintf(stderr, "Key valid\n"); + EVP_PKEY *evp_key = EVP_PKEY_new(); + if (!EVP_PKEY_assign_RSA(evp_key, rsa_key)) { + fprintf(stderr, "EVP_PKEY assignment failed\n"); + return 1; + } + PEM_write_PrivateKey(stdout, evp_key, NULL, NULL, 0, NULL, NULL); + EVP_PKEY_free(evp_key); return 1; + } else { + fprintf(stderr, "Key invalid:"); + ERR_print_errors_fp(stderr); } - sha_init(&sha_c); - sha_update(&sha_c, der_data, der_length - EXPONENT_SIZE_BYTES); - free(der_data); - - run(preferred_platform, search_raw, raw_len, &sha_c); return 0; } -- cgit v1.1