{ "metadata": { "name": "", "signature": "sha256:cc6dff0452db60e1c4a9d63bbb9703d17fca8a2ef1f02c5fb11910d6de322b73" }, "nbformat": 3, "nbformat_minor": 0, "worksheets": [ { "cells": [ { "cell_type": "code", "collapsed": false, "input": [ "%qtconsole --colors=linux" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 1 }, { "cell_type": "code", "collapsed": false, "input": [ "from __future__ import division\n", "import numpy as np\n", "import pyopencl as cl\n", "import pyopencl.array\n", "import pyopencl.tools" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 2 }, { "cell_type": "code", "collapsed": false, "input": [ "%load_ext pyopencl.ipython_ext" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 3 }, { "cell_type": "code", "collapsed": false, "input": [ "ctx = cl.create_some_context()\n", "queue = cl.CommandQueue(ctx)" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 4 }, { "cell_type": "code", "collapsed": false, "input": [ "device=ctx.devices[0]\n", "print device.max_mem_alloc_size\n", "print device.max_work_group_size" ], "language": "python", "metadata": {}, "outputs": [ { "output_type": "stream", "stream": "stdout", "text": [ "1073741824\n", "256\n" ] } ], "prompt_number": 5 }, { "cell_type": "code", "collapsed": false, "input": [ "from hashlib import sha512\n", "sha512('').hexdigest()" ], "language": "python", "metadata": {}, "outputs": [ { "metadata": {}, "output_type": "pyout", "prompt_number": 24, "text": [ "'cf83e1357eefb8bdf1542850d66d8007d620e4050b5715dc83f4a921d36ce9ce47d0d13c5d85f2b0ff8318d2877eec2f63b931bd47417a81a538327af927da3e'" ] } ], "prompt_number": 24 }, { "cell_type": "code", "collapsed": false, "input": [ "%%cl_kernel -o \"-I .\"\n", "#define _OPENCL_COMPILER\n", "#define DEVICE_INFO 2|64|1024\n", "#include \"opencl_cryptsha512.h\"\n", "\n", "__constant uint64_t k[] = {\n", " 0x428a2f98d728ae22UL, 0x7137449123ef65cdUL, 0xb5c0fbcfec4d3b2fUL, 0xe9b5dba58189dbbcUL,\n", " 0x3956c25bf348b538UL, 0x59f111f1b605d019UL, 0x923f82a4af194f9bUL, 0xab1c5ed5da6d8118UL,\n", " 0xd807aa98a3030242UL, 0x12835b0145706fbeUL, 0x243185be4ee4b28cUL, 0x550c7dc3d5ffb4e2UL,\n", " 0x72be5d74f27b896fUL, 0x80deb1fe3b1696b1UL, 0x9bdc06a725c71235UL, 0xc19bf174cf692694UL,\n", " 0xe49b69c19ef14ad2UL, 0xefbe4786384f25e3UL, 0x0fc19dc68b8cd5b5UL, 0x240ca1cc77ac9c65UL,\n", " 0x2de92c6f592b0275UL, 0x4a7484aa6ea6e483UL, 0x5cb0a9dcbd41fbd4UL, 0x76f988da831153b5UL,\n", " 0x983e5152ee66dfabUL, 0xa831c66d2db43210UL, 0xb00327c898fb213fUL, 0xbf597fc7beef0ee4UL,\n", " 0xc6e00bf33da88fc2UL, 0xd5a79147930aa725UL, 0x06ca6351e003826fUL, 0x142929670a0e6e70UL,\n", " 0x27b70a8546d22ffcUL, 0x2e1b21385c26c926UL, 0x4d2c6dfc5ac42aedUL, 0x53380d139d95b3dfUL,\n", " 0x650a73548baf63deUL, 0x766a0abb3c77b2a8UL, 0x81c2c92e47edaee6UL, 0x92722c851482353bUL,\n", " 0xa2bfe8a14cf10364UL, 0xa81a664bbc423001UL, 0xc24b8b70d0f89791UL, 0xc76c51a30654be30UL,\n", " 0xd192e819d6ef5218UL, 0xd69906245565a910UL, 0xf40e35855771202aUL, 0x106aa07032bbd1b8UL,\n", " 0x19a4c116b8d2d0c8UL, 0x1e376c085141ab53UL, 0x2748774cdf8eeb99UL, 0x34b0bcb5e19b48a8UL,\n", " 0x391c0cb3c5c95a63UL, 0x4ed8aa4ae3418acbUL, 0x5b9cca4f7763e373UL, 0x682e6ff3d6b2b8a3UL,\n", " 0x748f82ee5defb2fcUL, 0x78a5636f43172f60UL, 0x84c87814a1f0ab72UL, 0x8cc702081a6439ecUL,\n", " 0x90befffa23631e28UL, 0xa4506cebde82bde9UL, 0xbef9a3f7b2c67915UL, 0xc67178f2e372532bUL,\n", " 0xca273eceea26619cUL, 0xd186b8c721c0c207UL, 0xeada7dd6cde0eb1eUL, 0xf57d4f7fee6ed178UL,\n", " 0x06f067aa72176fbaUL, 0x0a637dc5a2c898a6UL, 0x113f9804bef90daeUL, 0x1b710b35131c471bUL,\n", " 0x28db77f523047d84UL, 0x32caab7b40c72493UL, 0x3c9ebe0a15c9bebcUL, 0x431d67c49c100d4cUL,\n", " 0x4cc5d4becb3e42b6UL, 0x597f299cfc657e2aUL, 0x5fcb6fab3ad6faecUL, 0x6c44198c4a475817UL,\n", "};\n", "\n", "\n", "inline void init_ctx(__local sha512_ctx * ctx) {\n", " ctx->H[0] = 0x6a09e667f3bcc908UL;\n", " ctx->H[1] = 0xbb67ae8584caa73bUL;\n", " ctx->H[2] = 0x3c6ef372fe94f82bUL;\n", " ctx->H[3] = 0xa54ff53a5f1d36f1UL;\n", " ctx->H[4] = 0x510e527fade682d1UL;\n", " ctx->H[5] = 0x9b05688c2b3e6c1fUL;\n", " ctx->H[6] = 0x1f83d9abfb41bd6bUL;\n", " ctx->H[7] = 0x5be0cd19137e2179UL;\n", " ctx->total = 0;\n", " ctx->buflen = 0;\n", "}\n", "\n", "inline void sha512_block(__local sha512_ctx * ctx) {\n", " uint64_t a = ctx->H[0];\n", " uint64_t b = ctx->H[1];\n", " uint64_t c = ctx->H[2];\n", " uint64_t d = ctx->H[3];\n", " uint64_t e = ctx->H[4];\n", " uint64_t f = ctx->H[5];\n", " uint64_t g = ctx->H[6];\n", " uint64_t h = ctx->H[7];\n", " uint64_t t1, t2;\n", " uint64_t w[16];\n", "\n", "#ifdef VECTOR_USAGE\n", " ulong16 w_vector;\n", " w_vector = vload16(0, ctx->buffer->mem_64);\n", " w_vector = SWAP64_V(w_vector);\n", " vstore16(w_vector, 0, w);\n", "#else\n", " #pragma unroll\n", " for (int i = 0; i < 16; i++)\n", " w[i] = SWAP64(ctx->buffer->mem_64[i]);\n", "#endif\n", "\n", " #pragma unroll\n", " for (int i = 0; i < 80; i++) {\n", "\n", " if (i > 15) {\n", " w[i & 15] = sigma1(w[(i - 2) & 15]) + sigma0(w[(i - 15) & 15]) + w[(i - 16) & 15] + w[(i - 7) & 15];\n", " }\n", " t1 = k[i] + w[i & 15] + h + Sigma1(e) + Ch(e, f, g);\n", " t2 = Maj(a, b, c) + Sigma0(a);\n", " h = g;\n", " g = f;\n", " f = e;\n", " e = d + t1;\n", " d = c;\n", " c = b;\n", " b = a;\n", " a = t1 + t2;\n", " }\n", " /* Put checksum in context given as argument. */\n", " ctx->H[0] += a;\n", " ctx->H[1] += b;\n", " ctx->H[2] += c;\n", " ctx->H[3] += d;\n", " ctx->H[4] += e;\n", " ctx->H[5] += f;\n", " ctx->H[6] += g;\n", " ctx->H[7] += h;\n", "}\n", "\n", "inline void insert_to_buffer(__local sha512_ctx * ctx,\n", " const uint8_t * string,\n", " const uint32_t len) {\n", " __local uint8_t * dest;\n", " dest = ctx->buffer->mem_08 + ctx->buflen;\n", "\n", " for (int i = 0; i < len; i++)\n", " PUTCHAR(dest, i, GETCHAR(string, i));\n", " ctx->buflen += len; \n", "}\n", "\n", "inline void ctx_update(__local sha512_ctx * ctx,\n", " uint8_t * string, uint32_t len) {\n", "\n", " ctx->total += len;\n", " uint32_t startpos = ctx->buflen;\n", " uint32_t offset = 0;\n", "\n", " while(1){\n", " insert_to_buffer(ctx, string+offset, (len -offset <= 128 - startpos ? len-offset : 128 - startpos));\n", " if(ctx->buflen<128) break;\n", " mem_fence(CLK_LOCAL_MEM_FENCE);\n", " sha512_block(ctx); \n", " offset = offset +128 - startpos;\n", " ctx->buflen = 0;\n", " startpos=0;\n", " }\n", "\n", "}\n", "\n", "inline void ctx_append_1(__local sha512_ctx * ctx) {\n", "\n", " uint32_t length = ctx->buflen;\n", " PUTCHAR(ctx->buffer->mem_08, length, 0x80);\n", "\n", " while (++length & 3)\n", " PUTCHAR(ctx->buffer->mem_08, length, 0);\n", "\n", " if (length & 7) {\n", " __local uint32_t * l = (__local uint32_t *) (ctx->buffer->mem_08 + length);\n", " *l = 0;\n", " length += 4;\n", " }\n", " __local uint64_t * l = (__local uint64_t *) (ctx->buffer->mem_08 + length);\n", "\n", " while (length < 128) {\n", " *l++ = 0;\n", " length += 8;\n", " }\n", "}\n", "\n", "inline void ctx_add_length(__local sha512_ctx * ctx) {\n", "\n", " ctx->buffer->mem_64[15] = SWAP64((uint64_t) (ctx->total * 8));\n", "}\n", "\n", "inline void finish_ctx(__local sha512_ctx * ctx) {\n", " ctx_append_1(ctx);\n", " ctx_add_length(ctx);\n", " ctx->buflen = 0;\n", "}\n", "\n", "inline void clear_ctx_buffer(__local sha512_ctx * ctx) {\n", "\n", "#ifdef VECTOR_USAGE\n", " ulong16 w_vector = 0;\n", " vstore16(w_vector, 0, ctx->buffer->mem_64);\n", "#else\n", " #pragma unroll\n", " for (int i = 0; i < 16; i++)\n", " ctx->buffer->mem_64[i] = 0;\n", "#endif\n", "\n", " ctx->buflen = 0;\n", "}\n", "\n", "inline void sha512_digest(__local sha512_ctx * ctx,\n", " __global uint64_t * result) {\n", "\n", " if (ctx->buflen <= 111) { //data+0x80+datasize fits in one 1024bit block\n", " finish_ctx(ctx);\n", "\n", " } else {\n", " bool moved = true;\n", "\n", " if (ctx->buflen < 128) { //data and 0x80 fits in one block\n", " ctx_append_1(ctx);\n", " moved = false;\n", " }\n", " sha512_block(ctx);\n", " clear_ctx_buffer(ctx);\n", "\n", " if (moved) //append 1,the rest is already clean\n", " PUTCHAR(ctx->buffer->mem_08, 0, 0x80);\n", " ctx_add_length(ctx);\n", " }\n", " sha512_block(ctx);\n", "\n", " #pragma unroll\n", " for (int i = 0; i < 8; i++)\n", " result[i] = SWAP64(ctx->H[i]);\n", "\n", "}\n", "\n", "inline void sha512crypt(__local sha512_ctx * ctx,\n", " __global sha512_hash * output, int passlen) {\n", " uint8_t pass[128];\n", " #pragma unroll\n", " for(int i=0;i<128;i++)\n", " pass[i]=97;\n", "\n", " init_ctx(ctx);\n", " #define NN 128\n", " for(int i=0;i passlen ? passlen-i : NN);\n", " sha512_digest(ctx, output->v);\n", "}\n", "\n", "__kernel\n", "void kernel_sha512(__global sha512_hash * out_buffer,\n", " __local sha512_ctx * ctx_memory) {\n", " size_t gid = get_global_id(0);\n", " size_t lid = get_local_id(0);\n", " int j=gid%1024; \n", " sha512crypt(&ctx_memory[lid], &out_buffer[gid], j);\n", "}\n" ], "language": "python", "metadata": {}, "outputs": [ { "output_type": "stream", "stream": "stderr", "text": [ "/usr/local/lib/python2.7/dist-packages/pyopencl-2014.1-py2.7-linux-x86_64.egg/pyopencl/__init__.py:59: CompilerWarning: From-source build succeeded, but resulted in non-empty logs:\n", "Build on succeeded, but said:\n", "\n", "LOOP UNROLL: pragma unroll (line 66)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 61)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 162)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 192)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 201)\n", " Unrolled as requested!\n", "\n", "Warning: kernel_sha512 kernel has register spilling. Lower performance is expected.\n", "\n", " warn(text, CompilerWarning)\n" ] } ], "prompt_number": 471 }, { "cell_type": "code", "collapsed": false, "input": [ "N=1024\n", "output=cl.array.zeros(queue, 8*8*N, dtype=np.uint8)\n", "working = cl.LocalMemory(32768)\n", "kernel_sha512(queue, (N,), (128,), output.data, working).wait()" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 472 }, { "cell_type": "code", "collapsed": false, "input": [ "result = output.get()\n", "p = \"abcdefghijklmnopqrstuvwxyz\"\n", "p=\"a\"*1024\n", "for i in range(N):\n", " r = \"\".join(map(lambda x:\"%02x\"%x, result[i*64:i*64+64]))\n", " if r!=sha512(p[:i]).hexdigest():\n", " print i\n", "print \"done\"" ], "language": "python", "metadata": {}, "outputs": [ { "output_type": "stream", "stream": "stdout", "text": [ "done\n" ] } ], "prompt_number": 473 }, { "cell_type": "code", "collapsed": false, "input": [ "%%cl_kernel -o \"-I .\"\n", "#define _OPENCL_COMPILER\n", "#define DEVICE_INFO 2|64|1024\n", "#include \"opencl_cryptsha512.h\"\n", "\n", "__constant uint64_t k[] = {\n", " 0x428a2f98d728ae22UL, 0x7137449123ef65cdUL, 0xb5c0fbcfec4d3b2fUL, 0xe9b5dba58189dbbcUL,\n", " 0x3956c25bf348b538UL, 0x59f111f1b605d019UL, 0x923f82a4af194f9bUL, 0xab1c5ed5da6d8118UL,\n", " 0xd807aa98a3030242UL, 0x12835b0145706fbeUL, 0x243185be4ee4b28cUL, 0x550c7dc3d5ffb4e2UL,\n", " 0x72be5d74f27b896fUL, 0x80deb1fe3b1696b1UL, 0x9bdc06a725c71235UL, 0xc19bf174cf692694UL,\n", " 0xe49b69c19ef14ad2UL, 0xefbe4786384f25e3UL, 0x0fc19dc68b8cd5b5UL, 0x240ca1cc77ac9c65UL,\n", " 0x2de92c6f592b0275UL, 0x4a7484aa6ea6e483UL, 0x5cb0a9dcbd41fbd4UL, 0x76f988da831153b5UL,\n", " 0x983e5152ee66dfabUL, 0xa831c66d2db43210UL, 0xb00327c898fb213fUL, 0xbf597fc7beef0ee4UL,\n", " 0xc6e00bf33da88fc2UL, 0xd5a79147930aa725UL, 0x06ca6351e003826fUL, 0x142929670a0e6e70UL,\n", " 0x27b70a8546d22ffcUL, 0x2e1b21385c26c926UL, 0x4d2c6dfc5ac42aedUL, 0x53380d139d95b3dfUL,\n", " 0x650a73548baf63deUL, 0x766a0abb3c77b2a8UL, 0x81c2c92e47edaee6UL, 0x92722c851482353bUL,\n", " 0xa2bfe8a14cf10364UL, 0xa81a664bbc423001UL, 0xc24b8b70d0f89791UL, 0xc76c51a30654be30UL,\n", " 0xd192e819d6ef5218UL, 0xd69906245565a910UL, 0xf40e35855771202aUL, 0x106aa07032bbd1b8UL,\n", " 0x19a4c116b8d2d0c8UL, 0x1e376c085141ab53UL, 0x2748774cdf8eeb99UL, 0x34b0bcb5e19b48a8UL,\n", " 0x391c0cb3c5c95a63UL, 0x4ed8aa4ae3418acbUL, 0x5b9cca4f7763e373UL, 0x682e6ff3d6b2b8a3UL,\n", " 0x748f82ee5defb2fcUL, 0x78a5636f43172f60UL, 0x84c87814a1f0ab72UL, 0x8cc702081a6439ecUL,\n", " 0x90befffa23631e28UL, 0xa4506cebde82bde9UL, 0xbef9a3f7b2c67915UL, 0xc67178f2e372532bUL,\n", " 0xca273eceea26619cUL, 0xd186b8c721c0c207UL, 0xeada7dd6cde0eb1eUL, 0xf57d4f7fee6ed178UL,\n", " 0x06f067aa72176fbaUL, 0x0a637dc5a2c898a6UL, 0x113f9804bef90daeUL, 0x1b710b35131c471bUL,\n", " 0x28db77f523047d84UL, 0x32caab7b40c72493UL, 0x3c9ebe0a15c9bebcUL, 0x431d67c49c100d4cUL,\n", " 0x4cc5d4becb3e42b6UL, 0x597f299cfc657e2aUL, 0x5fcb6fab3ad6faecUL, 0x6c44198c4a475817UL,\n", "};\n", "\n", "\n", "inline void init_ctx384(__local sha512_ctx * ctx) {\n", " ctx->H[0] = 0xcbbb9d5dc1059ed8UL;\n", " ctx->H[1] = 0x629a292a367cd507UL;\n", " ctx->H[2] = 0x9159015a3070dd17UL;\n", " ctx->H[3] = 0x152fecd8f70e5939UL;\n", " ctx->H[4] = 0x67332667ffc00b31UL;\n", " ctx->H[5] = 0x8eb44a8768581511UL;\n", " ctx->H[6] = 0xdb0c2e0d64f98fa7UL;\n", " ctx->H[7] = 0x47b5481dbefa4fa4UL;\n", " ctx->total = 0;\n", " ctx->buflen = 0;\n", "}\n", "\n", "inline void sha512_block(__local sha512_ctx * ctx) {\n", " uint64_t a = ctx->H[0];\n", " uint64_t b = ctx->H[1];\n", " uint64_t c = ctx->H[2];\n", " uint64_t d = ctx->H[3];\n", " uint64_t e = ctx->H[4];\n", " uint64_t f = ctx->H[5];\n", " uint64_t g = ctx->H[6];\n", " uint64_t h = ctx->H[7];\n", " uint64_t t1, t2;\n", " uint64_t w[16];\n", "\n", "#ifdef VECTOR_USAGE\n", " ulong16 w_vector;\n", " w_vector = vload16(0, ctx->buffer->mem_64);\n", " w_vector = SWAP64_V(w_vector);\n", " vstore16(w_vector, 0, w);\n", "#else\n", " #pragma unroll\n", " for (int i = 0; i < 16; i++)\n", " w[i] = SWAP64(ctx->buffer->mem_64[i]);\n", "#endif\n", "\n", " #pragma unroll\n", " for (int i = 0; i < 80; i++) {\n", "\n", " if (i > 15) {\n", " w[i & 15] = sigma1(w[(i - 2) & 15]) + sigma0(w[(i - 15) & 15]) + w[(i - 16) & 15] + w[(i - 7) & 15];\n", " }\n", " t1 = k[i] + w[i & 15] + h + Sigma1(e) + Ch(e, f, g);\n", " t2 = Maj(a, b, c) + Sigma0(a);\n", " h = g;\n", " g = f;\n", " f = e;\n", " e = d + t1;\n", " d = c;\n", " c = b;\n", " b = a;\n", " a = t1 + t2;\n", " }\n", " /* Put checksum in context given as argument. */\n", " ctx->H[0] += a;\n", " ctx->H[1] += b;\n", " ctx->H[2] += c;\n", " ctx->H[3] += d;\n", " ctx->H[4] += e;\n", " ctx->H[5] += f;\n", " ctx->H[6] += g;\n", " ctx->H[7] += h;\n", "}\n", "\n", "inline void insert_to_buffer(__local sha512_ctx * ctx,\n", " const uint8_t * string,\n", " const uint32_t len) {\n", " __local uint8_t * dest;\n", " dest = ctx->buffer->mem_08 + ctx->buflen;\n", "\n", " for (int i = 0; i < len; i++)\n", " PUTCHAR(dest, i, GETCHAR(string, i));\n", " ctx->buflen += len; \n", "}\n", "\n", "inline void ctx_update(__local sha512_ctx * ctx,\n", " uint8_t * string, uint32_t len) {\n", "\n", " ctx->total += len;\n", " uint32_t startpos = ctx->buflen;\n", " uint32_t offset = 0;\n", "\n", " while(1){\n", " insert_to_buffer(ctx, string+offset, (len -offset <= 128 - startpos ? len-offset : 128 - startpos));\n", " if(ctx->buflen<128) break;\n", " mem_fence(CLK_LOCAL_MEM_FENCE);\n", " sha512_block(ctx); \n", " offset = offset +128 - startpos;\n", " ctx->buflen = 0;\n", " startpos=0;\n", " }\n", "\n", "}\n", "\n", "inline void ctx_append_1(__local sha512_ctx * ctx) {\n", "\n", " uint32_t length = ctx->buflen;\n", " PUTCHAR(ctx->buffer->mem_08, length, 0x80);\n", "\n", " while (++length & 3)\n", " PUTCHAR(ctx->buffer->mem_08, length, 0);\n", "\n", " if (length & 7) {\n", " __local uint32_t * l = (__local uint32_t *) (ctx->buffer->mem_08 + length);\n", " *l = 0;\n", " length += 4;\n", " }\n", " __local uint64_t * l = (__local uint64_t *) (ctx->buffer->mem_08 + length);\n", "\n", " while (length < 128) {\n", " *l++ = 0;\n", " length += 8;\n", " }\n", "}\n", "\n", "inline void ctx_add_length(__local sha512_ctx * ctx) {\n", "\n", " ctx->buffer->mem_64[15] = SWAP64((uint64_t) (ctx->total * 8));\n", "}\n", "\n", "inline void finish_ctx(__local sha512_ctx * ctx) {\n", " ctx_append_1(ctx);\n", " ctx_add_length(ctx);\n", " ctx->buflen = 0;\n", "}\n", "\n", "inline void clear_ctx_buffer(__local sha512_ctx * ctx) {\n", "\n", "#ifdef VECTOR_USAGE\n", " ulong16 w_vector = 0;\n", " vstore16(w_vector, 0, ctx->buffer->mem_64);\n", "#else\n", " #pragma unroll\n", " for (int i = 0; i < 16; i++)\n", " ctx->buffer->mem_64[i] = 0;\n", "#endif\n", "\n", " ctx->buflen = 0;\n", "}\n", "\n", "inline void sha384_digest(__local sha512_ctx * ctx,\n", " __global uint64_t * result) {\n", "\n", " if (ctx->buflen <= 111) { //data+0x80+datasize fits in one 1024bit block\n", " finish_ctx(ctx);\n", "\n", " } else {\n", " bool moved = true;\n", "\n", " if (ctx->buflen < 128) { //data and 0x80 fits in one block\n", " ctx_append_1(ctx);\n", " moved = false;\n", " }\n", " sha512_block(ctx);\n", " clear_ctx_buffer(ctx);\n", "\n", " if (moved) //append 1,the rest is already clean\n", " PUTCHAR(ctx->buffer->mem_08, 0, 0x80);\n", " ctx_add_length(ctx);\n", " }\n", " sha512_block(ctx);\n", "\n", " #pragma unroll\n", " for (int i = 0; i < 6; i++)\n", " result[i] = SWAP64(ctx->H[i]);\n", "\n", "}\n", "\n", "inline void sha384crypt(__local sha512_ctx * ctx,\n", " __global sha384_hash * output, int passlen) {\n", " uint8_t pass[128];\n", " #pragma unroll\n", " for(int i=0;i<128;i++)\n", " pass[i]=97;\n", "\n", " init_ctx384(ctx);\n", " #define NN 128\n", " for(int i=0;i passlen ? passlen-i : NN);\n", " sha384_digest(ctx, output->v);\n", "}\n", "\n", "__kernel\n", "void kernel_sha384(__global sha384_hash * out_buffer,\n", " __local sha512_ctx * ctx_memory) {\n", " size_t gid = get_global_id(0);\n", " size_t lid = get_local_id(0);\n", " int j=gid%1024; \n", " sha384crypt(&ctx_memory[lid], &out_buffer[gid], j);\n", "}\n" ], "language": "python", "metadata": {}, "outputs": [ { "output_type": "stream", "stream": "stderr", "text": [ "/usr/local/lib/python2.7/dist-packages/pyopencl-2014.1-py2.7-linux-x86_64.egg/pyopencl/__init__.py:59: CompilerWarning: From-source build succeeded, but resulted in non-empty logs:\n", "Build on succeeded, but said:\n", "\n", "LOOP UNROLL: pragma unroll (line 66)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 61)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 162)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 192)\n", " Unrolled as requested!\n", "LOOP UNROLL: pragma unroll (line 201)\n", " Unrolled as requested!\n", "\n", "Warning: kernel_sha384 kernel has register spilling. Lower performance is expected.\n", "\n", " warn(text, CompilerWarning)\n" ] } ], "prompt_number": 475 }, { "cell_type": "code", "collapsed": false, "input": [ "N=1024\n", "output=cl.array.zeros(queue, 8*8*N, dtype=np.uint8)\n", "working = cl.LocalMemory(200*128)\n", "kernel_sha384(queue, (N,), (128,), output.data, working).wait()" ], "language": "python", "metadata": {}, "outputs": [], "prompt_number": 493 }, { "cell_type": "code", "collapsed": false, "input": [ "from hashlib import sha384\n", "result = output.get()\n", "p = \"abcdefghijklmnopqrstuvwxyz\"\n", "p=\"a\"*1024\n", "for i in range(N):\n", " r = \"\".join(map(lambda x:\"%02x\"%x, result[i*48:i*48+48]))\n", " if r!=sha384(p[:i]).hexdigest():\n", " print i\n", "print \"done\"" ], "language": "python", "metadata": {}, "outputs": [ { "output_type": "stream", "stream": "stdout", "text": [ "done\n" ] } ], "prompt_number": 494 }, { "cell_type": "code", "collapsed": false, "input": [ "res" ], "language": "python", "metadata": {}, "outputs": [] } ], "metadata": {} } ] }