PyBitmessage-2021-04-27/src/workprover/gpusolver.py

import hashlib
import os.path
import struct

import utils

pyopencl = None
numpy = None

class GPUSolverError(Exception):
    pass

class GPUSolver(object):
    def __init__(self, codePath, vendors = None):
        global pyopencl, numpy

        try:
            import numpy
            import pyopencl
        except ImportError:
            raise GPUSolverError()

        device = None

        for i in pyopencl.get_platforms():
            if vendors is not None and i.vendor not in vendors:
                continue

            devices = i.get_devices(device_type = pyopencl.device_type.GPU)

            if len(devices) != 0:
                device = devices[0]

                break
        else:
            raise GPUSolverError()

        context = pyopencl.Context(devices = [device])

        computeUnitsCount = device.get_info(pyopencl.device_info.MAX_COMPUTE_UNITS)
        workGroupSize = device.get_info(pyopencl.device_info.MAX_WORK_GROUP_SIZE)

        self.parallelism = workGroupSize * computeUnitsCount
        self.batchSize = self.parallelism * 256

        self.queue = pyopencl.CommandQueue(context, device)

        with open(os.path.join(codePath, "gpusolver.cl")) as file:
            source = file.read()

        program = pyopencl.Program(context, source).build()

        self.hostOutput = numpy.zeros(1 + self.batchSize, numpy.uint32)
        self.hostInput = numpy.zeros(1 + 8 + 1, numpy.uint64)

        self.output = pyopencl.Buffer(context, pyopencl.mem_flags.READ_WRITE, 4 * (1 + self.batchSize))
        self.input = pyopencl.Buffer(context, pyopencl.mem_flags.READ_ONLY, 8 * (1 + 8 + 1))

        self.kernel = program.search
        self.kernel.set_args(self.output, self.input)

    def search(self, initialHash, target, seed, timeout):
        startTime = utils.getTimePoint()

        self.hostOutput[0] = 0

        for i in xrange(8):
            self.hostInput[1 + i], = struct.unpack(">Q", initialHash[8 * i: 8 * (i + 1)])

        self.hostInput[9] = target

        pyopencl.enqueue_copy(self.queue, self.output, self.hostOutput[: 1])

        i = 0

        while True:
            randomness = hashlib.sha512(seed + struct.pack(">Q", i)).digest()
            i += 1

            self.hostInput[0], = struct.unpack(">Q", randomness[: 8])

            pyopencl.enqueue_copy(self.queue, self.input, self.hostInput)
            pyopencl.enqueue_nd_range_kernel(self.queue, self.kernel, (self.batchSize, ), None)
            self.queue.finish()
            pyopencl.enqueue_copy(self.queue, self.hostOutput[: 1], self.output)

            solutionsCount = long(self.hostOutput[0])

            if solutionsCount != 0:
                pyopencl.enqueue_copy(self.queue, self.hostOutput[0: 1 + solutionsCount], self.output)

                index, = struct.unpack(">Q", randomness[8: 16])
                threadNumber = self.hostOutput[1 + index % solutionsCount]

                nonce = struct.pack(">Q", long(self.hostInput[0]) + threadNumber)

                if not utils.checkProof(nonce, initialHash, target):
                    raise GPUSolverError()

                return nonce, self.batchSize * i

            if utils.getTimePoint() - startTime >= timeout:
                return None, self.batchSize * i

    def setParallelism(self, parallelism):
        pass
New POW calculation module 2018-06-23 08:57:34 +00:00			`import hashlib`
			`import os.path`
Sorted imports 2018-06-23 11:00:24 +00:00			`import struct`
New POW calculation module 2018-06-23 08:57:34 +00:00
			`import utils`

			`pyopencl = None`
			`numpy = None`

			`class GPUSolverError(Exception):`
			`pass`

			`class GPUSolver(object):`
			`def __init__(self, codePath, vendors = None):`
			`global pyopencl, numpy`

More precise exceptions 2018-06-23 10:32:05 +00:00			`try:`
			`import numpy`
Sorted imports 2018-06-23 11:00:24 +00:00			`import pyopencl`
More precise exceptions 2018-06-23 10:32:05 +00:00			`except ImportError:`
			`raise GPUSolverError()`
New POW calculation module 2018-06-23 08:57:34 +00:00
			`device = None`

			`for i in pyopencl.get_platforms():`
			`if vendors is not None and i.vendor not in vendors:`
			`continue`

			`devices = i.get_devices(device_type = pyopencl.device_type.GPU)`

			`if len(devices) != 0:`
			`device = devices[0]`

			`break`
			`else:`
More precise exceptions 2018-06-23 10:32:05 +00:00			`raise GPUSolverError()`
New POW calculation module 2018-06-23 08:57:34 +00:00
			`context = pyopencl.Context(devices = [device])`

			`computeUnitsCount = device.get_info(pyopencl.device_info.MAX_COMPUTE_UNITS)`
			`workGroupSize = device.get_info(pyopencl.device_info.MAX_WORK_GROUP_SIZE)`

			`self.parallelism = workGroupSize * computeUnitsCount`
			`self.batchSize = self.parallelism * 256`

			`self.queue = pyopencl.CommandQueue(context, device)`

			`with open(os.path.join(codePath, "gpusolver.cl")) as file:`
			`source = file.read()`

			`program = pyopencl.Program(context, source).build()`

			`self.hostOutput = numpy.zeros(1 + self.batchSize, numpy.uint32)`
			`self.hostInput = numpy.zeros(1 + 8 + 1, numpy.uint64)`

			`self.output = pyopencl.Buffer(context, pyopencl.mem_flags.READ_WRITE, 4 * (1 + self.batchSize))`
			`self.input = pyopencl.Buffer(context, pyopencl.mem_flags.READ_ONLY, 8 * (1 + 8 + 1))`

			`self.kernel = program.search`
			`self.kernel.set_args(self.output, self.input)`

			`def search(self, initialHash, target, seed, timeout):`
			`startTime = utils.getTimePoint()`

			`self.hostOutput[0] = 0`

			`for i in xrange(8):`
			`self.hostInput[1 + i], = struct.unpack(">Q", initialHash[8 * i: 8 * (i + 1)])`

			`self.hostInput[9] = target`

			`pyopencl.enqueue_copy(self.queue, self.output, self.hostOutput[: 1])`

			`i = 0`

			`while True:`
			`randomness = hashlib.sha512(seed + struct.pack(">Q", i)).digest()`
			`i += 1`

			`self.hostInput[0], = struct.unpack(">Q", randomness[: 8])`

			`pyopencl.enqueue_copy(self.queue, self.input, self.hostInput)`
			`pyopencl.enqueue_nd_range_kernel(self.queue, self.kernel, (self.batchSize, ), None)`
			`self.queue.finish()`
			`pyopencl.enqueue_copy(self.queue, self.hostOutput[: 1], self.output)`

			`solutionsCount = long(self.hostOutput[0])`

			`if solutionsCount != 0:`
			`pyopencl.enqueue_copy(self.queue, self.hostOutput[0: 1 + solutionsCount], self.output)`

			`index, = struct.unpack(">Q", randomness[8: 16])`
			`threadNumber = self.hostOutput[1 + index % solutionsCount]`

			`nonce = struct.pack(">Q", long(self.hostInput[0]) + threadNumber)`

			`if not utils.checkProof(nonce, initialHash, target):`
			`raise GPUSolverError()`

			`return nonce, self.batchSize * i`

			`if utils.getTimePoint() - startTime >= timeout:`
			`return None, self.batchSize * i`

			`def setParallelism(self, parallelism):`
			`pass`