PyBitmessage-2021-04-27/src/randomtrackingdict.py

import random
from threading import RLock
from time import time

class RandomTrackingDict(object):
    maxPending = 10
    pendingTimeout = 60
    def __init__(self): # O(1)
        self.dictionary = {}
        self.indexDict = []
        self.len = 0
        self.pendingLen = 0
        self.lastPoll = 0
        self.lock = RLock()

    def __len__(self):
        return self.len

    def __contains__(self, key):
        return key in self.dictionary

    def __getitem__(self, key):
        return self.dictionary[key][1]

    def __setitem__(self, key, value):
        with self.lock:
            if key in self.dictionary:
                self.dictionary[key][1] = value
            else:
                self.indexDict.append(key)
                self.dictionary[key] = [self.len, value]
                self.len += 1

    def __delitem__(self, key):
        if not key in self.dictionary:
            raise KeyError
        with self.lock:
            index = self.dictionary[key][0]
            self.indexDict[index] = self.indexDict[self.len - 1]
            self.dictionary[self.indexDict[index]][0] = index
            # if the following del is batched, performance of this single
            # operation can improve 4x, but it's already very fast so we'll
            # ignore it for the time being
            del self.indexDict[-1]
            del self.dictionary[key]
            self.len -= 1
            if index >= self.len - self.pendingLen:
                self.pendingLen -= 1

    def setMaxPending(self, maxPending):
        self.maxPending = maxPending

    def setPendingTimeout(self, pendingTimeout):
        self.pendingTimeout = pendingTimeout

    def randomKeys(self, count=1):
        if self.lastPoll + self.pendingTimeout < time():
            with self.lock:
                self.pendingLen = 0
        if self.len == 0 or self.pendingLen >= self.maxPending:
            raise KeyError
        with self.lock:
            available = self.len - self.pendingLen
            if count > available:
                count = available
            retval = random.sample(self.indexDict[:self.len - self.pendingLen], count)
            for i in retval[::-1]:
                # swap with one below lowest pending
                self.pendingLen += 1
                swapKey = self.indexDict[-self.pendingLen]
                curIndex = self.dictionary[i][0]
                self.indexDict[-self.pendingLen] = i
                self.indexDict[curIndex] = swapKey
                self.dictionary[i][0] = self.len - self.pendingLen
                self.dictionary[swapKey][0] = curIndex
            self.lastPoll = time()
            return retval

if __name__ == '__main__':
    def randString():
        retval = b''
        for _ in range(32):
            retval += chr(random.randint(0,255))
        return retval

    a = []
    k = RandomTrackingDict()
    d = {}
    
#    print "populating normal dict"
#    a.append(time())
#    for i in range(50000):
#        d[randString()] = True
#    a.append(time())
    print "populating random tracking dict"
    a.append(time())
    for i in range(50000):
        k[randString()] = True
    a.append(time())
    print "done"
    while len(k) > 0:
        retval = k.randomKeys(1000)
        if not retval:
            print "error getting random keys"
        #a.append(time())
        try:
            k.randomKeys(100)
            print "bad"
        except KeyError:
            pass
        #a.append(time())
        for i in retval:
            del k[i]
        #a.append(time())
    a.append(time())

    for x in range(len(a) - 1):
        print "%i: %.3f" % (x, a[x+1] - a[x])
Download optimisation - new data structure to handle download tracking, uses less CPU 2018-02-01 12:19:39 +01:00			`import random`
			`from threading import RLock`
			`from time import time`

			`class RandomTrackingDict(object):`
			`maxPending = 10`
			`pendingTimeout = 60`
			`def __init__(self): # O(1)`
			`self.dictionary = {}`
			`self.indexDict = []`
			`self.len = 0`
			`self.pendingLen = 0`
			`self.lastPoll = 0`
			`self.lock = RLock()`

			`def __len__(self):`
			`return self.len`

			`def __contains__(self, key):`
			`return key in self.dictionary`

			`def __getitem__(self, key):`
			`return self.dictionary[key][1]`

			`def __setitem__(self, key, value):`
			`with self.lock:`
			`if key in self.dictionary:`
			`self.dictionary[key][1] = value`
			`else:`
			`self.indexDict.append(key)`
			`self.dictionary[key] = [self.len, value]`
			`self.len += 1`

			`def __delitem__(self, key):`
			`if not key in self.dictionary:`
			`raise KeyError`
			`with self.lock:`
			`index = self.dictionary[key][0]`
			`self.indexDict[index] = self.indexDict[self.len - 1]`
			`self.dictionary[self.indexDict[index]][0] = index`
			`# if the following del is batched, performance of this single`
			`# operation can improve 4x, but it's already very fast so we'll`
			`# ignore it for the time being`
			`del self.indexDict[-1]`
			`del self.dictionary[key]`
			`self.len -= 1`
			`if index >= self.len - self.pendingLen:`
			`self.pendingLen -= 1`

			`def setMaxPending(self, maxPending):`
			`self.maxPending = maxPending`

			`def setPendingTimeout(self, pendingTimeout):`
			`self.pendingTimeout = pendingTimeout`

			`def randomKeys(self, count=1):`
			`if self.lastPoll + self.pendingTimeout < time():`
			`with self.lock:`
			`self.pendingLen = 0`
			`if self.len == 0 or self.pendingLen >= self.maxPending:`
			`raise KeyError`
			`with self.lock:`
			`available = self.len - self.pendingLen`
			`if count > available:`
			`count = available`
			`retval = random.sample(self.indexDict[:self.len - self.pendingLen], count)`
			`for i in retval[::-1]:`
			`# swap with one below lowest pending`
			`self.pendingLen += 1`
			`swapKey = self.indexDict[-self.pendingLen]`
			`curIndex = self.dictionary[i][0]`
			`self.indexDict[-self.pendingLen] = i`
			`self.indexDict[curIndex] = swapKey`
			`self.dictionary[i][0] = self.len - self.pendingLen`
			`self.dictionary[swapKey][0] = curIndex`
			`self.lastPoll = time()`
			`return retval`

			`if __name__ == '__main__':`
			`def randString():`
			`retval = b''`
			`for _ in range(32):`
			`retval += chr(random.randint(0,255))`
			`return retval`

			`a = []`
			`k = RandomTrackingDict()`
			`d = {}`

			`# print "populating normal dict"`
			`# a.append(time())`
			`# for i in range(50000):`
			`# d[randString()] = True`
			`# a.append(time())`
			`print "populating random tracking dict"`
			`a.append(time())`
			`for i in range(50000):`
			`k[randString()] = True`
			`a.append(time())`
			`print "done"`
			`while len(k) > 0:`
			`retval = k.randomKeys(1000)`
			`if not retval:`
			`print "error getting random keys"`
			`#a.append(time())`
			`try:`
			`k.randomKeys(100)`
			`print "bad"`
			`except KeyError:`
			`pass`
			`#a.append(time())`
			`for i in retval:`
			`del k[i]`
			`#a.append(time())`
			`a.append(time())`

			`for x in range(len(a) - 1):`
			`print "%i: %.3f" % (x, a[x+1] - a[x])`