Source code for synapse.lib.hashset

import hashlib

[docs]class HashSet: def __init__(self): self.size = 0 # BEWARE ORDER MATTERS FOR guid() self.hashes = ( ('md5', hashlib.md5(usedforsecurity=False)), ('sha1', hashlib.sha1(usedforsecurity=False)), ('sha256', hashlib.sha256()), ('sha512', hashlib.sha512()) )
[docs] def guid(self): ''' Use elements from this hash set to create a unique (re)identifier. ''' iden = hashlib.md5(usedforsecurity=False) props = {'size': self.size} for name, item in self.hashes: iden.update(item.digest()) props[name] = item.hexdigest() return iden.hexdigest(), props
[docs] def eatfd(self, fd): ''' Consume all the bytes from a file like object. Example: hset = HashSet() hset.eatfd(fd) ''' fd.seek(0) byts = fd.read(10000000) while byts: self.update(byts) byts = fd.read(10000000) return self.guid()
[docs] def update(self, byts): ''' Update all the hashes in the set with the given bytes. ''' self.size += len(byts) [h[1].update(byts) for h in self.hashes]
[docs] def digests(self): ''' Get a list of (name, bytes) tuples for the hashes in the hashset. ''' return [(name, item.digest()) for (name, item) in self.hashes]