go-ethereum/trie.py

225 lines
8.4 KiB
Python
Raw Normal View History

2013-12-21 20:20:30 -06:00
import leveldb
import rlp
import hashlib
def sha256(x): return hashlib.sha256(x).digest()
class DB():
def __init__(self,dbfile): self.db = leveldb.LevelDB(dbfile)
def get(self,key):
try: return self.db.Get(key)
except: return ''
def put(self,key,value): return self.db.Put(key,value)
def delete(self,key): return self.db.Delete(key)
2013-12-29 19:10:58 -06:00
def hexarraykey_to_bin(key):
term = 1 if key[-1] == 16 else 0
2013-12-31 09:32:06 -06:00
if term: key = key[:-1]
2013-12-29 19:10:58 -06:00
oddlen = len(key) % 2
flags = 2 * term + oddlen
if oddlen: key = [flags] + key
else: key = [flags,0] + key
o = ''
for i in range(0,len(key),2):
o += chr(16 * key[i] + key[i+1])
return o
def bin_to_hexarraykey(bindata):
2013-12-31 09:32:06 -06:00
o = ['0123456789abcdef'.find(x) for x in bindata.encode('hex')]
2013-12-29 19:10:58 -06:00
if o[0] >= 2: o.append(16)
if o[0] % 2 == 1: o = o[1:]
else: o = o[2:]
return o
databases = {}
2013-12-21 20:20:30 -06:00
class Trie():
def __init__(self,dbfile,root='',debug=False):
2013-12-21 20:20:30 -06:00
self.root = root
self.debug = debug
if dbfile not in databases:
databases[dbfile] = DB(dbfile)
self.db = databases[dbfile]
2013-12-21 20:20:30 -06:00
def __get_state(self,node,key):
2013-12-21 20:38:16 -06:00
if self.debug: print 'nk',node.encode('hex'),key
2013-12-21 20:20:30 -06:00
if len(key) == 0 or not node:
return node
curnode = rlp.decode(self.db.get(node))
2013-12-21 20:38:16 -06:00
if self.debug: print 'cn', curnode
2013-12-21 20:20:30 -06:00
if not curnode:
raise Exception("node not found in database")
elif len(curnode) == 2:
(k2,v2) = curnode
2013-12-31 09:32:06 -06:00
k2 = bin_to_hexarraykey(k2)
2013-12-21 20:20:30 -06:00
if len(key) >= len(k2) and k2 == key[:len(k2)]:
return self.__get_state(v2,key[len(k2):])
else:
return ''
elif len(curnode) == 17:
return self.__get_state(curnode[key[0]],key[1:])
def __put(self,node):
rlpnode = rlp.encode(node)
h = sha256(rlpnode)
self.db.put(h,rlpnode)
return h
def __update_state(self,node,key,value):
if value != '': return self.__insert_state(node,key,value)
else: return self.__delete_state(node,key)
def __insert_state(self,node,key,value):
if self.debug: print 'ins', node.encode('hex'), key
2013-12-21 20:20:30 -06:00
if len(key) == 0:
return value
else:
if not node:
2013-12-29 19:10:58 -06:00
newnode = [ hexarraykey_to_bin(key), value ]
2013-12-21 20:20:30 -06:00
return self.__put(newnode)
curnode = rlp.decode(self.db.get(node))
2013-12-21 20:38:16 -06:00
if self.debug: print 'icn', curnode
2013-12-21 20:20:30 -06:00
if not curnode:
raise Exception("node not found in database")
if len(curnode) == 2:
(k2, v2) = curnode
2013-12-31 09:32:06 -06:00
k2 = bin_to_hexarraykey(k2)
2013-12-21 20:20:30 -06:00
if key == k2:
2013-12-29 19:10:58 -06:00
newnode = [ hexarraykey_to_bin(key), value ]
2013-12-21 20:20:30 -06:00
return self.__put(newnode)
else:
i = 0
while key[:i+1] == k2[:i+1] and i < len(k2): i += 1
if i == len(k2):
newhash3 = self.__insert_state(v2,key[i:],value)
else:
newnode1 = self.__insert_state('',key[i+1:],value)
newnode2 = self.__insert_state('',k2[i+1:],v2)
newnode3 = [ '' ] * 17
newnode3[key[i]] = newnode1
newnode3[k2[i]] = newnode2
newhash3 = self.__put(newnode3)
if i == 0:
return newhash3
else:
2013-12-29 19:10:58 -06:00
newnode4 = [ hexarraykey_to_bin(key[:i]), newhash3 ]
2013-12-21 20:20:30 -06:00
return self.__put(newnode4)
else:
newnode = [ curnode[i] for i in range(17) ]
newnode[key[0]] = self.__insert_state(curnode[key[0]],key[1:],value)
return self.__put(newnode)
def __delete_state(self,node,key):
2013-12-21 20:38:16 -06:00
if self.debug: print 'dnk', node.encode('hex'), key
2013-12-21 20:20:30 -06:00
if len(key) == 0 or not node:
return ''
else:
curnode = rlp.decode(self.db.get(node))
if not curnode:
raise Exception("node not found in database")
2013-12-21 20:38:16 -06:00
if self.debug: print 'dcn', curnode
2013-12-21 20:20:30 -06:00
if len(curnode) == 2:
(k2, v2) = curnode
2013-12-31 16:29:43 -06:00
k2 = bin_to_hexarraykey(k2)
2013-12-21 20:20:30 -06:00
if key == k2:
return ''
elif key[:len(k2)] == k2:
newhash = self.__delete_state(v2,key[len(k2):])
childnode = rlp.decode(self.db.get(newhash))
if len(childnode) == 2:
2013-12-31 16:29:43 -06:00
newkey = k2 + bin_to_hexarraykey(childnode[0])
2013-12-29 19:10:58 -06:00
newnode = [ hexarraykey_to_bin(newkey), childnode[1] ]
2013-12-21 20:20:30 -06:00
else:
newnode = [ curnode[0], newhash ]
return self.__put(newnode)
else: return node
else:
newnode = [ curnode[i] for i in range(17) ]
newnode[key[0]] = self.__delete_state(newnode[key[0]],key[1:])
onlynode = -1
for i in range(17):
if newnode[i]:
if onlynode == -1: onlynode = i
else: onlynode = -2
if onlynode == 16:
newnode2 = [ hexarraykey_to_bin([16]), newnode[onlynode] ]
elif onlynode >= 0:
2013-12-21 20:20:30 -06:00
childnode = rlp.decode(self.db.get(newnode[onlynode]))
if not childnode:
raise Exception("?????")
if len(childnode) == 17:
newnode2 = [ hexarraykey_to_bin([onlynode]), newnode[onlynode] ]
2013-12-21 20:20:30 -06:00
elif len(childnode) == 2:
2013-12-31 16:29:43 -06:00
newkey = [onlynode] + bin_to_hexarraykey(childnode[0])
2013-12-29 19:10:58 -06:00
newnode2 = [ hexarraykey_to_bin(newkey), childnode[1] ]
2013-12-21 20:20:30 -06:00
else:
newnode2 = newnode
return self.__put(newnode2)
def __get_size(self,node):
if not node: return 0
curnode = self.db.get(node)
if not curnode:
raise Exception("node not found in database")
if len(curnode) == 2:
2013-12-29 19:10:58 -06:00
key = hexarraykey_to_bin(curnode[0])
if key[-1] == 16: return 1
else: return self.__get_size(curnode[1])
elif len(curnode) == 17:
total = 0
for i in range(16):
total += self.__get_size(curnode[i])
if curnode[16]: total += 1
return total
def __to_dict(self,node):
if not node: return {}
curnode = rlp.decode(self.db.get(node))
if not curnode:
raise Exception("node not found in database")
if len(curnode) == 2:
2013-12-31 09:32:06 -06:00
lkey = bin_to_hexarraykey(curnode[0])
o = {}
if lkey[-1] == 16:
o[curnode[0]] = curnode[1]
else:
d = self.__to_dict(curnode[1])
for v in d:
2013-12-31 09:32:06 -06:00
subkey = bin_to_hexarraykey(v)
2013-12-29 19:10:58 -06:00
totalkey = hexarraykey_to_bin(lkey+subkey)
o[totalkey] = d[v]
return o
elif len(curnode) == 17:
o = {}
for i in range(16):
d = self.__to_dict(curnode[i])
for v in d:
2013-12-31 09:32:06 -06:00
subkey = bin_to_hexarraykey(v)
2013-12-29 19:10:58 -06:00
totalkey = hexarraykey_to_bin([i] + subkey)
o[totalkey] = d[v]
if curnode[16]: o[chr(16)] = curnode[16]
return o
else:
raise Exception("bad curnode! "+curnode)
def to_dict(self,as_hex=False):
d = self.__to_dict(self.root)
o = {}
for v in d:
2013-12-31 09:32:06 -06:00
v2 = ''.join(['0123456789abcdef'[x] for x in bin_to_hexarraykey(v)[:-1]])
if not as_hex: v2 = v2.decode('hex')
o[v2] = d[v]
return o
2013-12-21 20:20:30 -06:00
def get(self,key):
key2 = ['0123456789abcdef'.find(x) for x in str(key).encode('hex')] + [16]
2013-12-21 20:20:30 -06:00
return self.__get_state(self.root,key2)
def get_size(self): return self.__get_size(self.root)
2013-12-21 20:20:30 -06:00
def update(self,key,value):
if not isinstance(key,(str,unicode)) or not isinstance(value,(str,unicode)):
2013-12-21 20:20:30 -06:00
raise Exception("Key and value must be strings")
key2 = ['0123456789abcdef'.find(x) for x in str(key).encode('hex')] + [16]
self.root = self.__update_state(self.root,key2,str(value))