3 from json import dumps, loads
5 from Queue import Queue
13 from backends.bitcoind import deserialize
14 from processor import Processor, print_log
17 from storage import Storage
20 class BlockchainProcessor(Processor):
22 def __init__(self, config, shared):
23 Processor.__init__(self)
25 self.mtimes = {} # monitoring
28 self.up_to_date = False
30 self.watch_lock = threading.Lock()
31 self.watch_blocks = []
32 self.watch_headers = []
33 self.watched_addresses = {}
35 self.history_cache = {}
37 self.cache_lock = threading.Lock()
38 self.headers_data = ''
39 self.headers_path = config.get('leveldb', 'path_fulltree')
41 self.mempool_addresses = {}
42 self.mempool_hist = {}
43 self.mempool_hashes = set([])
44 self.mempool_lock = threading.Lock()
46 self.address_queue = Queue()
49 self.test_reorgs = config.getboolean('leveldb', 'test_reorgs') # simulate random blockchain reorgs
51 self.test_reorgs = False
52 self.storage = Storage(config, shared, self.test_reorgs)
54 self.dblock = threading.Lock()
56 self.bitcoind_url = 'http://%s:%s@%s:%s/' % (
57 config.get('bitcoind', 'user'),
58 config.get('bitcoind', 'password'),
59 config.get('bitcoind', 'host'),
60 config.get('bitcoind', 'port'))
64 self.bitcoind('getinfo')
67 print_log('cannot contact bitcoind...')
72 self.sent_header = None
75 self.init_headers(self.storage.height)
77 threading.Timer(0, lambda: self.catch_up(sync=False)).start()
78 while not shared.stopped() and not self.up_to_date:
82 print "keyboard interrupt: stopping threads"
86 print_log("Blockchain is up to date.")
87 self.memorypool_update()
88 print_log("Memory pool initialized.")
90 threading.Timer(10, self.main_iteration).start()
94 def mtime(self, name):
97 delta = now - self.now
98 t = self.mtimes.get(name, 0)
99 self.mtimes[name] = t + delta
102 def print_mtime(self):
104 for k, v in self.mtimes.items():
105 s += k+':'+"%.2f"%v+' '
109 def bitcoind(self, method, params=[]):
110 postdata = dumps({"method": method, 'params': params, 'id': 'jsonrpc'})
112 respdata = urllib.urlopen(self.bitcoind_url, postdata).read()
114 traceback.print_exc(file=sys.stdout)
118 if r['error'] is not None:
119 raise BaseException(r['error'])
120 return r.get('result')
123 def block2header(self, b):
125 "block_height": b.get('height'),
126 "version": b.get('version'),
127 "prev_block_hash": b.get('previousblockhash'),
128 "merkle_root": b.get('merkleroot'),
129 "timestamp": b.get('time'),
130 "bits": int(b.get('bits'), 16),
131 "nonce": b.get('nonce'),
134 def get_header(self, height):
135 block_hash = self.bitcoind('getblockhash', [height])
136 b = self.bitcoind('getblock', [block_hash])
137 return self.block2header(b)
139 def init_headers(self, db_height):
140 self.chunk_cache = {}
141 self.headers_filename = os.path.join(self.headers_path, 'blockchain_headers')
143 if os.path.exists(self.headers_filename):
144 height = os.path.getsize(self.headers_filename)/80 - 1 # the current height
146 prev_hash = self.hash_header(self.read_header(height))
150 open(self.headers_filename, 'wb').close()
154 if height < db_height:
155 print_log("catching up missing headers:", height, db_height)
158 while height < db_height:
160 header = self.get_header(height)
162 assert prev_hash == header.get('prev_block_hash')
163 self.write_header(header, sync=False)
164 prev_hash = self.hash_header(header)
165 if (height % 1000) == 0:
166 print_log("headers file:", height)
167 except KeyboardInterrupt:
173 def hash_header(self, header):
174 return rev_hex(Hash(header_to_string(header).decode('hex')).encode('hex'))
176 def read_header(self, block_height):
177 if os.path.exists(self.headers_filename):
178 with open(self.headers_filename, 'rb') as f:
179 f.seek(block_height * 80)
182 h = header_from_string(h)
185 def read_chunk(self, index):
186 with open(self.headers_filename, 'rb') as f:
187 f.seek(index*2016*80)
188 chunk = f.read(2016*80)
189 return chunk.encode('hex')
191 def write_header(self, header, sync=True):
192 if not self.headers_data:
193 self.headers_offset = header.get('block_height')
195 self.headers_data += header_to_string(header).decode('hex')
196 if sync or len(self.headers_data) > 40*100:
199 with self.cache_lock:
200 chunk_index = header.get('block_height')/2016
201 if self.chunk_cache.get(chunk_index):
202 self.chunk_cache.pop(chunk_index)
204 def pop_header(self):
205 # we need to do this only if we have not flushed
206 if self.headers_data:
207 self.headers_data = self.headers_data[:-40]
209 def flush_headers(self):
210 if not self.headers_data:
212 with open(self.headers_filename, 'rb+') as f:
213 f.seek(self.headers_offset*80)
214 f.write(self.headers_data)
215 self.headers_data = ''
217 def get_chunk(self, i):
218 # store them on disk; store the current chunk in memory
219 with self.cache_lock:
220 chunk = self.chunk_cache.get(i)
222 chunk = self.read_chunk(i)
223 self.chunk_cache[i] = chunk
227 def get_mempool_transaction(self, txid):
229 raw_tx = self.bitcoind('getrawtransaction', [txid, 0])
233 vds = deserialize.BCDataStream()
234 vds.write(raw_tx.decode('hex'))
236 return deserialize.parse_Transaction(vds, is_coinbase=False)
238 print_log("ERROR: cannot parse", txid)
241 def get_history(self, addr, cache_only=False):
242 with self.cache_lock:
243 hist = self.history_cache.get(addr)
251 h = self.storage.get_history(str((addr)))
252 hist = self.storage.deserialize(h)
263 # sort history, because redeeming transactions are next to the corresponding txout
264 hist.sort(key=lambda tup: tup[2])
267 with self.mempool_lock:
268 for txid in self.mempool_hist.get(addr, []):
269 hist.append((txid, 0, 0))
272 hist = set(map(lambda x: (x[0], x[2]), hist))
275 hist = map(lambda x: {'tx_hash': x[0], 'height': x[1]}, hist)
277 # add something to distinguish between unused and empty addresses
278 if hist == [] and is_known:
281 with self.cache_lock:
282 self.history_cache[addr] = hist
285 def get_status(self, addr, cache_only=False):
286 tx_points = self.get_history(addr, cache_only)
287 if cache_only and tx_points == -1:
292 if tx_points == ['*']:
296 status += tx.get('tx_hash') + ':%d:' % tx.get('height')
297 return hashlib.sha256(status).digest().encode('hex')
299 def get_merkle(self, tx_hash, height):
301 block_hash = self.bitcoind('getblockhash', [height])
302 b = self.bitcoind('getblock', [block_hash])
303 tx_list = b.get('tx')
304 tx_pos = tx_list.index(tx_hash)
306 merkle = map(hash_decode, tx_list)
307 target_hash = hash_decode(tx_hash)
309 while len(merkle) != 1:
311 merkle.append(merkle[-1])
314 new_hash = Hash(merkle[0] + merkle[1])
315 if merkle[0] == target_hash:
316 s.append(hash_encode(merkle[1]))
317 target_hash = new_hash
318 elif merkle[1] == target_hash:
319 s.append(hash_encode(merkle[0]))
320 target_hash = new_hash
325 return {"block_height": height, "merkle": s, "pos": tx_pos}
328 def add_to_history(self, addr, tx_hash, tx_pos, tx_height):
330 s = self.serialize_item(tx_hash, tx_pos, tx_height) + 40*chr(0)
333 serialized_hist = self.batch_list[addr]
335 l = len(serialized_hist)/80
336 for i in range(l-1, -1, -1):
337 item = serialized_hist[80*i:80*(i+1)]
338 item_height = int(rev_hex(item[36:39].encode('hex')), 16)
339 if item_height <= tx_height:
340 serialized_hist = serialized_hist[0:80*(i+1)] + s + serialized_hist[80*(i+1):]
343 serialized_hist = s + serialized_hist
345 self.batch_list[addr] = serialized_hist
348 txo = (tx_hash + int_to_hex(tx_pos, 4)).decode('hex')
349 self.batch_txio[txo] = addr
356 def deserialize_block(self, block):
357 txlist = block.get('tx')
358 tx_hashes = [] # ordered txids
359 txdict = {} # deserialized tx
361 for raw_tx in txlist:
362 tx_hash = hash_encode(Hash(raw_tx.decode('hex')))
363 vds = deserialize.BCDataStream()
364 vds.write(raw_tx.decode('hex'))
366 tx = deserialize.parse_Transaction(vds, is_coinbase)
368 print_log("ERROR: cannot parse", tx_hash)
370 tx_hashes.append(tx_hash)
373 return tx_hashes, txdict
377 def import_block(self, block, block_hash, block_height, sync, revert=False):
379 touched_addr = set([])
381 # deserialize transactions
382 tx_hashes, txdict = self.deserialize_block(block)
386 undo_info = self.storage.get_undo_info(block_height)
391 for txid in tx_hashes: # must be ordered
394 undo = self.storage.import_transaction(txid, tx, block_height, touched_addr)
395 undo_info[txid] = undo
397 undo = undo_info.pop(txid)
398 self.storage.revert_transaction(txid, tx, block_height, touched_addr, undo)
401 assert undo_info == {}
405 self.storage.write_undo_info(block_height, self.bitcoind_height, undo_info)
408 self.storage.db_undo.put('height', repr( (block_hash, block_height, self.storage.db_version) ))
410 for addr in touched_addr:
411 self.invalidate_cache(addr)
413 self.storage.update_hashes()
416 def add_request(self, session, request):
417 # see if we can get if from cache. if not, add to queue
418 if self.process(session, request, cache_only=True) == -1:
419 self.queue.put((session, request))
422 def do_subscribe(self, method, params, session):
423 with self.watch_lock:
424 if method == 'blockchain.numblocks.subscribe':
425 if session not in self.watch_blocks:
426 self.watch_blocks.append(session)
428 elif method == 'blockchain.headers.subscribe':
429 if session not in self.watch_headers:
430 self.watch_headers.append(session)
432 elif method == 'blockchain.address.subscribe':
434 l = self.watched_addresses.get(address)
436 self.watched_addresses[address] = [session]
437 elif session not in l:
441 def do_unsubscribe(self, method, params, session):
442 with self.watch_lock:
443 if method == 'blockchain.numblocks.subscribe':
444 if session in self.watch_blocks:
445 self.watch_blocks.remove(session)
446 elif method == 'blockchain.headers.subscribe':
447 if session in self.watch_headers:
448 self.watch_headers.remove(session)
449 elif method == "blockchain.address.subscribe":
451 l = self.watched_addresses.get(addr)
460 self.watched_addresses.pop(addr)
463 def process(self, session, request, cache_only=False):
465 message_id = request['id']
466 method = request['method']
467 params = request.get('params', [])
471 if method == 'blockchain.numblocks.subscribe':
472 result = self.storage.height
474 elif method == 'blockchain.headers.subscribe':
477 elif method == 'blockchain.address.subscribe':
480 result = self.get_status(address, cache_only)
481 except BaseException, e:
482 error = str(e) + ': ' + address
483 print_log("error:", error)
485 elif method == 'blockchain.address.get_history':
488 result = self.get_history(address, cache_only)
489 except BaseException, e:
490 error = str(e) + ': ' + address
491 print_log("error:", error)
493 elif method == 'blockchain.block.get_header':
499 result = self.get_header(height)
500 except BaseException, e:
501 error = str(e) + ': %d' % height
502 print_log("error:", error)
504 elif method == 'blockchain.block.get_chunk':
510 result = self.get_chunk(index)
511 except BaseException, e:
512 error = str(e) + ': %d' % index
513 print_log("error:", error)
515 elif method == 'blockchain.transaction.broadcast':
517 txo = self.bitcoind('sendrawtransaction', params)
518 print_log("sent tx:", txo)
520 except BaseException, e:
521 result = str(e) # do not send an error
522 print_log("error:", result, params)
524 elif method == 'blockchain.transaction.get_merkle':
530 tx_height = params[1]
531 result = self.get_merkle(tx_hash, tx_height)
532 except BaseException, e:
533 error = str(e) + ': ' + repr(params)
534 print_log("get_merkle error:", error)
536 elif method == 'blockchain.transaction.get':
539 result = self.bitcoind('getrawtransaction', [tx_hash, 0])
540 except BaseException, e:
541 error = str(e) + ': ' + repr(params)
542 print_log("tx get error:", error)
545 error = "unknown method:%s" % method
547 if cache_only and result == -1:
551 self.push_response(session, {'id': message_id, 'error': error})
553 self.push_response(session, {'id': message_id, 'result': result})
556 def getfullblock(self, block_hash):
557 block = self.bitcoind('getblock', [block_hash])
561 for txid in block['tx']:
563 "method": "getrawtransaction",
569 postdata = dumps(rawtxreq)
571 respdata = urllib.urlopen(self.bitcoind_url, postdata).read()
573 traceback.print_exc(file=sys.stdout)
579 if ir['error'] is not None:
581 print_log("Error: make sure you run bitcoind with txindex=1; use -reindex if needed.")
582 raise BaseException(ir['error'])
583 rawtxdata.append(ir['result'])
584 block['tx'] = rawtxdata
587 def catch_up(self, sync=True):
590 while not self.shared.stopped():
595 info = self.bitcoind('getinfo')
596 self.bitcoind_height = info.get('blocks')
597 bitcoind_block_hash = self.bitcoind('getblockhash', [self.bitcoind_height])
598 if self.storage.last_hash == bitcoind_block_hash:
599 self.up_to_date = True
603 self.up_to_date = False
604 next_block_hash = self.bitcoind('getblockhash', [self.storage.height + 1])
605 next_block = self.getfullblock(next_block_hash)
608 # fixme: this is unsafe, if we revert when the undo info is not yet written
609 revert = (random.randint(1, 100) == 1) if self.test_reorgs else False
611 if (next_block.get('previousblockhash') == self.storage.last_hash) and not revert:
613 self.import_block(next_block, next_block_hash, self.storage.height+1, sync)
614 self.storage.height = self.storage.height + 1
615 self.write_header(self.block2header(next_block), sync)
616 self.storage.last_hash = next_block_hash
619 if self.storage.height % 1000 == 0 and not sync:
620 t_daemon = self.mtimes.get('daemon')
621 t_import = self.mtimes.get('import')
622 print_log("catch_up: block %d (%.3fs %.3fs)" % (self.storage.height, t_daemon, t_import), self.storage.get_root_hash().encode('hex'))
623 self.mtimes['daemon'] = 0
624 self.mtimes['import'] = 0
627 assert prh == self.storage.get_root_hash().encode('hex')
631 prh = self.storage.get_root_hash().encode('hex')
633 # revert current block
634 block = self.getfullblock(self.storage.last_hash)
635 print_log("blockchain reorg", self.storage.height, block.get('previousblockhash'), self.storage.last_hash)
636 self.import_block(block, self.storage.last_hash, self.storage.height, sync, revert=True)
640 self.storage.height -= 1
642 # read previous header from disk
643 self.header = self.read_header(self.storage.height)
644 self.storage.last_hash = self.hash_header(self.header)
647 self.header = self.block2header(self.bitcoind('getblock', [self.storage.last_hash]))
649 if self.shared.stopped():
650 print_log( "closing database" )
654 def memorypool_update(self):
655 mempool_hashes = set(self.bitcoind('getrawmempool'))
656 touched_addresses = set([])
658 for tx_hash in mempool_hashes:
659 if tx_hash in self.mempool_hashes:
662 tx = self.get_mempool_transaction(tx_hash)
666 mpa = self.mempool_addresses.get(tx_hash, [])
667 for x in tx.get('inputs'):
668 # we assume that the input address can be parsed by deserialize(); this is true for Electrum transactions
669 addr = x.get('address')
670 if addr and addr not in mpa:
672 touched_addresses.add(addr)
674 for x in tx.get('outputs'):
675 addr = x.get('address')
676 if addr and addr not in mpa:
678 touched_addresses.add(addr)
680 self.mempool_addresses[tx_hash] = mpa
681 self.mempool_hashes.add(tx_hash)
683 # remove older entries from mempool_hashes
684 self.mempool_hashes = mempool_hashes
686 # remove deprecated entries from mempool_addresses
687 for tx_hash, addresses in self.mempool_addresses.items():
688 if tx_hash not in self.mempool_hashes:
689 self.mempool_addresses.pop(tx_hash)
690 for addr in addresses:
691 touched_addresses.add(addr)
693 # rebuild mempool histories
694 new_mempool_hist = {}
695 for tx_hash, addresses in self.mempool_addresses.items():
696 for addr in addresses:
697 h = new_mempool_hist.get(addr, [])
700 new_mempool_hist[addr] = h
702 with self.mempool_lock:
703 self.mempool_hist = new_mempool_hist
705 # invalidate cache for touched addresses
706 for addr in touched_addresses:
707 self.invalidate_cache(addr)
710 def invalidate_cache(self, address):
711 with self.cache_lock:
712 if address in self.history_cache:
713 print_log("cache: invalidating", address)
714 self.history_cache.pop(address)
716 with self.watch_lock:
717 sessions = self.watched_addresses.get(address)
720 # TODO: update cache here. if new value equals cached value, do not send notification
721 self.address_queue.put((address,sessions))
723 def main_iteration(self):
724 if self.shared.stopped():
725 print_log("blockchain processor terminating")
734 self.memorypool_update()
736 if self.sent_height != self.storage.height:
737 self.sent_height = self.storage.height
738 for session in self.watch_blocks:
739 self.push_response(session, {
741 'method': 'blockchain.numblocks.subscribe',
742 'params': [self.storage.height],
745 if self.sent_header != self.header:
746 print_log("blockchain: %d (%.3fs)" % (self.storage.height, t2 - t1))
747 self.sent_header = self.header
748 for session in self.watch_headers:
749 self.push_response(session, {
751 'method': 'blockchain.headers.subscribe',
752 'params': [self.header],
757 addr, sessions = self.address_queue.get(False)
761 status = self.get_status(addr)
762 for session in sessions:
763 self.push_response(session, {
765 'method': 'blockchain.address.subscribe',
766 'params': [addr, status],
769 if not self.shared.stopped():
770 threading.Timer(10, self.main_iteration).start()
772 print_log("blockchain processor terminating")