fix abe crash (blockindexing stops) on limit reached for get_address_out_rows in...
[electrum-server.git] / backends / abe / __init__.py
index 65bd284..7a2cb02 100644 (file)
@@ -10,6 +10,29 @@ from Queue import Queue
 import time, threading
 
 
+import hashlib
+encode = lambda x: x[::-1].encode('hex')
+decode = lambda x: x.decode('hex')[::-1]
+Hash = lambda x: hashlib.sha256(hashlib.sha256(x).digest()).digest()
+
+def rev_hex(s):
+    return s.decode('hex')[::-1].encode('hex')
+
+def int_to_hex(i, length=1):
+    s = hex(i)[2:].rstrip('L')
+    s = "0"*(2*length - len(s)) + s
+    return rev_hex(s)
+
+def header_to_string(res):
+    s = int_to_hex(res.get('version'),4) \
+        + rev_hex(res.get('prev_block_hash')) \
+        + rev_hex(res.get('merkle_root')) \
+        + int_to_hex(int(res.get('timestamp')),4) \
+        + int_to_hex(int(res.get('bits')),4) \
+        + int_to_hex(int(res.get('nonce')),4)
+    return s
+
+
 class AbeStore(Datastore_class):
 
     def __init__(self, config):
@@ -26,30 +49,34 @@ class AbeStore(Datastore_class):
         coin = config.get('server', 'coin')
         self.addrtype = 0
         if coin == 'litecoin':
-            print 'Litecoin settings:'
+            print_log ('Litecoin settings:')
             datadir = config.get('server','datadir')
-            print '  datadir = ' + datadir
+            print_log ('  datadir = ' + datadir)
             args.datadir = [{"dirname":datadir,"chain":"Litecoin","code3":"LTC","address_version":"\u0030"}]
-            print '  addrtype = 48'
+            print_log ('  addrtype = 48')
             self.addrtype = 48
 
         Datastore_class.__init__(self,args)
 
         # Use 1 (Bitcoin) if chain_id is not sent
         self.chain_id = self.datadirs[0]["chain_id"] or 1
-        print 'Coin chain_id = %d' % self.chain_id
+        print_log ('Coin chain_id = %d' % self.chain_id)
 
         self.sql_limit = int( config.get('database','limit') )
 
         self.tx_cache = {}
         self.bitcoind_url = 'http://%s:%s@%s:%s/' % ( config.get('bitcoind','user'), config.get('bitcoind','password'), config.get('bitcoind','host'), config.get('bitcoind','port'))
 
+        self.chunk_cache = {}
+
         self.address_queue = Queue()
 
-        self.dblock = thread.allocate_lock()
+        self.lock = threading.Lock()        # for the database
+        self.cache_lock = threading.Lock()  # for the cache
         self.last_tx_id = 0
         self.known_mempool_hashes = []
 
+
     
     def import_tx(self, tx, is_coinbase):
         tx_id = super(AbeStore, self).import_tx(tx, is_coinbase)
@@ -60,7 +87,7 @@ class AbeStore(Datastore_class):
 
 
     def import_block(self, b, chain_ids=frozenset()):
-        #print "import block"
+        #print_log ("import block")
         block_id = super(AbeStore, self).import_block(b, chain_ids)
         for pos in xrange(len(b['transactions'])):
             tx = b['transactions'][pos]
@@ -70,7 +97,7 @@ class AbeStore(Datastore_class):
             if tx_id:
                 self.update_tx_cache(tx_id)
             else:
-                print "error: import_block: no tx_id"
+                print_log ("error: import_block: no tx_id")
         return block_id
 
 
@@ -79,39 +106,43 @@ class AbeStore(Datastore_class):
         for row in inrows:
             _hash = self.binout(row[6])
             if not _hash:
-                #print "WARNING: missing tx_in for tx", txid
+                #print_log ("WARNING: missing tx_in for tx", txid)
                 continue
 
             address = hash_to_address(chr(self.addrtype), _hash)
-            if self.tx_cache.has_key(address):
-                print "cache: invalidating", address
-                self.tx_cache.pop(address)
+            with self.cache_lock:
+                if self.tx_cache.has_key(address):
+                    print_log ("cache: invalidating", address)
+                    self.tx_cache.pop(address)
+
             self.address_queue.put(address)
 
         outrows = self.get_tx_outputs(txid, False)
         for row in outrows:
             _hash = self.binout(row[6])
             if not _hash:
-                #print "WARNING: missing tx_out for tx", txid
+                #print_log ("WARNING: missing tx_out for tx", txid)
                 continue
 
             address = hash_to_address(chr(self.addrtype), _hash)
-            if self.tx_cache.has_key(address):
-                print "cache: invalidating", address
-                self.tx_cache.pop(address)
+            with self.cache_lock:
+                if self.tx_cache.has_key(address):
+                    print_log ("cache: invalidating", address)
+                    self.tx_cache.pop(address)
+
             self.address_queue.put(address)
 
     def safe_sql(self,sql, params=(), lock=True):
 
         error = False
         try:
-            if lock: self.dblock.acquire()
+            if lock: self.lock.acquire()
             ret = self.selectall(sql,params)
         except:
             error = True
             traceback.print_exc(file=sys.stdout)
         finally:
-            if lock: self.dblock.release()
+            if lock: self.lock.release()
 
         if error: 
             raise BaseException('sql error')
@@ -243,11 +274,15 @@ class AbeStore(Datastore_class):
             raise BaseException('limit reached')
         return out
 
-    def get_history(self, addr):
 
-        cached_version = self.tx_cache.get( addr )
-        if cached_version is not None:
-            return cached_version
+
+    def get_history(self, addr, cache_only=False):
+        with self.cache_lock:
+            cached_version = self.tx_cache.get( addr )
+            if cached_version is not None:
+                return cached_version
+
+        if cache_only: return -1
 
         version, binaddr = decode_check_address(addr)
         if binaddr is None:
@@ -265,7 +300,7 @@ class AbeStore(Datastore_class):
             try:
                 nTime, chain_id, height, is_in, blk_hash, tx_hash, tx_id, pos, value = row
             except:
-                print "cannot unpack row", row
+                print_log ("cannot unpack row", row)
                 break
             tx_hash = self.hashout_hex(tx_hash)
             txpoint = {
@@ -300,13 +335,13 @@ class AbeStore(Datastore_class):
 
             # discard transactions that are too old
             if self.last_tx_id - tx_id > 50000:
-                print "discarding tx id", tx_id
+                print_log ("discarding tx id", tx_id)
                 continue
 
             # this means that pending transactions were added to the db, even if they are not returned by getmemorypool
             address_has_mempool = True
 
-            #print "mempool", tx_hash
+            #print_log ("mempool", tx_hash)
             txpoint = {
                     "timestamp":    0,
                     "height":   0,
@@ -328,7 +363,7 @@ class AbeStore(Datastore_class):
             for row in inrows:
                 _hash = self.binout(row[6])
                 if not _hash:
-                    #print "WARNING: missing tx_in for tx", tx_id, addr
+                    #print_log ("WARNING: missing tx_in for tx", tx_id, addr)
                     continue
                 address = hash_to_address(chr(self.addrtype), _hash)
                 txinputs.append(address)
@@ -338,7 +373,7 @@ class AbeStore(Datastore_class):
             for row in outrows:
                 _hash = self.binout(row[6])
                 if not _hash:
-                    #print "WARNING: missing tx_out for tx", tx_id, addr
+                    #print_log ("WARNING: missing tx_out for tx", tx_id, addr)
                     continue
                 address = hash_to_address(chr(self.addrtype), _hash)
                 txoutputs.append(address)
@@ -359,26 +394,31 @@ class AbeStore(Datastore_class):
 
             txpoint.pop('tx_id')
 
+
+        txpoints = map(lambda x: {'tx_hash':x['tx_hash'], 'height':x['height']}, txpoints)
+        out = []
+        for item in txpoints:
+            if item not in out: out.append(item)
+
         # cache result
-        # do not cache mempool results because statuses are ambiguous
-        if not address_has_mempool:
-            self.tx_cache[addr] = txpoints
+        ## do not cache mempool results because statuses are ambiguous
+        #if not address_has_mempool:
+        with self.cache_lock:
+            self.tx_cache[addr] = out
         
-        return txpoints
+        return out
 
 
-    def get_status(self,addr):
-        # get address status, i.e. the last block for that address.
-        tx_points = self.get_history(addr)
-        if not tx_points:
-            status = None
-        else:
-            lastpoint = tx_points[-1]
-            status = lastpoint['block_hash']
-            # this is a temporary hack; move it up once old clients have disappeared
-            if status == 'mempool': # and session['version'] != "old":
-                status = status + ':%d'% len(tx_points)
-        return status
+    def get_status(self, addr, cache_only=False):
+        # for 0.5 clients
+        tx_points = self.get_history(addr, cache_only)
+        if cache_only and tx_points == -1: return -1
+
+        if not tx_points: return None
+        status = ''
+        for tx in tx_points:
+            status += tx.get('tx_hash') + ':%d:' % tx.get('height')
+        return hashlib.sha256( status ).digest().encode('hex')
 
 
     def get_block_header(self, block_height):
@@ -406,6 +446,57 @@ class AbeStore(Datastore_class):
         return out
         
 
+    def get_chunk(self, index):
+        with self.cache_lock:
+            msg = self.chunk_cache.get(index)
+            if msg: return msg
+
+        sql = """
+            SELECT
+                block_hash,
+                block_version,
+                block_hashMerkleRoot,
+                block_nTime,
+                block_nBits,
+                block_nNonce,
+                block_height,
+                prev_block_hash,
+                block_height
+              FROM chain_summary
+             WHERE block_height >= %d AND block_height< %d AND in_longest = 1 ORDER BY block_height"""%(index*2016, (index+1)*2016)
+
+        out = self.safe_sql(sql)
+        msg = ''
+        for row in out:
+            (block_hash, block_version, hashMerkleRoot, nTime, nBits, nNonce, height, prev_block_hash, block_height) \
+                = ( self.hashout_hex(row[0]), int(row[1]), self.hashout_hex(row[2]), int(row[3]), int(row[4]), int(row[5]), int(row[6]), self.hashout_hex(row[7]), int(row[8]) )
+            h = {"block_height":block_height, "version":block_version, "prev_block_hash":prev_block_hash, 
+                   "merkle_root":hashMerkleRoot, "timestamp":nTime, "bits":nBits, "nonce":nNonce}
+
+            if h.get('block_height')==0: h['prev_block_hash'] = "0"*64
+            msg += header_to_string(h)
+
+            #print_log ("hash", encode(Hash(msg.decode('hex'))))
+            #if h.get('block_height')==1:break
+
+        with self.cache_lock:
+            self.chunk_cache[index] = msg
+        print_log ("get_chunk", index, len(msg))
+        return msg
+
+
+
+    def get_raw_tx(self, tx_hash, height):
+        postdata = dumps({"method": 'getrawtransaction', 'params': [tx_hash, 0, height], 'id':'jsonrpc'})
+        respdata = urllib.urlopen(self.bitcoind_url, postdata).read()
+        r = loads(respdata)
+        if r['error'] != None:
+            raise BaseException(r['error'])
+
+        hextx = r.get('result')
+        return hextx
+
+
     def get_tx_merkle(self, tx_hash):
 
         out = self.safe_sql("""
@@ -413,7 +504,9 @@ class AbeStore(Datastore_class):
              JOIN block_tx on tx.tx_id = block_tx.tx_id 
              JOIN chain_summary on chain_summary.block_id = block_tx.block_id
              WHERE tx_hash='%s' AND in_longest = 1"""%tx_hash)
-        block_id = out[0]
+
+        if not out: raise BaseException("not in a block")
+        block_id = int(out[0][0])
 
         # get block height
         out = self.safe_sql("SELECT block_height FROM chain_summary WHERE block_id = %d AND in_longest = 1"%block_id)
@@ -422,21 +515,20 @@ class AbeStore(Datastore_class):
         block_height = int(out[0][0])
 
         merkle = []
+        tx_pos = None
+
         # list all tx in block
         for row in self.safe_sql("""
             SELECT DISTINCT tx_id, tx_pos, tx_hash
               FROM txin_detail
              WHERE block_id = ?
              ORDER BY tx_pos""", (block_id,)):
-            tx_id, tx_pos, tx_h = row
-            merkle.append(tx_h)
+            _id, _pos, _hash = row
+            merkle.append(_hash)
+            if _hash == tx_hash: tx_pos = int(_pos)
 
         # find subset.
         # TODO: do not compute this on client request, better store the hash tree of each block in a database...
-        import hashlib
-        encode = lambda x: x[::-1].encode('hex')
-        decode = lambda x: x.decode('hex')[::-1]
-        Hash = lambda x: hashlib.sha256(hashlib.sha256(x).digest()).digest()
 
         merkle = map(decode, merkle)
         target_hash = decode(tx_hash)
@@ -448,17 +540,17 @@ class AbeStore(Datastore_class):
             while merkle:
                 new_hash = Hash( merkle[0] + merkle[1] )
                 if merkle[0] == target_hash:
-                    s.append( "L" + encode(merkle[1]))
+                    s.append( encode(merkle[1]))
                     target_hash = new_hash
                 elif merkle[1] == target_hash:
-                    s.append( "R" + encode(merkle[0]))
+                    s.append( encode(merkle[0]))
                     target_hash = new_hash
                 n.append( new_hash )
                 merkle = merkle[2:]
             merkle = n
 
         # send result
-        return {"block_height":block_height,"merkle":s}
+        return {"block_height":block_height, "merkle":s, "pos":tx_pos}
 
 
 
@@ -468,16 +560,20 @@ class AbeStore(Datastore_class):
         ds = BCDataStream.BCDataStream()
         postdata = dumps({"method": 'getrawmempool', 'params': [], 'id':'jsonrpc'})
         respdata = urllib.urlopen(store.bitcoind_url, postdata).read()
+
         r = loads(respdata)
         if r['error'] != None:
-            print r['error']
+            print_log (r['error'])
             return
 
         mempool_hashes = r.get('result')
+        num_new_tx = 0 
+
         for tx_hash in mempool_hashes:
 
             if tx_hash in store.known_mempool_hashes: continue
             store.known_mempool_hashes.append(tx_hash)
+            num_new_tx += 1
 
             postdata = dumps({"method": 'getrawtransaction', 'params': [tx_hash], 'id':'jsonrpc'})
             respdata = urllib.urlopen(store.bitcoind_url, postdata).read()
@@ -495,10 +591,11 @@ class AbeStore(Datastore_class):
             else:
                 tx_id = store.import_tx(tx, False)
                 store.update_tx_cache(tx_id)
-                #print tx_hash
+                #print_log (tx_hash)
 
         store.commit()
         store.known_mempool_hashes = mempool_hashes
+        return num_new_tx
 
 
     def send_tx(self,tx):
@@ -513,12 +610,24 @@ class AbeStore(Datastore_class):
         return out
 
 
-    def main_iteration(store):
-        with store.dblock:
-            store.catch_up()
-            store.memorypool_update()
-            block_number = store.get_block_number(store.chain_id)
-            return block_number
+    def main_iteration(self):
+        with self.lock:
+            t1 = time.time()
+            self.catch_up()
+            t2 = time.time()
+            time_catch_up = t2 - t1
+            n = self.memorypool_update()
+            time_mempool = time.time() - t2
+            height = self.get_block_number( self.chain_id )
+
+        with self.cache_lock:
+            try: 
+                self.chunk_cache.pop(height/2016) 
+            except: 
+                pass
+
+        block_header = self.get_block_header( height )
+        return block_header, time_catch_up, time_mempool, n
 
 
 
@@ -536,24 +645,32 @@ class AbeStore(Datastore_class):
 
 
 
-from processor import Processor
+from processor import Processor, print_log
 
 class BlockchainProcessor(Processor):
 
-    def __init__(self, config):
+    def __init__(self, config, shared):
         Processor.__init__(self)
         self.store = AbeStore(config)
-        self.block_number = -1
         self.watched_addresses = []
+        self.shared = shared
 
         # catch_up first
-        n = self.store.main_iteration()
-        print "blockchain: %d blocks"%n
+        self.block_header, time_catch_up, time_mempool, n = self.store.main_iteration()
+        self.block_number = self.block_header.get('block_height')
+        print_log ("blockchain: %d blocks"%self.block_number)
 
         threading.Timer(10, self.run_store_iteration).start()
 
-    def process(self, request):
-        #print "abe process", request
+
+    def add_request(self, request):
+        # see if we can get if from cache. if not, add to queue
+        if self.process( request, cache_only = True) == -1:
+            self.queue.put(request)
+
+
+    def process(self, request, cache_only = False):
+        #print_log ("abe process", request)
 
         message_id = request['id']
         method = request['method']
@@ -564,47 +681,77 @@ class BlockchainProcessor(Processor):
         if method == 'blockchain.numblocks.subscribe':
             result = self.block_number
 
+        elif method == 'blockchain.headers.subscribe':
+            result = self.block_header
+
         elif method == 'blockchain.address.subscribe':
             try:
                 address = params[0]
-                result = self.store.get_status(address)
+                result = self.store.get_status(address, cache_only)
                 self.watch_address(address)
             except BaseException, e:
                 error = str(e) + ': ' + address
-                print "error:", error
+                print_log ("error:", error)
 
         elif method == 'blockchain.address.get_history':
             try:
                 address = params[0]
-                result = self.store.get_history( address ) 
+                result = self.store.get_history( address, cache_only )
             except BaseException, e:
                 error = str(e) + ': ' + address
-                print "error:", error
+                print_log ("error:", error)
 
         elif method == 'blockchain.block.get_header':
-            try:
-                height = params[0]
-                result = self.store.get_block_header( height ) 
-            except BaseException, e:
-                error = str(e) + ': %d'% height
-                print "error:", error
-
+            if cache_only: 
+                result = -1
+            else:
+                try:
+                    height = params[0]
+                    result = self.store.get_block_header( height ) 
+                except BaseException, e:
+                    error = str(e) + ': %d'% height
+                    print_log ("error:", error)
+                    
+        elif method == 'blockchain.block.get_chunk':
+            if cache_only:
+                result = -1
+            else:
+                try:
+                    index = params[0]
+                    result = self.store.get_chunk( index ) 
+                except BaseException, e:
+                    error = str(e) + ': %d'% index
+                    print_log ("error:", error)
+                    
         elif method == 'blockchain.transaction.broadcast':
             txo = self.store.send_tx(params[0])
-            print "sent tx:", txo
+            print_log ("sent tx:", txo)
             result = txo 
 
         elif method == 'blockchain.transaction.get_merkle':
+            if cache_only:
+                result = -1
+            else:
+                try:
+                    tx_hash = params[0]
+                    result = self.store.get_tx_merkle(tx_hash ) 
+                except BaseException, e:
+                    error = str(e) + ': ' + tx_hash
+                    print_log ("error:", error)
+                    
+        elif method == 'blockchain.transaction.get':
             try:
                 tx_hash = params[0]
-                result = self.store.get_tx_merkle(tx_hash ) 
+                height = params[1]
+                result = self.store.get_raw_tx(tx_hash, height ) 
             except BaseException, e:
                 error = str(e) + ': ' + tx_hash
-                print "error:", error
+                print_log ("error:", error)
 
         else:
             error = "unknown method:%s"%method
 
+        if cache_only and result == -1: return -1
 
         if error:
             response = { 'id':message_id, 'error':error }
@@ -622,29 +769,39 @@ class BlockchainProcessor(Processor):
     def run_store_iteration(self):
         
         try:
-            block_number = self.store.main_iteration()
+            block_header, time_catch_up, time_mempool, n = self.store.main_iteration()
         except:
             traceback.print_exc(file=sys.stdout)
-            print "terminating"
+            print_log ("terminating")
             self.shared.stop()
 
         if self.shared.stopped(): 
-            print "exit timer"
+            print_log ("exit timer")
             return
 
-        if self.block_number != block_number:
-            self.block_number = block_number
-            print "block number:", self.block_number
+        #print_log ("block number: %d  (%.3fs)  mempool:%d (%.3fs)"%(self.block_number, time_catch_up, n, time_mempool))
+
+        if self.block_number != block_header.get('block_height'):
+            self.block_number = block_header.get('block_height')
+            print_log ("block number: %d  (%.3fs)"%(self.block_number, time_catch_up))
             self.push_response({ 'id': None, 'method':'blockchain.numblocks.subscribe', 'params':[self.block_number] })
 
+        if self.block_header != block_header:
+            self.block_header = block_header
+            self.push_response({ 'id': None, 'method':'blockchain.headers.subscribe', 'params':[self.block_header] })
+
+
         while True:
             try:
                 addr = self.store.address_queue.get(False)
             except:
                 break
             if addr in self.watched_addresses:
-                status = self.store.get_status( addr )
-                self.push_response({ 'id': None, 'method':'blockchain.address.subscribe', 'params':[addr, status] })
+                try:
+                    status = self.store.get_status( addr )
+                    self.push_response({ 'id': None, 'method':'blockchain.address.subscribe', 'params':[addr, status] })
+                except:
+                    break
 
         threading.Timer(10, self.run_store_iteration).start()