fixed bug in tail ranking where output was essentially reversed
[p2pool.git] / p2pool / data.py
1 from __future__ import division
2
3 import itertools
4 import random
5 import time
6 import os
7
8 from twisted.python import log
9
10 import p2pool
11 from p2pool import skiplists
12 from p2pool.bitcoin import data as bitcoin_data, script
13 from p2pool.util import memoize, expiring_dict, math, forest
14
15
16 share_data_type = bitcoin_data.ComposedType([
17     ('previous_share_hash', bitcoin_data.PossiblyNoneType(0, bitcoin_data.HashType())),
18     ('coinbase', bitcoin_data.VarStrType()),
19     ('nonce', bitcoin_data.VarStrType()),
20     ('new_script', bitcoin_data.VarStrType()),
21     ('subsidy', bitcoin_data.StructType('<Q')),
22     ('donation', bitcoin_data.StructType('<H')),
23     ('stale_frac', bitcoin_data.StructType('<B')),
24 ])
25
26 share_info_type = bitcoin_data.ComposedType([
27     ('share_data', share_data_type),
28     ('target', bitcoin_data.FloatingIntegerType()),
29     ('timestamp', bitcoin_data.StructType('<I')),
30 ])
31
32 share1a_type = bitcoin_data.ComposedType([
33     ('header', bitcoin_data.block_header_type),
34     ('share_info', share_info_type),
35     ('merkle_branch', bitcoin_data.merkle_branch_type),
36 ])
37
38 share1b_type = bitcoin_data.ComposedType([
39     ('header', bitcoin_data.block_header_type),
40     ('share_info', share_info_type),
41     ('other_txs', bitcoin_data.ListType(bitcoin_data.tx_type)),
42 ])
43
44 # type:
45 # 0: share1a
46 # 1: share1b
47
48 share_type = bitcoin_data.ComposedType([
49     ('type', bitcoin_data.VarIntType()),
50     ('contents', bitcoin_data.VarStrType()),
51 ])
52
53 class Share(object):
54     __slots__ = 'header previous_block share_info merkle_branch other_txs timestamp share_data new_script subsidy previous_hash previous_share_hash target nonce pow_hash header_hash hash time_seen peer donation stale_frac'.split(' ')
55     
56     @classmethod
57     def from_share(cls, share, net):
58         if share['type'] == 0:
59             res = cls.from_share1a(share1a_type.unpack(share['contents']), net)
60             if not (res.pow_hash > res.header['target']):
61                 raise ValueError('invalid share type')
62             return res
63         elif share['type'] == 1:
64             res = cls.from_share1b(share1b_type.unpack(share['contents']), net)
65             if not (res.pow_hash <= res.header['target']):
66                 raise ValueError('invalid share type')
67             return res
68         else:
69             raise ValueError('unknown share type: %r' % (share['type'],))
70     
71     @classmethod
72     def from_share1a(cls, share1a, net):
73         return cls(net, **share1a)
74     
75     @classmethod
76     def from_share1b(cls, share1b, net):
77         return cls(net, **share1b)
78     
79     def __init__(self, net, header, share_info, merkle_branch=None, other_txs=None):
80         if merkle_branch is None and other_txs is None:
81             raise ValueError('need either merkle_branch or other_txs')
82         if other_txs is not None:
83             new_merkle_branch = bitcoin_data.calculate_merkle_branch([dict(version=0, tx_ins=[], tx_outs=[], lock_time=0)] + other_txs, 0)
84             if merkle_branch is not None:
85                 if merke_branch != new_merkle_branch:
86                     raise ValueError('invalid merkle_branch and other_txs')
87             merkle_branch = new_merkle_branch
88         
89         if len(merkle_branch) > 16:
90             raise ValueError('merkle_branch too long!')
91         
92         self.header = header
93         self.previous_block = header['previous_block']
94         self.share_info = share_info
95         self.merkle_branch = merkle_branch
96         self.other_txs = other_txs
97         
98         self.share_data = self.share_info['share_data']
99         self.target = self.share_info['target']
100         self.timestamp = self.share_info['timestamp']
101         
102         self.new_script = self.share_data['new_script']
103         self.subsidy = self.share_data['subsidy']
104         self.donation = self.share_data['donation']
105         
106         if len(self.new_script) > 100:
107             raise ValueError('new_script too long!')
108         
109         self.previous_hash = self.previous_share_hash = self.share_data['previous_share_hash']
110         self.nonce = self.share_data['nonce']
111         
112         if len(self.nonce) > 100:
113             raise ValueError('nonce too long!')
114         
115         if len(self.share_data['coinbase']) > 100:
116             raise ValueError('''coinbase too large! %i bytes''' % (len(self.share_data['coinbase']),))
117         
118         self.pow_hash = net.BITCOIN_POW_FUNC(header)
119         self.header_hash = bitcoin_data.block_header_type.hash256(header)
120         
121         self.hash = share1a_type.hash256(self.as_share1a())
122         
123         if self.pow_hash > self.target:
124             print 'hash %x' % self.pow_hash
125             print 'targ %x' % self.target
126             raise ValueError('not enough work!')
127         
128         if script.get_sigop_count(self.new_script) > 1:
129             raise ValueError('too many sigops!')
130         
131         self.stale_frac = self.share_data['stale_frac']/254 if self.share_data['stale_frac'] != 255 else None
132         
133         # XXX eww
134         self.time_seen = time.time()
135         self.peer = None
136     
137     def __repr__(self):
138         return '<Share %s>' % (' '.join('%s=%r' % (k, getattr(self, k)) for k in self.__slots__),)
139     
140     def check(self, tracker, now, net):
141         share_info, gentx = generate_transaction(tracker, self.share_info['share_data'], self.header['target'], self.share_info['timestamp'], net)
142         if share_info != self.share_info:
143             raise ValueError('share difficulty invalid')
144         
145         if bitcoin_data.check_merkle_branch(gentx, 0, self.merkle_branch) != self.header['merkle_root']:
146             raise ValueError('''gentx doesn't match header via merkle_branch''')
147     
148     def as_share(self):
149         if self.pow_hash > self.header['target']: # share1a
150             return dict(type=0, contents=share1a_type.pack(self.as_share1a()))
151         elif self.pow_hash <= self.header['target']: # share1b
152             return dict(type=1, contents=share1b_type.pack(self.as_share1b()))
153         else:
154             raise AssertionError()
155     
156     def as_share1a(self):
157         return dict(header=self.header, share_info=self.share_info, merkle_branch=self.merkle_branch)
158     
159     def as_share1b(self):
160         if self.other_txs is None:
161             raise ValueError('share does not contain all txs')
162         
163         return dict(header=self.header, share_info=self.share_info, other_txs=self.other_txs)
164     
165     def as_block(self, tracker, net):
166         if self.other_txs is None:
167             raise ValueError('share does not contain all txs')
168         
169         share_info, gentx = generate_transaction(tracker, self.share_info['share_data'], self.header['target'], self.share_info['timestamp'], net)
170         assert share_info == self.share_info
171         
172         return dict(header=self.header, txs=[gentx] + self.other_txs)
173
174 def get_pool_attempts_per_second(tracker, previous_share_hash, dist):
175     near = tracker.shares[previous_share_hash]
176     far = tracker.shares[tracker.get_nth_parent_hash(previous_share_hash, dist - 1)]
177     attempts = tracker.get_work(near.hash) - tracker.get_work(far.hash)
178     time = near.timestamp - far.timestamp
179     if time == 0:
180         time = 1
181     return attempts//time
182
183 def generate_transaction(tracker, share_data, block_target, desired_timestamp, net):
184     previous_share_hash = share_data['previous_share_hash']
185     new_script = share_data['new_script']
186     subsidy = share_data['subsidy']
187     donation = share_data['donation']
188     assert 0 <= donation <= 65535
189     
190     if len(share_data['coinbase']) > 100:
191         raise ValueError('coinbase too long!')
192     
193     previous_share = tracker.shares[previous_share_hash] if previous_share_hash is not None else None
194     
195     chain_length = getattr(net, 'REAL_CHAIN_LENGTH_FUNC', lambda _: net.REAL_CHAIN_LENGTH)(previous_share.timestamp if previous_share is not None else None)
196     
197     height, last = tracker.get_height_and_last(previous_share_hash)
198     assert height >= chain_length or last is None
199     if height < net.TARGET_LOOKBEHIND:
200         target = bitcoin_data.FloatingInteger.from_target_upper_bound(net.MAX_TARGET)
201     else:
202         attempts_per_second = get_pool_attempts_per_second(tracker, previous_share_hash, net.TARGET_LOOKBEHIND)
203         pre_target = 2**256//(net.SHARE_PERIOD*attempts_per_second) - 1
204         pre_target2 = math.clip(pre_target, (previous_share.target*9//10, previous_share.target*11//10))
205         pre_target3 = math.clip(pre_target2, (0, net.MAX_TARGET))
206         target = bitcoin_data.FloatingInteger.from_target_upper_bound(pre_target3)
207     
208     attempts_to_block = bitcoin_data.target_to_average_attempts(block_target)
209     max_att = net.SPREAD * attempts_to_block
210     
211     this_att = min(bitcoin_data.target_to_average_attempts(target), max_att)
212     other_weights, other_total_weight, other_donation_weight = tracker.get_cumulative_weights(previous_share_hash, min(height, chain_length), 65535*max(0, max_att - this_att))
213     assert other_total_weight == sum(other_weights.itervalues()) + other_donation_weight, (other_total_weight, sum(other_weights.itervalues()) + other_donation_weight)
214     weights, total_weight, donation_weight = math.add_dicts([{new_script: this_att*(65535-donation)}, other_weights]), this_att*65535 + other_total_weight, this_att*donation + other_donation_weight
215     assert total_weight == sum(weights.itervalues()) + donation_weight, (total_weight, sum(weights.itervalues()) + donation_weight)
216     
217     SCRIPT = '4104ffd03de44a6e11b9917f3a29f9443283d9871c9d743ef30d5eddcd37094b64d1b3d8090496b53256786bf5c82932ec23c3b74d9f05a6f95a8b5529352656664bac'.decode('hex')
218     
219     # 1 satoshi is always donated so that a list of p2pool generated blocks can be easily found by looking at the donation address
220     amounts = dict((script, (subsidy-1)*(199*weight)//(200*total_weight)) for (script, weight) in weights.iteritems())
221     amounts[new_script] = amounts.get(new_script, 0) + (subsidy-1)//200
222     amounts[SCRIPT] = amounts.get(SCRIPT, 0) + (subsidy-1)*(199*donation_weight)//(200*total_weight)
223     amounts[SCRIPT] = amounts.get(SCRIPT, 0) + subsidy - sum(amounts.itervalues()) # collect any extra satoshis :P
224     
225     if sum(amounts.itervalues()) != subsidy:
226         raise ValueError()
227     if any(x < 0 for x in amounts.itervalues()):
228         raise ValueError()
229     
230     dests = sorted(amounts.iterkeys(), key=lambda script: (amounts[script], script))
231     dests = dests[-4000:] # block length limit, unlikely to ever be hit
232     
233     share_info = dict(
234         share_data=share_data,
235         target=target,
236         timestamp=math.clip(desired_timestamp, (previous_share.timestamp - 60, previous_share.timestamp + 60)) if previous_share is not None else desired_timestamp,
237     )
238     
239     return share_info, dict(
240         version=1,
241         tx_ins=[dict(
242             previous_output=None,
243             sequence=None,
244             script=share_data['coinbase'].ljust(2, '\x00'),
245         )],
246         tx_outs=[dict(value=0, script='\x20' + bitcoin_data.HashType().pack(share_info_type.hash256(share_info)))] + [dict(value=amounts[script], script=script) for script in dests if amounts[script]],
247         lock_time=0,
248     )
249
250
251 class OkayTracker(forest.Tracker):
252     def __init__(self, net):
253         forest.Tracker.__init__(self)
254         self.net = net
255         self.verified = forest.Tracker()
256         self.verified.get_nth_parent_hash = self.get_nth_parent_hash # self is a superset of self.verified
257         
258         self.get_cumulative_weights = skiplists.WeightsSkipList(self)
259     
260     def attempt_verify(self, share, now):
261         if share.hash in self.verified.shares:
262             return True
263         height, last = self.get_height_and_last(share.hash)
264         if height < self.net.CHAIN_LENGTH + 1 and last is not None:
265             raise AssertionError()
266         try:
267             share.check(self, now, self.net)
268         except:
269             log.err(None, 'Share check failed:')
270             return False
271         else:
272             self.verified.add(share)
273             return True
274     
275     def think(self, ht, previous_block, now):
276         desired = set()
277         
278         # O(len(self.heads))
279         #   make 'unverified heads' set?
280         # for each overall head, attempt verification
281         # if it fails, attempt on parent, and repeat
282         # if no successful verification because of lack of parents, request parent
283         bads = set()
284         for head in set(self.heads) - set(self.verified.heads):
285             head_height, last = self.get_height_and_last(head)
286             
287             for share in itertools.islice(self.get_chain_known(head), None if last is None else min(5, max(0, head_height - self.net.CHAIN_LENGTH))):
288                 if self.attempt_verify(share, now):
289                     break
290                 if share.hash in self.heads:
291                     bads.add(share.hash)
292             else:
293                 if last is not None:
294                     desired.add((self.shares[random.choice(list(self.reverse_shares[last]))].peer, last))
295         for bad in bads:
296             assert bad not in self.verified.shares
297             assert bad in self.heads
298             if p2pool.DEBUG:
299                 print "BAD", bad
300             self.remove(bad)
301         
302         # try to get at least CHAIN_LENGTH height for each verified head, requesting parents if needed
303         for head in list(self.verified.heads):
304             head_height, last_hash = self.verified.get_height_and_last(head)
305             last_height, last_last_hash = self.get_height_and_last(last_hash)
306             # XXX review boundary conditions
307             want = max(self.net.CHAIN_LENGTH - head_height, 0)
308             can = max(last_height - 1 - self.net.CHAIN_LENGTH, 0) if last_last_hash is not None else last_height
309             get = min(want, can)
310             #print 'Z', head_height, last_hash is None, last_height, last_last_hash is None, want, can, get
311             for share in itertools.islice(self.get_chain_known(last_hash), get):
312                 if not self.attempt_verify(share, now):
313                     break
314             if head_height < self.net.CHAIN_LENGTH and last_last_hash is not None:
315                 desired.add((self.verified.shares[random.choice(list(self.verified.reverse_shares[last_hash]))].peer, last_last_hash))
316         if p2pool.DEBUG:
317             print len(self.verified.tails), "tails:"
318             for x in self.verified.tails:
319                 print format_hash(x), self.score(max(self.verified.tails[x], key=self.verified.get_height), ht)
320         
321         # decide best tree
322         best_tail = max(self.verified.tails, key=lambda h: self.score(max(self.verified.tails[h], key=self.verified.get_height), ht)) if self.verified.tails else None
323         # decide best verified head
324         scores = sorted(self.verified.tails.get(best_tail, []), key=lambda h: (
325             self.verified.get_work(self.verified.get_nth_parent_hash(h, min(5, self.verified.get_height(h)))),
326             #self.verified.shares[h].peer is None,
327             ht.get_min_height(self.verified.shares[h].previous_block),
328             -self.verified.shares[h].time_seen
329         ))
330         
331         
332         if p2pool.DEBUG:
333             print len(self.verified.tails), "chain tails and", len(self.verified.tails.get(best_tail, [])), 'chain heads. Top 10 heads:'
334             if len(scores) > 10:
335                 print '    ...'
336             for h in scores[-10:]:
337                 print '   ', format_hash(h), format_hash(self.verified.shares[h].previous_hash), (
338                     self.verified.get_work(self.verified.get_nth_parent_hash(h, min(5, self.verified.get_height(h)))),
339                     self.verified.shares[h].peer is None,
340                     ht.get_min_height(self.verified.shares[h].previous_block),
341                     -self.verified.shares[h].time_seen
342                 )
343         
344         # eat away at heads
345         if scores:
346             for i in xrange(1000):
347                 to_remove = set()
348                 for share_hash, tail in self.heads.iteritems():
349                     if share_hash in scores[-5:]:
350                         #print 1
351                         continue
352                     if self.shares[share_hash].time_seen > time.time() - 300:
353                         #print 2
354                         continue
355                     if share_hash not in self.verified.shares and max(self.shares[after_tail_hash].time_seen for after_tail_hash in self.reverse_shares.get(tail)) > time.time() - 120: # XXX stupid
356                         #print 3
357                         continue
358                     to_remove.add(share_hash)
359                 if not to_remove:
360                     break
361                 for share_hash in to_remove:
362                     self.remove(share_hash)
363                     if share_hash in self.verified.shares:
364                         self.verified.remove(share_hash)
365                 #print "_________", to_remove
366         
367         # drop tails
368         for i in xrange(1000):
369             to_remove = set()
370             for tail, heads in self.tails.iteritems():
371                 if min(self.get_height(head) for head in heads) < 2*self.net.CHAIN_LENGTH + 10:
372                     continue
373                 for aftertail in self.reverse_shares.get(tail, set()):
374                     if len(self.reverse_shares[self.shares[aftertail].previous_hash]) > 1: # XXX
375                         print "raw"
376                         continue
377                     to_remove.add(aftertail)
378             if not to_remove:
379                 break
380             # if removed from this, it must be removed from verified
381             #start = time.time()
382             for aftertail in to_remove:
383                 if self.shares[aftertail].previous_hash not in self.tails:
384                     print "erk", aftertail, self.shares[aftertail].previous_hash
385                     continue
386                 self.remove(aftertail)
387                 if aftertail in self.verified.shares:
388                     self.verified.remove(aftertail)
389             #end = time.time()
390             #print "removed! %i %f" % (len(to_remove), (end - start)/len(to_remove))
391         
392         best = scores[-1] if scores else None
393         
394         if best is not None:
395             best_share = self.verified.shares[best]
396             if ht.get_min_height(best_share.header['previous_block']) < ht.get_min_height(previous_block) and best_share.header_hash != previous_block and best_share.peer is not None:
397                 if p2pool.DEBUG:
398                     print 'Stale detected! %x < %x' % (best_share.header['previous_block'], previous_block)
399                 best = best_share.previous_hash
400         
401         return best, desired
402     
403     @memoize.memoize_with_backing(expiring_dict.ExpiringDict(5, get_touches=False))
404     def score(self, share_hash, ht):
405         head_height, last = self.verified.get_height_and_last(share_hash)
406         score2 = 0
407         block_height = 0
408         max_height = min(self.net.CHAIN_LENGTH, head_height)
409         for share in reversed(list(itertools.islice(self.verified.get_chain_known(self.verified.get_nth_parent_hash(share_hash, max_height//2)), max_height//2))):
410             block_height = max(block_height, ht.get_min_height(share.header['previous_block']))
411             this_score = (self.verified.get_work(share_hash) - self.verified.get_work(share.hash))//(ht.get_highest_height() - block_height + 1)
412             if this_score > score2:
413                 score2 = this_score
414         return min(head_height, self.net.CHAIN_LENGTH), score2
415
416 def format_hash(x):
417     if x is None:
418         return 'xxxxxxxx'
419     return '%08x' % (x % 2**32)
420
421 class ShareStore(object):
422     def __init__(self, prefix, net):
423         self.filename = prefix
424         self.dirname = os.path.dirname(os.path.abspath(prefix))
425         self.filename = os.path.basename(os.path.abspath(prefix))
426         self.net = net
427         self.known = None # will be filename -> set of share hashes, set of verified hashes
428     
429     def get_shares(self):
430         if self.known is not None:
431             raise AssertionError()
432         known = {}
433         filenames, next = self.get_filenames_and_next()
434         for filename in filenames:
435             share_hashes, verified_hashes = known.setdefault(filename, (set(), set()))
436             with open(filename, 'rb') as f:
437                 for line in f:
438                     try:
439                         type_id_str, data_hex = line.strip().split(' ')
440                         type_id = int(type_id_str)
441                         if type_id == 0:
442                             pass
443                         elif type_id == 1:
444                             pass
445                         elif type_id == 2:
446                             verified_hash = int(data_hex, 16)
447                             yield 'verified_hash', verified_hash
448                             verified_hashes.add(verified_hash)
449                         elif type_id == 5:
450                             share = Share.from_share(share_type.unpack(data_hex.decode('hex')), self.net)
451                             yield 'share', share
452                             share_hashes.add(share.hash)
453                         else:
454                             raise NotImplementedError("share type %i" % (type_id,))
455                     except Exception:
456                         log.err(None, "Error while reading saved shares, continuing where left off:")
457         self.known = known
458     
459     def _add_line(self, line):
460         filenames, next = self.get_filenames_and_next()
461         if filenames and os.path.getsize(filenames[-1]) < 10e6:
462             filename = filenames[-1]
463         else:
464             filename = next
465         
466         with open(filename, 'ab') as f:
467             f.write(line + '\n')
468         
469         return filename
470     
471     def add_share(self, share):
472         type_id, data = 5, share_type.pack(share.as_share())
473         filename = self._add_line("%i %s" % (type_id, data.encode('hex')))
474         share_hashes, verified_hashes = self.known.setdefault(filename, (set(), set()))
475         share_hashes.add(share.hash)
476     
477     def add_verified_hash(self, share_hash):
478         filename = self._add_line("%i %x" % (2, share_hash))
479         share_hashes, verified_hashes = self.known.setdefault(filename, (set(), set()))
480         verified_hashes.add(share_hash)
481     
482     def get_filenames_and_next(self):
483         suffixes = sorted(int(x[len(self.filename):]) for x in os.listdir(self.dirname) if x.startswith(self.filename) and x[len(self.filename):].isdigit())
484         return [os.path.join(self.dirname, self.filename + str(suffix)) for suffix in suffixes], os.path.join(self.dirname, self.filename + (str(suffixes[-1] + 1) if suffixes else str(0)))
485     
486     def forget_share(self, share_hash):
487         for filename, (share_hashes, verified_hashes) in self.known.iteritems():
488             if share_hash in share_hashes:
489                 share_hashes.remove(share_hash)
490         self.check_remove()
491     
492     def forget_verified_share(self, share_hash):
493         for filename, (share_hashes, verified_hashes) in self.known.iteritems():
494             if share_hash in verified_hashes:
495                 verified_hashes.remove(share_hash)
496         self.check_remove()
497     
498     def check_remove(self):
499         to_remove = set()
500         for filename, (share_hashes, verified_hashes) in self.known.iteritems():
501             #print filename, len(share_hashes) + len(verified_hashes)
502             if not share_hashes and not verified_hashes:
503                 to_remove.add(filename)
504         for filename in to_remove:
505             self.known.pop(filename)
506             os.remove(filename)
507             print "REMOVED", filename