Implement reorg logic
This commit is contained in:
parent
76748d2673
commit
5c63cd40de
20
query.py
20
query.py
@ -11,11 +11,31 @@ from server.block_processor import BlockProcessor
|
||||
from lib.hash import hash_to_str
|
||||
|
||||
|
||||
def count_entries(db):
|
||||
utxos = 0
|
||||
for key in db.iterator(prefix=b'u', include_value=False):
|
||||
utxos += 1
|
||||
print("UTXO count:", utxos)
|
||||
|
||||
hash168 = 0
|
||||
for key in db.iterator(prefix=b'h', include_value=False):
|
||||
hash168 += 1
|
||||
print("Hash168 count:", hash168)
|
||||
|
||||
hist = 0
|
||||
for key in db.iterator(prefix=b'H', include_value=False):
|
||||
hist += 1
|
||||
print("History addresses:", hist)
|
||||
|
||||
|
||||
def main():
|
||||
env = Env()
|
||||
coin = env.coin
|
||||
os.chdir(env.db_dir)
|
||||
bp = BlockProcessor(env, None)
|
||||
if len(sys.argv) == 1:
|
||||
count_entries(bp.db)
|
||||
return
|
||||
argc = 1
|
||||
try:
|
||||
limit = int(sys.argv[argc])
|
||||
|
||||
@ -6,15 +6,17 @@ import ast
|
||||
import asyncio
|
||||
import struct
|
||||
import time
|
||||
from bisect import bisect_left
|
||||
from collections import defaultdict, namedtuple
|
||||
from functools import partial
|
||||
|
||||
import plyvel
|
||||
|
||||
from server.cache import FSCache, UTXOCache
|
||||
from server.cache import FSCache, UTXOCache, NO_CACHE_ENTRY
|
||||
from server.daemon import DaemonError
|
||||
from lib.hash import hash_to_str
|
||||
from lib.util import LoggedClass
|
||||
from lib.script import ScriptPubKey
|
||||
from lib.util import chunks, LoggedClass
|
||||
|
||||
|
||||
def formatted_time(t):
|
||||
@ -124,24 +126,28 @@ class BlockProcessor(LoggedClass):
|
||||
self.next_cache_check = 0
|
||||
self.last_flush = time.time()
|
||||
self.coin = env.coin
|
||||
self.caught_up = False
|
||||
self.reorg_limit = env.reorg_limit
|
||||
|
||||
# Chain state (initialize to genesis in case of new DB)
|
||||
self.db_height = -1
|
||||
self.db_tx_count = 0
|
||||
self.db_tip = b'\0' * 32
|
||||
self.flush_count = 0
|
||||
self.utxo_flush_count = 0
|
||||
self.wall_time = 0
|
||||
self.tip = b'\0' * 32
|
||||
|
||||
# Open DB and metadata files. Record some of its state.
|
||||
self.db = self.open_db(self.coin)
|
||||
self.tx_count = self.db_tx_count
|
||||
self.height = self.db_height
|
||||
self.tip = self.db_tip
|
||||
|
||||
# Caches to be flushed later. Headers and tx_hashes have one
|
||||
# entry per block
|
||||
self.history = defaultdict(partial(array.array, 'I'))
|
||||
self.history_size = 0
|
||||
self.backup_hash168s = set()
|
||||
self.utxo_cache = UTXOCache(self, self.db, self.coin)
|
||||
self.fs_cache = FSCache(self.coin, self.height, self.tx_count)
|
||||
self.prefetcher = Prefetcher(daemon, self.height)
|
||||
@ -157,13 +163,20 @@ class BlockProcessor(LoggedClass):
|
||||
self.tx_count, self.flush_count,
|
||||
self.utxo_flush_count,
|
||||
formatted_time(self.wall_time)))
|
||||
self.logger.info('reorg limit of {:,d} blocks'
|
||||
.format(self.reorg_limit))
|
||||
self.logger.info('flushing UTXO cache at {:,d} MB'
|
||||
.format(self.utxo_MB))
|
||||
self.logger.info('flushing history cache at {:,d} MB'
|
||||
.format(self.hist_MB))
|
||||
|
||||
def coros(self):
|
||||
return [self.start(), self.prefetcher.start()]
|
||||
self.clean_db()
|
||||
|
||||
def coros(self, force_backup=False):
|
||||
if force_backup:
|
||||
return [self.force_chain_reorg(True), self.prefetcher.start()]
|
||||
else:
|
||||
return [self.start(), self.prefetcher.start()]
|
||||
|
||||
async def start(self):
|
||||
'''External entry point for block processing.
|
||||
@ -178,30 +191,49 @@ class BlockProcessor(LoggedClass):
|
||||
|
||||
async def advance_blocks(self):
|
||||
'''Loop forever processing blocks in the forward direction.'''
|
||||
caught_up = False
|
||||
while True:
|
||||
blocks = await self.prefetcher.get_blocks()
|
||||
for block in blocks:
|
||||
if not self.advance_block(block):
|
||||
await self.handle_chain_reorg()
|
||||
caught_up = False
|
||||
self.caught_up = False
|
||||
break
|
||||
await asyncio.sleep(0) # Yield
|
||||
|
||||
if not caught_up and self.height == self.daemon.cached_height():
|
||||
caught_up = True
|
||||
if self.height != self.daemon.cached_height():
|
||||
continue
|
||||
|
||||
if not self.caught_up:
|
||||
self.caught_up = True
|
||||
self.logger.info('caught up to height {:,d}'
|
||||
.format(self.height))
|
||||
|
||||
async def handle_chain_reorg(self):
|
||||
hashes = await self.reorg_hashes(self)
|
||||
hex_hashes = [hash_to_str(hash) for hash in hashes]
|
||||
blocks = await self.daemon.raw_blocks(hex_hashes)
|
||||
for block in reversed(blocks):
|
||||
self.backup_block(block)
|
||||
await self.prefetcher.clear()
|
||||
# Flush everything when in caught-up state as queries
|
||||
# are performed on DB not in-memory
|
||||
self.flush(True)
|
||||
|
||||
async def reorg_hashes(self):
|
||||
async def force_chain_reorg(self, to_genesis):
|
||||
try:
|
||||
await self.handle_chain_reorg(to_genesis)
|
||||
finally:
|
||||
self.flush(True)
|
||||
|
||||
async def handle_chain_reorg(self, to_genesis=False):
|
||||
# First get all state on disk
|
||||
self.logger.info('chain reorg detected')
|
||||
self.flush(True)
|
||||
self.logger.info('finding common height...')
|
||||
hashes = await self.reorg_hashes(to_genesis)
|
||||
# Reverse and convert to hex strings.
|
||||
hashes = [hash_to_str(hash) for hash in reversed(hashes)]
|
||||
for hex_hashes in chunks(hashes, 50):
|
||||
blocks = await self.daemon.raw_blocks(hex_hashes)
|
||||
self.backup_blocks(blocks)
|
||||
self.logger.info('backed up to height {:,d}'.format(self.height))
|
||||
await self.prefetcher.clear(self.height)
|
||||
self.logger.info('prefetcher reset')
|
||||
|
||||
async def reorg_hashes(self, to_genesis):
|
||||
'''Return the list of hashes to back up beacuse of a reorg.
|
||||
|
||||
The hashes are returned in order of increasing height.'''
|
||||
@ -211,27 +243,26 @@ class BlockProcessor(LoggedClass):
|
||||
return n
|
||||
return -1
|
||||
|
||||
self.logger.info('chain reorg detected; finding common height...')
|
||||
|
||||
start = self.height - 1
|
||||
count = 1
|
||||
while True:
|
||||
while start > 0:
|
||||
self.logger.info('start: {:,d} count: {:,d}'.format(start, count))
|
||||
hashes = self.fs_cache.block_hashes(start, count)
|
||||
hex_hashes = [hash_to_str(hash) for hash in hashes]
|
||||
d_hex_hashes = await self.daemon.block_hex_hashes(start, count)
|
||||
d_hashes = [bytes.fromhex(hex_hash) for hex_hash in d_hex_hashes]
|
||||
n = match_pos(hashes, d_hashes)
|
||||
if n >= 0:
|
||||
n = match_pos(hex_hashes, d_hex_hashes)
|
||||
if n >= 0 and not to_genesis:
|
||||
start += n + 1
|
||||
break
|
||||
assert start > 0
|
||||
count = min(count * 2, start)
|
||||
start -= count
|
||||
|
||||
# Hashes differ from height 'start'
|
||||
start += n + 1
|
||||
count = (self.height - start) + 1
|
||||
|
||||
self.logger.info('chain was reorganised for {:,d} blocks starting '
|
||||
'at height {:,d}', start, count)
|
||||
self.logger.info('chain was reorganised for {:,d} blocks from '
|
||||
'height {:,d} to height {:,d}'
|
||||
.format(count, start, start + count - 1))
|
||||
|
||||
return self.fs_cache.block_hashes(start, count)
|
||||
|
||||
@ -244,11 +275,9 @@ class BlockProcessor(LoggedClass):
|
||||
db = plyvel.DB(db_name, create_if_missing=True,
|
||||
error_if_exists=True, compression=None)
|
||||
self.logger.info('created new database {}'.format(db_name))
|
||||
self.flush_state(db)
|
||||
else:
|
||||
self.logger.info('successfully opened database {}'.format(db_name))
|
||||
self.read_state(db)
|
||||
self.delete_excess_history(db)
|
||||
|
||||
return db
|
||||
|
||||
@ -261,37 +290,58 @@ class BlockProcessor(LoggedClass):
|
||||
self.coin.GENESIS_HASH))
|
||||
self.db_height = state['height']
|
||||
self.db_tx_count = state['tx_count']
|
||||
self.tip = state['tip']
|
||||
self.db_tip = state['tip']
|
||||
self.flush_count = state['flush_count']
|
||||
self.utxo_flush_count = state['utxo_flush_count']
|
||||
self.wall_time = state['wall_time']
|
||||
|
||||
def delete_excess_history(self, db):
|
||||
'''Clear history flushed since the most recent UTXO flush.'''
|
||||
utxo_flush_count = self.utxo_flush_count
|
||||
diff = self.flush_count - utxo_flush_count
|
||||
if diff == 0:
|
||||
return
|
||||
if diff < 0:
|
||||
raise ChainError('DB corrupt: flush_count < utxo_flush_count')
|
||||
def clean_db(self):
|
||||
'''Clean out stale DB items.
|
||||
|
||||
self.logger.info('DB not shut down cleanly. Scanning for most '
|
||||
'recent {:,d} history flushes'.format(diff))
|
||||
Stale DB items are excess history flushed since the most
|
||||
recent UTXO flush (only happens on unclean shutdown), and aged
|
||||
undo information.
|
||||
'''
|
||||
if self.flush_count < self.utxo_flush_count:
|
||||
raise ChainError('DB corrupt: flush_count < utxo_flush_count')
|
||||
with self.db.write_batch(transaction=True) as batch:
|
||||
if self.flush_count > self.utxo_flush_count:
|
||||
self.logger.info('DB shut down uncleanly. Scanning for '
|
||||
'excess history flushes...')
|
||||
self.remove_excess_history(batch)
|
||||
self.utxo_flush_count = self.flush_count
|
||||
self.remove_stale_undo_items(batch)
|
||||
self.flush_state(batch)
|
||||
|
||||
def remove_excess_history(self, batch):
|
||||
prefix = b'H'
|
||||
unpack = struct.unpack
|
||||
keys = []
|
||||
for key, hist in db.iterator(prefix=prefix):
|
||||
for key, hist in self.db.iterator(prefix=prefix):
|
||||
flush_id, = unpack('>H', key[-2:])
|
||||
if flush_id > self.utxo_flush_count:
|
||||
keys.append(key)
|
||||
|
||||
self.logger.info('deleting {:,d} history entries'.format(len(keys)))
|
||||
with db.write_batch(transaction=True) as batch:
|
||||
for key in keys:
|
||||
db.delete(key)
|
||||
self.utxo_flush_count = self.flush_count
|
||||
self.flush_state(batch)
|
||||
self.logger.info('deletion complete')
|
||||
self.logger.info('deleting {:,d} history entries'
|
||||
.format(len(keys)))
|
||||
for key in keys:
|
||||
batch.delete(key)
|
||||
|
||||
def remove_stale_undo_items(self, batch):
|
||||
prefix = b'U'
|
||||
unpack = struct.unpack
|
||||
cutoff = self.db_height - self.reorg_limit
|
||||
keys = []
|
||||
for key, hist in self.db.iterator(prefix=prefix):
|
||||
height, = unpack('>I', key[-4:])
|
||||
if height > cutoff:
|
||||
break
|
||||
keys.append(key)
|
||||
|
||||
self.logger.info('deleting {:,d} stale undo entries'
|
||||
.format(len(keys)))
|
||||
for key in keys:
|
||||
batch.delete(key)
|
||||
|
||||
def flush_state(self, batch):
|
||||
'''Flush chain state to the batch.'''
|
||||
@ -302,7 +352,7 @@ class BlockProcessor(LoggedClass):
|
||||
'genesis': self.coin.GENESIS_HASH,
|
||||
'height': self.db_height,
|
||||
'tx_count': self.db_tx_count,
|
||||
'tip': self.tip,
|
||||
'tip': self.db_tip,
|
||||
'flush_count': self.flush_count,
|
||||
'utxo_flush_count': self.utxo_flush_count,
|
||||
'wall_time': self.wall_time,
|
||||
@ -317,63 +367,83 @@ class BlockProcessor(LoggedClass):
|
||||
self.utxo_flush_count = self.flush_count
|
||||
self.db_tx_count = self.tx_count
|
||||
self.db_height = self.height
|
||||
self.db_tip = self.tip
|
||||
|
||||
def assert_flushed(self):
|
||||
'''Asserts state is fully flushed.'''
|
||||
assert self.tx_count == self.db_tx_count
|
||||
assert not self.history
|
||||
assert not self.utxo_cache.cache
|
||||
assert not self.utxo_cache.db_cache
|
||||
assert not self.backup_hash168s
|
||||
|
||||
def flush(self, flush_utxos=False):
|
||||
'''Flush out cached state.
|
||||
|
||||
History is always flushed. UTXOs are flushed if flush_utxos.'''
|
||||
if self.height == self.db_height:
|
||||
self.logger.info('nothing to flush')
|
||||
self.assert_flushed()
|
||||
return
|
||||
|
||||
flush_start = time.time()
|
||||
last_flush = self.last_flush
|
||||
tx_diff = self.tx_count - self.db_tx_count
|
||||
|
||||
# Write out the files to the FS before flushing to the DB. If
|
||||
# the DB transaction fails, the files being too long doesn't
|
||||
# matter. But if writing the files fails we do not want to
|
||||
# have updated the DB.
|
||||
tx_diff = self.fs_cache.flush(self.height, self.tx_count)
|
||||
if self.height > self.db_height:
|
||||
self.fs_cache.flush(self.height, self.tx_count)
|
||||
|
||||
with self.db.write_batch(transaction=True) as batch:
|
||||
# History first - fast and frees memory. Flush state last
|
||||
# as it reads the wall time.
|
||||
self.flush_history(batch)
|
||||
if self.height > self.db_height:
|
||||
self.flush_history(batch)
|
||||
else:
|
||||
self.backup_history(batch)
|
||||
if flush_utxos:
|
||||
self.flush_utxos(batch)
|
||||
self.flush_state(batch)
|
||||
self.logger.info('committing transaction...')
|
||||
|
||||
# Update and put the wall time again - otherwise we drop the
|
||||
# time it took leveldb to commit the batch
|
||||
# time it took to commit the batch
|
||||
self.flush_state(self.db)
|
||||
|
||||
flush_time = int(self.last_flush - flush_start)
|
||||
self.logger.info('flush #{:,d} to height {:,d} took {:,d}s'
|
||||
.format(self.flush_count, self.height, flush_time))
|
||||
self.logger.info('flush #{:,d} to height {:,d} txs: {:,d} took {:,d}s'
|
||||
.format(self.flush_count, self.height, self.tx_count,
|
||||
flush_time))
|
||||
|
||||
# Log handy stats
|
||||
daemon_height = self.daemon.cached_height()
|
||||
txs_per_sec = int(self.tx_count / self.wall_time)
|
||||
this_txs_per_sec = 1 + int(tx_diff / (self.last_flush - last_flush))
|
||||
if self.height > self.coin.TX_COUNT_HEIGHT:
|
||||
tx_est = (daemon_height - self.height) * self.coin.TX_PER_BLOCK
|
||||
else:
|
||||
tx_est = ((daemon_height - self.coin.TX_COUNT_HEIGHT)
|
||||
* self.coin.TX_PER_BLOCK
|
||||
+ (self.coin.TX_COUNT - self.tx_count))
|
||||
# Catch-up stats
|
||||
if not self.caught_up and tx_diff > 0:
|
||||
daemon_height = self.daemon.cached_height()
|
||||
txs_per_sec = int(self.tx_count / self.wall_time)
|
||||
this_txs_per_sec = 1 + int(tx_diff / (self.last_flush - last_flush))
|
||||
if self.height > self.coin.TX_COUNT_HEIGHT:
|
||||
tx_est = (daemon_height - self.height) * self.coin.TX_PER_BLOCK
|
||||
else:
|
||||
tx_est = ((daemon_height - self.coin.TX_COUNT_HEIGHT)
|
||||
* self.coin.TX_PER_BLOCK
|
||||
+ (self.coin.TX_COUNT - self.tx_count))
|
||||
|
||||
self.logger.info('txs: {:,d} tx/sec since genesis: {:,d}, '
|
||||
'since last flush: {:,d}'
|
||||
.format(self.tx_count, txs_per_sec, this_txs_per_sec))
|
||||
self.logger.info('sync time: {} ETA: {}'
|
||||
.format(formatted_time(self.wall_time),
|
||||
formatted_time(tx_est / this_txs_per_sec)))
|
||||
self.logger.info('tx/sec since genesis: {:,d}, '
|
||||
'since last flush: {:,d}'
|
||||
.format(txs_per_sec, this_txs_per_sec))
|
||||
self.logger.info('sync time: {} ETA: {}'
|
||||
.format(formatted_time(self.wall_time),
|
||||
formatted_time(tx_est / this_txs_per_sec)))
|
||||
|
||||
def flush_history(self, batch):
|
||||
self.logger.info('flushing history')
|
||||
|
||||
# Drop any None entry
|
||||
self.history.pop(None, None)
|
||||
assert not self.backup_hash168s
|
||||
|
||||
self.flush_count += 1
|
||||
flush_id = struct.pack('>H', self.flush_count)
|
||||
|
||||
for hash168, hist in self.history.items():
|
||||
key = b'H' + hash168 + flush_id
|
||||
batch.put(key, hist.tobytes())
|
||||
@ -384,6 +454,39 @@ class BlockProcessor(LoggedClass):
|
||||
self.history = defaultdict(partial(array.array, 'I'))
|
||||
self.history_size = 0
|
||||
|
||||
def backup_history(self, batch):
|
||||
self.logger.info('backing up history to height {:,d} tx_count {:,d}'
|
||||
.format(self.height, self.tx_count))
|
||||
|
||||
# Drop any NO_CACHE entry
|
||||
self.backup_hash168s.discard(NO_CACHE_ENTRY)
|
||||
assert not self.history
|
||||
|
||||
nremoves = 0
|
||||
for hash168 in sorted(self.backup_hash168s):
|
||||
prefix = b'H' + hash168
|
||||
deletes = []
|
||||
puts = {}
|
||||
for key, hist in self.db.iterator(reverse=True, prefix=prefix):
|
||||
a = array.array('I')
|
||||
a.frombytes(hist)
|
||||
# Remove all history entries >= self.tx_count
|
||||
idx = bisect_left(a, self.tx_count)
|
||||
nremoves += len(a) - idx
|
||||
if idx > 0:
|
||||
puts[key] = a[:idx].tobytes()
|
||||
break
|
||||
deletes.append(key)
|
||||
|
||||
for key in deletes:
|
||||
batch.delete(key)
|
||||
for key, value in puts.items():
|
||||
batch.put(key, value)
|
||||
|
||||
self.logger.info('removed {:,d} history entries from {:,d} addresses'
|
||||
.format(nremoves, len(self.backup_hash168s)))
|
||||
self.backup_hash168s = set()
|
||||
|
||||
def cache_sizes(self):
|
||||
'''Returns the approximate size of the cache, in MB.'''
|
||||
# Good average estimates based on traversal of subobjects and
|
||||
@ -400,15 +503,27 @@ class BlockProcessor(LoggedClass):
|
||||
self.logger.info('cache stats at height {:,d} daemon height: {:,d}'
|
||||
.format(self.height, self.daemon.cached_height()))
|
||||
self.logger.info(' entries: UTXO: {:,d} DB: {:,d} '
|
||||
'hist addrs: {:,d} hist size: {:,d}'
|
||||
'hist addrs: {:,d} hist size {:,d}'
|
||||
.format(len(self.utxo_cache.cache),
|
||||
len(self.utxo_cache.db_cache),
|
||||
len(self.history),
|
||||
self.history_size))
|
||||
self.history_size,
|
||||
len(self.history)))
|
||||
self.logger.info(' size: {:,d}MB (UTXOs {:,d}MB hist {:,d}MB)'
|
||||
.format(utxo_MB + hist_MB, utxo_MB, hist_MB))
|
||||
return utxo_MB, hist_MB
|
||||
|
||||
def undo_key(self, height):
|
||||
'''DB key for undo information at the given height.'''
|
||||
return b'U' + struct.pack('>I', height)
|
||||
|
||||
def write_undo_info(self, height, undo_info):
|
||||
'''Write out undo information for the current height.'''
|
||||
self.db.put(self.undo_key(height), undo_info)
|
||||
|
||||
def read_undo_info(self, height):
|
||||
'''Read undo information from a file for the current height.'''
|
||||
return self.db.get(self.undo_key(height))
|
||||
|
||||
def advance_block(self, block):
|
||||
# We must update the fs_cache before calling advance_txs() as
|
||||
# the UTXO cache uses the fs_cache via get_tx_hash() to
|
||||
@ -421,7 +536,9 @@ class BlockProcessor(LoggedClass):
|
||||
|
||||
self.tip = header_hash
|
||||
self.height += 1
|
||||
self.advance_txs(tx_hashes, txs)
|
||||
undo_info = self.advance_txs(tx_hashes, txs)
|
||||
if self.daemon.cached_height() - self.height <= self.reorg_limit:
|
||||
self.write_undo_info(self.height, b''.join(undo_info))
|
||||
|
||||
# Check if we're getting full and time to flush?
|
||||
now = time.time()
|
||||
@ -434,28 +551,105 @@ class BlockProcessor(LoggedClass):
|
||||
return True
|
||||
|
||||
def advance_txs(self, tx_hashes, txs):
|
||||
cache = self.utxo_cache
|
||||
tx_num = self.tx_count
|
||||
put_utxo = self.utxo_cache.put
|
||||
spend_utxo = self.utxo_cache.spend
|
||||
undo_info = []
|
||||
|
||||
for tx_hash, tx in zip(tx_hashes, txs):
|
||||
# Add the outputs as new UTXOs; spend the inputs
|
||||
hash168s = cache.add_many(tx_hash, tx_num, tx.outputs)
|
||||
# Use local vars for speed in the loops
|
||||
history = self.history
|
||||
tx_num = self.tx_count
|
||||
coin = self.coin
|
||||
parse_script = ScriptPubKey.from_script
|
||||
pack = struct.pack
|
||||
|
||||
for tx, tx_hash in zip(txs, tx_hashes):
|
||||
hash168s = set()
|
||||
tx_numb = pack('<I', tx_num)
|
||||
|
||||
# Spend the inputs
|
||||
if not tx.is_coinbase:
|
||||
for txin in tx.inputs:
|
||||
hash168s.add(cache.spend(txin))
|
||||
cache_value = spend_utxo(txin.prev_hash, txin.prev_idx)
|
||||
undo_info.append(cache_value)
|
||||
hash168s.add(cache_value[:21])
|
||||
|
||||
# Add the new UTXOs
|
||||
for idx, txout in enumerate(tx.outputs):
|
||||
# Get the hash168. Ignore scripts we can't grok.
|
||||
hash168 = parse_script(txout.pk_script, coin).hash168
|
||||
if hash168:
|
||||
hash168s.add(hash168)
|
||||
put_utxo(tx_hash + pack('<H', idx),
|
||||
hash168 + tx_numb + pack('<Q', txout.value))
|
||||
|
||||
# Drop any NO_CACHE entry
|
||||
hash168s.discard(NO_CACHE_ENTRY)
|
||||
for hash168 in hash168s:
|
||||
self.history[hash168].append(tx_num)
|
||||
history[hash168].append(tx_num)
|
||||
self.history_size += len(hash168s)
|
||||
tx_num += 1
|
||||
|
||||
self.tx_count = tx_num
|
||||
|
||||
def backup_block(self, block):
|
||||
pass
|
||||
return undo_info
|
||||
|
||||
def undo_txs(self, tx_hashes, txs):
|
||||
pass
|
||||
def backup_blocks(self, blocks):
|
||||
'''Backup the blocks and flush.
|
||||
|
||||
The blocks should be in order of decreasing height.
|
||||
A flush is performed once the blocks are backed up.
|
||||
'''
|
||||
self.logger.info('backing up {:,d} blocks'.format(len(blocks)))
|
||||
self.assert_flushed()
|
||||
|
||||
for block in blocks:
|
||||
header, tx_hashes, txs = self.coin.read_block(block)
|
||||
prev_hash, header_hash = self.coin.header_hashes(header)
|
||||
if header_hash != self.tip:
|
||||
raise ChainError('backup block {} is not tip {} at height {:,d}'
|
||||
.format(hash_to_str(header_hash),
|
||||
hash_to_str(self.tip), self.height))
|
||||
|
||||
self.backup_txs(tx_hashes, txs)
|
||||
self.fs_cache.backup_block()
|
||||
self.tip = prev_hash
|
||||
self.height -= 1
|
||||
|
||||
self.logger.info('backed up to height {:,d}'.format(self.height))
|
||||
self.flush(True)
|
||||
|
||||
def backup_txs(self, tx_hashes, txs):
|
||||
# Prevout values, in order down the block (coinbase first if present)
|
||||
# undo_info is in reverse block order
|
||||
undo_info = self.read_undo_info(self.height)
|
||||
n = len(undo_info)
|
||||
|
||||
# Use local vars for speed in the loops
|
||||
pack = struct.pack
|
||||
put_utxo = self.utxo_cache.put
|
||||
spend_utxo = self.utxo_cache.spend
|
||||
hash168s = self.backup_hash168s
|
||||
|
||||
rtxs = reversed(txs)
|
||||
rtx_hashes = reversed(tx_hashes)
|
||||
|
||||
for tx_hash, tx in zip(rtx_hashes, rtxs):
|
||||
# Spend the outputs
|
||||
for idx, txout in enumerate(tx.outputs):
|
||||
cache_value = spend_utxo(tx_hash, idx)
|
||||
hash168s.add(cache_value[:21])
|
||||
|
||||
# Restore the inputs
|
||||
if not tx.is_coinbase:
|
||||
for txin in reversed(tx.inputs):
|
||||
n -= 33
|
||||
undo_item = undo_info[n:n+33]
|
||||
put_utxo(txin.prev_hash + pack('<H', txin.prev_idx),
|
||||
undo_item)
|
||||
hash168s.add(undo_item[:21])
|
||||
|
||||
assert n == 0
|
||||
self.tx_count -= len(txs)
|
||||
|
||||
@staticmethod
|
||||
def resolve_limit(limit):
|
||||
|
||||
108
server/cache.py
108
server/cache.py
@ -7,7 +7,6 @@ import os
|
||||
import struct
|
||||
from bisect import bisect_right
|
||||
|
||||
from lib.script import ScriptPubKey
|
||||
from lib.util import chunks, LoggedClass
|
||||
from lib.hash import double_sha256, hash_to_str
|
||||
|
||||
@ -17,6 +16,8 @@ HIST_ENTRIES_PER_KEY = 1024
|
||||
HIST_VALUE_BYTES = HIST_ENTRIES_PER_KEY * 4
|
||||
ADDR_TX_HASH_LEN = 4
|
||||
UTXO_TX_HASH_LEN = 4
|
||||
NO_HASH_168 = bytes([255]) * 21
|
||||
NO_CACHE_ENTRY = NO_HASH_168 + bytes(12)
|
||||
|
||||
|
||||
class UTXOCache(LoggedClass):
|
||||
@ -76,84 +77,47 @@ class UTXOCache(LoggedClass):
|
||||
self.parent = parent
|
||||
self.coin = coin
|
||||
self.cache = {}
|
||||
self.put = self.cache.__setitem__
|
||||
self.db = db
|
||||
self.db_cache = {}
|
||||
# Statistics
|
||||
self.adds = 0
|
||||
self.cache_hits = 0
|
||||
self.cache_spends = 0
|
||||
self.db_deletes = 0
|
||||
|
||||
def add_many(self, tx_hash, tx_num, txouts):
|
||||
'''Add a sequence of UTXOs to the cache, return the set of hash168s
|
||||
seen.
|
||||
|
||||
Pass the hash of the TX it appears in, its TX number, and the
|
||||
TX outputs.
|
||||
'''
|
||||
parse_script = ScriptPubKey.from_script
|
||||
pack = struct.pack
|
||||
tx_numb = pack('<I', tx_num)
|
||||
hash168s = set()
|
||||
|
||||
self.adds += len(txouts)
|
||||
for idx, txout in enumerate(txouts):
|
||||
# Get the hash168. Ignore scripts we can't grok.
|
||||
pk = parse_script(txout.pk_script, self.coin)
|
||||
hash168 = pk.hash168
|
||||
if not hash168:
|
||||
continue
|
||||
|
||||
hash168s.add(hash168)
|
||||
key = tx_hash + pack('<H', idx)
|
||||
|
||||
# Well-known duplicate coinbases from heights 91722-91880
|
||||
# that destoyed 100 BTC forever:
|
||||
# e3bf3d07d4b0375638d5f1db5255fe07ba2c4cb067cd81b84ee974b6585fb468
|
||||
# d5d27987d2a3dfc724e359870c6644b40e497bdc0589a033220fe15429d88599
|
||||
#if key in self.cache:
|
||||
# self.logger.info('duplicate tx hash {}'
|
||||
# .format(hash_to_str(tx_hash)))
|
||||
|
||||
self.cache[key] = hash168 + tx_numb + pack('<Q', txout.value)
|
||||
|
||||
return hash168s
|
||||
|
||||
def spend(self, txin):
|
||||
'''Spend a UTXO and return the address spent.
|
||||
def spend(self, prev_hash, prev_idx):
|
||||
'''Spend a UTXO and return the cache's value.
|
||||
|
||||
If the UTXO is not in the cache it must be on disk.
|
||||
'''
|
||||
# Fast track is it's in the cache
|
||||
pack = struct.pack
|
||||
key = txin.prev_hash + pack('<H', txin.prev_idx)
|
||||
value = self.cache.pop(key, None)
|
||||
idx_packed = pack('<H', prev_idx)
|
||||
value = self.cache.pop(prev_hash + idx_packed, None)
|
||||
if value:
|
||||
self.cache_hits += 1
|
||||
return value[:21]
|
||||
self.cache_spends += 1
|
||||
return value
|
||||
|
||||
# Oh well. Find and remove it from the DB.
|
||||
hash168 = self.hash168(txin.prev_hash, txin.prev_idx)
|
||||
hash168 = self.hash168(prev_hash, idx_packed)
|
||||
if not hash168:
|
||||
return None
|
||||
return NO_CACHE_ENTRY
|
||||
|
||||
self.db_deletes += 1
|
||||
|
||||
# Read the UTXO through the cache from the disk. We have to
|
||||
# go through the cache because compressed keys can collide.
|
||||
key = (b'u' + hash168 + txin.prev_hash[:UTXO_TX_HASH_LEN]
|
||||
+ pack('<H', txin.prev_idx))
|
||||
key = b'u' + hash168 + prev_hash[:UTXO_TX_HASH_LEN] + idx_packed
|
||||
data = self.cache_get(key)
|
||||
if data is None:
|
||||
# Uh-oh, this should not happen...
|
||||
self.logger.error('found no UTXO for {} / {:d} key {}'
|
||||
.format(hash_to_str(txin.prev_hash),
|
||||
txin.prev_idx, bytes(key).hex()))
|
||||
return hash168
|
||||
.format(hash_to_str(prev_hash), prev_idx,
|
||||
bytes(key).hex()))
|
||||
return NO_CACHE_ENTRY
|
||||
|
||||
if len(data) == 12:
|
||||
(tx_num, ) = struct.unpack('<I', data[:4])
|
||||
self.cache_delete(key)
|
||||
return hash168
|
||||
return hash168 + data
|
||||
|
||||
# Resolve the compressed key collison. These should be
|
||||
# extremely rare.
|
||||
@ -161,26 +125,25 @@ class UTXOCache(LoggedClass):
|
||||
for n in range(0, len(data), 12):
|
||||
(tx_num, ) = struct.unpack('<I', data[n:n+4])
|
||||
tx_hash, height = self.parent.get_tx_hash(tx_num)
|
||||
if txin.prev_hash == tx_hash:
|
||||
data = data[:n] + data[n + 12:]
|
||||
if prev_hash == tx_hash:
|
||||
result = hash168 + data[n: n+12]
|
||||
data = data[:n] + data[n+12:]
|
||||
self.cache_write(key, data)
|
||||
return hash168
|
||||
return result
|
||||
|
||||
raise Exception('could not resolve UTXO key collision')
|
||||
|
||||
def hash168(self, tx_hash, idx):
|
||||
def hash168(self, tx_hash, idx_packed):
|
||||
'''Return the hash168 paid to by the given TXO.
|
||||
|
||||
Refers to the database. Returns None if not found (which is
|
||||
indicates a non-standard script).
|
||||
'''
|
||||
key = b'h' + tx_hash[:ADDR_TX_HASH_LEN] + struct.pack('<H', idx)
|
||||
key = b'h' + tx_hash[:ADDR_TX_HASH_LEN] + idx_packed
|
||||
data = self.cache_get(key)
|
||||
if data is None:
|
||||
# Assuming the DB is not corrupt, this indicates a
|
||||
# successful spend of a non-standard script
|
||||
# self.logger.info('ignoring spend of non-standard UTXO {} / {:d}'
|
||||
# .format(hash_to_str(tx_hash), idx)))
|
||||
return None
|
||||
|
||||
if len(data) == 25:
|
||||
@ -222,6 +185,7 @@ class UTXOCache(LoggedClass):
|
||||
# may be in the DB already.
|
||||
hcolls = ucolls = 0
|
||||
new_utxos = len(self.cache)
|
||||
|
||||
for cache_key, cache_value in self.cache.items():
|
||||
# Frist write to the hash168 lookup table
|
||||
key = b'h' + cache_key[:ADDR_TX_HASH_LEN] + cache_key[-2:]
|
||||
@ -244,6 +208,7 @@ class UTXOCache(LoggedClass):
|
||||
|
||||
# GC-ing this now can only help the levelDB write.
|
||||
self.cache = {}
|
||||
self.put = self.cache.__setitem__
|
||||
|
||||
# Now we can update to the batch.
|
||||
for key, value in self.db_cache.items():
|
||||
@ -254,13 +219,15 @@ class UTXOCache(LoggedClass):
|
||||
|
||||
self.db_cache = {}
|
||||
|
||||
adds = new_utxos + self.cache_spends
|
||||
|
||||
self.logger.info('UTXO cache adds: {:,d} spends: {:,d} '
|
||||
.format(self.adds, self.cache_hits))
|
||||
.format(adds, self.cache_spends))
|
||||
self.logger.info('UTXO DB adds: {:,d} spends: {:,d}. '
|
||||
'Collisions: hash168: {:,d} UTXO: {:,d}'
|
||||
.format(new_utxos, self.db_deletes,
|
||||
hcolls, ucolls))
|
||||
self.adds = self.cache_hits = self.db_deletes = 0
|
||||
self.cache_spends = self.db_deletes = 0
|
||||
|
||||
|
||||
class FSCache(LoggedClass):
|
||||
@ -311,9 +278,15 @@ class FSCache(LoggedClass):
|
||||
self.tx_hashes.append(tx_hashes)
|
||||
self.tx_counts.append(prior_tx_count + len(txs))
|
||||
|
||||
def backup_block(self, block):
|
||||
'''Revert a block and return (header, tx_hashes, txs)'''
|
||||
pass
|
||||
def backup_block(self):
|
||||
'''Revert a block.'''
|
||||
assert not self.headers
|
||||
assert not self.tx_hashes
|
||||
assert self.height >= 0
|
||||
# Just update in-memory. It doesn't matter if disk files are
|
||||
# too long, they will be overwritten when advancing.
|
||||
self.height -= 1
|
||||
self.tx_counts.pop()
|
||||
|
||||
def flush(self, new_height, new_tx_count):
|
||||
'''Flush the things stored on the filesystem.
|
||||
@ -326,9 +299,10 @@ class FSCache(LoggedClass):
|
||||
txs_done = cur_tx_count - prior_tx_count
|
||||
|
||||
assert self.height + blocks_done == new_height
|
||||
assert cur_tx_count == new_tx_count
|
||||
assert len(self.tx_hashes) == blocks_done
|
||||
assert len(self.tx_counts) == new_height + 1
|
||||
assert cur_tx_count == new_tx_count, \
|
||||
'cur: {:,d} new: {:,d}'.format(cur_tx_count, new_tx_count)
|
||||
|
||||
# First the headers
|
||||
headers = b''.join(self.headers)
|
||||
@ -364,8 +338,6 @@ class FSCache(LoggedClass):
|
||||
self.headers = []
|
||||
self.height += blocks_done
|
||||
|
||||
return txs_done
|
||||
|
||||
def read_headers(self, height, count):
|
||||
read_count = min(count, self.height + 1 - height)
|
||||
|
||||
|
||||
@ -25,6 +25,7 @@ class Env(LoggedClass):
|
||||
self.tcp_port = self.integer('TCP_PORT', None)
|
||||
self.ssl_port = self.integer('SSL_PORT', None)
|
||||
self.rpc_port = self.integer('RPC_PORT', 8000)
|
||||
self.reorg_limit = self.integer('REORG_LIMIT', 200)
|
||||
self.daemon_url = self.build_daemon_url()
|
||||
self.max_subscriptions = self.integer('MAX_SUBSCRIPTIONS', 10000)
|
||||
self.banner_file = self.default('BANNER_FILE', None)
|
||||
|
||||
Loading…
Reference in New Issue
Block a user