#!/usr/bin/env python3
# Copyright (c) 2014-2016 The Bitcoin Core developers
# Distributed under the MIT software license, see the accompanying
# file COPYING or http://www.opensource.org/licenses/mit-license.php.
""" Run regression test suite.
This module calls down into individual test cases via subprocess . It will
forward all unrecognized arguments onto the individual test scripts .
Functional tests are disabled on Windows by default . Use - - force to run them anyway .
For a description of arguments recognized by test scripts , see
` test / functional / test_framework / test_framework . py : BitcoinTestFramework . main ` .
"""
import argparse
import configparser
import os
import time
import shutil
import sys
import subprocess
import tempfile
import re
import logging
# Formatting. Default colors to empty strings.
BOLD , BLUE , RED , GREY = ( " " , " " ) , ( " " , " " ) , ( " " , " " ) , ( " " , " " )
try :
# Make sure python thinks it can write unicode to its stdout
" \u2713 " . encode ( " utf_8 " ) . decode ( sys . stdout . encoding )
TICK = " ✓ "
CROSS = " ✖ "
CIRCLE = " ○ "
except UnicodeDecodeError :
TICK = " P "
CROSS = " x "
CIRCLE = " o "
if os . name == ' posix ' :
# primitive formatting on supported
# terminal via ANSI escape sequences:
BOLD = ( ' \033 [0m ' , ' \033 [1m ' )
BLUE = ( ' \033 [0m ' , ' \033 [0;34m ' )
RED = ( ' \033 [0m ' , ' \033 [0;31m ' )
GREY = ( ' \033 [0m ' , ' \033 [1;30m ' )
TEST_EXIT_PASSED = 0
TEST_EXIT_SKIPPED = 77
BASE_SCRIPTS = [
# Scripts that are run by the travis build process.
# Longest test should go first, to favor running tests in parallel
' wallet-hd.py ' ,
' walletbackup.py ' ,
# vv Tests less than 5m vv
' p2p-fullblocktest.py ' ,
' fundrawtransaction.py ' ,
' p2p-compactblocks.py ' ,
' segwit.py ' ,
# vv Tests less than 2m vv
' wallet.py ' ,
' wallet-accounts.py ' ,
' p2p-segwit.py ' ,
' wallet-dump.py ' ,
' listtransactions.py ' ,
# vv Tests less than 60s vv
' sendheaders.py ' ,
' zapwallettxes.py ' ,
' importmulti.py ' ,
' mempool_limit.py ' ,
' merkle_blocks.py ' ,
' receivedby.py ' ,
' abandonconflict.py ' ,
' bip68-112-113-p2p.py ' ,
' rawtransactions.py ' ,
' reindex.py ' ,
# vv Tests less than 30s vv
" zmq_test.py " ,
' mempool_resurrect_test.py ' ,
' txn_doublespend.py --mineblock ' ,
' txn_clone.py ' ,
' getchaintips.py ' ,
' rest.py ' ,
' mempool_spendcoinbase.py ' ,
' mempool_reorg.py ' ,
' mempool_persist.py ' ,
' httpbasics.py ' ,
' multi_rpc.py ' ,
' proxy_test.py ' ,
' signrawtransactions.py ' ,
' disconnect_ban.py ' ,
' decodescript.py ' ,
' blockchain.py ' ,
' disablewallet.py ' ,
' net.py ' ,
' keypool.py ' ,
' p2p-mempool.py ' ,
' prioritise_transaction.py ' ,
' invalidblockrequest.py ' ,
' invalidtxrequest.py ' ,
' p2p-versionbits-warning.py ' ,
' preciousblock.py ' ,
' importprunedfunds.py ' ,
' signmessages.py ' ,
' nulldummy.py ' ,
' import-rescan.py ' ,
' bumpfee.py ' ,
' rpcnamedargs.py ' ,
' listsinceblock.py ' ,
' p2p-leaktests.py ' ,
' import-abort-rescan.py ' ,
]
EXTENDED_SCRIPTS = [
# These tests are not run by the travis build process.
# Longest test should go first, to favor running tests in parallel
' pruning.py ' ,
# vv Tests less than 20m vv
' smartfees.py ' ,
# vv Tests less than 5m vv
' maxuploadtarget.py ' ,
' mempool_packages.py ' ,
# vv Tests less than 2m vv
' bip68-sequence.py ' ,
' getblocktemplate_longpoll.py ' ,
' p2p-timeouts.py ' ,
# vv Tests less than 60s vv
' bip9-softforks.py ' ,
' p2p-feefilter.py ' ,
' rpcbind_test.py ' ,
# vv Tests less than 30s vv
' assumevalid.py ' ,
' bip65-cltv.py ' ,
' bip65-cltv-p2p.py ' ,
' bipdersig-p2p.py ' ,
' bipdersig.py ' ,
' getblocktemplate_proposals.py ' ,
' txn_doublespend.py ' ,
' txn_clone.py --mineblock ' ,
' forknotify.py ' ,
' invalidateblock.py ' ,
' p2p-acceptblock.py ' ,
' replace-by-fee.py ' ,
]
# Place EXTENDED_SCRIPTS first since it has the 3 longest running tests
ALL_SCRIPTS = EXTENDED_SCRIPTS + BASE_SCRIPTS
NON_SCRIPTS = [
# These are python files that live in the functional tests directory, but are not test scripts.
" combine_logs.py " ,
" create_cache.py " ,
" test_runner.py " ,
]
def main ( ) :
# Parse arguments and pass through unrecognised args
parser = argparse . ArgumentParser ( add_help = False ,
usage = ' %(prog)s [test_runner.py options] [script options] [scripts] ' ,
description = __doc__ ,
epilog = '''
Help text and arguments for individual test script : ''' ,
formatter_class = argparse . RawTextHelpFormatter )
parser . add_argument ( ' --coverage ' , action = ' store_true ' , help = ' generate a basic coverage report for the RPC interface ' )
parser . add_argument ( ' --exclude ' , ' -x ' , help = ' specify a comma-seperated-list of scripts to exclude. Do not include the .py extension in the name. ' )
parser . add_argument ( ' --extended ' , action = ' store_true ' , help = ' run the extended test suite in addition to the basic tests ' )
parser . add_argument ( ' --force ' , ' -f ' , action = ' store_true ' , help = ' run tests even on platforms where they are disabled by default (e.g. windows). ' )
parser . add_argument ( ' --help ' , ' -h ' , ' -? ' , action = ' store_true ' , help = ' print help text and exit ' )
parser . add_argument ( ' --jobs ' , ' -j ' , type = int , default = 4 , help = ' how many test scripts to run in parallel. Default=4. ' )
parser . add_argument ( ' --keepcache ' , ' -k ' , action = ' store_true ' , help = ' the default behavior is to flush the cache directory on startup. --keepcache retains the cache from the previous testrun. ' )
parser . add_argument ( ' --quiet ' , ' -q ' , action = ' store_true ' , help = ' only print results summary and failure logs ' )
args , unknown_args = parser . parse_known_args ( )
# Create a set to store arguments and create the passon string
tests = set ( arg for arg in unknown_args if arg [ : 2 ] != " -- " )
passon_args = [ arg for arg in unknown_args if arg [ : 2 ] == " -- " ]
# Read config generated by configure.
config = configparser . ConfigParser ( )
configfile = os . path . abspath ( os . path . dirname ( __file__ ) ) + " /config.ini "
config . read_file ( open ( configfile ) )
passon_args . append ( " --configfile= %s " % configfile )
# Set up logging
logging_level = logging . INFO if args . quiet else logging . DEBUG
logging . basicConfig ( format = ' %(message)s ' , level = logging_level )
enable_wallet = config [ " components " ] . getboolean ( " ENABLE_WALLET " )
enable_utils = config [ " components " ] . getboolean ( " ENABLE_UTILS " )
enable_bitcoind = config [ " components " ] . getboolean ( " ENABLE_BITCOIND " )
if config [ " environment " ] [ " EXEEXT " ] == " .exe " and not args . force :
# https://github.com/bitcoin/bitcoin/commit/d52802551752140cf41f0d9a225a43e84404d3e9
# https://github.com/bitcoin/bitcoin/pull/5677#issuecomment-136646964
print ( " Tests currently disabled on Windows by default. Use --force option to enable " )
sys . exit ( 0 )
if not ( enable_wallet and enable_utils and enable_bitcoind ) :
print ( " No functional tests to run. Wallet, utils, and bitcoind must all be enabled " )
print ( " Rerun `configure` with -enable-wallet, -with-utils and -with-daemon and rerun make " )
sys . exit ( 0 )
# Build list of tests
if tests :
# Individual tests have been specified. Run specified tests that exist
# in the ALL_SCRIPTS list. Accept the name with or without .py extension.
test_list = [ t for t in ALL_SCRIPTS if
( t in tests or re . sub ( " .py$ " , " " , t ) in tests ) ]
else :
# No individual tests have been specified.
# Run all base tests, and optionally run extended tests.
test_list = BASE_SCRIPTS
if args . extended :
# place the EXTENDED_SCRIPTS first since the three longest ones
# are there and the list is shorter
test_list = EXTENDED_SCRIPTS + test_list
# Remove the test cases that the user has explicitly asked to exclude.
if args . exclude :
for exclude_test in args . exclude . split ( ' , ' ) :
if exclude_test + " .py " in test_list :
test_list . remove ( exclude_test + " .py " )
if not test_list :
print ( " No valid test scripts specified. Check that your test is in one "
" of the test lists in test_runner.py, or run test_runner.py with no arguments to run all tests " )
sys . exit ( 0 )
if args . help :
# Print help for test_runner.py, then print help of the first script (with args removed) and exit.
parser . print_help ( )
subprocess . check_call ( [ ( config [ " environment " ] [ " SRCDIR " ] + ' /test/functional/ ' + test_list [ 0 ] . split ( ) [ 0 ] ) ] + [ ' -h ' ] )
sys . exit ( 0 )
check_script_list ( config [ " environment " ] [ " SRCDIR " ] )
if not args . keepcache :
shutil . rmtree ( " %s /test/cache " % config [ " environment " ] [ " BUILDDIR " ] , ignore_errors = True )
run_tests ( test_list , config [ " environment " ] [ " SRCDIR " ] , config [ " environment " ] [ " BUILDDIR " ] , config [ " environment " ] [ " EXEEXT " ] , args . jobs , args . coverage , passon_args )
def run_tests ( test_list , src_dir , build_dir , exeext , jobs = 1 , enable_coverage = False , args = [ ] ) :
# Warn if bitcoind is already running (unix only)
try :
if subprocess . check_output ( [ " pidof " , " bitcoind " ] ) is not None :
print ( " %s WARNING! %s There is already a bitcoind process running on this system. Tests may fail unexpectedly due to resource contention! " % ( BOLD [ 1 ] , BOLD [ 0 ] ) )
except ( OSError , subprocess . SubprocessError ) :
pass
# Warn if there is a cache directory
cache_dir = " %s /test/cache " % build_dir
if os . path . isdir ( cache_dir ) :
print ( " %s WARNING! %s There is a cache directory here: %s . If tests fail unexpectedly, try deleting the cache directory. " % ( BOLD [ 1 ] , BOLD [ 0 ] , cache_dir ) )
#Set env vars
if " BITCOIND " not in os . environ :
os . environ [ " BITCOIND " ] = build_dir + ' /src/bitcoind ' + exeext
tests_dir = src_dir + ' /test/functional/ '
flags = [ " --srcdir= {} /src " . format ( build_dir ) ] + args
flags . append ( " --cachedir= %s " % cache_dir )
if enable_coverage :
coverage = RPCCoverage ( )
flags . append ( coverage . flag )
logging . debug ( " Initializing coverage directory at %s " % coverage . dir )
else :
coverage = None
if len ( test_list ) > 1 and jobs > 1 :
# Populate cache
subprocess . check_output ( [ tests_dir + ' create_cache.py ' ] + flags )
#Run Tests
job_queue = TestHandler ( jobs , tests_dir , test_list , flags )
time0 = time . time ( )
test_results = [ ]
max_len_name = len ( max ( test_list , key = len ) )
for _ in range ( len ( test_list ) ) :
test_result , stdout , stderr = job_queue . get_next ( )
test_results . append ( test_result )
if test_result . status == " Passed " :
logging . debug ( " \n %s %s %s passed, Duration: %s s " % ( BOLD [ 1 ] , test_result . name , BOLD [ 0 ] , test_result . time ) )
elif test_result . status == " Skipped " :
logging . debug ( " \n %s %s %s skipped " % ( BOLD [ 1 ] , test_result . name , BOLD [ 0 ] ) )
else :
print ( " \n %s %s %s failed, Duration: %s s \n " % ( BOLD [ 1 ] , test_result . name , BOLD [ 0 ] , test_result . time ) )
print ( BOLD [ 1 ] + ' stdout: \n ' + BOLD [ 0 ] + stdout + ' \n ' )
print ( BOLD [ 1 ] + ' stderr: \n ' + BOLD [ 0 ] + stderr + ' \n ' )
print_results ( test_results , max_len_name , ( int ( time . time ( ) - time0 ) ) )
if coverage :
coverage . report_rpc_coverage ( )
logging . debug ( " Cleaning up coverage data " )
coverage . cleanup ( )
all_passed = all ( map ( lambda test_result : test_result . was_successful , test_results ) )
sys . exit ( not all_passed )
def print_results ( test_results , max_len_name , runtime ) :
results = " \n " + BOLD [ 1 ] + " %s | %s | %s \n \n " % ( " TEST " . ljust ( max_len_name ) , " STATUS " , " DURATION " ) + BOLD [ 0 ]
test_results . sort ( key = lambda result : result . name . lower ( ) )
all_passed = True
time_sum = 0
for test_result in test_results :
all_passed = all_passed and test_result . was_successful
time_sum + = test_result . time
test_result . padding = max_len_name
results + = str ( test_result )
status = TICK + " Passed " if all_passed else CROSS + " Failed "
results + = BOLD [ 1 ] + " \n %s | %s | %s s (accumulated) \n " % ( " ALL " . ljust ( max_len_name ) , status . ljust ( 9 ) , time_sum ) + BOLD [ 0 ]
results + = " Runtime: %s s \n " % ( runtime )
print ( results )
class TestHandler :
"""
Trigger the testscrips passed in via the list .
"""
def __init__ ( self , num_tests_parallel , tests_dir , test_list = None , flags = None ) :
assert ( num_tests_parallel > = 1 )
self . num_jobs = num_tests_parallel
self . tests_dir = tests_dir
self . test_list = test_list
self . flags = flags
self . num_running = 0
# In case there is a graveyard of zombie bitcoinds, we can apply a
# pseudorandom offset to hopefully jump over them.
# (625 is PORT_RANGE/MAX_NODES)
self . portseed_offset = int ( time . time ( ) * 1000 ) % 625
self . jobs = [ ]
def get_next ( self ) :
while self . num_running < self . num_jobs and self . test_list :
# Add tests
self . num_running + = 1
t = self . test_list . pop ( 0 )
port_seed = [ " --portseed= {} " . format ( len ( self . test_list ) + self . portseed_offset ) ]
log_stdout = tempfile . SpooledTemporaryFile ( max_size = 2 * * 16 )
log_stderr = tempfile . SpooledTemporaryFile ( max_size = 2 * * 16 )
test_argv = t . split ( )
self . jobs . append ( ( t ,
time . time ( ) ,
subprocess . Popen ( [ self . tests_dir + test_argv [ 0 ] ] + test_argv [ 1 : ] + self . flags + port_seed ,
universal_newlines = True ,
stdout = log_stdout ,
stderr = log_stderr ) ,
log_stdout ,
log_stderr ) )
if not self . jobs :
raise IndexError ( ' pop from empty list ' )
while True :
# Return first proc that finishes
time . sleep ( .5 )
for j in self . jobs :
( name , time0 , proc , log_out , log_err ) = j
if proc . poll ( ) is not None :
log_out . seek ( 0 ) , log_err . seek ( 0 )
[ stdout , stderr ] = [ l . read ( ) . decode ( ' utf-8 ' ) for l in ( log_out , log_err ) ]
log_out . close ( ) , log_err . close ( )
if proc . returncode == TEST_EXIT_PASSED and stderr == " " :
status = " Passed "
elif proc . returncode == TEST_EXIT_SKIPPED :
status = " Skipped "
else :
status = " Failed "
self . num_running - = 1
self . jobs . remove ( j )
return TestResult ( name , status , int ( time . time ( ) - time0 ) ) , stdout , stderr
print ( ' . ' , end = ' ' , flush = True )
class TestResult ( ) :
def __init__ ( self , name , status , time ) :
self . name = name
self . status = status
self . time = time
self . padding = 0
def __repr__ ( self ) :
if self . status == " Passed " :
color = BLUE
glyph = TICK
elif self . status == " Failed " :
color = RED
glyph = CROSS
elif self . status == " Skipped " :
color = GREY
glyph = CIRCLE
return color [ 1 ] + " %s | %s %s | %s s \n " % ( self . name . ljust ( self . padding ) , glyph , self . status . ljust ( 7 ) , self . time ) + color [ 0 ]
@property
def was_successful ( self ) :
return self . status != " Failed "
def check_script_list ( src_dir ) :
""" Check scripts directory.
Check that there are no scripts in the functional tests directory which are
not being run by pull - tester . py . """
script_dir = src_dir + ' /test/functional/ '
python_files = set ( [ t for t in os . listdir ( script_dir ) if t [ - 3 : ] == " .py " ] )
missed_tests = list ( python_files - set ( map ( lambda x : x . split ( ) [ 0 ] , ALL_SCRIPTS + NON_SCRIPTS ) ) )
if len ( missed_tests ) != 0 :
print ( " %s WARNING! %s The following scripts are not being run: %s . Check the test lists in test_runner.py. " % ( BOLD [ 1 ] , BOLD [ 0 ] , str ( missed_tests ) ) )
if os . getenv ( ' TRAVIS ' ) == ' true ' :
# On travis this warning is an error to prevent merging incomplete commits into master
sys . exit ( 1 )
class RPCCoverage ( object ) :
"""
Coverage reporting utilities for test_runner .
Coverage calculation works by having each test script subprocess write
coverage files into a particular directory . These files contain the RPC
commands invoked during testing , as well as a complete listing of RPC
commands per ` bitcoin - cli help ` ( ` rpc_interface . txt ` ) .
After all tests complete , the commands run are combined and diff ' d against
the complete list to calculate uncovered RPC commands .
See also : test / functional / test_framework / coverage . py
"""
def __init__ ( self ) :
self . dir = tempfile . mkdtemp ( prefix = " coverage " )
self . flag = ' --coveragedir= %s ' % self . dir
def report_rpc_coverage ( self ) :
"""
Print out RPC commands that were unexercised by tests .
"""
uncovered = self . _get_uncovered_rpc_commands ( )
if uncovered :
print ( " Uncovered RPC commands: " )
print ( " " . join ( ( " - %s \n " % i ) for i in sorted ( uncovered ) ) )
else :
print ( " All RPC commands covered. " )
def cleanup ( self ) :
return shutil . rmtree ( self . dir )
def _get_uncovered_rpc_commands ( self ) :
"""
Return a set of currently untested RPC commands .
"""
# This is shared from `test/functional/test-framework/coverage.py`
reference_filename = ' rpc_interface.txt '
coverage_file_prefix = ' coverage. '
coverage_ref_filename = os . path . join ( self . dir , reference_filename )
coverage_filenames = set ( )
all_cmds = set ( )
covered_cmds = set ( )
if not os . path . isfile ( coverage_ref_filename ) :
raise RuntimeError ( " No coverage reference found " )
with open ( coverage_ref_filename , ' r ' ) as f :
all_cmds . update ( [ i . strip ( ) for i in f . readlines ( ) ] )
for root , dirs , files in os . walk ( self . dir ) :
for filename in files :
if filename . startswith ( coverage_file_prefix ) :
coverage_filenames . add ( os . path . join ( root , filename ) )
for filename in coverage_filenames :
with open ( filename , ' r ' ) as f :
covered_cmds . update ( [ i . strip ( ) for i in f . readlines ( ) ] )
return all_cmds - covered_cmds
if __name__ == ' __main__ ' :
main ( )