2019-01-16 11:49:01 -05:00
#!/usr/bin/env python3
2021-07-28 13:57:16 +02:00
# Copyright (c) 2019-2021 The Bitcoin Core developers
2019-01-16 11:49:01 -05:00
# Distributed under the MIT software license, see the accompanying
# file COPYING or http://www.opensource.org/licenses/mit-license.php.
""" Run fuzz test targets.
"""
2020-04-17 15:44:29 -04:00
from concurrent . futures import ThreadPoolExecutor , as_completed
2023-06-20 15:58:21 +02:00
from pathlib import Path
2019-01-16 11:49:01 -05:00
import argparse
import configparser
2020-04-17 15:44:29 -04:00
import logging
2019-01-16 11:49:01 -05:00
import os
import subprocess
2020-04-17 15:44:29 -04:00
import sys
2019-01-16 11:49:01 -05:00
2020-02-19 14:10:22 +00:00
2021-01-26 10:44:32 +01:00
def get_fuzz_env ( * , target , source_dir ) :
2021-01-20 16:48:39 +01:00
return {
' FUZZ ' : target ,
2021-01-26 10:44:32 +01:00
' UBSAN_OPTIONS ' :
f ' suppressions= { source_dir } /test/sanitizer_suppressions/ubsan:print_stacktrace=1:halt_on_error=1:report_error_type=1 ' ,
2021-01-20 16:48:39 +01:00
' ASAN_OPTIONS ' : # symbolizer disabled due to https://github.com/google/sanitizers/issues/1364#issuecomment-761072085
' symbolize=0:detect_stack_use_after_return=1:check_initialization_order=1:strict_init_order=1 ' ,
}
2019-01-16 11:49:01 -05:00
def main ( ) :
2019-02-19 15:46:29 -05:00
parser = argparse . ArgumentParser (
formatter_class = argparse . ArgumentDefaultsHelpFormatter ,
2021-03-08 15:40:17 +01:00
description = ''' Run the fuzz targets with all inputs from the corpus_dir once. ''' ,
2019-02-19 15:46:29 -05:00
)
2019-01-16 11:49:01 -05:00
parser . add_argument (
" -l " ,
" --loglevel " ,
dest = " loglevel " ,
default = " INFO " ,
help = " log events at this level and higher to the console. Can be set to DEBUG, INFO, WARNING, ERROR or CRITICAL. Passing --loglevel DEBUG will output all logs to console. " ,
)
2020-02-16 10:45:05 +00:00
parser . add_argument (
' --valgrind ' ,
action = ' store_true ' ,
2020-02-17 13:34:51 +00:00
help = ' If true, run fuzzing binaries under the valgrind memory error detector ' ,
2020-02-16 10:45:05 +00:00
)
2023-06-20 15:58:21 +02:00
parser . add_argument (
" --empty_min_time " ,
type = int ,
help = " If set, run at least this long, if the existing fuzz inputs directory is empty. " ,
)
2020-02-19 14:10:22 +00:00
parser . add_argument (
' -x ' ,
' --exclude ' ,
help = " A comma-separated list of targets to exclude " ,
)
2020-04-17 15:44:29 -04:00
parser . add_argument (
' --par ' ,
2020-05-09 15:55:29 -04:00
' -j ' ,
2020-04-17 15:44:29 -04:00
type = int ,
default = 4 ,
help = ' How many targets to merge or execute in parallel. ' ,
)
2019-01-16 11:49:01 -05:00
parser . add_argument (
2021-03-08 15:40:17 +01:00
' corpus_dir ' ,
help = ' The corpus to run on (must contain subfolders for each fuzz target). ' ,
2019-01-16 11:49:01 -05:00
)
parser . add_argument (
' target ' ,
nargs = ' * ' ,
help = ' The target(s) to run. Default is to run all targets. ' ,
)
2019-02-19 15:46:29 -05:00
parser . add_argument (
' --m_dir ' ,
2021-03-08 15:40:17 +01:00
help = ' Merge inputs from this directory into the corpus_dir. ' ,
2019-02-19 15:46:29 -05:00
)
2020-08-04 18:42:29 +02:00
parser . add_argument (
' -g ' ,
' --generate ' ,
action = ' store_true ' ,
2021-03-08 15:40:17 +01:00
help = ' Create new corpus (or extend the existing ones) by running '
2020-08-04 18:42:29 +02:00
' the given targets for a finite number of times. Outputs them to '
2021-03-08 15:40:17 +01:00
' the passed corpus_dir. '
2020-08-04 18:42:29 +02:00
)
2019-01-16 11:49:01 -05:00
args = parser . parse_args ( )
2023-06-20 15:58:21 +02:00
args . corpus_dir = Path ( args . corpus_dir )
2019-01-16 11:49:01 -05:00
# Set up logging
logging . basicConfig (
format = ' %(message)s ' ,
level = int ( args . loglevel ) if args . loglevel . isdigit ( ) else args . loglevel . upper ( ) ,
)
# Read config generated by configure.
config = configparser . ConfigParser ( )
configfile = os . path . abspath ( os . path . dirname ( __file__ ) ) + " /../config.ini "
config . read_file ( open ( configfile , encoding = " utf8 " ) )
2023-06-22 11:49:28 +02:00
if not config [ " components " ] . getboolean ( " ENABLE_FUZZ_BINARY " ) :
logging . error ( " Must have fuzz executable built " )
2019-01-16 11:49:01 -05:00
sys . exit ( 1 )
# Build list of tests
2020-12-03 16:42:49 +01:00
test_list_all = parse_test_list ( fuzz_bin = os . path . join ( config [ " environment " ] [ " BUILDDIR " ] , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) )
2019-01-16 11:49:01 -05:00
if not test_list_all :
logging . error ( " No fuzz targets found " )
sys . exit ( 1 )
2020-02-19 14:10:22 +00:00
logging . debug ( " {} fuzz target(s) found: {} " . format ( len ( test_list_all ) , " " . join ( sorted ( test_list_all ) ) ) )
2019-01-16 11:49:01 -05:00
args . target = args . target or test_list_all # By default run all
test_list_error = list ( set ( args . target ) . difference ( set ( test_list_all ) ) )
if test_list_error :
logging . error ( " Unknown fuzz targets selected: {} " . format ( test_list_error ) )
test_list_selection = list ( set ( test_list_all ) . intersection ( set ( args . target ) ) )
if not test_list_selection :
logging . error ( " No fuzz targets selected " )
2020-02-19 14:10:22 +00:00
if args . exclude :
for excluded_target in args . exclude . split ( " , " ) :
if excluded_target not in test_list_selection :
logging . error ( " Target \" {} \" not found in current target list. " . format ( excluded_target ) )
continue
test_list_selection . remove ( excluded_target )
test_list_selection . sort ( )
logging . info ( " {} of {} detected fuzz target(s) selected: {} " . format ( len ( test_list_selection ) , len ( test_list_all ) , " " . join ( test_list_selection ) ) )
2019-01-16 11:49:01 -05:00
2020-08-04 18:42:29 +02:00
if not args . generate :
2021-03-08 15:40:17 +01:00
test_list_missing_corpus = [ ]
2020-08-04 18:42:29 +02:00
for t in test_list_selection :
2021-03-08 15:40:17 +01:00
corpus_path = os . path . join ( args . corpus_dir , t )
2020-08-04 18:42:29 +02:00
if not os . path . exists ( corpus_path ) or len ( os . listdir ( corpus_path ) ) == 0 :
2021-03-08 15:40:17 +01:00
test_list_missing_corpus . append ( t )
test_list_missing_corpus . sort ( )
if test_list_missing_corpus :
2020-08-04 18:42:29 +02:00
logging . info (
2021-03-08 15:40:17 +01:00
" Fuzzing harnesses lacking a corpus: {} " . format (
" " . join ( test_list_missing_corpus )
2020-08-04 18:42:29 +02:00
)
2020-03-09 17:20:52 +00:00
)
2021-03-08 15:40:17 +01:00
logging . info ( " Please consider adding a fuzz corpus at https://github.com/bitcoin-core/qa-assets " )
2020-03-09 17:20:52 +00:00
2019-02-14 15:49:13 -05:00
try :
help_output = subprocess . run (
args = [
2020-12-03 16:42:49 +01:00
os . path . join ( config [ " environment " ] [ " BUILDDIR " ] , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2019-02-14 15:49:13 -05:00
' -help=1 ' ,
] ,
2021-01-26 10:44:32 +01:00
env = get_fuzz_env ( target = test_list_selection [ 0 ] , source_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ) ,
2020-03-02 16:26:49 -05:00
timeout = 20 ,
2023-06-22 11:49:28 +02:00
check = False ,
2019-02-14 15:49:13 -05:00
stderr = subprocess . PIPE ,
2023-01-17 21:46:35 +01:00
text = True ,
2019-02-14 15:49:13 -05:00
) . stderr
2023-06-22 11:49:28 +02:00
using_libfuzzer = " libFuzzer " in help_output
if ( args . generate or args . m_dir ) and not using_libfuzzer :
2019-02-14 15:49:13 -05:00
logging . error ( " Must be built with libFuzzer " )
sys . exit ( 1 )
except subprocess . TimeoutExpired :
logging . error ( " subprocess timed out: Currently only libFuzzer is supported " )
2019-01-16 11:49:01 -05:00
sys . exit ( 1 )
2020-04-17 15:44:29 -04:00
with ThreadPoolExecutor ( max_workers = args . par ) as fuzz_pool :
2020-08-04 18:42:29 +02:00
if args . generate :
2021-03-08 15:40:17 +01:00
return generate_corpus (
2020-08-04 18:42:29 +02:00
fuzz_pool = fuzz_pool ,
2021-01-26 10:44:32 +01:00
src_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
2020-08-04 18:42:29 +02:00
build_dir = config [ " environment " ] [ " BUILDDIR " ] ,
2021-03-08 15:40:17 +01:00
corpus_dir = args . corpus_dir ,
2020-08-04 18:42:29 +02:00
targets = test_list_selection ,
)
2020-04-17 15:44:29 -04:00
if args . m_dir :
merge_inputs (
fuzz_pool = fuzz_pool ,
2021-03-08 15:40:17 +01:00
corpus = args . corpus_dir ,
2020-04-17 15:44:29 -04:00
test_list = test_list_selection ,
2021-01-26 10:44:32 +01:00
src_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
2020-04-17 15:44:29 -04:00
build_dir = config [ " environment " ] [ " BUILDDIR " ] ,
merge_dir = args . m_dir ,
)
return
run_once (
fuzz_pool = fuzz_pool ,
2021-03-08 15:40:17 +01:00
corpus = args . corpus_dir ,
2019-02-19 15:46:29 -05:00
test_list = test_list_selection ,
2021-01-26 10:44:32 +01:00
src_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
2019-02-19 15:46:29 -05:00
build_dir = config [ " environment " ] [ " BUILDDIR " ] ,
2023-06-22 11:49:28 +02:00
using_libfuzzer = using_libfuzzer ,
2020-04-17 15:44:29 -04:00
use_valgrind = args . valgrind ,
2023-06-20 15:58:21 +02:00
empty_min_time = args . empty_min_time ,
2019-02-19 15:46:29 -05:00
)
2019-01-16 11:49:01 -05:00
2021-03-08 15:40:17 +01:00
def generate_corpus ( * , fuzz_pool , src_dir , build_dir , corpus_dir , targets ) :
""" Generates new corpus.
2020-08-04 18:42:29 +02:00
2021-03-08 15:40:17 +01:00
Run { targets } without input , and outputs the generated corpus to
{ corpus_dir } .
2020-08-04 18:42:29 +02:00
"""
2021-03-08 15:40:17 +01:00
logging . info ( " Generating corpus to {} " . format ( corpus_dir ) )
2023-06-27 16:13:05 +02:00
rpc_target = " rpc "
has_rpc = rpc_target in targets
if has_rpc :
targets . remove ( rpc_target )
targets = [ ( t , { } ) for t in targets ]
if has_rpc :
lines = subprocess . run (
[ " git " , " grep " , " --function-context " , " RPC_COMMANDS_SAFE_FOR_FUZZING { " , os . path . join ( src_dir , " src " , " test " , " fuzz " , " rpc.cpp " ) ] ,
check = True ,
stdout = subprocess . PIPE ,
text = True ,
) . stdout . splitlines ( )
lines = [ l . split ( " \" " , 1 ) [ 1 ] . split ( " \" " ) [ 0 ] for l in lines if l . startswith ( " src/test/fuzz/rpc.cpp- \" " ) ]
targets + = [ ( rpc_target , { " LIMIT_TO_RPC_COMMAND " : r } ) for r in lines ]
2020-08-04 18:42:29 +02:00
2023-06-27 16:13:05 +02:00
def job ( command , t , t_env ) :
logging . debug ( f " Running ' { command } ' " )
2020-08-04 18:42:29 +02:00
logging . debug ( " Command ' {} ' output: \n ' {} ' \n " . format (
2023-06-27 16:13:05 +02:00
command ,
2020-12-03 16:42:49 +01:00
subprocess . run (
command ,
2023-06-27 16:13:05 +02:00
env = {
* * t_env ,
* * get_fuzz_env ( target = t , source_dir = src_dir ) ,
} ,
2020-12-03 16:42:49 +01:00
check = True ,
stderr = subprocess . PIPE ,
2023-01-17 21:46:35 +01:00
text = True ,
2023-06-27 16:13:05 +02:00
) . stderr ,
) )
2020-08-04 18:42:29 +02:00
futures = [ ]
2023-06-27 16:13:05 +02:00
for target , t_env in targets :
target_corpus_dir = corpus_dir / target
2021-03-08 15:40:17 +01:00
os . makedirs ( target_corpus_dir , exist_ok = True )
2020-08-04 18:42:29 +02:00
command = [
2020-12-03 16:42:49 +01:00
os . path . join ( build_dir , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2020-08-04 18:42:29 +02:00
" -runs=100000 " ,
2021-03-08 15:40:17 +01:00
target_corpus_dir ,
2020-08-04 18:42:29 +02:00
]
2023-06-27 16:13:05 +02:00
futures . append ( fuzz_pool . submit ( job , command , target , t_env ) )
2020-08-04 18:42:29 +02:00
for future in as_completed ( futures ) :
future . result ( )
2021-01-26 10:44:32 +01:00
def merge_inputs ( * , fuzz_pool , corpus , test_list , src_dir , build_dir , merge_dir ) :
2021-03-08 15:40:17 +01:00
logging . info ( " Merge the inputs from the passed dir into the corpus_dir. Passed dir {} " . format ( merge_dir ) )
2020-04-17 15:44:29 -04:00
jobs = [ ]
2019-02-19 15:46:29 -05:00
for t in test_list :
args = [
2020-12-03 16:42:49 +01:00
os . path . join ( build_dir , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2019-02-19 15:46:29 -05:00
' -merge=1 ' ,
2021-01-28 14:54:53 +01:00
' -shuffle=0 ' ,
' -prefer_small=1 ' ,
2020-04-09 00:52:43 +08:00
' -use_value_profile=1 ' , # Also done by oss-fuzz https://github.com/google/oss-fuzz/issues/1406#issuecomment-387790487
2019-02-19 15:46:29 -05:00
os . path . join ( corpus , t ) ,
os . path . join ( merge_dir , t ) ,
]
os . makedirs ( os . path . join ( corpus , t ) , exist_ok = True )
os . makedirs ( os . path . join ( merge_dir , t ) , exist_ok = True )
2020-04-17 15:44:29 -04:00
def job ( t , args ) :
output = ' Run {} with args {} \n ' . format ( t , " " . join ( args ) )
2020-12-03 16:42:49 +01:00
output + = subprocess . run (
args ,
2021-01-26 10:44:32 +01:00
env = get_fuzz_env ( target = t , source_dir = src_dir ) ,
2020-12-03 16:42:49 +01:00
check = True ,
stderr = subprocess . PIPE ,
2023-01-17 21:46:35 +01:00
text = True ,
2020-12-03 16:42:49 +01:00
) . stderr
2020-04-17 15:44:29 -04:00
logging . debug ( output )
jobs . append ( fuzz_pool . submit ( job , t , args ) )
for future in as_completed ( jobs ) :
future . result ( )
2019-02-19 15:46:29 -05:00
2020-04-17 15:44:29 -04:00
2023-06-22 11:49:28 +02:00
def run_once ( * , fuzz_pool , corpus , test_list , src_dir , build_dir , using_libfuzzer , use_valgrind , empty_min_time ) :
2020-04-17 15:44:29 -04:00
jobs = [ ]
2019-01-16 11:49:01 -05:00
for t in test_list :
2023-06-20 15:58:21 +02:00
corpus_path = corpus / t
2020-03-09 17:20:52 +00:00
os . makedirs ( corpus_path , exist_ok = True )
2019-01-16 11:49:01 -05:00
args = [
2020-12-03 16:42:49 +01:00
os . path . join ( build_dir , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2019-01-16 11:49:01 -05:00
]
2023-06-20 15:58:21 +02:00
empty_dir = not any ( corpus_path . iterdir ( ) )
2023-06-22 11:49:28 +02:00
if using_libfuzzer :
if empty_min_time and empty_dir :
args + = [ f " -max_total_time= { empty_min_time } " ]
else :
args + = [
" -runs=1 " ,
corpus_path ,
]
2023-06-20 15:58:21 +02:00
else :
2023-06-22 11:49:28 +02:00
args + = [ corpus_path ]
2020-02-16 10:45:05 +00:00
if use_valgrind :
2020-02-17 13:34:51 +00:00
args = [ ' valgrind ' , ' --quiet ' , ' --error-exitcode=1 ' ] + args
2020-04-17 15:44:29 -04:00
def job ( t , args ) :
output = ' Run {} with args {} ' . format ( t , args )
2021-01-20 16:48:39 +01:00
result = subprocess . run (
args ,
2021-01-26 10:44:32 +01:00
env = get_fuzz_env ( target = t , source_dir = src_dir ) ,
2021-01-20 16:48:39 +01:00
stderr = subprocess . PIPE ,
2023-01-17 21:46:35 +01:00
text = True ,
2021-01-20 16:48:39 +01:00
)
2020-04-17 15:44:29 -04:00
output + = result . stderr
return output , result
jobs . append ( fuzz_pool . submit ( job , t , args ) )
for future in as_completed ( jobs ) :
output , result = future . result ( )
logging . debug ( output )
2020-02-19 14:27:19 +00:00
try :
result . check_returncode ( )
except subprocess . CalledProcessError as e :
if e . stdout :
logging . info ( e . stdout )
if e . stderr :
logging . info ( e . stderr )
2023-06-22 11:49:28 +02:00
logging . info ( f " Target { result . args } failed with exit code { e . returncode } " )
2020-02-19 14:27:19 +00:00
sys . exit ( 1 )
2019-01-16 11:49:01 -05:00
2020-12-03 16:42:49 +01:00
def parse_test_list ( * , fuzz_bin ) :
test_list_all = subprocess . run (
fuzz_bin ,
env = {
' PRINT_ALL_FUZZ_TARGETS_AND_ABORT ' : ' '
} ,
stdout = subprocess . PIPE ,
stderr = subprocess . DEVNULL ,
2023-01-17 21:46:35 +01:00
text = True ,
2020-12-03 16:42:49 +01:00
) . stdout . splitlines ( )
2019-01-16 11:49:01 -05:00
return test_list_all
if __name__ == ' __main__ ' :
main ( )