2019-01-16 17:49:01 +01:00
#!/usr/bin/env python3
2023-08-16 19:27:31 +02:00
# Copyright (c) 2019-2020 The Bitcoin Core developers
2019-01-16 17:49:01 +01:00
# Distributed under the MIT software license, see the accompanying
# file COPYING or http://www.opensource.org/licenses/mit-license.php.
""" Run fuzz test targets.
"""
2020-04-17 21:44:29 +02:00
from concurrent . futures import ThreadPoolExecutor , as_completed
2019-01-16 17:49:01 +01:00
import argparse
import configparser
2020-04-17 21:44:29 +02:00
import logging
2019-01-16 17:49:01 +01:00
import os
2024-02-27 10:03:11 +01:00
import random
2019-01-16 17:49:01 +01:00
import subprocess
2020-04-17 21:44:29 +02:00
import sys
2019-01-16 17:49:01 +01:00
2021-01-29 07:43:05 +01:00
def get_fuzz_env ( * , target , source_dir ) :
2021-01-26 09:56:15 +01:00
return {
' FUZZ ' : target ,
2021-01-29 07:43:05 +01:00
' UBSAN_OPTIONS ' :
f ' suppressions= { source_dir } /test/sanitizer_suppressions/ubsan:print_stacktrace=1:halt_on_error=1:report_error_type=1 ' ,
2021-01-26 09:56:15 +01:00
' ASAN_OPTIONS ' : # symbolizer disabled due to https://github.com/google/sanitizers/issues/1364#issuecomment-761072085
' symbolize=0:detect_stack_use_after_return=1:check_initialization_order=1:strict_init_order=1 ' ,
}
2019-01-16 17:49:01 +01:00
def main ( ) :
2020-03-09 16:21:27 +01:00
parser = argparse . ArgumentParser (
formatter_class = argparse . ArgumentDefaultsHelpFormatter ,
2021-03-10 07:32:07 +01:00
description = ''' Run the fuzz targets with all inputs from the corpus_dir once. ''' ,
2020-03-09 16:21:27 +01:00
)
2019-01-16 17:49:01 +01:00
parser . add_argument (
" -l " ,
" --loglevel " ,
dest = " loglevel " ,
default = " INFO " ,
help = " log events at this level and higher to the console. Can be set to DEBUG, INFO, WARNING, ERROR or CRITICAL. Passing --loglevel DEBUG will output all logs to console. " ,
)
2020-02-16 18:47:50 +01:00
parser . add_argument (
' --valgrind ' ,
action = ' store_true ' ,
2020-02-17 14:34:51 +01:00
help = ' If true, run fuzzing binaries under the valgrind memory error detector ' ,
)
parser . add_argument (
' -x ' ,
' --exclude ' ,
help = " A comma-separated list of targets to exclude " ,
2020-02-16 18:47:50 +01:00
)
2020-04-17 21:44:29 +02:00
parser . add_argument (
' --par ' ,
2020-05-09 21:55:29 +02:00
' -j ' ,
2020-04-17 21:44:29 +02:00
type = int ,
default = 4 ,
help = ' How many targets to merge or execute in parallel. ' ,
)
2019-01-16 17:49:01 +01:00
parser . add_argument (
2021-03-10 07:32:07 +01:00
' corpus_dir ' ,
help = ' The corpus to run on (must contain subfolders for each fuzz target). ' ,
2019-01-16 17:49:01 +01:00
)
parser . add_argument (
' target ' ,
nargs = ' * ' ,
help = ' The target(s) to run. Default is to run all targets. ' ,
)
2020-03-09 16:21:27 +01:00
parser . add_argument (
' --m_dir ' ,
2021-03-10 07:32:07 +01:00
help = ' Merge inputs from this directory into the corpus_dir. ' ,
2020-03-09 16:21:27 +01:00
)
2020-08-04 18:42:29 +02:00
parser . add_argument (
' -g ' ,
' --generate ' ,
action = ' store_true ' ,
2021-03-10 07:32:07 +01:00
help = ' Create new corpus (or extend the existing ones) by running '
2020-08-04 18:42:29 +02:00
' the given targets for a finite number of times. Outputs them to '
2021-03-10 07:32:07 +01:00
' the passed corpus_dir. '
2020-08-04 18:42:29 +02:00
)
2019-01-16 17:49:01 +01:00
args = parser . parse_args ( )
# Set up logging
logging . basicConfig (
format = ' %(message)s ' ,
level = int ( args . loglevel ) if args . loglevel . isdigit ( ) else args . loglevel . upper ( ) ,
)
# Read config generated by configure.
config = configparser . ConfigParser ( )
configfile = os . path . abspath ( os . path . dirname ( __file__ ) ) + " /../config.ini "
config . read_file ( open ( configfile , encoding = " utf8 " ) )
if not config [ " components " ] . getboolean ( " ENABLE_FUZZ " ) :
logging . error ( " Must have fuzz targets built " )
sys . exit ( 1 )
# Build list of tests
2024-03-08 11:13:09 +01:00
test_list_all = parse_test_list (
fuzz_bin = os . path . join ( config [ " environment " ] [ " BUILDDIR " ] , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
source_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
)
2019-01-16 17:49:01 +01:00
if not test_list_all :
logging . error ( " No fuzz targets found " )
sys . exit ( 1 )
2020-02-17 14:34:51 +01:00
logging . debug ( " {} fuzz target(s) found: {} " . format ( len ( test_list_all ) , " " . join ( sorted ( test_list_all ) ) ) )
2019-01-16 17:49:01 +01:00
args . target = args . target or test_list_all # By default run all
test_list_error = list ( set ( args . target ) . difference ( set ( test_list_all ) ) )
if test_list_error :
logging . error ( " Unknown fuzz targets selected: {} " . format ( test_list_error ) )
test_list_selection = list ( set ( test_list_all ) . intersection ( set ( args . target ) ) )
if not test_list_selection :
logging . error ( " No fuzz targets selected " )
2020-02-17 14:34:51 +01:00
if args . exclude :
for excluded_target in args . exclude . split ( " , " ) :
if excluded_target not in test_list_selection :
logging . error ( " Target \" {} \" not found in current target list. " . format ( excluded_target ) )
continue
test_list_selection . remove ( excluded_target )
test_list_selection . sort ( )
logging . info ( " {} of {} detected fuzz target(s) selected: {} " . format ( len ( test_list_selection ) , len ( test_list_all ) , " " . join ( test_list_selection ) ) )
2019-01-16 17:49:01 +01:00
2020-08-04 18:42:29 +02:00
if not args . generate :
2021-03-10 07:32:07 +01:00
test_list_missing_corpus = [ ]
2020-08-04 18:42:29 +02:00
for t in test_list_selection :
2021-03-10 07:32:07 +01:00
corpus_path = os . path . join ( args . corpus_dir , t )
2020-08-04 18:42:29 +02:00
if not os . path . exists ( corpus_path ) or len ( os . listdir ( corpus_path ) ) == 0 :
2021-03-10 07:32:07 +01:00
test_list_missing_corpus . append ( t )
test_list_missing_corpus . sort ( )
if test_list_missing_corpus :
2020-08-04 18:42:29 +02:00
logging . info (
2021-03-10 07:32:07 +01:00
" Fuzzing harnesses lacking a corpus: {} " . format (
" " . join ( test_list_missing_corpus )
2020-08-04 18:42:29 +02:00
)
2020-03-09 18:20:52 +01:00
)
2021-03-10 07:32:07 +01:00
logging . info ( " Please consider adding a fuzz corpus at https://github.com/bitcoin-core/qa-assets " )
2020-03-09 18:20:52 +01:00
2019-01-16 17:49:01 +01:00
try :
help_output = subprocess . run (
args = [
2022-09-19 09:03:12 +02:00
os . path . join ( config [ " environment " ] [ " BUILDDIR " ] , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2019-01-16 17:49:01 +01:00
' -help=1 ' ,
] ,
2021-01-29 07:43:05 +01:00
env = get_fuzz_env ( target = test_list_selection [ 0 ] , source_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ) ,
2020-03-02 22:26:49 +01:00
timeout = 20 ,
2019-01-16 17:49:01 +01:00
check = True ,
stderr = subprocess . PIPE ,
universal_newlines = True ,
) . stderr
if " libFuzzer " not in help_output :
logging . error ( " Must be built with libFuzzer " )
sys . exit ( 1 )
except subprocess . TimeoutExpired :
logging . error ( " subprocess timed out: Currently only libFuzzer is supported " )
sys . exit ( 1 )
2020-04-17 21:44:29 +02:00
with ThreadPoolExecutor ( max_workers = args . par ) as fuzz_pool :
2020-08-04 18:42:29 +02:00
if args . generate :
2021-03-10 07:32:07 +01:00
return generate_corpus (
2020-08-04 18:42:29 +02:00
fuzz_pool = fuzz_pool ,
2021-01-29 07:43:05 +01:00
src_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
2020-08-04 18:42:29 +02:00
build_dir = config [ " environment " ] [ " BUILDDIR " ] ,
2021-03-10 07:32:07 +01:00
corpus_dir = args . corpus_dir ,
2020-08-04 18:42:29 +02:00
targets = test_list_selection ,
)
2020-04-17 21:44:29 +02:00
if args . m_dir :
merge_inputs (
fuzz_pool = fuzz_pool ,
2021-03-10 07:32:07 +01:00
corpus = args . corpus_dir ,
2020-04-17 21:44:29 +02:00
test_list = test_list_selection ,
2021-01-29 07:43:05 +01:00
src_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
2020-04-17 21:44:29 +02:00
build_dir = config [ " environment " ] [ " BUILDDIR " ] ,
merge_dir = args . m_dir ,
)
return
run_once (
fuzz_pool = fuzz_pool ,
2021-03-10 07:32:07 +01:00
corpus = args . corpus_dir ,
2020-03-09 16:21:27 +01:00
test_list = test_list_selection ,
2021-01-29 07:43:05 +01:00
src_dir = config [ ' environment ' ] [ ' SRCDIR ' ] ,
2020-03-09 16:21:27 +01:00
build_dir = config [ " environment " ] [ " BUILDDIR " ] ,
2020-04-17 21:44:29 +02:00
use_valgrind = args . valgrind ,
2020-03-09 16:21:27 +01:00
)
2019-01-16 17:49:01 +01:00
2021-03-10 07:32:07 +01:00
def generate_corpus ( * , fuzz_pool , src_dir , build_dir , corpus_dir , targets ) :
""" Generates new corpus.
2020-08-04 18:42:29 +02:00
2021-03-10 07:32:07 +01:00
Run { targets } without input , and outputs the generated corpus to
{ corpus_dir } .
2020-08-04 18:42:29 +02:00
"""
2021-03-10 07:32:07 +01:00
logging . info ( " Generating corpus to {} " . format ( corpus_dir ) )
2020-08-04 18:42:29 +02:00
2022-09-19 09:03:12 +02:00
def job ( command , t ) :
2020-08-04 18:42:29 +02:00
logging . debug ( " Running ' {} ' \n " . format ( " " . join ( command ) ) )
logging . debug ( " Command ' {} ' output: \n ' {} ' \n " . format (
' ' . join ( command ) ,
2022-09-19 09:03:12 +02:00
subprocess . run (
command ,
2021-01-29 07:43:05 +01:00
env = get_fuzz_env ( target = t , source_dir = src_dir ) ,
2022-09-19 09:03:12 +02:00
check = True ,
stderr = subprocess . PIPE ,
universal_newlines = True ,
) . stderr ) )
2020-08-04 18:42:29 +02:00
futures = [ ]
for target in targets :
2021-03-10 07:32:07 +01:00
target_corpus_dir = os . path . join ( corpus_dir , target )
os . makedirs ( target_corpus_dir , exist_ok = True )
2024-02-27 10:03:11 +01:00
use_value_profile = int ( random . random ( ) < .3 )
2020-08-04 18:42:29 +02:00
command = [
2022-09-19 09:03:12 +02:00
os . path . join ( build_dir , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2024-02-27 10:03:11 +01:00
" -rss_limit_mb=8000 " ,
" -max_total_time=6000 " ,
" -reload=0 " ,
f " -use_value_profile= { use_value_profile } " ,
2021-03-10 07:32:07 +01:00
target_corpus_dir ,
2020-08-04 18:42:29 +02:00
]
2022-09-19 09:03:12 +02:00
futures . append ( fuzz_pool . submit ( job , command , target ) )
2020-08-04 18:42:29 +02:00
for future in as_completed ( futures ) :
future . result ( )
2021-01-29 07:43:05 +01:00
def merge_inputs ( * , fuzz_pool , corpus , test_list , src_dir , build_dir , merge_dir ) :
2021-03-10 07:32:07 +01:00
logging . info ( " Merge the inputs from the passed dir into the corpus_dir. Passed dir {} " . format ( merge_dir ) )
2020-04-17 21:44:29 +02:00
jobs = [ ]
2020-03-09 16:21:27 +01:00
for t in test_list :
args = [
2022-09-19 09:03:12 +02:00
os . path . join ( build_dir , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2020-03-09 16:21:27 +01:00
' -merge=1 ' ,
2021-02-11 10:34:42 +01:00
' -shuffle=0 ' ,
' -prefer_small=1 ' ,
2020-04-08 18:52:43 +02:00
' -use_value_profile=1 ' , # Also done by oss-fuzz https://github.com/google/oss-fuzz/issues/1406#issuecomment-387790487
2020-03-09 16:21:27 +01:00
os . path . join ( corpus , t ) ,
os . path . join ( merge_dir , t ) ,
]
os . makedirs ( os . path . join ( corpus , t ) , exist_ok = True )
os . makedirs ( os . path . join ( merge_dir , t ) , exist_ok = True )
2020-04-17 21:44:29 +02:00
def job ( t , args ) :
output = ' Run {} with args {} \n ' . format ( t , " " . join ( args ) )
2022-09-19 09:03:12 +02:00
output + = subprocess . run (
args ,
2021-01-29 07:43:05 +01:00
env = get_fuzz_env ( target = t , source_dir = src_dir ) ,
2022-09-19 09:03:12 +02:00
check = True ,
stderr = subprocess . PIPE ,
universal_newlines = True ,
) . stderr
2020-04-17 21:44:29 +02:00
logging . debug ( output )
jobs . append ( fuzz_pool . submit ( job , t , args ) )
for future in as_completed ( jobs ) :
future . result ( )
2020-03-09 16:21:27 +01:00
2020-04-17 21:44:29 +02:00
2021-01-29 07:43:05 +01:00
def run_once ( * , fuzz_pool , corpus , test_list , src_dir , build_dir , use_valgrind ) :
2020-04-17 21:44:29 +02:00
jobs = [ ]
2019-01-16 17:49:01 +01:00
for t in test_list :
2021-08-11 05:52:06 +02:00
corpus_path = os . path . join ( corpus , t )
2020-03-09 18:20:52 +01:00
os . makedirs ( corpus_path , exist_ok = True )
2019-01-16 17:49:01 +01:00
args = [
2022-09-19 09:03:12 +02:00
os . path . join ( build_dir , ' src ' , ' test ' , ' fuzz ' , ' fuzz ' ) ,
2019-01-16 17:49:01 +01:00
' -runs=1 ' ,
2021-08-11 05:52:06 +02:00
corpus_path ,
2019-01-16 17:49:01 +01:00
]
2020-02-16 18:47:50 +01:00
if use_valgrind :
2020-02-17 14:34:51 +01:00
args = [ ' valgrind ' , ' --quiet ' , ' --error-exitcode=1 ' ] + args
2020-04-17 21:44:29 +02:00
def job ( t , args ) :
output = ' Run {} with args {} ' . format ( t , args )
2021-01-26 09:56:15 +01:00
result = subprocess . run (
args ,
2021-01-29 07:43:05 +01:00
env = get_fuzz_env ( target = t , source_dir = src_dir ) ,
2021-01-26 09:56:15 +01:00
stderr = subprocess . PIPE ,
universal_newlines = True ,
)
2020-04-17 21:44:29 +02:00
output + = result . stderr
return output , result
jobs . append ( fuzz_pool . submit ( job , t , args ) )
for future in as_completed ( jobs ) :
output , result = future . result ( )
logging . debug ( output )
2020-02-17 14:34:51 +01:00
try :
result . check_returncode ( )
2020-02-19 17:20:27 +01:00
except subprocess . CalledProcessError as e :
if e . stdout :
logging . info ( e . stdout )
if e . stderr :
logging . info ( e . stderr )
logging . info ( " Target \" {} \" failed with exit code {} : {} " . format ( t , e . returncode , " " . join ( args ) ) )
sys . exit ( 1 )
2020-02-17 14:34:51 +01:00
except subprocess . CalledProcessError as e :
if e . stdout :
logging . info ( e . stdout )
if e . stderr :
logging . info ( e . stderr )
2020-04-17 21:44:29 +02:00
logging . info ( " Target \" {} \" failed with exit code {} " . format ( " " . join ( result . args ) , e . returncode ) )
2020-02-17 14:34:51 +01:00
sys . exit ( 1 )
2019-01-16 17:49:01 +01:00
2024-03-08 11:13:09 +01:00
def parse_test_list ( * , fuzz_bin , source_dir ) :
2022-09-19 09:03:12 +02:00
test_list_all = subprocess . run (
fuzz_bin ,
env = {
2024-03-08 11:13:09 +01:00
' PRINT_ALL_FUZZ_TARGETS_AND_ABORT ' : ' ' ,
* * get_fuzz_env ( target = " " , source_dir = source_dir )
2022-09-19 09:03:12 +02:00
} ,
stdout = subprocess . PIPE ,
stderr = subprocess . DEVNULL ,
universal_newlines = True ,
) . stdout . splitlines ( )
2019-01-16 17:49:01 +01:00
return test_list_all
if __name__ == ' __main__ ' :
main ( )