name: Fuzz and run valgrind on: push: branches: - master pull_request: schedule: - cron: 23 */8 * * * jobs: build: runs-on: ubuntu-latest env: # fuzzers that use the default implementation defaultimplfuzzers: atpointer dump dump_raw_tape minify parser print_json # fuzzers that loop over the implementations themselves implfuzzers: implementations minifyimpl utf8 implementations: haswell westmere fallback UBSAN_OPTIONS: halt_on_error=1 MAXLEN: -max_len=4000 steps: - name: Install packages necessary for building run: | sudo apt update sudo apt-get install --quiet ninja-build valgrind zip unzip wget https://apt.llvm.org/llvm.sh chmod +x llvm.sh sudo ./llvm.sh 10 - uses: actions/checkout@v1 - name: Create and prepare the initial seed corpus run: | fuzz/build_corpus.sh mv corpus.zip seed_corpus.zip mkdir seedcorpus unzip -q -d seedcorpus seed_corpus.zip - name: Download the corpus from the last run run: | wget --quiet https://dl.bintray.com/pauldreik/simdjson-fuzz-corpus/corpus/corpus.tar tar xf corpus.tar rm corpus.tar - name: List clang versions run: | ls /usr/bin/clang* which clang++ clang++ --version - name: Build all the variants run: fuzz/build_fuzzer_variants.sh - name: Explore fast (release build, default implementation) run: | set -eux for fuzzer in $defaultimplfuzzers $implfuzzers; do mkdir -p out/$fuzzer # in case this is a new fuzzer, or corpus.tar is broken # get input from everyone else (corpus cross pollination) others=$(find out -type d -not -name $fuzzer -not -name out -not -name cmin) build-fast/fuzz/fuzz_$fuzzer out/$fuzzer $others seedcorpus -max_total_time=30 $MAXLEN done - name: Fuzz default impl. fuzzers with sanitizer+asserts (good at detecting errors) run: | set -eux for fuzzer in $defaultimplfuzzers; do # get input from everyone else (corpus cross pollination) others=$(find out -type d -not -name $fuzzer -not -name out -not -name cmin) for implementation in $implementations; do export SIMDJSON_FORCE_IMPLEMENTATION=$implementation build-sanitizers/fuzz/fuzz_$fuzzer out/$fuzzer $others seedcorpus -max_total_time=20 $MAXLEN done echo now have $(ls out/$fuzzer |wc -l) files in corpus done - name: Fuzz differential impl. fuzzers with sanitizer+asserts (good at detecting errors) run: | set -eux for fuzzer in $implfuzzers; do # get input from everyone else (corpus cross pollination) others=$(find out -type d -not -name $fuzzer -not -name out -not -name cmin) build-sanitizers/fuzz/fuzz_$fuzzer out/$fuzzer $others seedcorpus -max_total_time=20 $MAXLEN echo now have $(ls out/$fuzzer |wc -l) files in corpus done - name: Minimize the corpus with the fast fuzzer on the default implementation run: | set -eux for fuzzer in $defaultimplfuzzers $implfuzzers; do mkdir -p out/cmin/$fuzzer # get input from everyone else (corpus cross pollination) others=$(find out -type d -not -name $fuzzer -not -name out -not -name cmin) build-fast/fuzz/fuzz_$fuzzer -merge=1 $MAXLEN out/cmin/$fuzzer out/$fuzzer $others seedcorpus rm -rf out/$fuzzer mv out/cmin/$fuzzer out/$fuzzer done - name: Package the corpus into an artifact run: | for fuzzer in $allfuzzers; do tar rf corpus.tar out/$fuzzer done - name: Save the corpus as a github artifact uses: actions/upload-artifact@v2 with: name: corpus path: corpus.tar # This takes a subset of the minimized corpus and run it through valgrind. It is slow, # therefore take a "random" subset. The random selection is accomplished by sorting on filenames, # which are hashes of the content. - name: Run some of the minimized corpus through valgrind (replay build, default implementation) run: | for fuzzer in $defaultimplfuzzers $implfuzzers; do find out/$fuzzer -type f |sort|head -n200|xargs -n40 valgrind build-replay/fuzz/fuzz_$fuzzer 2>&1|tee valgrind-$fuzzer.txt done - name: Compress the valgrind output run: tar cf valgrind.tar valgrind-*.txt - name: Save valgrind output as a github artifact uses: actions/upload-artifact@v2 if: always() with: name: valgrindresults path: valgrind.tar if-no-files-found: ignore - name: Upload the corpus and results to bintray if we are on master if: ${{ github.event_name == 'schedule' }} run: | echo uploading each artifact twice, otherwise it will not be published curl -T corpus.tar -upauldreik:${{ secrets.bintrayApiKey }} https://api.bintray.com/content/pauldreik/simdjson-fuzz-corpus/corpus/0/corpus/corpus.tar";publish=1;override=1" curl -T corpus.tar -upauldreik:${{ secrets.bintrayApiKey }} https://api.bintray.com/content/pauldreik/simdjson-fuzz-corpus/corpus/0/corpus/corpus.tar";publish=1;override=1" curl -T valgrind.tar -upauldreik:${{ secrets.bintrayApiKey }} https://api.bintray.com/content/pauldreik/simdjson-fuzz-corpus/corpus/0/corpus/valgrind.tar";publish=1;override=1" curl -T valgrind.tar -upauldreik:${{ secrets.bintrayApiKey }} https://api.bintray.com/content/pauldreik/simdjson-fuzz-corpus/corpus/0/corpus/valgrind.tar";publish=1;override=1" - name: Archive any crashes as an artifact uses: actions/upload-artifact@v2 if: always() with: name: crashes path: | crash-* leak-* timeout-* if-no-files-found: ignore