[sledge] Test: Update test infra

Summary: To support: - html report generation via sexp reports (instead of RESULT in stdout) - smt2 benchmarks - local and extra-repo tests - calculation of relative paths to tests Reviewed By: ngorogiannis Differential Revision: D23459514 fbshipit-source-id: f44e51c17
5 years ago · d87d8f7ef2
parent 4c52102882
commit d87d8f7ef2
20 changed files with 223 additions and 18860 deletions
--- a/sledge/.gitignore
+++ b/sledge/.gitignore
@ -2,9 +2,11 @@
 .llvm_install
 /llvm/
 /test/**/*.bc
-/test/**/*.bc.err
+/test/**/*.err
-/test/**/*.bc.out
+/test/**/*.out
-/test/**/*.ll.err
+/test/**/*.sexp
-/test/**/*.ll.out
+/test/*.html
-/test/report.current
+/test/*.sexp
 /test/extra
 /test/local
 _build
--- a/sledge/test/Makefile
+++ b/sledge/test/Makefile
@ -7,18 +7,23 @@
 CLANG_ARGS?=-O0
 # executable to test
-SLEDGE_EXE=$(CURDIR)/../_build/_install/debug/bin/sledge
+SLEDGE_DBG=$(CURDIR)/../_build/debug/bin/sledge_cli.exe
 SLEDGE_OPT=$(CURDIR)/../_build/release/bin/sledge_cli.exe
 # additional arguments to pass to sledge
 SLEDGE_ARGS?=
 # limits for each test run
-TIMEOUT?=30
+TIMEOUT?=90
 MEMOUT?=4096
-SLEDGE=./wrap.sh $(TIMEOUT) $(MEMOUT) $(SLEDGE_EXE)
+sledge_dbg=./wrap.sh $(TIMEOUT) $(MEMOUT) $(SLEDGE_DBG)
 sledge_opt=./wrap.sh $(TIMEOUT) $(MEMOUT) $(SLEDGE_OPT)
-DIFF?=diff
+sledge_report=$(CURDIR)/../_build/debug/report/sledge_report.exe
 # which utilities to use
 diff?=patdiff
 # configure the non-host llvm and clang
 export PATH := $(CURDIR)/../.llvm_install/sledge/bin:$(PATH)
@ -28,130 +33,220 @@ export LANG := C
 default: test
 # all analyze tests
 translate:
 	@find -L llvm -name '*.ll' -or -name '*.bc' \
 	 | parallel --bar $(SLEDGE) llvm translate -no-models -no-internalize $(SLEDGE_ARGS)
 _translate-report-raw:
 	@find -L llvm -name '*.out' \
 	 | xargs grep "RESULT:" \
 	 | sed 's/\.out:/:	/' | sort | sort -s -t':' -k 3,4
 # report all results
 translate-report-full:
 	@$(MAKE) --silent _translate-report-raw | column -ts$$'\t'
 # report all errors
 translate-report-errors:
 	@$(MAKE) --silent _translate-report-raw \
 	 | grep -E -v "RESULT: (Success|Invalid input)" \
 	 | column -ts$$'\t'
 # report errors
 translate-report:
 	@$(MAKE) --silent _translate-report-raw \
 	 | grep -E -v "RESULT: Unimplemented" \
 	 | grep -E -v "RESULT: (Success|Invalid input)" \
 	 | column -ts$$'\t'
 Buckets:=\
  "Invalid input"\
  "Success"\
  "Unimplemented: ConstantAggregateZero of size 0"\
  "Unimplemented: call null"\
  "Unimplemented: coroutines"\
  "Unimplemented: ifuncs"\
  "Unimplemented: inline asm"\
  "Unimplemented: landingpad of type"\
  "Unimplemented: non-integral pointer types"\
  "Unimplemented: opcode kind in call instruction"\
  "Unimplemented: operand kind in call instruction"\
  "Unimplemented: size_of"\
  "Unimplemented: statepoints"\
  "Unimplemented: unsized non-opaque aggregate types"\
  "Unimplemented: vector operations"\
  "Unimplemented: windows exception handling"\
  "segmentation violation"
 report-summary:
 	for b in $(Buckets); do (printf "$$b\t"; grep -E "$$b" report.expected | wc -l); done | sort -t$$'\t' -k 2 -n -r | column -ts$$'\t'
 # compile c to llvm bitcode
 %.bc : %.c
-	@(cd $(dir $*) && clang -g -c -emit-llvm $(CLANG_ARGS) $(notdir $*).c -o $(notdir $*).bc)
+	@(cd $(dir $*) && clang -g -c -emit-llvm -include $(CURDIR)/../model/llair_intrinsics.h -Wno-main-return-type $(CLANG_ARGS) $(notdir $*).c -o $(notdir $*).bc)
 # compile c++ to llvm bitcode
 %.bc : %.cpp
 	@(cd $(dir $*) && clang++ -g -c -emit-llvm $(CLANG_ARGS) $(notdir $*).cpp -o $(notdir $*).bc)
 %.llair : %.bc
-	$(SLEDGE_EXE) llvm translate $< -llair-output $@
+	$(SLEDGE_DBG) llvm translate $< -llair-output $@
 %.llair.txt : %.llair
-	$(SLEDGE_EXE) disassemble $< -llair-txt-output $@
+	$(SLEDGE_DBG) disassemble $< -llair-txt-output $@
 # code to test sledge translate
 TranslateCs:=$(shell find -L {,local/}translate -name '*.c' 2>/dev/null)
 TranslateCPPs:=$(shell find -L {,local/}translate -name '*.cpp' 2>/dev/null)
 TranslateGenBCs:=$(patsubst %.c,%.bc,$(TranslateCs)) $(patsubst %.cpp,%.bc,$(TranslateCPPs))
 TranslateBCs:=$(TranslateGenBCs) $(shell find -L extra/translate -name '*.bc' 2>/dev/null)
 TranslateLLs:=$(shell find -L {,local/}translate -name '*.ll' 2>/dev/null)
 TranslateTests:=$(TranslateBCs) $(TranslateLLs)
 # code to test sledge analyze
 AnalyzeCs:=$(shell find -L {,local/}analyze -name '*.c' 2>/dev/null)
 AnalyzeCPPs:=$(shell find -L {,local/}analyze -name '*.cpp' 2>/dev/null)
 AnalyzeGenBCs:=$(patsubst %.c,%.bc,$(AnalyzeCs)) $(patsubst %.cpp,%.bc,$(AnalyzeCPPs))
 AnalyzeBCs:=$(AnalyzeGenBCs) $(shell find -L extra/analyze -name '*.bc' 2>/dev/null)
 AnalyzeLLs:=$(shell find -L {,local/}analyze -name '*.ll' 2>/dev/null)
 AnalyzeTests:=$(AnalyzeBCs) $(AnalyzeLLs)
-# code to test analyze
+GeneratedBCs:=$(TranslateGenBCs) $(AnalyzeGenBCs)
 AnalyzeCs:=$(shell find * -not -path 'llvm/*' -name '*.c')
 AnalyzeCPPs:=$(shell find * -not -path 'llvm/*' -name '*.cpp')
-AnalyzeBCs:=$(patsubst %.c,%.bc,$(AnalyzeCs)) $(patsubst %.cpp,%.bc,$(AnalyzeCPPs))
+# compile all c/c++ to bc
-AnalyzeLLs:=$(shell find * -not -path 'llvm/*' -name '*.ll')
+compile: $(GeneratedBCs)
 	@if [ -d "extra" ]; then \
 	   $(MAKE) sledge=$(SLEDGE_DBG) -C extra compile; \
 	 fi
-AnalyzeTests:=$(AnalyzeBCs) $(AnalyzeLLs)
+#
 # translation (frontend) tests
 #
-# compile all c/c++ to bc
+# run sledge llvm translate tests
-compile: $(AnalyzeBCs)
+.PHONY: translate
 translate: compile
 	-@parallel --bar $(sledge_dbg) llvm disassemble -no-models -no-internalize $(SLEDGE_ARGS) ::: $(TranslateTests)
 .PHONY: translate.sexp
 translate.sexp:
 	@find -L {,local/,extra/}translate -not -path 'baseline/*' -name '*.sexp' 2>/dev/null \
 	 | xargs cat > translate.sexp
 baseline/translate.sexp: translate.sexp
 	@cp translate.sexp $@
 translate.html: translate.sexp
 	@$(sledge_report) html -baseline baseline/translate.sexp translate.sexp -output $@
 translate-status: translate.sexp
 	@$(sledge_report) status -baseline baseline/translate.sexp translate.sexp | column -ts$$'\t'
 #
 # analyze (backend) tests
 #
-# all analyze tests
+# run analyze tests
 .PHONY: analyze
 analyze: compile
-	@parallel --bar $(SLEDGE) llvm analyze $(SLEDGE_ARGS) ::: $(AnalyzeTests)
+	-@parallel --bar $(sledge_dbg) llvm analyze -bound 5 -trace Report+Control $(SLEDGE_ARGS) ::: $(AnalyzeTests)
-
+
-# run all tests and generate code coverage information
+parallel_sledge_opt=parallel --shuf --bar $(sledge_opt) llvm analyze -append-report -bound 5 $(SLEDGE_ARGS) :::
-BISECT_DIR=$(CURDIR)/../_coverage/out
+
-coverage:
+analyze-perf1: compile
-	@cd ..; dune build _build/_install/coverage/bin/sledge
+	@$(parallel_sledge_opt) $(AnalyzeTests)
-	@mkdir -p $(BISECT_DIR)
+
-	@-$(MAKE) BISECT_FILE=$(BISECT_DIR)/bisect SLEDGE_EXE=$(CURDIR)/../_build/_install/coverage/bin/sledge test -k
+analyze-perf3: compile
-	@find $(BISECT_DIR) -type f | xargs bisect-ppx-report -I ../_build/_install/coverage/ -text ../_coverage/summary.txt -html ../_coverage/
+	@$(parallel_sledge_opt) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests)
-	@echo "open ../_coverage/index.html"
+
-
+analyze-perf5: compile
-_analyze-report-raw:
+	@$(parallel_sledge_opt) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests)
-	@find * -not -path 'llvm/*' -name '*.out' \
+
-	 | xargs grep "RESULT:" \
+analyze-perf7: compile
-	 | sed 's/\.out:/:	/' | sort | sort -s -t':' -k 3,4
+	@$(parallel_sledge_opt) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests) $(AnalyzeTests)
-
+
-# report all results
+.PHONY: analyze.sexp
-analyze-report-full:
+analyze.sexp:
-	@$(MAKE) --silent _analyze-report-raw | column -ts$$'\t'
+	@find -L {,local/,extra/}analyze -not -path 'baseline/*' -name '*.sexp' 2>/dev/null \
-
+	 | xargs cat > analyze.sexp
-# list tests with zero or multiple RESULT lines
+
-report-invalid-results:
+baseline/analyze.sexp: analyze.sexp
-	@find -L * -name '*.out' -exec grep -H -c "RESULT:" {} \; \
+	@cp analyze.sexp $@
-	 | grep -v ":1$$"
+
 analyze.html: analyze.sexp
 	@$(sledge_report) html -baseline baseline/analyze.sexp analyze.sexp -output $@
 analyze-status: analyze.sexp
 	@$(sledge_report) status -baseline baseline/analyze.sexp analyze.sexp | column -ts$$'\t'
 #
 # smt tests
 #
 SmtTests:=$(shell find smt -name '*.smt2' 2>/dev/null)
 # run sledge smt tests
 .PHONY: smt
 smt:
 	-@parallel --bar $(sledge_dbg) smt $(SLEDGE_ARGS) ::: $(SmtTests)
 parallel_sledge_opt_smt=parallel --shuf --bar $(sledge_opt) smt -append-report $(SLEDGE_ARGS) :::
 smt-perf1:
 	@$(parallel_sledge_opt_smt) $(SmtTests)
 smt-perf3:
 	@$(parallel_sledge_opt_smt) $(SmtTests) $(SmtTests) $(SmtTests)
 smt-perf5:
 	@$(parallel_sledge_opt_smt) $(SmtTests) $(SmtTests) $(SmtTests) $(SmtTests) $(SmtTests)
 smt-perf7:
 	@$(parallel_sledge_opt_smt) $(SmtTests) $(SmtTests) $(SmtTests) $(SmtTests) $(SmtTests) $(SmtTests) $(SmtTests)
 .PHONY: smt.sexp
 smt.sexp:
 	@find -L {,local/,extra/}smt -not -path 'baseline/*' -name '*.sexp' 2>/dev/null \
 	 | xargs cat > smt.sexp
 baseline/smt.sexp: smt.sexp
 	@cp smt.sexp $@
 smt.html: smt.sexp
 	@$(sledge_report) html -baseline baseline/smt.sexp smt.sexp -output $@
 smt-status: smt.sexp
 	@$(sledge_report) status -baseline baseline/smt.sexp smt.sexp | column -ts$$'\t'
 #
 # llvm tests
 #
 # run sledge llvm translate tests
 .PHONY: llvm
 llvm:
 	-@find -L llvm -name '*.ll' -or -name '*.bc' 2>/dev/null \
 	 | parallel --bar $(sledge_dbg) llvm translate -no-models -no-internalize $(SLEDGE_ARGS)
 .PHONY: llvm.sexp
 llvm.sexp:
 	@find -L {,local/,extra/}llvm -not -path 'baseline/*' -name '*.sexp' 2>/dev/null \
 	 | xargs cat > llvm.sexp
 baseline/llvm.sexp: llvm.sexp
 	@cp llvm.sexp $@
 llvm.html: llvm.sexp
 	@$(sledge_report) html -baseline baseline/llvm.sexp llvm.sexp -output $@
 llvm-status: llvm.sexp
 	@$(sledge_report) status -baseline baseline/llvm.sexp llvm.sexp | column -ts$$'\t'
 #
 # test workflow
 #
 # report warnings
 warnings:
 	@find -L * -name '*.out' | xargs grep -h "Warning:" | sort
 test-translate:
 	-@find -L {,local/,extra/}translate -name "*.sexp" -or -name "*.out" -or -name '*.err' -or -name '*.llair' -or -name '*.llair.txt' -delete 2>/dev/null
 	-@$(MAKE) --no-print-directory translate
 	@$(MAKE) --no-print-directory translate-status
 test-analyze:
 	-@find -L {,local/,extra/}analyze -name "*.sexp" -or -name "*.out" -or -name '*.err' -delete 2>/dev/null
 	-@$(MAKE) --no-print-directory analyze
 	@$(MAKE) --no-print-directory analyze-status
 test-smt:
 	-@find -L {,local/,extra/}smt -name "*.sexp" -or -name "*.out" -or -name '*.err' -delete 2>/dev/null
 	-@$(MAKE) --no-print-directory smt
 	@$(MAKE) --no-print-directory smt-status
 test-llvm:
 	-@find -L {,local/,extra/}llvm -name "*.sexp" -or -name "*.out" -or -name '*.err' -or -name '*.llair' -delete 2>/dev/null
 	-@$(MAKE) --no-print-directory llvm
 	@$(MAKE) --no-print-directory llvm-status
 # run tests and check against expected results
-test:
+test: test-translate test-analyze test-smt test-llvm
 	-@$(MAKE) --silent --keep-going clean analyze translate
 	@$(MAKE) --silent _analyze-report-raw > report.current
 	@$(MAKE) --silent _translate-report-raw >> report.current
 	@$(DIFF) report.expected report.current
 # set current results as new expected results
-promote:
+promote: baseline/translate.sexp baseline/analyze.sexp baseline/smt.sexp baseline/llvm.sexp
-	@cp report.current report.expected
+
 # copy the current out and err files to the baseline dir
 promote-out:
 	@find -L * -not -path 'baseline/*' \( -name '*.out' -or -name '*.err' \) | xargs gcp --parents -t baseline
 # diff the current out files against the ones in the baseline dir
 diff-out:
 	@$(diff) -mask-uniques -include '.*\.out' baseline -alt-next current .
 # diff the current err files against the ones in the baseline dir
 diff-err:
 	@$(diff) -mask-uniques -include '.*\.err' baseline -alt-next current .
 # remove generated bitcode files
 cleanbc:
-	@rm -f $(AnalyzeBCs)
+	@rm -f $(GeneratedBCs)
 # remove result files
 cleanout:
-	@find -L * -name "*.out" -or -name '*.err' -or -name '*.llair' \
+	@find -L * -not -path 'baseline/*' -name "*.sexp" -or -name "*.out" -or -name '*.err' -or -name '*.llair' -or -name '*.llair.txt'	 \
 	 | xargs rm -f
 clean: cleanbc cleanout
--- a/sledge/test/analyze/arithmetic.c
+++ b/sledge/test/analyze/arithmetic.c
--- a/sledge/test/analyze/arithmetic_loop.c
+++ b/sledge/test/analyze/arithmetic_loop.c
--- a/sledge/test/analyze/global_vars.c
+++ b/sledge/test/analyze/global_vars.c
--- a/sledge/test/analyze/globals.c
+++ b/sledge/test/analyze/globals.c
--- a/sledge/test/analyze/nonreducible_call_graph.c
+++ b/sledge/test/analyze/nonreducible_call_graph.c
--- a/sledge/test/analyze/recursion.c
+++ b/sledge/test/analyze/recursion.c
--- a/sledge/test/analyze/tmp_uaf.cpp
+++ b/sledge/test/analyze/tmp_uaf.cpp
--- a/sledge/test/analyze/wrap_malloc.c
+++ b/sledge/test/analyze/wrap_malloc.c
--- a/sledge/test/report.expected
+++ b/sledge/test/report.expected
--- a/sledge/test/translate/address_of_label.cpp
+++ b/sledge/test/translate/address_of_label.cpp
--- a/sledge/test/translate/cond_alloca.cpp
+++ b/sledge/test/translate/cond_alloca.cpp
--- a/sledge/test/translate/destructor_bases.cpp
+++ b/sledge/test/translate/destructor_bases.cpp
--- a/sledge/test/translate/exceptions.cpp
+++ b/sledge/test/translate/exceptions.cpp
--- a/sledge/test/translate/rethrow.cpp
+++ b/sledge/test/translate/rethrow.cpp
--- a/sledge/test/translate/struct.cpp
+++ b/sledge/test/translate/struct.cpp
--- a/sledge/test/translate/vector.cpp
+++ b/sledge/test/translate/vector.cpp
--- a/sledge/test/translate/virtual.cpp
+++ b/sledge/test/translate/virtual.cpp
--- a/sledge/test/wrap.sh
+++ b/sledge/test/wrap.sh
@ -6,7 +6,7 @@
 # LICENSE file in the root directory of this source tree.
 # wrap execution of sledge with time and memory limits
-# and add RESULT status to output in case of an unexpected exit
+# and add status entries to report in case of an unexpected exit
 # usage: wrap.sh <timeout(sec)> <memout(MB)> <command> <testdir/testname>
@ -15,26 +15,33 @@ set -u
 timeout=$1
 memout=$(( $2*1024 ))
 command=${@: 3: $#-3}
-test=${@: -1}
+test_ext=${@: -1}
 test=${test_ext%.*}
-testdir=$(dirname $test)
+unknown_error () {
-testname=$(basename $test)
+  echo -e "((name $test)(entry(Status(UnknownError \"$1\"))))" >> $test.sexp
 }
 timeout () {
  echo -e "((name $test)(entry(Status Timeout)))" >> $test.sexp
 }
 memout () {
  echo -e "((name $test)(entry(Status Memout)))" >> $test.sexp
 }
 cd $testdir
 (
  ulimit -t $timeout -v $memout
-  $command $testname 1> $testname.out 2> $testname.err
+  $command -report $test.sexp $test_ext 1> $test.out 2> $test.err
-)
+) &> /dev/null
 status=$?
 case $status in
-  ( 132 ) echo -e "RESULT: illegal instruction" >> $testname.out ;;
+  ( 0 | 1 ) ;;
-  ( 136 ) echo -e "RESULT: floating-point exception" >> $testname.out ;;
+  ( 132 ) unknown_error "illegal instruction" ;;
-  ( 139 ) echo -e "RESULT: segmentation violation" >> $testname.out ;;
+  ( 136 ) unknown_error "floating-point exception" ;;
-  ( 127 ) echo -e "RESULT: MEMOUT" >> $testname.out ;;
+  ( 139 ) unknown_error "segmentation violation" ;;
-  ( 137 | 152 ) echo -e "RESULT: TIMEOUT" >> $testname.out ;;
+  ( 127 | 134 ) memout ;;
-  ( * ) ;;
+  ( 137 | 152 ) timeout ;;
  ( * ) unknown_error "exit $status" ;;
 esac
 if ! grep -q 'RESULT:' $testname.out; then
  echo -e "RESULT: Internal error: "$status >> $testname.out
 fi
 exit $status