evanmak · evanmak · Oct 1, 2020 · Sep 27, 2020 · Sep 27, 2020 · Sep 27, 2020
diff --git a/Docker/build_savior.sh b/Docker/build_savior.sh
@@ -106,8 +106,8 @@ function dir_check {
     cd $SOFTWARE_DIR/llvm-3.6
     mkdir build
     cd $SOFTWARE_DIR/llvm-3.6/build
-    cmake -DLLVM_ENABLE_RTTI:BOOL=ON ..
-    make install -j$(nproc)
+    cmake -DCMAKE_BUILD_TYPE=Release -DLLVM_ENABLE_RTTI:BOOL=ON ..
+    make install -j4
 
     PROG=KLEE
     apt-get install -y build-essential curl libcap-dev libncurses5-dev python-minimal unzip
@@ -160,7 +160,7 @@ function dir_check {
     #TODO: open source KLEE concolic executor separately
     #installing klee-3.6
     rm -rf /root/savior/KLEE/klee-build
-    cd ~/work/savior/KLEE
+    cd $WORK_DIR/savior/KLEE
     mkdir klee-build
     cd klee-build
     echo "NOTE: you might need to rebuild libboost for C++ ABI compatibility on Ubuntu 16.04"
@@ -195,12 +195,12 @@ function dir_check {
     mkdir build
     mkdir install
     cd $SOFTWARE_DIR/llvm-4.0/build
-    cmake -DLLVM_ENABLE_RTTI:BOOL=ON -DCMAKE_INSTALL_PREFIX=$SOFTWARE_DIR/llvm-4.0/install ..
-    make install -j$(nproc)
+    cmake -DLLVM_LINK_LLVM_DYLIB=ON -DCMAKE_BUILD_TYPE=Release -DLLVM_ENABLE_RTTI:BOOL=ON -DCMAKE_INSTALL_PREFIX=$SOFTWARE_DIR/llvm-4.0/install ..
+    make install -j4
 
     #install svf
     PROG=svf
-    
+
     #build insertbug pass with llvm-3.6 first
     cd $WORK_DIR/$PROJ/svf/InsertBugPotential
     mkdir build && cd build && cmake .. && make -j$(nproc)
@@ -214,4 +214,3 @@ function dir_check {
     cmake ..
     make -j$(nproc)
     cd .. && ln -sf $(pwd)/Release-build/bin/dma_wrapper.py dma_wrapper.py
-
diff --git a/coordinator/EdgeOracles/avg_bug_potential_oracle.py b/coordinator/EdgeOracles/avg_bug_potential_oracle.py
@@ -58,8 +58,10 @@ def get_fuzzer_queue_dir(self, raw_config, target_bin):
         fuzzer_dir = os.path.join(sync_dir, "slave_000001", "queue")
         return fuzzer_dir
 
+##### PR: filename mismatch
     def read_queue(self):
-        return [f for f in os.listdir(self.fuzzer_input_dir) if os.path.isfile(os.path.join(self.fuzzer_input_dir, f))]
+        return [utils.from_afl_name_to_simple(f) for f in os.listdir(self.fuzzer_input_dir) if os.path.isfile(os.path.join(self.fuzzer_input_dir, f))]
+##### PR: filename mismatch
 
     def get_oracle_config(self):
         config = ConfigParser.ConfigParser()
@@ -141,7 +143,7 @@ def build_input_to_score_cache(self, dummy_all_edges, inputs):
             stat['score'] = 0.0
             stat['first_seen'] = seed
             stat['interesting_edges'] = []
-            stat['size'] = os.path.getsize(seed)
+            stat['size'] = os.path.getsize(utils.from_simple_to_afl_name(seed)) ##### PR: filename mismatch
             contributing_edge_counter = 0
             for e in set(edges):
                 is_interesting_edge = False
@@ -188,13 +190,14 @@ def get_score(self, testcase):
         # even though it contains new coverage
         score2 = "orig:" in testcase
         # Smaller size is better
-        score3 = -os.path.getsize(testcase)
+        score3 = -os.path.getsize(utils.from_simple_to_afl_name(testcase))  ##### PR: filename mismatch
         # Shorter path is better
         score4 = -self.get_path_length(testcase)
         # Since name contains id, so later generated one will be chosen earlier
         score5 = testcase
         return (score1, score2, score3, score4, score5)
 
+
     def testcase_compare(self, a, b):
         a_score = self.get_score(a)
         b_score = self.get_score(b)

diff --git a/coordinator/EdgeOracles/bug_potential_oracle.py b/coordinator/EdgeOracles/bug_potential_oracle.py
@@ -54,8 +54,10 @@ def get_fuzzer_queue_dir(self, raw_config, target_bin):
         fuzzer_dir = os.path.join(sync_dir, "slave_000001", "queue")
         return fuzzer_dir
 
+##### PR: filename mismatch
     def read_queue(self):
-        return [f for f in os.listdir(self.fuzzer_input_dir) if os.path.isfile(os.path.join(self.fuzzer_input_dir, f))]
+        return [utils.from_afl_name_to_simple(f) for f in os.listdir(self.fuzzer_input_dir) if os.path.isfile(os.path.join(self.fuzzer_input_dir, f))]
+##### PR: filename mismatch
 
     def get_oracle_config(self):
         config = ConfigParser.ConfigParser()

diff --git a/coordinator/EdgeOracles/sequential_oracle.py b/coordinator/EdgeOracles/sequential_oracle.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python
 import sys
 import os
+import utils
 import ConfigParser
 from utils import bcolors
 from operator import itemgetter
@@ -23,9 +24,10 @@ def get_fuzzer_queue_dir(self, raw_config, target_bin):
         sync_dir = config.get("moriarty", "sync_dir").replace("@target", target_dir)
         return os.path.join(sync_dir, "master", "queue")
 
-
+##### PR: filename mismatch
     def read_queue(self):
-        return [f for f in os.listdir(self.fuzzer_input_dir) if os.path.isfile(os.path.join(self.fuzzer_input_dir, f))]
+        return [utils.from_afl_name_to_simple(f) for f in os.listdir(self.fuzzer_input_dir) if os.path.isfile(os.path.join(self.fuzzer_input_dir, f))]
+##### PR: filename mismatch
 
     def get_result(self, raw_data, max_results, edge_threshold=0.8):
         stats = []

diff --git a/coordinator/SEs/klee_conc_explorer.py b/coordinator/SEs/klee_conc_explorer.py
@@ -148,7 +148,9 @@ def run(self, input_id_map_list, cov_file):
         for input_id_map in input_id_map_list:
             #--generate klee seed ktest
             # print input_id_map
-            afl_input = input_id_map['input']
+            afl_input = utils.from_simple_to_afl_name(input_id_map['input'])
+            if not afl_input:
+                continue
             if max_input_size < os.path.getsize(afl_input):
                 max_input_size = os.path.getsize(afl_input)
             klee_seed = klee_seed_dir+"/"+str(input_counter).zfill(6)+".ktest"

diff --git a/coordinator/SEs/klee_sym_explorer.py b/coordinator/SEs/klee_sym_explorer.py
@@ -105,7 +105,9 @@ def run(self, input_id_map_list, cov_file_list):
 
             #--generate klee seed ktest
             # print input_id_map
-            afl_input = input_id_map['input']
+            afl_input = utils.from_simple_to_afl_name(input_id_map['input'])
+            if not afl_input:
+                continue
             klee_seed = self.seed_dir+"/klee_instance_sym_"+str(pid).zfill(6)+".ktest"
             # print "before calling converter"
             # print afl_input

diff --git a/coordinator/utils/utils.py b/coordinator/utils/utils.py
@@ -12,6 +12,7 @@
 import shutil
 import datetime
 import random
+import glob
 
 def error_msg(s):
     print bcolors.FAIL+"[ERROR] {0}".format(s)+bcolors.ENDC
@@ -210,6 +211,18 @@ def merge_coverage_files(data_files, output_name, ftype='branch-only'):
         error_msg("can not merge coverage file {0}".format(output_name))
         return False
 
+##### PR: filename mismatch
+def from_simple_to_afl_name(simple_path):
+    tmp = os.path.basename(simple_path).replace("_",":")
+    tmp = glob.glob(os.path.join(os.path.dirname(simple_path), tmp) + "*")
+    if not tmp:
+        return ""
+    else:
+        return tmp[0]
 fprintf(f, "%u\t%s/queue/id_%06u\n", i, out_dir, edge_san_first_seen[i]);  
 fprintf(f, "%u\t%s/queue/id_%06u\n", i, out_dir, edge_san_first_seen[i]);  
+
+def from_afl_name_to_simple(afl_name):
+    return os.path.join(os.path.dirname(afl_name), os.path.basename(afl_name)[:9].replace(':','_'))
+##### PR: filename mismatch
 
 def expand_stack_limit():
     """Klee requires ulimit to set stack as unlimited"""
@@ -283,9 +296,9 @@ def gen_loctrace_file(prog, inp, input_mode,outfile=None, timeout=1):
             os.unlink(target_file)
     myenv['AFL_LOC_TRACE_FILE'] = target_file
     if input_mode == "symfile":
-        prog_cmd = prog.replace("INPUT_FILE", inp)
+        prog_cmd = prog.replace("INPUT_FILE", from_simple_to_afl_name(inp))
     elif input_mode == "stdin":
-        prog_cmd = " ".join([prog + " < " + inp])
+        prog_cmd = " ".join([prog + " < " + from_simple_to_afl_name(inp)])
     prog_cmd = "timeout " + str(timeout)+"s " + prog_cmd
     prog_cmd = prog_cmd + " > /dev/null 2> /dev/null"
     p = subprocess.Popen(prog_cmd, shell=True, env=myenv)
@@ -326,7 +339,7 @@ def log_recommend_edges(lst, log, loc_map, find_loc_script, prog, cur_heu):
         return
 
     def _get_src_loc(e, s):
-        cmd = [find_loc_script, e, loc_map, prog + " < " + s]
+        cmd = [find_loc_script, e, loc_map, prog + " < " + from_simple_to_afl_name(s)]
         cmd = " ".join(cmd)
         #we call the find script twice, first to get loctrace, second to get src
         subprocess.call(cmd, shell=True)
@@ -375,7 +388,7 @@ def save_inputs(seed_list, target_dir):
         error_msg("{0} is not a valid directory".format(target_dir))
         return
     for seed in seed_list:
-        shutil.copy2(seed['input'], target_dir)
+        shutil.copy2(from_simple_to_afl_name(seed['input']), target_dir)
 
 def pack_klee_errors(search_dir, target_dir):
     """

diff --git a/example-folder/Makefile b/example-folder/Makefile
@@ -0,0 +1,32 @@
+## Variable storing paths
+SAVIOR_PATH=${HOME}/work/savior
+
+all: seed_folder
+
+example : example.c
+	LLVM_COMPILER=clang wllvm -fsanitize=integer,bounds,shift -g -o example example.c
+
+example.bc : example
+	extract-bc example
+
+# and labelmap.csv  locmap.csv  paired_edges.csv
+savior-example :  example.bc
+	${SAVIOR_PATH}/AFL/afl-clang-fast example.bc -o savior-example -lubsan -lm
+
+# and savior-example.dma example.reach.bug example.edge
+savior-example.bc : savior-example
+	${SAVIOR_PATH}/svf/SVF/Release-build/bin/dma -fspta savior-example.bc -savior-label-only -o example.reach.bug -edge example.edge
+
+savior-example.dma.bc : savior-example.bc
+	opt -load ${SAVIOR_PATH}/svf/InsertBugPotential/build/insertpass/libInsertBugPass.so -InsertBug -i example.reach.bug savior-example.bc -o savior-example.dma.bc
+
+example.conf : savior-example.dma.bc
+	./set-configuration.sh
+
+seed_folder :  example.conf
+	mkdir -p "seed_folder" && echo "a" > seed_folder/seed1.txt
+
+# and run: python ../coordinator/moriarty.py -t $(pwd) -c $(pwd)/example.conf
+
+clean:
+	rm example .example* *.bc savior-example savior-example.dma example.conf example.edge example.reach.bug labelmap.csv locmap.csv paired_edges.csv .savior_sanitizer_combination .afl_coverage_combination
diff --git a/example-folder/README.md b/example-folder/README.md
@@ -0,0 +1,15 @@
+# Savior simple example
+
+The example simply checks a magic number value big enough to prevent AFL from generating testcases covering the true branch.
+
+Run `make` to:
+- build the SAVIOR instrumented binaries,
+- create a seed into `seed_folder`,
+- set a default configuration file (`example.conf`).
+
+Verify the example behavior by running a testcase passing the magic number check:
+
+```
+./savior-example < test.in
+Magic number passed
+```
diff --git a/example-folder/example.c b/example-folder/example.c
@@ -0,0 +1,23 @@
+#include <stdio.h>
+#include <unistd.h>
+
+long AFL_STOP = 0x41464c5f53544f50;
+
+int main(int argc, char *argv[]) {
+ int a,nb;
+ long magic;
+
+ nb = read(0, &magic, sizeof(long));
+ if (nb == 0) return 1;
+ if (nb < sizeof(long)) return 1; //add coverage if good size
+
+ if (magic != AFL_STOP) return 1;
+
+ puts("Magic number passed"); 
+
+ nb = read(0, &a, sizeof(int));
+ a = a - 12;
+
+ return 0; 
+}
+
diff --git a/example-folder/set-configuration.sh b/example-folder/set-configuration.sh
@@ -0,0 +1,19 @@
+
+
+## Variable storing paths
+SAVIOR_PATH=$HOME/work/savior
+SYNC_FOLDER=@target/output_folder
+SEED_FOLDER=@target/seed_folder
+# target directory: $(pwd)
+
+sed s/PROG/example/g $SAVIOR_PATH/coordinator/fuzz.cfg.template | \
+    #sed s/inputtype=stdin/inputtype=symfile/g | \
+    #sed "s|target_bin=@target/savior-fuzzer|target_bin=$AFL_CMD|g" | \
+    #sed "s|target_bc=@target/savior-fuzzer.dma.bc|target_bc=$KLEE_CMD|g" | \
+    sed "s|sync_dir=@target/out|sync_dir=$SYNC_FOLDER|g" | \
+    sed "s,in_dir=@target/in,in_dir=$SEED_FOLDER,g" | \
+    sed "s|heuristics=san-guided|heuristics=san-guided:sequential:bug-potential:avg-bug-potential|g" | \
+    sed "s|SAVIOR|$SAVIOR_PATH|g" > example.conf
+
+## Note: to use uncov-edge-bug generates code_reach_map by running the dma pass without -savior-label-only option
+## ref: https://github.com/evanmak/savior-source/blob/b419c868e3dd966e77bb2707a7901e6f1872fb92/coordinator/README.md
diff --git a/example-folder/test.in b/example-folder/test.in
@@ -0,0 +1 @@
+POTS_LFA2