Skip to content

Commit

Permalink
Update scripts to support paths with spaces, WIP
Browse files Browse the repository at this point in the history
  • Loading branch information
AndrewQuijano committed Oct 15, 2024
1 parent c5a7300 commit 57bb960
Show file tree
Hide file tree
Showing 7 changed files with 98 additions and 102 deletions.
46 changes: 25 additions & 21 deletions scripts/add_queries.sh
Original file line number Diff line number Diff line change
Expand Up @@ -26,9 +26,6 @@
# and run the bug_mining.py script (which uses PANDA to trace taint).
#

# Load lava-functions and vars
. `dirname $0`/funcs.sh

tick
version="2.0.0"

Expand All @@ -50,13 +47,18 @@ elif [ $# -eq 2 ]; then
ATP_TYPE="-$1"
json="$(readlink -f $2)"
else
USAGE $0
USAGE $0
exit 1
fi

lava="$(dirname $(dirname $(readlink -f $0)))"
absolute_path=$(readlink -f "$0")
scripts_path=$(dirname "$absolute_path")
lava=$(dirname "$scripts_path")
project_name="$1"
. `dirname $0`/vars.sh

# Load lava-functions and vars
source "$scripts_path/funcs.sh"
source "$scripts_path/vars.sh"

progress "queries" 0 "Entering $directory/$name."
mkdir -p "$directory/$name"
Expand Down Expand Up @@ -98,15 +100,15 @@ progress "queries" 0 "Making with btrace..."
rm -f btrace.log
ORIGIN_IFS=$IFS
IFS='&&'
read -ra MAKES <<< $makecmd
for i in ${MAKES[@]}; do
read -ra MAKES <<< "$makecmd"
for i in "${MAKES[@]}"; do
IFS=' '
read -ra ARGS <<< $i
read -ra ARGS <<< "$i"
echo "$lava/tools/btrace/sw-btrace ${ARGS[@]}"
CC=$llvm/bin/clang \
CXX=$llvm/bin/clang++ \
CFLAGS="-O0 -m32 -DHAVE_CONFIG_H -g -gdwarf-2 -fno-stack-protector -D_FORTIFY_SOURCE=0 -I. -I.. -I../include -I./src/" \
$lava/tools/btrace/sw-btrace ${ARGS[@]}
"$lava/tools/btrace/sw-btrace" "${ARGS[@]}"
IFS='&&'
done
IFS=$ORIGIN_IFS
Expand All @@ -119,7 +121,7 @@ bash -c $install
progress "queries" 0 "Creating compile_commands.json..."
# Delete any pre-existing compile commands.json (could be in archive by mistake)
rm -f compile_commands.json
$lava/tools/btrace/sw-btrace-to-compiledb $llvm/lib/clang/11/include
"$lava/tools/btrace/sw-btrace-to-compiledb" $llvm/lib/clang/11/include
if [ -e "$directory/$name/extra_compile_commands.json" ]; then
sed -i '$d' compile_commands.json
echo "," >> compile_commands.json
Expand All @@ -130,23 +132,24 @@ git commit -m 'Add compile_commands.json.'

cd ..

c_files=$($python $lava/tools/lavaTool/get_c_files.py $source)
c_dirs=$(for i in $c_files; do dirname $i; done | sort | uniq)
# Switching IFS to '\n' to support paths with spaces in them.
c_files=$($python "$lava/tools/lavaTool/get_c_files.py" "$source")
IFS=$'\n'
c_dirs=$(for i in $c_files; do dirname "$i"; done | sort | uniq)

progress "queries" 0 "Copying include files..."
for i in $c_dirs; do
echo " $i"
if [ -d $i ]; then
cp $lava/tools/include/*.h $i/
if [ -d "$i" ]; then
cp "$lava"/tools/include/*.h "$i"/
fi
done


# Run another clang tool that provides information about functions,
# i.e., which have only prototypes, which have bodies.
progress "queries" 0 "Figure out functions"
for this_c_file in $c_files; do
$lava/tools/install/bin/lavaFnTool $this_c_file
"$lava/tools/install/bin/lavaFnTool" "$this_c_file"
done

#progress "queries" 0 "Initialize variables..."
Expand All @@ -167,7 +170,7 @@ fninstr=$directory/$name/fninstr

echo "Creating fninstr [$fninstr]"
echo -e "\twith command: \"python $lava/scripts/fninstr.py -d -o $fninstr $fnfiles\""
$python $lava/scripts/fninstr.py -d -o $fninstr $fnfiles
$python "$lava/scripts/fninstr.py" -d -o $fninstr $fnfiles

if [[ ! -z "$df_fn_blacklist" ]]; then
cmd=$(echo "sed -i /${df_fn_blacklist}/d $fninstr")
Expand All @@ -181,7 +184,7 @@ if [ "$dataflow" = "true" ]; then
# Since it's okay to pass the whitelist either way
progress "queries" 0 "Inserting queries for dataflow"
for i in $c_files; do
$lava/tools/install/bin/lavaTool -action=query \
"$lava/tools/install/bin/lavaTool" -action=query \
-lava-db="$directory/$name/lavadb" \
-p="$directory/$name/$source/compile_commands.json" \
-arg_dataflow \
Expand All @@ -195,7 +198,7 @@ else
progress "queries" 0 "Inserting queries..."
# TODO: remove lava-wl here, unless we're using it to limit where we inject
for i in $c_files; do
$lava/tools/install/bin/lavaTool -action=query \
"$lava/tools/install/bin/lavaTool" -action=query \
-lava-db="$directory/$name/lavadb" \
-lava-wl="$fninstr" \
-p="$source/compile_commands.json" \
Expand All @@ -215,7 +218,7 @@ fi
for i in $c_dirs; do
echo "Applying replacements to $i"
pushd $i
$llvm/bin/clang-apply-replacements .
"$llvm/bin/clang-apply-replacements" .
popd
done

Expand All @@ -227,6 +230,7 @@ for this_c_file in $c_files; do
exit 1
fi
done
unset IFS

progress "queries" 0 "Done inserting queries. Time to make and run actuate.py on a 64-BIT machine!"

Expand Down
4 changes: 2 additions & 2 deletions scripts/funcs.sh
Original file line number Diff line number Diff line change
Expand Up @@ -53,15 +53,15 @@ if [ -z "$LAVA_FUNCS_INCLUDED" ]; then
if [ -z "$logfile" ]; then
logfile=/dev/stdout
fi
echo $command >> $logfile;
echo "$command" >> "$logfile";
set +e
docker_map_args="-v $lava:$lava -v $tarfiledir:$tarfiledir"

if [ "$extradockerargs" = "null" ]; then
extradockerargs="";
fi

if [[ "$directory" = "$tarfiledir"* ]]; then true; else
if [[ "$directory" = $tarfiledir* ]]; then true; else
docker_map_args="$docker_map_args -v $directory:$directory"
fi
if [ "$remote_machine" == "localhost" ]; then
Expand Down
26 changes: 15 additions & 11 deletions scripts/lava.sh
Original file line number Diff line number Diff line change
Expand Up @@ -32,7 +32,7 @@

version="2.0.0"
trap '' PIPE
set -e # Exit on error
set -ex # Exit on error

USAGE() {
echo "$0 version $version"
Expand Down Expand Up @@ -72,7 +72,10 @@ fi

# Load lava-functions
. `dirname $0`/funcs.sh
lava=$(dirname $(dirname $(readlink -f "$0")))
absolute_path=$(readlink -f "$0")
scripts_path=$(dirname "$absolute_path")
lava=$(dirname "$scripts_path")
sql="$lava/tools/lavaODB/generated/lava.sql"

# defaults
ok=0
Expand All @@ -99,6 +102,7 @@ parse_args $@
if [ -z "$project_name" ]; then
USAGE
fi

. `dirname $0`/vars.sh

if [[ $demo -eq 1 ]]
Expand Down Expand Up @@ -132,7 +136,7 @@ RESET_DB() {
progress "everything" 1 "Resetting lava db -- logging to $lf"
run_remote "$buildhost" "dropdb -U $pguser -h $dbhost $db || true" "$lf"
run_remote "$buildhost" "createdb -U $pguser -h $dbhost $db || true" "$lf"
run_remote "$buildhost" "psql -d $db -h $dbhost -f $lava/tools/lavaODB/generated/lava.sql -U $pguser" "$lf"
run_remote "$buildhost" "psql -d $db -h $dbhost -f \"$sql\" -U $pguser" "$lf"
run_remote "$buildhost" "echo dbwipe complete" "$lf"
}

Expand Down Expand Up @@ -160,7 +164,7 @@ if [ $add_queries -eq 1 ]; then
lf="$logs/add_queries.log"
truncate "$lf"
progress "everything" 1 "Adding queries to source with type $ATP and $project_name -- logging to $lf"
run_remote "$buildhost" "$scripts/add_queries.sh $ATP_TYPE $project_name" "$lf"
run_remote "$buildhost" "\"$scripts/add_queries.sh\" $ATP_TYPE $project_name" "$lf"
if [ "$fixupscript" != "null" ]; then
lf="$logs/fixups.log"
truncate "$lf"
Expand All @@ -180,16 +184,16 @@ if [ $make -eq 1 ]; then
lf="$logs/make.log"
truncate "$lf"
# Note, adding the static flag is important. We are running the binaries on a PANDA VM, so we have no idea if it will have any libraries we need.
run_remote "$buildhost" "cd $sourcedir && CC=$llvm/bin/clang CXX=$llvm/bin/clang++ CFLAGS='-O0 -m32 -DHAVE_CONFIG_H -g -gdwarf-2 -fno-stack-protector -D_FORTIFY_SOURCE=0 -I. -I.. -I../include -I./src/ -static' $makecmd" "$lf"
run_remote "$buildhost" "cd \"$sourcedir\" && CC=$llvm/bin/clang CXX=$llvm/bin/clang++ CFLAGS='-O0 -m32 -DHAVE_CONFIG_H -g -gdwarf-2 -fno-stack-protector -D_FORTIFY_SOURCE=0 -I. -I.. -I../include -I./src/ -static' $makecmd" "$lf"
run_remote "$buildhost" "cd \"$sourcedir\" && rm -rf lava-install" "$lf"

run_remote "$buildhost" "cd $sourcedir && rm -rf lava-install" "$lf"
if [ "$install_simple" == "null" ]; then
run_remote "$buildhost" "cd $sourcedir && $install" "$lf"
run_remote "$buildhost" "cd \"$sourcedir\" && $install" "$lf"
else
run_remote "$buildhost" "cd $sourcedir && $install_simple" "$lf"
run_remote "$buildhost" "cd \"$sourcedir\" && $install_simple" "$lf"
fi
if [ "$post_install" != "null" ]; then
run_remote "$buildhost" "cd $sourcedir && $post_install" "$lf"
run_remote "$buildhost" "cd \"$sourcedir\" && $post_install" "$lf"
fi
tock
echo "make complete $time_diff seconds"
Expand Down Expand Up @@ -217,7 +221,7 @@ if [ $taint -eq 1 ]; then
lf="$logs/bug_mining-$i.log"
truncate "$lf"
progress "everything" 1 "PANDA taint analysis prospective bug mining -- input $input -- logging to $lf"
run_remote "$buildhost" "$python $scripts/bug_mining.py $hostjson $project_name $input $curtail" "$lf"
run_remote "$buildhost" "$python $scripts/bug_mining.py $hostjson $project_name $input $curtail" "$lf"
echo -n "Num Bugs in db: "
bug_count=$(run_remote "$buildhost" "psql -At $db -U $pguser -h $dbhost -c 'select count(*) from bug'")
if [ "$bug_count" = "0" ]; then
Expand Down Expand Up @@ -246,7 +250,7 @@ if [ $inject -eq 1 ]; then
if [ "$injfixupsscript" != "null" ]; then
fix="--fixupsscript='$injfixupsscript'"
fi
run_remote "$buildhost" "$python $scripts/inject.py -t $bugtypes -m $many -e $exitCode $kt $fix $hostjson $project_name" "$lf"
run_remote "$buildhost" "$python \"$scripts/inject.py\" -t $bugtypes -m $many -e $exitCode $kt $fix $hostjson $project_name" "$lf"
grep yield "$lf" | grep " real bugs "
done
fi
Expand Down
7 changes: 5 additions & 2 deletions scripts/reset_db.sh
Original file line number Diff line number Diff line change
@@ -1,7 +1,10 @@

# Load lava-functions
. `dirname $0`/funcs.sh
lava=$(dirname $(dirname $(readlink -f "$0")))
absolute_path=$(readlink -f "$0")
scripts_path=$(dirname "$absolute_path")
lava=$(dirname "$scripts_path")
sql="$lava/tools/lavaODB/generated/lava.sql"

# defaults
ok=0
Expand Down Expand Up @@ -36,7 +39,7 @@ RESET_DB() {
progress "everything" 1 "Resetting lava db -- logging to $lf"
run_remote "$buildhost" "dropdb -U $pguser -h $dbhost $db || true" "$lf"
run_remote "$buildhost" "createdb -U $pguser -h $dbhost $db || true" "$lf"
run_remote "$buildhost" "psql -d $db -h $dbhost -f $lava/tools/lavaODB/generated/lava.sql -U $pguser" "$lf"
run_remote "$buildhost" "psql -d $db -h $dbhost -f \"$sql\" -U $pguser" "$lf"
run_remote "$buildhost" "echo dbwipe complete" "$lf"
}

Expand Down
66 changes: 33 additions & 33 deletions scripts/vars.sh
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
#!/bin/sh
# Set all our environment variables
# $lava, $json, and must be set prior to calling this
# $lava, "$json", and must be set prior to calling this

if [ -z ${project_name+x} ]; then
echo "Fatal error: project_name variable unset when calling var.sh"
Expand All @@ -13,76 +13,76 @@ if [ -z ${lava+x} ]; then
fi

hostjson="$lava/host.json"
if [ ! -f $hostjson ]; then
if [ ! -f "$hostjson" ]; then
echo "Fatal error: host.json not found. Copy host.json.example to host.json"
exit 1;
fi

# Host Vars
qemu="$(jq -r '.qemu' $hostjson)"
qcow_dir="$(jq -r '.qcow_dir // ""' $hostjson)"
output_dir="$(jq -r '.output_dir // ""' $hostjson)"
config_dir="$(jq -r '.config_dir // ""' $hostjson)/$project_name"
tar_dir="$(jq -r '.tar_dir // ""' $hostjson)"
db_suffix="$(jq -r '.db_suffix // ""' $hostjson)"
buildhost="$(jq -r '.buildhost // "localhost"' $hostjson)"
dockername="$(jq -r '.docker // "lava32"' $hostjson)"
pguser="$(jq -r '.pguser // "postgres"' $hostjson)"
pgpass="$(jq -r '.pgpass // "postgrespostgres"' $hostjson)"
dbhost="$(jq -r '.host // "database"' $hostjson)"
qemu="$(jq -r '.qemu' "$hostjson")"
qcow_dir="$(jq -r '.qcow_dir // ""' "$hostjson")"
output_dir="$(jq -r '.output_dir // ""' "$hostjson")"
config_dir="$(jq -r '.config_dir // ""' "$hostjson")/$project_name"
tar_dir="$(jq -r '.tar_dir // ""' "$hostjson")"
db_suffix="$(jq -r '.db_suffix // ""' "$hostjson")"
buildhost="$(jq -r '.buildhost // "localhost"' "$hostjson")"
dockername="$(jq -r '.docker // "lava32"' "$hostjson")"
pguser="$(jq -r '.pguser // "postgres"' "$hostjson")"
pgpass="$(jq -r '.pgpass // "postgrespostgres"' "$hostjson")"
dbhost="$(jq -r '.host // "database"' "$hostjson")"

export PGUSER=$pguser
export PGPASS=$pgpass

json="${config_dir}/$project_name.json"

if [ ! -f $json ]; then
echo "Fatal error: $json not found. Did you provide the right project name?"
if [ ! -f "$json" ]; then
echo "Fatal error: "$json" not found. Did you provide the right project name?"
exit 1;
fi

# Project specific
name="$(jq -r .name $json)"
db="$(jq -r .db $json)$db_suffix"
extradockerargs="$(jq -r .extra_docker_args $json)"
exitCode="$(jq -r .expected_exit_code $json)"
dataflow="$(jq -r '.dataflow // "false"' $json)" # TODO use everywhere, stop passing as argument
name="$(jq -r .name "$json")"
db="$(jq -r .db "$json")$db_suffix"
extradockerargs="$(jq -r .extra_docker_args "$json")"
exitCode="$(jq -r .expected_exit_code "$json")"
dataflow="$(jq -r '.dataflow // "false"' "$json")" # TODO use everywhere, stop passing as argument
llvm="/usr/lib/llvm-11"

# List of function names to blacklist for data_flow injection, merged as fn1\|fn2\|fn3 so we can use sed
# Or an empty string if not present
df_fn_blacklist=`jq -r '.df_fn_blacklist // ""' $json`
df_fn_blacklist=`jq -r '.df_fn_blacklist // ""' "$json"`
if [[ ! -z $df_fn_blacklist ]]; then
df_fn_blacklist=`jq -r '.df_fn_blacklist // "" | join ("\\\\|")' $json`
df_fn_blacklist=`jq -r '.df_fn_blacklist // "" | join ("\\\\|")' "$json"`
fi

tarfiledir="$tar_dir"
tarfile="$tarfiledir/$(jq -r '.tarfile' $json)"
tarfile="$tarfiledir/$(jq -r '.tarfile' "$json")"
directory=$output_dir

inputs=`jq -r '.inputs' $json | jq 'join (" ")' | sed 's/\"//g' `
inputs=`jq -r '.inputs' "$json" | jq 'join (" ")' | sed 's/\"//g' `

fixupscript="null"
if [ "$(jq -r .fixupscript $json)" != "null" ]; then
fixupscript="$config_dir/$(jq -r .fixupscript $json)"
if [ "$(jq -r .fixupscript "$json")" != "null" ]; then
fixupscript="$config_dir/$(jq -r .fixupscript "$json")"
fi

bug_build="$output_dir/$name/$name/bugs/" # TODO why does this have name twice?
injfixupsscript="null"
if [ "$(jq -r .injfixupsscript $json)" != "null" ]; then
injfixupsscript="$config_dir/$(jq -r .injfixupsscript $json)"
if [ "$(jq -r .injfixupsscript "$json")" != "null" ]; then
injfixupsscript="$config_dir/$(jq -r .injfixupsscript "$json")"
# replace {bug_build} with string
injfixupsscript="${injfixupsscript/\{bug_build\}/$bug_build}"
fi

logs="$output_dir/$name/logs"

makecmd="$(jq -r .make $json)"
install=$(jq -r .install $json)
makecmd="$(jq -r .make "$json")"
install=$(jq -r .install "$json")
install="${install/\{config_dir\}/$config_dir}" # Format string replacement for config_dir
post_install="$(jq -r .post_install $json)"
install_simple=$(jq -r .install_simple $json)
configure_cmd=$(jq -r '.configure // "/bin/true"' $json)
post_install="$(jq -r .post_install "$json")"
install_simple=$(jq -r .install_simple "$json")
configure_cmd=$(jq -r '.configure // "/bin/true"' "$json")

# Constants
scripts="$lava/scripts"
Expand Down
Loading

0 comments on commit 57bb960

Please sign in to comment.