Skip to content

Commit

Permalink
added BENCHMARK_SHELL to found benchmarks
Browse files Browse the repository at this point in the history
  • Loading branch information
EtomicBomb committed Nov 21, 2024
1 parent 55a77c5 commit 94c85da
Show file tree
Hide file tree
Showing 13 changed files with 119 additions and 84 deletions.
10 changes: 6 additions & 4 deletions covid-mts/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -15,8 +15,10 @@ input_file="$input_dir/in$suffix.csv"
output_scoped="$outputs_dir/outputs$suffix"
mkdir -p "$output_scoped"

"$scripts_dir/1.sh" "$input_file" > "$output_scoped/1.out"
"$scripts_dir/2.sh" "$input_file" > "$output_scoped/2.out"
"$scripts_dir/3.sh" "$input_file" > "$output_scoped/3.out"
"$scripts_dir/4.sh" "$input_file" > "$output_scoped/4.out"
BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

$BENCHMARK_SHELL "$scripts_dir/1.sh" "$input_file" > "$output_scoped/1.out"
$BENCHMARK_SHELL "$scripts_dir/2.sh" "$input_file" > "$output_scoped/2.out"
$BENCHMARK_SHELL "$scripts_dir/3.sh" "$input_file" > "$output_scoped/3.out"
$BENCHMARK_SHELL "$scripts_dir/4.sh" "$input_file" > "$output_scoped/4.out"

5 changes: 3 additions & 2 deletions file-enc/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,5 +17,6 @@ if [[ "$1" == "--small" ]]; then
suffix=".small"
fi

$scripts_dir/compress_files.sh $input_pcaps $results_dir/compress_files$suffix
$scripts_dir/encrypt_files.sh $input_pcaps $results_dir/encrypt_files$suffix
BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}
$BENCHMARK_SHELL $scripts_dir/compress_files.sh $input_pcaps $results_dir/compress_files$suffix
$BENCHMARK_SHELL $scripts_dir/encrypt_files.sh $input_pcaps $results_dir/encrypt_files$suffix
6 changes: 4 additions & 2 deletions log-analysis/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,10 +17,12 @@ if [[ "$@" == *"--small"* ]]; then
suffix=".small"
fi

BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

echo "nginx"
time $scripts_dir/nginx.sh $nginx_input $results_dir/nginx$suffix
$BENCHMARK_SHELL $scripts_dir/nginx.sh $nginx_input $results_dir/nginx$suffix
echo $?

echo "pcaps"
time $scripts_dir/pcaps.sh $pcaps_input $results_dir/pcaps$suffix
$BENCHMARK_SHELL $scripts_dir/pcaps.sh $pcaps_input $results_dir/pcaps$suffix
echo $?
4 changes: 3 additions & 1 deletion max-temp/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -18,4 +18,6 @@ export statistics_dir="$results_dir/statistics$suffix"

mkdir -p "$statistics_dir"

${scripts_dir}/temp-analytics.sh
BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

$BENCHMARK_SHELL ${scripts_dir}/temp-analytics.sh
6 changes: 4 additions & 2 deletions media-conv/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -17,10 +17,12 @@ if [[ "$@" == *"--small"* ]]; then
suffix=".small"
fi

BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

echo "img_convert"
time $scripts_dir/img_convert.sh $img_convert_input $results_dir/img_convert$suffix > $results_dir/img_convert$suffix.log
$BENCHMARK_SHELL $scripts_dir/img_convert.sh $img_convert_input $results_dir/img_convert$suffix > $results_dir/img_convert$suffix.log
echo $?

echo "to_mp3"
time $scripts_dir/to_mp3.sh $to_mp3_input $results_dir/to_mp3$suffix > $results_dir/to_mp3$suffix.log
$BENCHMARK_SHELL $scripts_dir/to_mp3.sh $to_mp3_input $results_dir/to_mp3$suffix > $results_dir/to_mp3$suffix.log
echo $?
4 changes: 3 additions & 1 deletion nlp/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,8 @@ else
export IN="$SUITE_DIR/inputs/pg"
fi

BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

mkdir -p "outputs"

# Define the script names in a single variable
Expand Down Expand Up @@ -51,6 +53,6 @@ while IFS= read -r script; do
mkdir -p "$output_dir"

echo "$script"
time "$SHELL" "$script_file" "$output_dir"
$BENCHMARK_SHELL "$SHELL" "$script_file" "$output_dir"
echo "$?"
done <<< "$script_names"
4 changes: 3 additions & 1 deletion oneliners/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,8 @@ export SUITE_DIR=$(realpath $(dirname "$0"))
export TIMEFORMAT=%R
cd $SUITE_DIR

BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

if [[ "$@" == *"--small"* ]]; then
scripts_inputs=(
"nfa-regex;1M"
Expand Down Expand Up @@ -42,6 +44,6 @@ do
output_file="./outputs/${parsed[0]}.out"

echo "$script_file"
time "$SHELL" "$script_file" "$input_file" > "$output_file"
$BENCHMARK_SHELL "$SHELL" "$script_file" "$input_file" > "$output_file"
echo "$?"
done
74 changes: 6 additions & 68 deletions sklearn/run.sh
100755 → 100644
Original file line number Diff line number Diff line change
@@ -1,72 +1,10 @@
#!/bin/bash

PYTHON="python3"
OUT=${OUT:-$PWD/result}
TMP=${TMP:-$PWD/tmp}
#export tmp to env
export TMP
SCRIPTS=${SCRIPTS:-$PWD/scripts}
REPO_TOP=$(git rev-parse --show-toplevel)
eval_dir="${REPO_TOP}/sklearn"
scripts_dir="${eval_dir}/scripts"

# Ideally, we'll move on to piping rather than writing to a file
MODEL=$TMP/model.obj
X=$TMP/X_train.obj
y=$TMP/y_train.obj
CLASSES=$TMP/classes.obj
DUAL=false # should be converted to bool inside script
MAX_SQ_SUM=$TMP/max_squared_sum.obj
WARM_COEF=$TMP/warm_start_coef.obj
C_=$TMP/C_.obj
BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}
cd "$eval_dir" # scripts/run.sh references PWD
$BENCHMARK_SHELL "$scripts_dir/run.sh" $@

echo $PYTHON >&2
echo "DIR: $DIR" >&2
echo "SCRIPTS: $SCRIPTS" >&2
echo "MODEL: $MODEL" >&2
echo "X: $X" >&2
echo "y: $y" >&2
echo "CLASSES: $CLASSES" >&2
echo "DUAL: $DUAL" >&2
echo "MAX_SQ_SUM: $MAX_SQ_SUM" >&2
echo "WARM_COEF: $WARM_COEF" >&2
echo "C_: $C_" >&2

# TODO: Try this out on a larger dataset
# TODO: Benchmark each phase

# Generating model & samples
$PYTHON $SCRIPTS/gen_model.py 100
$PYTHON $SCRIPTS/gen_samples.py

# Validity checking functions
# These functions just check to make sure that the input is valid.
# If not they will raise an error. Otherwise, they do not mutate the data.
$PYTHON $SCRIPTS/check_solver.py $MODEL
penalty=$($PYTHON $SCRIPTS/penalty.py $MODEL)
$PYTHON $SCRIPTS/val_data.py $MODEL $X $y
$PYTHON $SCRIPTS/classes.py $MODEL $y # This should return a classes with just the unique classes in y
echo "$PYTHON $SCRIPTS/check_multiclass.py $MODEL" >&2
multiclass=$($PYTHON $SCRIPTS/check_multiclass.py $MODEL)
echo "------" >&2
# TODO: Benchmark each step of the pipeline
# Make a modified pipeline where each step writes its output to a file

# Calculations functions
$PYTHON $SCRIPTS/rownorm.py $X
n_classes=$($PYTHON $SCRIPTS/reshape_classes.py $MODEL $CLASSES)
$PYTHON $SCRIPTS/warm_start.py $MODEL $multiclass $n_classes # pipes coefficients

# Covtype dataset has 7 classes
echo "WARM_COEF: $WARM_COEF" >&2
echo "MAX_SQ_SUM: $MAX_SQ_SUM" >&2

echo "multiclass: $multiclass" >&2
echo "penalty: $penalty" >&2
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 1
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 2
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 3
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 4
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 5
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 6
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 7

$PYTHON $SCRIPTS/zip_coef.py $MODEL
$PYTHON $SCRIPTS/adjust_coef.py $MODEL $X $multiclass $n_classes $RESULT/trained_model.obj
72 changes: 72 additions & 0 deletions sklearn/scripts/run.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,72 @@
#!/bin/bash

PYTHON="python3"
OUT=${OUT:-$PWD/result}
TMP=${TMP:-$PWD/tmp}
#export tmp to env
export TMP
SCRIPTS=${SCRIPTS:-$PWD/scripts}

# Ideally, we'll move on to piping rather than writing to a file
MODEL=$TMP/model.obj
X=$TMP/X_train.obj
y=$TMP/y_train.obj
CLASSES=$TMP/classes.obj
DUAL=false # should be converted to bool inside script
MAX_SQ_SUM=$TMP/max_squared_sum.obj
WARM_COEF=$TMP/warm_start_coef.obj
C_=$TMP/C_.obj

echo $PYTHON >&2
echo "DIR: $DIR" >&2
echo "SCRIPTS: $SCRIPTS" >&2
echo "MODEL: $MODEL" >&2
echo "X: $X" >&2
echo "y: $y" >&2
echo "CLASSES: $CLASSES" >&2
echo "DUAL: $DUAL" >&2
echo "MAX_SQ_SUM: $MAX_SQ_SUM" >&2
echo "WARM_COEF: $WARM_COEF" >&2
echo "C_: $C_" >&2

# TODO: Try this out on a larger dataset
# TODO: Benchmark each phase

# Generating model & samples
$PYTHON $SCRIPTS/gen_model.py 100
$PYTHON $SCRIPTS/gen_samples.py

# Validity checking functions
# These functions just check to make sure that the input is valid.
# If not they will raise an error. Otherwise, they do not mutate the data.
$PYTHON $SCRIPTS/check_solver.py $MODEL
penalty=$($PYTHON $SCRIPTS/penalty.py $MODEL)
$PYTHON $SCRIPTS/val_data.py $MODEL $X $y
$PYTHON $SCRIPTS/classes.py $MODEL $y # This should return a classes with just the unique classes in y
echo "$PYTHON $SCRIPTS/check_multiclass.py $MODEL" >&2
multiclass=$($PYTHON $SCRIPTS/check_multiclass.py $MODEL)
echo "------" >&2
# TODO: Benchmark each step of the pipeline
# Make a modified pipeline where each step writes its output to a file

# Calculations functions
$PYTHON $SCRIPTS/rownorm.py $X
n_classes=$($PYTHON $SCRIPTS/reshape_classes.py $MODEL $CLASSES)
$PYTHON $SCRIPTS/warm_start.py $MODEL $multiclass $n_classes # pipes coefficients

# Covtype dataset has 7 classes
echo "WARM_COEF: $WARM_COEF" >&2
echo "MAX_SQ_SUM: $MAX_SQ_SUM" >&2

echo "multiclass: $multiclass" >&2
echo "penalty: $penalty" >&2
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 1
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 2
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 3
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 4
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 5
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 6
$PYTHON $SCRIPTS/parallel.py $MODEL $X $y $C_ $WARM_COEF $MAX_SQ_SUM $multiclass $penalty 7

$PYTHON $SCRIPTS/zip_coef.py $MODEL
$PYTHON $SCRIPTS/adjust_coef.py $MODEL $X $multiclass $n_classes $RESULT/trained_model.obj
11 changes: 10 additions & 1 deletion uniq-ips/run.sh
100755 → 100644
Original file line number Diff line number Diff line change
@@ -1 +1,10 @@
cat "logs-popcount-org.txt" | sort | uniq > "out.txt"
#!/bin/bash

REPO_TOP=$(git rev-parse --show-toplevel)
eval_dir="${REPO_TOP}/uniq-ips"
scripts_dir="${eval_dir}/scripts"

BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}
cd "$eval_dir" # scripts/run.sh puts files in its current directory
$BENCHMARK_SHELL "$scripts_dir/run.sh" $@

1 change: 1 addition & 0 deletions uniq-ips/scripts/run.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
cat "logs-popcount-org.txt" | sort | uniq > "out.txt"
3 changes: 2 additions & 1 deletion unix50/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -54,6 +54,7 @@ fi
echo executing unix50 $(date)

mkdir -p "outputs"
BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}

for script_input in ${scripts_inputs[@]};
do
Expand All @@ -67,6 +68,6 @@ do
output_file="./outputs/$script.out"

echo "$script"
time $SHELL $script_file $input_file > $output_file
$BENCHMARK_SHELL $script_file $input_file > $output_file
echo $?
done
3 changes: 2 additions & 1 deletion web-index/run.sh
Original file line number Diff line number Diff line change
Expand Up @@ -2,6 +2,7 @@

cd "$(dirname "$0")"

BENCHMARK_SHELL=${BENCHMARK_SHELL:-bash}
directory_path="inputs/articles"

if [ ! -d "$directory_path" ]; then
Expand All @@ -25,5 +26,5 @@ fi
mkdir -p "$OUTPUT_BASE"

echo "web-index"
time $SHELL ./scripts/ngrams.sh "$OUTPUT_BASE"
$BENCHMARK_SHELL ./scripts/ngrams.sh "$OUTPUT_BASE"
echo $?

0 comments on commit 94c85da

Please sign in to comment.