diff options
| author | Douglas Rumbaugh <dbr4@psu.edu> | 2024-05-14 16:13:18 -0400 |
|---|---|---|
| committer | Douglas Rumbaugh <dbr4@psu.edu> | 2024-05-14 16:13:18 -0400 |
| commit | 47c36d9eba94bd1f1493ec82ebfde46ec0c74590 (patch) | |
| tree | cc7e84c5ed9df1fa9f709ad270197ec4d15a2134 /bin/scripts/run_benchmarks.sh | |
| parent | c49543e5c23af6bee35c7164ba433fc663c79041 (diff) | |
| download | dynamic-extension-47c36d9eba94bd1f1493ec82ebfde46ec0c74590.tar.gz | |
Benchmark helper script
Diffstat (limited to 'bin/scripts/run_benchmarks.sh')
| -rw-r--r-- | bin/scripts/run_benchmarks.sh | 78 |
1 files changed, 78 insertions, 0 deletions
diff --git a/bin/scripts/run_benchmarks.sh b/bin/scripts/run_benchmarks.sh new file mode 100644 index 0000000..069d460 --- /dev/null +++ b/bin/scripts/run_benchmarks.sh @@ -0,0 +1,78 @@ +#!/bin/bash + +dataset_dir='/data/dataset/' +query_dir='/data/queries/' +bench_dir='bin/benchmarks/' + +queries=('sosd_books_queries.tsv' 'sosd_fb_queries.tsv' 'sosd_osm_queries.tsv') +datasets=('books_200M_uint64.bin' 'fb_200M_uint64.bin' 'osm_cellids_200M_uint64.bin') +cnt=199999400 + +benchmarks=('irs_bench' 'pgm_bench' 'ts_bench' 'dynamic_pgm_bench' 'btree_bench' 'alex_bench' 'ts_bsm_bench') + +for bench in ${benchmarks[@]}; do + for (( i=0; i<3; i++)); do + dataset=${datasets[$i]} + query=${queries[$i]} + printf "%20s\t%30s\t" "$bench" "$dataset" + numactl -C1 -m1 "$bench_dir""$bench" "$cnt" "$dataset_dir""$dataset" "$query_dir""$query" + + if [[ ! $? ]]; then + printf "ERROR\n" + fi + done +done + +vector_datasets=('cleaned-vectors.txt') +vector_queries=('sbw_queries.txt') + +vector_benchmarks=('vptree_bench' 'mtree_bench' 'vptree_bsm_bench') +for bench in ${vector_benchmarks[@]}; do + for (( i=0; i<1; i++)); do + dataset=${vector_datasets[$i]} + query=${vector_queries[$i]} + printf "%20s\t%30s\t\t" "$bench" "$dataset" + cnt=$(wc -l "$dataset_dir""$dataset" | cut -d' ' -f1) + numactl -C1 -m1 "$bench_dir""$bench" "$cnt" "$dataset_dir""$dataset" "$query_dir""$query" + + if [[ ! $? ]]; then + printf "ERROR\n" + fi + done +done + +string_datasets=('ursarc2.0.txt' 'english-words.txt') +string_benchmarks=('fst_bench' 'fst_bsm_bench') +for bench in ${string_benchmarks[@]}; do + for (( i=0; i<2; i++)); do + dataset=${string_datasets[$i]} + printf "%20s\t%30s\t\t" "$bench" "$dataset" + cnt=$(wc -l "$dataset_dir""$dataset" | cut -d' ' -f1) + numactl -C1 -m1 "$bench_dir""$bench" "$cnt" "$dataset_dir""$dataset" + + if [[ ! $? ]]; then + printf "ERROR\n" + fi + done +done + +binary_vector_datasets=('bigann.u8bin') +binary_vector_queries=('ann_queries.u8bin') + +binary_vector_benchmarks=('vptree_bench_alt' 'mtree_bench_alt' 'vptree_bsm_bench_alt') + +for bench in ${binary_vector_benchmarks[@]}; do + for (( i=0; i<1; i++)); do + dataset=${binary_vector_datasets[$i]} + query=${binary_vector_queries[$i]} + printf "%20s\t%30s\t\t" "$bench" "$dataset" + cnt=10000000 + numactl -C1 -m1 "$bench_dir""$bench" "$cnt" "$dataset_dir""$dataset" "$query_dir""$query" + + if [[ ! $? ]]; then + printf "ERROR\n" + fi + done +done + + |