diff --git a/datasets/compress.sh b/datasets/compress.sh index c24b800..53f7ea5 100755 --- a/datasets/compress.sh +++ b/datasets/compress.sh @@ -4,6 +4,7 @@ filenames=( $(ls job_codings_v3*.csv) ) filenames=( ${filenames[@]} "clustering_progress.csv" ) filenames=( ${filenames[@]} $(ls job_metadata*.csv) ) filenames=( ${filenames[@]} $( ls job_similarities_*.csv ) ) +filenames=( ${filenames[@]} $( ls sim_computation_times_*.csv ) ) echo "${filenames[*]}" diff --git a/datasets/decompress.sh b/datasets/decompress.sh index f95631e..7607bab 100755 --- a/datasets/decompress.sh +++ b/datasets/decompress.sh @@ -19,6 +19,6 @@ for source_filename in ${source_filenames[@]}; do echo "Decompressing ${source_filename}" tar -xJf "${source_filename}" else - echo "Skipping ${source_filename}" + echo "Skipping decompression of ${source_filename}" fi done diff --git a/datasets/sim_computation_times_4296426.csv.tar.xz b/datasets/sim_computation_times_4296426.csv.tar.xz index 8d2804c..00a7486 100644 Binary files a/datasets/sim_computation_times_4296426.csv.tar.xz and b/datasets/sim_computation_times_4296426.csv.tar.xz differ diff --git a/datasets/sim_computation_times_5024292.csv.tar.xz b/datasets/sim_computation_times_5024292.csv.tar.xz index c137eb3..66d09ab 100644 Binary files a/datasets/sim_computation_times_5024292.csv.tar.xz and b/datasets/sim_computation_times_5024292.csv.tar.xz differ diff --git a/datasets/sim_computation_times_7488914.csv.tar.xz b/datasets/sim_computation_times_7488914.csv.tar.xz index 6f30694..ad6a225 100644 Binary files a/datasets/sim_computation_times_7488914.csv.tar.xz and b/datasets/sim_computation_times_7488914.csv.tar.xz differ diff --git a/scripts/analyse-all.sh b/scripts/analyse-all.sh index 26767dd..80d32a7 100755 --- a/scripts/analyse-all.sh +++ b/scripts/analyse-all.sh @@ -12,11 +12,14 @@ function prepare(){ popd for I in datasets/*.csv ; do - ln -s $I + if [ ! -e $(basename $I) ]; then + echo "Creating symlink $(basename $I)" + ln -s $I + fi done } -# prepare +prepare for I in job_similarities_*.csv ; do rm *.png *.pdf