mistral-io-datasets/datasets/compress.sh

23 lines
675 B
Bash
Raw Normal View History

2020-08-18 13:27:39 +00:00
#!/bin/bash
2020-09-01 10:52:36 +00:00
filenames=( $(ls job_codings_v*.csv) )
2020-08-20 17:04:20 +00:00
filenames=( ${filenames[@]} "clustering_progress.csv" )
2020-08-18 17:54:43 +00:00
filenames=( ${filenames[@]} $(ls job_metadata*.csv) )
2020-08-18 13:27:39 +00:00
filenames=( ${filenames[@]} $( ls job_similarities_*.csv ) )
2020-08-26 10:54:27 +00:00
filenames=( ${filenames[@]} $( ls sim_computation_times_*.csv ) )
filenames=( ${filenames[@]} $( ls ks_*.csv ) )
2020-08-18 13:27:39 +00:00
echo "${filenames[*]}"
for in_fn in ${filenames[@]}; do
out_fn="${in_fn}.tar.xz"
if [ -f "${in_fn}" ]; then
if [ ! -f "${out_fn}" ]; then
echo "Compressing ${in_fn}"
tar -cf - "${in_fn}" | xz -9 > "${out_fn}"
else
echo "Skipping ${out_fn}. File exists."
fi
fi
done