comparison bin/do_idx.sh @ 110:a0ea1e4a714d

pass in debug flag(s) to merge_date.py
author Henry Thompson <ht@markup.co.uk>
date Tue, 19 Sep 2023 19:40:58 +0100
parents 9403c02d5034
children 5b952d16838c
comparison
equal deleted inserted replaced
109:52c6a9b0fc8c 110:a0ea1e4a714d
1 #!/bin/bash 1 #!/bin/bash
2 while [ "$1" = "-d" ]
3 do
4 shift
5 debug="$debug -d"
6 done
2 export res="$1" 7 export res="$1"
3 orig="$2" 8 orig="$2"
4 # igzip was faster, but produced bigger files, so went to gzip one step 9 # igzip was faster, but produced bigger files, so went to gzip one step
5 # smaller than default (-6), which produces slightly _smaller_ blocks. 10 # smaller than default (-6), which produces slightly _smaller_ blocks.
6 merge_date.py <(LC_ALL=C sort -m -k1,2 -s $res/ks_[0-9]*.tsv) $orig $res/idx |\ 11 merge_date.py $debug <(LC_ALL=C sort -m -k1,2 -s $res/ks_[0-9]*.tsv) $orig $res/idx |\
7 parallel -j 10 'echo {#} {} >$res/merge_{#}.log 12 parallel -j 10 'echo {#} {} >$res/merge_{#}.log
8 echo $(date) {#} {} 13 echo $(date) {#} {}
9 export res 14 export res
10 split -l 3000 --filter="gzip -c -7 --keep | \ 15 split -l 3000 --filter="gzip -c -7 --keep | \
11 tee >(wc -c >> \ 16 tee >(wc -c >> \