Mercurial > hg > cc > cirrus_work
comparison bin/do_idx.sh @ 110:a0ea1e4a714d
pass in debug flag(s) to merge_date.py
author | Henry Thompson <ht@markup.co.uk> |
---|---|
date | Tue, 19 Sep 2023 19:40:58 +0100 |
parents | 9403c02d5034 |
children | 5b952d16838c |
comparison
equal
deleted
inserted
replaced
109:52c6a9b0fc8c | 110:a0ea1e4a714d |
---|---|
1 #!/bin/bash | 1 #!/bin/bash |
2 while [ "$1" = "-d" ] | |
3 do | |
4 shift | |
5 debug="$debug -d" | |
6 done | |
2 export res="$1" | 7 export res="$1" |
3 orig="$2" | 8 orig="$2" |
4 # igzip was faster, but produced bigger files, so went to gzip one step | 9 # igzip was faster, but produced bigger files, so went to gzip one step |
5 # smaller than default (-6), which produces slightly _smaller_ blocks. | 10 # smaller than default (-6), which produces slightly _smaller_ blocks. |
6 merge_date.py <(LC_ALL=C sort -m -k1,2 -s $res/ks_[0-9]*.tsv) $orig $res/idx |\ | 11 merge_date.py $debug <(LC_ALL=C sort -m -k1,2 -s $res/ks_[0-9]*.tsv) $orig $res/idx |\ |
7 parallel -j 10 'echo {#} {} >$res/merge_{#}.log | 12 parallel -j 10 'echo {#} {} >$res/merge_{#}.log |
8 echo $(date) {#} {} | 13 echo $(date) {#} {} |
9 export res | 14 export res |
10 split -l 3000 --filter="gzip -c -7 --keep | \ | 15 split -l 3000 --filter="gzip -c -7 --keep | \ |
11 tee >(wc -c >> \ | 16 tee >(wc -c >> \ |