Mercurial > hg > cc > cirrus_work
view bin/do_idx.sh @ 125:d864700913b8
readability
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Thu, 28 Sep 2023 14:06:11 +0100 |
parents | 5b952d16838c |
children | 0326805aa6df |
line wrap: on
line source
#!/bin/bash while [ "$1" = "-d" ] do shift debug="$debug -d" done export res="$1" orig="$2" # igzip was faster, but produced bigger files, so went to gzip one step # smaller than default (-6), which produces slightly _smaller_ blocks. merge_date.py $debug <(LC_ALL=C sort -m -k1,3 -s $res/ks_[0-9]*.tsv) \ $orig $res/idx 2>$res/merge.log | \ parallel -j 10 'echo {#} {} >$res/merge_{#}.log echo $(date) {#} {} export res split -l 3000 --filter="gzip -c -7 --keep | \ tee >(wc -c >> \ $res/merge_{#}.log)" \ {} > {}.gz && \ rm {}'