view bin/extract.sh @ 172:72b0420167dc

generalised sbatch front-end to cdx2tsv.py
author Henry S. Thompson <ht@inf.ed.ac.uk>
date Thu, 28 Jul 2022 17:24:29 +0100
parents 1e479e3ea9c4
children
line wrap: on
line source

#!/usr/bin/bash
# Launch parallel tasks, one per segment from extract_?.txt
#  First line thereof gives CC identifier
echo $(date) $(hostname)
h=$(hostname)
hn=${h##*n}
head -1 extract_${hn}.txt |\
 { read cc ; \
 tail -n +2 extract_${hn}.txt |\
    parallel --joblog topjob.log --will-cite  -j 4 -N 1 \$HOME/bin/doExtract.sh "$cc" '{#}' '{}' ; }
echo $(date) $(hostname) $?