view master/src/wecu/run.sh @ 64:b91e44355bbf

fix minor argument passing snafus
author Henry S. Thompson <ht@markup.co.uk>
date Wed, 03 Jun 2020 22:08:01 +0000
parents a3edba8dab11
children
line wrap: on
line source

cores=`cat cores.txt`

time parallel \
    --sshloginfile hosts \
    --transferfile mapper.py \
    --transferfile reducer.py \
    --will-cite \
    --retries 3 \
    --jobs $cores \
    --workdir $PWD \
    -a input_paths  \
    'curl -s -N "https://commoncrawl.s3.amazonaws.com/{}" | unpigz -dp 1 -c | ./mapper.py' | \
    sort | \
    ./reducer.py