Mercurial > hg > cc > cirrus_work
changeset 171:143d2c6d56da
cross-language confusion :-)
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Wed, 15 Nov 2023 09:36:23 +0000 |
parents | 4870e14ec237 |
children | bc66c6098e5e |
files | bin/getcc_multi.aws |
diffstat | 1 files changed, 1 insertions(+), 1 deletions(-) [+] |
line wrap: on
line diff
--- a/bin/getcc_multi.aws Mon Nov 06 15:55:57 2023 +0000 +++ b/bin/getcc_multi.aws Wed Nov 15 09:36:23 2023 +0000 @@ -37,7 +37,7 @@ s=$(grep -Eow "[0-9]*\.$SEG" $wf | head -1) mkdir -p $s/orig/warc -fgrep -v -f <(cd $s/orig/warc && ls *.warc.gz || pass) <(fgrep -w $s warc.paths) > /tmp/hst/$s +fgrep -v -f <(cd $s/orig/warc && ls *.warc.gz || :) <(fgrep -w $s warc.paths) > /tmp/hst/$s split -a 1 --numeric-suffixes=1 -n l/$nthreads /tmp/hst/$s /tmp/hst/${s}_