view workers/bin/count1.sh @ 19:d4f186655bcc

lots of tweaking, reached the 80/20 point
author Henry S. Thompson <ht@markup.co.uk>
date Sat, 20 Oct 2018 16:11:29 +0000
parents 36b5d379909a
children
line wrap: on
line source

#!/bin/bash
echo "# $(date) > $ID.$1"
jq '.Envelope|.["WARC-Header-Metadata"]["WARC-Target-URI"]'|cut -f 1 -d ':'|awk '{c[$1]+=1} END {for (k in c) {print k, c[k]}}'
echo "# $(date) < $ID.$1"