view workers/bin/count1.sh @ 51:26e18c66ce36

final merge
author Henry S. Thompson <ht@markup.co.uk>
date Sun, 16 Dec 2018 14:25:42 +0000
parents 36b5d379909a
children
line wrap: on
line source

#!/bin/bash
echo "# $(date) > $ID.$1"
jq '.Envelope|.["WARC-Header-Metadata"]["WARC-Target-URI"]'|cut -f 1 -d ':'|awk '{c[$1]+=1} END {for (k in c) {print k, c[k]}}'
echo "# $(date) < $ID.$1"