comparison workers/bin/_timedWhich.sh @ 18:9631fca89cc6

F2-related stuff, and new experiment
author Henry S. Thompson <ht@markup.co.uk>
date Fri, 19 Oct 2018 14:25:19 +0000
parents 2a2c1fb03c54
children d4f186655bcc
comparison
equal deleted inserted replaced
17:2a2c1fb03c54 18:9631fca89cc6
1 #!/bin/bash 1 #!/bin/bash
2 egrep -o'("WARC-Target-URI":"https?:|"Last-Modified":"[^"]*")'|\ 2 egrep -o '("WARC-Target-URI":"https?:|"Last-Modified":"[^"]*")'|\
3 egrep -o '(https?:|:".*"$)' |\ 3 egrep -o '(https?:|:".*"$)' |\
4 tr '\012' \# | sed 's/:#:/ /g'|tr \# '\012' | tr -d \"|\ 4 tr '\012' \# | sed 's/:#:/ /g'|tr \# '\012' | tr -d \"|\
5 sed 's/ [[:digit:]][[:digit:]]\?:[[:digit:]][[:digit:]]:[[:digit:]][[:digit:]] / /;s/\(https\? \)\(: \)\?[MTWFSa-z]..\.\?, \?/\1/;s/ \([-+][[:digit:]]\{4\}\|[[:upper:]]\{2,3\}\)$//;s/ [[:digit:]]\{1,2\} / /;s/\/[[:digit:]]\{1,2\}\/\([[:digit:]]\{4\}\)$/ \1/'|\ 5 sed 's/ [[:digit:]][[:digit:]]\?:[[:digit:]][[:digit:]]:[[:digit:]][[:digit:]] / /;s/\(https\? \)\(: \)\?[MTWFSa-z]..\.\?, \?/\1/;s/ \([-+][[:digit:]]\{4\}\|[[:upper:]]\{2,3\}\)$//;s/ [[:digit:]]\{1,2\} / /;s/\/[[:digit:]]\{1,2\}\/\([[:digit:]]\{4\}\)$/ \1/'|\
6 awk '{c[$0]+=1} END {for (k in c) {print k, c[k]}}' 6 awk '{c[$0]+=1} END {for (k in c) {print k, c[k]}}'
7 7