Mercurial > hg > cc > cirrus_home
view bin/unfold.sh @ 121:863ea87be6bb
support field edit
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Mon, 28 Jun 2021 15:40:10 +0000 |
parents | a82c325e8b32 |
children |
line wrap: on
line source
#!/bin/bash # Usage: unfold.sh links_... pdfs=/beegfs/common_crawl/CC-MAIN-2019-35/pdfs links=$pdfs/links f=$1 IFS=' ' awk '{if (NR==1) { o=$1 ; u=$2 } else { if ($1=="annot" || $1=="scrape") { print o,"\t",u o=$1 u=$2 } else { u=u $1 } } } END { print o,"\t",u }' $f