Mercurial > hg > cc > cirrus_work
changeset 211:0ffa655efc21
add some debugging info
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Thu, 11 Jan 2024 16:44:45 +0000 |
parents | 6faed9e5d9c9 |
children | 443b3a6f0b41 |
files | lib/python/cc/lmh/lmh.py |
diffstat | 1 files changed, 5 insertions(+), 1 deletions(-) [+] |
line wrap: on
line diff
--- a/lib/python/cc/lmh/lmh.py Thu Jan 11 16:43:16 2024 +0000 +++ b/lib/python/cc/lmh/lmh.py Thu Jan 11 16:44:45 2024 +0000 @@ -48,7 +48,11 @@ infile_pat='/beegfs/common_crawl/CC-MAIN-%s/*.%s/orig/%s/*%s.warc.gz'%( CCdate, segment, filetype, fileno) - infile_name=glob.glob(infile_pat)[0] + try: + infile_name=glob.glob(infile_pat)[0] + except IndexError: + print(infile_pat,CCdata,segment,filetype,fileno,file=sys.stderr) + raise (_,_,_,_,_,_,_,ff)=infile_name.split('/')