changeset 211:0ffa655efc21

add some debugging info
author Henry S. Thompson <ht@inf.ed.ac.uk>
date Thu, 11 Jan 2024 16:44:45 +0000
parents 6faed9e5d9c9
children 443b3a6f0b41
files lib/python/cc/lmh/lmh.py
diffstat 1 files changed, 5 insertions(+), 1 deletions(-) [+]
line wrap: on
line diff
--- a/lib/python/cc/lmh/lmh.py	Thu Jan 11 16:43:16 2024 +0000
+++ b/lib/python/cc/lmh/lmh.py	Thu Jan 11 16:44:45 2024 +0000
@@ -48,7 +48,11 @@
 
   infile_pat='/beegfs/common_crawl/CC-MAIN-%s/*.%s/orig/%s/*%s.warc.gz'%(
     CCdate, segment, filetype, fileno)
-  infile_name=glob.glob(infile_pat)[0]
+  try:
+    infile_name=glob.glob(infile_pat)[0]
+  except IndexError:
+    print(infile_pat,CCdata,segment,filetype,fileno,file=sys.stderr)
+    raise
 
   (_,_,_,_,_,_,_,ff)=infile_name.split('/')