Mercurial > hg > cc > cirrus_work
comparison bin/test_warc.py @ 45:212da3fe3b19
make test 1 idempotent
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Wed, 05 Jul 2023 19:32:02 +0100 |
parents | 689a0e311cd2 |
children | e20c64917805 |
comparison
equal
deleted
inserted
replaced
44:083229195d12 | 45:212da3fe3b19 |
---|---|
4 | 4 |
5 if (debug:=(sys.argv[1]=='-d')): | 5 if (debug:=(sys.argv[1]=='-d')): |
6 sys.argv.pop(1) | 6 sys.argv.pop(1) |
7 | 7 |
8 def showme(wtype,buf,part): | 8 def showme(wtype,buf,part): |
9 # This should exactly reproduce a complete warc file if called | |
10 # as per version 1 below | |
9 if debug: | 11 if debug: |
10 breakpoint() | 12 OUT.write(b"%d\n%b"%(part,buf)) |
11 OUT.write(b"%d\n%b"%(part,buf)) | 13 else: |
14 OUT.write(buf) | |
15 if buf[-1]!=b'\n': | |
16 OUT.write(b'\r\n') | |
17 if part==7: | |
18 OUT.write(b'\r\n') # to match complete file formatting | |
12 | 19 |
20 # 1 warc.warc(sys.argv[1],showme,[b'response','warcinfo','request','metadata'],whole=True) | |
13 | 21 |
14 #warc(showme,[b'response','warcinfo','request','metadata'],int(sys.argv[2])) | 22 # 2 |
15 #warc(showme,[b'response'],whole=True) | |
16 | |
17 warc.warc(sys.argv[1],showme,[b'response'],parts=int(sys.argv[2]),debug=debug) | 23 warc.warc(sys.argv[1],showme,[b'response'],parts=int(sys.argv[2]),debug=debug) |