Mercurial > hg > cc > cirrus_work
annotate bin/do_idx.sh @ 103:7d58dc01f329
re-instate logging splits for .idx
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Wed, 13 Sep 2023 12:40:39 +0100 |
parents | e2e64c3d763e |
children | 9403c02d5034 |
rev | line source |
---|---|
101
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
1 #!/bin/bash |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
2 export res="$1" |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
3 orig="$2" |
103
7d58dc01f329
re-instate logging splits for .idx
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
101
diff
changeset
|
4 merge_date.py <(LC_ALL=C sort -m -k1,2 -s $res/ks_[0-9]*.tsv) $orig $res/idx |\ |
101
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
5 parallel -j 10 'echo {#} {} >$res/merge_{#}.log |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
6 echo $(date) {#} {} |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
7 export res |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
8 split -l 3000 --filter="igzip -c | \ |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
9 tee >(wc -c >> \ |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
10 $res/merge_{#}.log)" \ |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
11 {} > {}.gz && \ |
e2e64c3d763e
bug4 fixed, but that created a new, earlier bug
Henry S. Thompson <ht@inf.ed.ac.uk>
parents:
diff
changeset
|
12 rm {}' |