Mercurial > hg > python
view cluster.py @ 61:19262b15a099
merge
author | Henry S. Thompson <ht@inf.ed.ac.uk> |
---|---|
date | Wed, 13 Dec 2023 17:32:38 +0000 |
parents | 668d788cac47 |
children |
line wrap: on
line source
#!/usr/bin/python3 '''Read a minutor block lockation tsv and resort it to show clusters''' import sys from util import * if len(sys.argv)==1 or sys.argv[1]=='-h': print("""Usage: cluster.py [-h] [-c n] [-s] infile.tsv [outfile.tsv] n is cluster diameter, default is 5 -s for strict circle distance, reduces number of candidates default outfile is [infile]_c[n].tsv""") exit(1) if sys.argv[1]=='-c': sys.argv.pop(1) n=float(sys.argv.pop(1)) else: n=5.0 if sys.argv[1]=='-s': sys.argv.pop(1) strict=True else: strict=False infile_name=sys.argv.pop(1) if len(sys.argv)>1: outfile_name=sys.argv.pop(1) else: outfile_name="%s_c%s.tsv"%(infile_name.split('.')[0],n) cc=[] with open(infile_name,'r') as infile: with open(outfile_name,'w') as outfile: l=infile.readline().rstrip() print(l,file=outfile) ff=PPAT.split(l) (nr,ox,oy,oz)=intsMaybe(ff) home=(float(ox),float(oy),float(oz)) et=ff[9] l=infile.readline().rstrip() print(l,file=outfile) l2=PPAT.split(l) if l2[-1]=='bounded': orad=int(l2[1]) ymin=ymax=-1 else: (orad,ymin,ymax)=intsMaybe(l2) _=infile.readline() for l in infile: found=False (_,td,qd)=l.rstrip().split('\t') q=[float(i) for i in qd.split(',')] td=float(td) if strict and td>orad: # Enforce a circular region, not square print(td,orad,file=sys.stderr) break for c in cc: for p in c: if d(p,q)<=n: c.append(q) found=True break if found: break if not found: cc.append([q]) oc=cc cc=[] # lose w=0 ow=-1 nc=[] # win while True: for i,c in enumerate(oc): win=False for p in c: for g in oc[i+1:]: for q in g: if d(p,q)<=n: win=True w+=1 nc.append(c+g) break if win: break if win: break if not win: cc.append(c) print(len(cc),len(nc),ow,w,file=sys.stderr) if ow==w: break ow=w oc=nc nc=[] for c in sorted(cc,reverse=True,key=lambda x:len(x)): print(c,file=outfile)