view cluster.py @ 57:057b52746850 simple

use Run and Space classes in Vector.runs
author Henry Thompson <ht@markup.co.uk>
date Thu, 01 Jun 2023 18:21:56 +0100
parents 668d788cac47
children
line wrap: on
line source

#!/usr/bin/python3
'''Read a minutor block lockation tsv and resort it to show clusters'''
import sys

from util import *

if len(sys.argv)==1 or sys.argv[1]=='-h':
  print("""Usage: cluster.py [-h] [-c n] [-s] infile.tsv [outfile.tsv]
           n is cluster diameter, default is 5
           -s for strict circle distance, reduces number of candidates
           default outfile is [infile]_c[n].tsv""")
  exit(1)
if sys.argv[1]=='-c':
  sys.argv.pop(1)
  n=float(sys.argv.pop(1))
else:
  n=5.0

if sys.argv[1]=='-s':
  sys.argv.pop(1)
  strict=True
else:
  strict=False

infile_name=sys.argv.pop(1)
if len(sys.argv)>1:
  outfile_name=sys.argv.pop(1)
else:
  outfile_name="%s_c%s.tsv"%(infile_name.split('.')[0],n)

cc=[]

with open(infile_name,'r') as infile:
  with open(outfile_name,'w') as outfile:
    l=infile.readline().rstrip()
    print(l,file=outfile)
    ff=PPAT.split(l)
    (nr,ox,oy,oz)=intsMaybe(ff)
    home=(float(ox),float(oy),float(oz))
    et=ff[9]
    l=infile.readline().rstrip()
    print(l,file=outfile)
    l2=PPAT.split(l)
    if l2[-1]=='bounded':
      orad=int(l2[1])
      ymin=ymax=-1
    else:
      (orad,ymin,ymax)=intsMaybe(l2)
    _=infile.readline()
    for l in infile:
      found=False
      (_,td,qd)=l.rstrip().split('\t')
      q=[float(i) for i in qd.split(',')]
      td=float(td)
      if strict and td>orad:
        # Enforce a circular region, not square
        print(td,orad,file=sys.stderr)
        break
      for c in cc:
        for p in c:
          if d(p,q)<=n:
            c.append(q)
            found=True
            break
        if found:
          break
      if not found:
        cc.append([q])
    oc=cc
    cc=[] # lose
    w=0
    ow=-1
    nc=[] # win
    while True:
      for i,c in enumerate(oc):
        win=False
        for p in c:
          for g in oc[i+1:]:
            for q in g:
              if d(p,q)<=n:
                win=True
                w+=1
                nc.append(c+g)
                break
            if win:
              break
          if win:
            break
        if not win:
          cc.append(c)
      print(len(cc),len(nc),ow,w,file=sys.stderr)
      if ow==w:
        break
      ow=w
      oc=nc
      nc=[]
    for c in sorted(cc,reverse=True,key=lambda x:len(x)):
      print(c,file=outfile)