Commit eb4f9627 authored by Mathieu Giraud's avatar Mathieu Giraud, compute and display stats on clusters

class Analysis(VidjilJson):
def __init__(self):
def __init__(self, data=None): = data
self.clones = {}
lw_clones = set([c.d['id'] for c in lw])
return my_clones.difference(lw_clones)
def cluster_stats(self, point=0):
for cluster in self.d['clusters']:
sizes = []
for c in cluster:
s =[c].d["reads"][point]
sizes += [s]
except AttributeError:
print "!! missing from cluster", c
if sizes:
print "%% cluster: max is %.3f of the sum, len %d" % (float(max(sizes)) / float(sum(sizes)), len(sizes))
def info_of_clone(self, w):
if w.d['id'] in self.clones:
return self.clones[w.d['id']]
# TODO: hardcoded for output of
# should be more flexible
ii = 'data.vidjil/' + 'pat-' + i_short +'.analysis'
data_analysis = analysis.Analysis()
data_analysis = analysis.Analysis(data)
if str(data_analysis.d['samples']['run_timestamp']) == str(data.d['samples'].d['run_timestamp']):
print("%% timestamps: OK")
print("%% timestamps: XXX", i, data.d['samples'].d['run_timestamp'], "instead of", data_analysis.d['samples']['run_timestamp'])
data_analysis = None
