Context Navigation

source: mds-and-trees/tree-genealogy.py @ 712

Last change on this file since 712 was 712, checked in by Maciej Komosinski, 7 years ago
Improved status and error messages
File size: 40.0 KB

Line
1	import json
2	import math
3	import random
4	import argparse
5	import bisect
6	import copy
7	import time as timelib
8	from PIL import Image, ImageDraw, ImageFont
9	from scipy import stats
10	from matplotlib import colors
11	import numpy as np
12
13	class LoadingError(Exception):
14	pass
15
16	class Drawer:
17
18	def __init__(self, design, config_file, w=600, h=800, w_margin=10, h_margin=20):
19	self.design = design
20	self.width = w
21	self.height = h
22	self.w_margin = w_margin
23	self.h_margin = h_margin
24	self.w_no_margs = w - 2* w_margin
25	self.h_no_margs = h - 2* h_margin
26
27	self.color_converter = colors.ColorConverter()
28
29	self.settings = {
30	'colors_of_kinds': ['red', 'green', 'blue', 'magenta', 'yellow', 'cyan', 'orange', 'purple'],
31	'dots': {
32	'color': {
33	'meaning': 'Lifespan',
34	'normalize_cmap': False,
35	'cmap': {},
36	'start': 'red',
37	'end': 'green',
38	'bias': 1
39	},
40	'size': {
41	'meaning': 'EnergyEaten',
42	'start': 1,
43	'end': 6,
44	'bias': 0.5
45	},
46	'opacity': {
47	'meaning': 'EnergyEaten',
48	'start': 0.2,
49	'end': 1,
50	'bias': 1
51	}
52	},
53	'lines': {
54	'color': {
55	'meaning': 'adepth',
56	'normalize_cmap': False,
57	'cmap': {},
58	'start': 'black',
59	'end': 'red',
60	'bias': 3
61	},
62	'width': {
63	'meaning': 'adepth',
64	'start': 0.1,
65	'end': 4,
66	'bias': 3
67	},
68	'opacity': {
69	'meaning': 'adepth',
70	'start': 0.1,
71	'end': 0.8,
72	'bias': 5
73	}
74	}
75	}
76
77	def merge(source, destination):
78	for key, value in source.items():
79	if isinstance(value, dict):
80	node = destination.setdefault(key, {})
81	merge(value, node)
82	else:
83	destination[key] = value
84	return destination
85
86	if config_file != "":
87	with open(config_file) as config:
88	c = json.load(config)
89	self.settings = merge(c, self.settings)
90	#print(json.dumps(self.settings, indent=4, sort_keys=True))
91
92	self.compile_cmaps()
93
94	def compile_cmaps(self):
95	def normalize_and_compile_cmap(cmap):
96	for key in cmap:
97	for arr in cmap[key]:
98	arr[0] = (arr[0] - cmap[key][0][0]) / (cmap[key][-1][0] - cmap[key][0][0])
99	return colors.LinearSegmentedColormap('Custom', cmap)
100
101	for part in ['dots', 'lines']:
102	if self.settings[part]['color']['cmap']:
103	if self.settings[part]['color']['normalize_cmap']:
104	cmap = self.settings[part]['color']['cmap']
105	min = self.design.props[self.settings[part]['color']['meaning'] + "_min"]
106	max = self.design.props[self.settings[part]['color']['meaning'] + "_max"]
107
108	for key in cmap:
109	if cmap[key][0][0] > min:
110	cmap[key].insert(0, cmap[key][0][:])
111	cmap[key][0][0] = min
112	if cmap[key][-1][0] < max:
113	cmap[key].append(cmap[key][-1][:])
114	cmap[key][-1][0] = max
115
116	og_cmap = normalize_and_compile_cmap(copy.deepcopy(cmap))
117
118	col2key = {'red':0, 'green':1, 'blue':2}
119	for key in cmap:
120	# for color from (r/g/b) #n's should be the same for all keys!
121	n_min = (min - cmap[key][0][0]) / (cmap[key][-1][0] - cmap[key][0][0])
122	n_max = (max - cmap[key][0][0]) / (cmap[key][-1][0] - cmap[key][0][0])
123
124	min_col = og_cmap(n_min)
125	max_col = og_cmap(n_max)
126
127	cmap[key][0] = [min, min_col[col2key[key]], min_col[col2key[key]]]
128	cmap[key][-1] = [max, max_col[col2key[key]], max_col[col2key[key]]]
129	print(self.settings[part]['color']['cmap'])
130	self.settings[part]['color']['cmap'] = normalize_and_compile_cmap(self.settings[part]['color']['cmap'])
131
132	def draw_dots(self, file, min_width, max_width, max_height):
133	for i in range(len(self.design.positions)):
134	node = self.design.positions[i]
135	if 'x' not in node:
136	continue
137	dot_style = self.compute_dot_style(node=i)
138	self.add_dot(file, (self.w_margin+self.w_no_margs*(node['x']-min_width)/(max_width-min_width),
139	self.h_margin+self.h_no_margs*node['y']/max_height), dot_style)
140
141	def draw_lines(self, file, min_width, max_width, max_height):
142	for parent in range(len(self.design.positions)):
143	par_pos = self.design.positions[parent]
144	if not 'x' in par_pos:
145	continue
146	for child in self.design.tree.children[parent]:
147	chi_pos = self.design.positions[child]
148	if 'x' not in chi_pos:
149	continue
150	line_style = self.compute_line_style(parent, child)
151	self.add_line(file, (self.w_margin+self.w_no_margs*(par_pos['x']-min_width)/(max_width-min_width),
152	self.h_margin+self.h_no_margs*par_pos['y']/max_height),
153	(self.w_margin+self.w_no_margs*(chi_pos['x']-min_width)/(max_width-min_width),
154	self.h_margin+self.h_no_margs*chi_pos['y']/max_height), line_style)
155
156	def draw_scale(self, file, filenames):
157	self.add_text(file, "Generated from " + filenames[0].split("\\")[-1]
158	+ (" and " + str(len(filenames)-1) + " more" if len(filenames) > 1 else ""), (5, 5), "start")
159
160	start_text = ""
161	end_text = ""
162	if self.design.TIME == "BIRTHS":
163	start_text = "Birth #0"
164	end_text = "Birth #" + str(len(self.design.positions)-1)
165	if self.design.TIME == "REAL":
166	start_text = "Time " + str(min(self.design.tree.time))
167	end_text = "Time " + str(max(self.design.tree.time))
168	if self.design.TIME == "GENERATIONAL":
169	start_text = "Depth " + str(self.design.props['adepth_min'])
170	end_text = "Depth " + str(self.design.props['adepth_max'])
171
172	self.add_dashed_line(file, (self.width*0.7, self.h_margin), (self.width, self.h_margin))
173	self.add_text(file, start_text, (self.width, self.h_margin), "end")
174	self.add_dashed_line(file, (self.width*0.7, self.height-self.h_margin), (self.width, self.height-self.h_margin))
175	self.add_text(file, end_text, (self.width, self.height-self.h_margin), "end")
176
177	def compute_property(self, part, prop, node):
178	start = self.settings[part][prop]['start']
179	end = self.settings[part][prop]['end']
180	value = (self.design.props[self.settings[part][prop]['meaning']][node]
181	if self.settings[part][prop]['meaning'] in self.design.props else 0 )
182	bias = self.settings[part][prop]['bias']
183	if prop == "color":
184	if not self.settings[part][prop]['cmap']:
185	return self.compute_color(start, end, value, bias)
186	else:
187	return self.compute_color_from_cmap(self.settings[part][prop]['cmap'], value, bias)
188	else:
189	return self.compute_value(start, end, value, bias)
190
191	def compute_color_from_cmap(self, cmap, value, bias=1):
192	value = 1 - (1-value)**bias
193	rgba = cmap(value)
194	return (100rgba[0], 100rgba[1], 100*rgba[2])
195
196
197	def compute_color(self, start, end, value, bias=1):
198	if isinstance(value, str):
199	value = int(value)
200	r, g, b = self.color_converter.to_rgb(self.settings['colors_of_kinds'][value])
201	else:
202	start_color = self.color_converter.to_rgb(start)
203	end_color = self.color_converter.to_rgb(end)
204	value = 1 - (1-value)**bias
205	r = start_color[0](1-value)+end_color[0]value
206	g = start_color[1](1-value)+end_color[1]value
207	b = start_color[2](1-value)+end_color[2]value
208	return (100r, 100g, 100*b)
209
210	def compute_value(self, start, end, value, bias=1):
211	value = 1 - (1-value)**bias
212	return start(1-value) + endvalue
213
214	class PngDrawer(Drawer):
215
216	def scale_up(self):
217	self.width *= self.multi
218	self.height *= self.multi
219	self.w_margin *= self.multi
220	self.h_margin *= self.multi
221	self.h_no_margs *= self.multi
222	self.w_no_margs *= self.multi
223
224	def scale_down(self):
225	self.width /= self.multi
226	self.height /= self.multi
227	self.w_margin /= self.multi
228	self.h_margin /= self.multi
229	self.h_no_margs /= self.multi
230	self.w_no_margs /= self.multi
231
232	def draw_design(self, filename, input_filename, multi=1, scale="SIMPLE"):
233	print("Drawing...")
234
235	self.multi=multi
236	self.scale_up()
237
238	back = Image.new('RGBA', (self.width, self.height), (255,255,255,0))
239
240	min_width = min([x['x'] for x in self.design.positions if 'x' in x])
241	max_width = max([x['x'] for x in self.design.positions if 'x' in x])
242	max_height = max([x['y'] for x in self.design.positions if 'y' in x])
243
244	self.draw_lines(back, min_width, max_width, max_height)
245	self.draw_dots(back, min_width, max_width, max_height)
246
247	if scale == "SIMPLE":
248	self.draw_scale(back, input_filename)
249
250	#back.show()
251	self.scale_down()
252
253	back.thumbnail((self.width, self.height), Image.ANTIALIAS)
254
255	back.save(filename)
256
257	def add_dot(self, file, pos, style):
258	x, y = int(pos[0]), int(pos[1])
259	r = style['r']*self.multi
260	offset = (int(x - r), int(y - r))
261	size = (2int(r), 2int(r))
262
263	c = style['color']
264
265	img = Image.new('RGBA', size)
266	ImageDraw.Draw(img).ellipse((1, 1, size[0]-1, size[1]-1),
267	(int(2.55c[0]), int(2.55c[1]), int(2.55c[2]), int(255style['opacity'])))
268	file.paste(img, offset, mask=img)
269
270	def add_line(self, file, from_pos, to_pos, style):
271	fx, fy, tx, ty = int(from_pos[0]), int(from_pos[1]), int(to_pos[0]), int(to_pos[1])
272	w = int(style['width'])*self.multi
273
274	offset = (min(fx-w, tx-w), min(fy-w, ty-w))
275	size = (abs(fx-tx)+2w, abs(fy-ty)+2w)
276	if size[0] == 0 or size[1] == 0:
277	return
278
279	c = style['color']
280
281	img = Image.new('RGBA', size)
282	ImageDraw.Draw(img).line((w, w, size[0]-w, size[1]-w) if (fx-tx)*(fy-ty)>0 else (size[0]-w, w, w, size[1]-w),
283	(int(2.55c[0]), int(2.55c[1]), int(2.55c[2]), int(255style['opacity'])), w)
284	file.paste(img, offset, mask=img)
285
286	def add_dashed_line(self, file, from_pos, to_pos):
287	style = {'color': (0,0,0), 'width': 1, 'opacity': 1}
288	sublines = 50
289	# TODO could be faster: compute delta and only add delta each time (but currently we do not use it often)
290	normdiv = 2*sublines-1
291	for i in range(sublines):
292	from_pos_sub = (self.compute_value(from_pos[0], to_pos[0], 2*i/normdiv, 1),
293	self.compute_value(from_pos[1], to_pos[1], 2*i/normdiv, 1))
294	to_pos_sub = (self.compute_value(from_pos[0], to_pos[0], (2*i+1)/normdiv, 1),
295	self.compute_value(from_pos[1], to_pos[1], (2*i+1)/normdiv, 1))
296	self.add_line(file, from_pos_sub, to_pos_sub, style)
297
298	def add_text(self, file, text, pos, anchor, style=''):
299	font = ImageFont.truetype("Vera.ttf", 16*self.multi)
300
301	img = Image.new('RGBA', (self.width, self.height))
302	draw = ImageDraw.Draw(img)
303	txtsize = draw.textsize(text, font=font)
304	pos = pos if anchor == "start" else (pos[0]-txtsize[0], pos[1])
305	draw.text(pos, text, (0,0,0), font=font)
306	file.paste(img, (0,0), mask=img)
307
308	def compute_line_style(self, parent, child):
309	return {'color': self.compute_property('lines', 'color', child),
310	'width': self.compute_property('lines', 'width', child),
311	'opacity': self.compute_property('lines', 'opacity', child)}
312
313	def compute_dot_style(self, node):
314	return {'color': self.compute_property('dots', 'color', node),
315	'r': self.compute_property('dots', 'size', node),
316	'opacity': self.compute_property('dots', 'opacity', node)}
317
318	class SvgDrawer(Drawer):
319	def draw_design(self, filename, input_filename, multi=1, scale="SIMPLE"):
320	print("Drawing...")
321	file = open(filename, "w")
322
323	min_width = min([x['x'] for x in self.design.positions if 'x' in x])
324	max_width = max([x['x'] for x in self.design.positions if 'x' in x])
325	max_height = max([x['y'] for x in self.design.positions if 'y' in x])
326
327	file.write('<svg xmlns:svg="http://www.w3.org/2000/svg" xmlns="http://www.w3.org/2000/svg" '
328	'xmlns:xlink="http://www.w3.org/1999/xlink" version="1.0" '
329	'width="' + str(self.width) + '" height="' + str(self.height) + '">')
330
331	self.draw_lines(file, min_width, max_width, max_height)
332	self.draw_dots(file, min_width, max_width, max_height)
333
334	if scale == "SIMPLE":
335	self.draw_scale(file, input_filename)
336
337	file.write("</svg>")
338	file.close()
339
340	def add_text(self, file, text, pos, anchor, style=''):
341	style = (style if style != '' else 'style="font-family: Arial; font-size: 12; fill: #000000;"')
342	# assuming font size 12, it should be taken from the style string!
343	file.write('<text ' + style + ' text-anchor="' + anchor + '" x="' + str(pos[0]) + '" y="' + str(pos[1]+12) + '" >' + text + '</text>')
344
345	def add_dot(self, file, pos, style):
346	file.write('<circle ' + style + ' cx="' + str(pos[0]) + '" cy="' + str(pos[1]) + '" />')
347
348	def add_line(self, file, from_pos, to_pos, style):
349	file.write('<line ' + style + ' x1="' + str(from_pos[0]) + '" x2="' + str(to_pos[0]) +
350	'" y1="' + str(from_pos[1]) + '" y2="' + str(to_pos[1]) + '" fill="none"/>')
351
352	def add_dashed_line(self, file, from_pos, to_pos):
353	style = 'stroke="black" stroke-width="0.5" stroke-opacity="1" stroke-dasharray="5, 5"'
354	self.add_line(file, from_pos, to_pos, style)
355
356	def compute_line_style(self, parent, child):
357	return self.compute_stroke_color('lines', child) + ' ' \
358	+ self.compute_stroke_width('lines', child) + ' ' \
359	+ self.compute_stroke_opacity(child)
360
361	def compute_dot_style(self, node):
362	return self.compute_dot_size(node) + ' ' \
363	+ self.compute_fill_opacity(node) + ' ' \
364	+ self.compute_dot_fill(node)
365
366	def compute_stroke_color(self, part, node):
367	color = self.compute_property(part, 'color', node)
368	return 'stroke="rgb(' + str(color[0]) + '%,' + str(color[1]) + '%,' + str(color[2]) + '%)"'
369
370	def compute_stroke_width(self, part, node):
371	return 'stroke-width="' + str(self.compute_property(part, 'width', node)) + '"'
372
373	def compute_stroke_opacity(self, node):
374	return 'stroke-opacity="' + str(self.compute_property('lines', 'opacity', node)) + '"'
375
376	def compute_fill_opacity(self, node):
377	return 'fill-opacity="' + str(self.compute_property('dots', 'opacity', node)) + '"'
378
379	def compute_dot_size(self, node):
380	return 'r="' + str(self.compute_property('dots', 'size', node)) + '"'
381
382	def compute_dot_fill(self, node):
383	color = self.compute_property('dots', 'color', node)
384	return 'fill="rgb(' + str(color[0]) + '%,' + str(color[1]) + '%,' + str(color[2]) + '%)"'
385
386	class Designer:
387
388	def __init__(self, tree, jitter=False, time="GENERATIONAL", balance="DENSITY"):
389	self.props = {}
390
391	self.tree = tree
392
393	self.TIME = time
394	self.JITTER = jitter
395
396	if balance == "RANDOM":
397	self.xmin_crowd = self.xmin_crowd_random
398	elif balance == "MIN":
399	self.xmin_crowd = self.xmin_crowd_min
400	elif balance == "DENSITY":
401	self.xmin_crowd = self.xmin_crowd_density
402	else:
403	raise ValueError("Error, the value of BALANCE does not match any expected value.")
404
405	def calculate_measures(self):
406	print("Calculating measures...")
407	self.compute_depth()
408	self.compute_maxdepth()
409	self.compute_adepth()
410	self.compute_children()
411	self.compute_kind()
412	self.compute_time()
413	self.compute_progress()
414	self.compute_custom()
415
416	def xmin_crowd_random(self, x1, x2, y):
417	return (x1 if random.randrange(2) == 0 else x2)
418
419	def xmin_crowd_min(self, x1, x2, y):
420	x1_closest = 999999
421	x2_closest = 999999
422	miny = y-3
423	maxy = y+3
424	i = bisect.bisect_left(self.y_sorted, miny)
425	while True:
426	if len(self.positions_sorted) <= i or self.positions_sorted[i]['y'] > maxy:
427	break
428	pos = self.positions_sorted[i]
429
430	x1_closest = min(x1_closest, abs(x1-pos['x']))
431	x2_closest = min(x2_closest, abs(x2-pos['x']))
432
433	i += 1
434	return (x1 if x1_closest > x2_closest else x2)
435
436	def xmin_crowd_density(self, x1, x2, y):
437	# TODO experimental - requires further work to make it less 'jumpy' and more predictable
438	CONST_LOCAL_AREA_RADIUS = 5
439	CONST_GLOBAL_AREA_RADIUS = 10
440	CONST_WINDOW_SIZE = 20000 #TODO should depend on the maxY ?
441	x1_dist_loc = 0
442	x2_dist_loc = 0
443	count_loc = 1
444	x1_dist_glob = 0
445	x2_dist_glob = 0
446	count_glob = 1
447	miny = y-CONST_WINDOW_SIZE
448	maxy = y+CONST_WINDOW_SIZE
449	i_left = bisect.bisect_left(self.y_sorted, miny)
450	i_right = bisect.bisect_right(self.y_sorted, maxy)
451	#TODO test: maxy=y should give the same results, right?
452
453	def include_pos(pos):
454	nonlocal x1_dist_loc, x2_dist_loc, x1_dist_glob, x2_dist_glob, count_loc, count_glob
455
456	dysq = (pos['y']-y)**2 + 1 #+1 so 1/dysq is at most 1
457	dx1 = math.fabs(pos['x']-x1)
458	dx2 = math.fabs(pos['x']-x2)
459
460	d = math.fabs(pos['x'] - (x1+x2)/2)
461
462	if d < CONST_LOCAL_AREA_RADIUS:
463	x1_dist_loc += math.sqrt(dx1/dysq + dx1**2)
464	x2_dist_loc += math.sqrt(dx2/dysq + dx2**2)
465	count_loc += 1
466	elif d > CONST_GLOBAL_AREA_RADIUS:
467	x1_dist_glob += math.sqrt(dx1/dysq + dx1**2)
468	x2_dist_glob += math.sqrt(dx2/dysq + dx2**2)
469	count_glob += 1
470
471	# optimized to draw from all the nodes, if less than 10 nodes in the range
472	if len(self.positions_sorted) > i_left:
473	if i_right - i_left < 10:
474	for j in range(i_left, i_right):
475	include_pos(self.positions_sorted[j])
476	else:
477	for j in range(10):
478	pos = self.positions_sorted[random.randrange(i_left, i_right)]
479	include_pos(pos)
480
481	return (x1 if (x1_dist_loc-x2_dist_loc)/count_loc-(x1_dist_glob-x2_dist_glob)/count_glob > 0 else x2)
482	#return (x1 if x1_dist +random.gauss(0, 0.00001) > x2_dist +random.gauss(0, 0.00001) else x2)
483	#print(x1_dist, x2_dist)
484	#x1_dist = x1_dist**2
485	#x2_dist = x2_dist**2
486	#return x1 if x1_dist+x2_dist==0 else (x1x1_dist + x2x2_dist) / (x1_dist+x2_dist) + random.gauss(0, 0.01)
487	#return (x1 if random.randint(0, int(x1_dist+x2_dist)) < x1_dist else x2)
488
489	def calculate_node_positions(self, ignore_last=0):
490	print("Calculating positions...")
491
492	def add_node(node):
493	index = bisect.bisect_left(self.y_sorted, node['y'])
494	self.y_sorted.insert(index, node['y'])
495	self.positions_sorted.insert(index, node)
496	self.positions[node['id']] = node
497
498	self.positions_sorted = [{'x':0, 'y':0, 'id':0}]
499	self.y_sorted = [0]
500	self.positions = [{} for x in range(len(self.tree.parents))]
501	self.positions[0] = {'x':0, 'y':0, 'id':0}
502
503	# order by maximum depth of the parent guarantees that co child is evaluated before its parent
504	visiting_order = [i for i in range(0, len(self.tree.parents))]
505	visiting_order = sorted(visiting_order, key=lambda q:\
506	0 if q == 0 else self.props["maxdepth"][q])
507
508	start_time = timelib.time()
509
510	# for each child of the current node
511	for node_counter,child in enumerate(visiting_order, start=1):
512	# debug info - elapsed time
513	if node_counter % 100000 == 0:
514	print("%d%%\t%d\t%g" % (node_counter*100/len(self.tree.parents), node_counter, timelib.time()-start_time))
515	start_time = timelib.time()
516
517	# using normalized adepth
518	if self.props['adepth'][child] >= ignore_last/self.props['adepth_max']:
519
520	ypos = 0
521	if self.TIME == "BIRTHS":
522	ypos = child
523	elif self.TIME == "GENERATIONAL":
524	# one more than its parent (what if more than one parent?)
525	ypos = max([self.positions[par]['y'] for par, v in self.tree.parents[child].items()])+1 \
526	if self.tree.parents[child] else 0
527	elif self.TIME == "REAL":
528	ypos = self.tree.time[child]
529
530	if len(self.tree.parents[child]) == 1:
531	# if current_node is the only parent
532	parent, similarity = [(par, v) for par, v in self.tree.parents[child].items()][0]
533
534	if self.JITTER:
535	dissimilarity = (1-similarity) + random.gauss(0, 0.01) + 0.001
536	else:
537	dissimilarity = (1-similarity) + 0.001
538	add_node({'id':child, 'y':ypos, 'x':
539	self.xmin_crowd(self.positions[parent]['x']-dissimilarity,
540	self.positions[parent]['x']+dissimilarity, ypos)})
541	else:
542	# position weighted by the degree of inheritence from each parent
543	total_inheretance = sum([v for k, v in self.tree.parents[child].items()])
544	xpos = sum([self.positions[k]['x']*v/total_inheretance
545	for k, v in self.tree.parents[child].items()])
546	if self.JITTER:
547	add_node({'id':child, 'y':ypos, 'x':xpos + random.gauss(0, 0.1)})
548	else:
549	add_node({'id':child, 'y':ypos, 'x':xpos})
550
551
552	def compute_custom(self):
553	for prop in self.tree.props:
554	self.props[prop] = [None for x in range(len(self.tree.children))]
555
556	for i in range(len(self.props[prop])):
557	self.props[prop][i] = self.tree.props[prop][i]
558
559	self.normalize_prop(prop)
560
561	def compute_time(self):
562	# simple rewrite from the tree
563	self.props["time"] = [0 for x in range(len(self.tree.children))]
564
565	for i in range(len(self.props['time'])):
566	self.props['time'][i] = self.tree.time[i]
567
568	self.normalize_prop('time')
569
570	def compute_kind(self):
571	# simple rewrite from the tree
572	self.props["kind"] = [0 for x in range(len(self.tree.children))]
573
574	for i in range (len(self.props['kind'])):
575	self.props['kind'][i] = str(self.tree.kind[i])
576
577	def compute_depth(self):
578	self.props["depth"] = [999999999 for x in range(len(self.tree.children))]
579	visited = [0 for x in range(len(self.tree.children))]
580
581	nodes_to_visit = [0]
582	visited[0] = 1
583	self.props["depth"][0] = 0
584	while True:
585	current_node = nodes_to_visit[0]
586
587	for child in self.tree.children[current_node]:
588	if visited[child] == 0:
589	visited[child] = 1
590	nodes_to_visit.append(child)
591	self.props["depth"][child] = self.props["depth"][current_node]+1
592	nodes_to_visit = nodes_to_visit[1:]
593	if len(nodes_to_visit) == 0:
594	break
595
596	self.normalize_prop('depth')
597
598	def compute_maxdepth(self):
599	self.props["maxdepth"] = [999999999 for x in range(len(self.tree.children))]
600	visited = [0 for x in range(len(self.tree.children))]
601
602	nodes_to_visit = [0]
603	visited[0] = 1
604	self.props["maxdepth"][0] = 0
605	while True:
606	current_node = nodes_to_visit[0]
607
608	for child in self.tree.children[current_node]:
609	if visited[child] == 0:
610	visited[child] = 1
611	nodes_to_visit.append(child)
612	self.props["maxdepth"][child] = self.props["maxdepth"][current_node]+1
613	elif self.props["maxdepth"][child] < self.props["maxdepth"][current_node]+1:
614	self.props["maxdepth"][child] = self.props["maxdepth"][current_node]+1
615	if child not in nodes_to_visit:
616	nodes_to_visit.append(child)
617
618	nodes_to_visit = nodes_to_visit[1:]
619	if len(nodes_to_visit) == 0:
620	break
621
622	self.normalize_prop('maxdepth')
623
624	def compute_adepth(self):
625	self.props["adepth"] = [0 for x in range(len(self.tree.children))]
626
627	# order by maximum depth of the parent guarantees that co child is evaluated before its parent
628	visiting_order = [i for i in range(0, len(self.tree.parents))]
629	visiting_order = sorted(visiting_order, key=lambda q: self.props["maxdepth"][q])[::-1]
630
631	for node in visiting_order:
632	children = self.tree.children[node]
633	if len(children) != 0:
634	# 0 by default
635	self.props["adepth"][node] = max([self.props["adepth"][child] for child in children])+1
636	self.normalize_prop('adepth')
637
638	def compute_children(self):
639	self.props["children"] = [0 for x in range(len(self.tree.children))]
640	for i in range (len(self.props['children'])):
641	self.props['children'][i] = len(self.tree.children[i])
642
643	self.normalize_prop('children')
644
645	def compute_progress(self):
646	self.props["progress"] = [0 for x in range(len(self.tree.children))]
647	for i in range(len(self.props['children'])):
648	times = sorted([self.props["time"][self.tree.children[i][j]]*100000 for j in range(len(self.tree.children[i]))])
649	if len(times) > 4:
650	times = [times[i+1] - times[i] for i in range(len(times)-1)]
651	#print(times)
652	slope, intercept, r_value, p_value, std_err = stats.linregress(range(len(times)), times)
653	self.props['progress'][i] = slope if not np.isnan(slope) and not np.isinf(slope) else 0
654
655	for i in range(0, 5):
656	self.props['progress'][self.props['progress'].index(min(self.props['progress']))] = 0
657	self.props['progress'][self.props['progress'].index(max(self.props['progress']))] = 0
658
659	mini = min(self.props['progress'])
660	maxi = max(self.props['progress'])
661	for k in range(len(self.props['progress'])):
662	if self.props['progress'][k] == 0:
663	self.props['progress'][k] = mini
664
665	#for k in range(len(self.props['progress'])):
666	# self.props['progress'][k] = 1-self.props['progress'][k]
667
668	self.normalize_prop('progress')
669
670	def normalize_prop(self, prop):
671	noneless = [v for v in self.props[prop] if (type(v)!=str and type(v)!=list)]
672	if len(noneless) > 0:
673	max_val = max(noneless)
674	min_val = min(noneless)
675	print("%s: [%g, %g]" % (prop, min_val, max_val))
676	self.props[prop +'_max'] = max_val
677	self.props[prop +'_min'] = min_val
678	for i in range(len(self.props[prop])):
679	if self.props[prop][i] is not None:
680	qqq = self.props[prop][i]
681	self.props[prop][i] = 0 if max_val == min_val else (self.props[prop][i] - min_val) / (max_val - min_val)
682
683	class TreeData:
684	simple_data = None
685
686	children = []
687	parents = []
688	time = []
689	kind = []
690
691	def __init__(self): #, simple_data=False):
692	#self.simple_data = simple_data
693	pass
694
695	def load(self, filenames, max_nodes=0):
696	print("Loading...")
697
698	CLI_PREFIX = "Script.Message:"
699	default_props = ["Time", "FromIDs", "ID", "Operation", "Inherited"]
700
701	merged_with_virtual_parent = [] #this list will contain individuals for which the parent could not be found
702
703	self.ids = {}
704	def get_id(id, createOnError = True):
705	if createOnError:
706	if id not in self.ids:
707	self.ids[id] = len(self.ids)
708	else:
709	if id not in self.ids:
710	return None
711
712	return self.ids[id]
713
714	def try_to_load(input):
715	creature = False
716	try:
717	creature = json.loads(input)
718	except ValueError:
719	print("Json format error: the line cannot be read. Breaking the loading loop.")
720	# fixing arrays by removing the last element
721	# ! assuming that only the last line is broken !
722	self.parents.pop()
723	self.children.pop()
724	self.time.pop()
725	self.kind.pop()
726	self.life_lenght.pop()
727	return creature
728
729	def load_creature_props(creature):
730	creature_id = get_id(creature["ID"])
731	for prop in creature:
732	if prop not in default_props:
733	if prop not in self.props:
734	self.props[prop] = [0 for i in range(nodes)]
735	self.props[prop][creature_id] = creature[prop]
736
737	def load_born_props(creature):
738	nonlocal max_time
739	creature_id = get_id(creature["ID"])
740	if "Time" in creature:
741	self.time[creature_id] = creature["Time"] + time_offset
742	max_time = max(self.time[creature_id], max_time)
743
744	def load_offspring_props(creature):
745	creature_id = get_id(creature["ID"])#, False)
746	if "FromIDs" in creature:
747	# make sure that ID's of parents are lower than that of their children
748	for i in range(0, len(creature["FromIDs"])):
749	if creature["FromIDs"][i] not in self.ids:
750	get_id("virtual_parent")
751
752
753	# we assign to each parent its contribution to the genotype of the child
754	for i in range(0, len(creature["FromIDs"])):
755	if creature["FromIDs"][i] in self.ids:
756	parent_id = get_id(creature["FromIDs"][i])
757	else:
758	if creature["FromIDs"][i] not in merged_with_virtual_parent:
759	merged_with_virtual_parent.append(creature["FromIDs"][i])
760	parent_id = get_id("virtual_parent")
761	inherited = (creature["Inherited"][i] if 'Inherited' in creature else 1)
762	self.parents[creature_id][parent_id] = inherited
763
764	if "Kind" in creature:
765	self.kind[creature_id] = creature["Kind"]
766	else:
767	raise LoadingError("[OFFSPRING] misses the 'FromIDs' field!")
768
769	# counting the number of expected nodes
770	nodes_born, nodes_offspring = 0, 0
771	for filename in filenames:
772	file = open(filename)
773	for line in file:
774	line_arr = line.split(' ', 1)
775	if len(line_arr) == 2:
776	if line_arr[0] == CLI_PREFIX:
777	line_arr = line_arr[1].split(' ', 1)
778	if line_arr[0] == "[BORN]":
779	nodes_born += 1
780	if line_arr[0] == "[OFFSPRING]":
781	nodes_offspring += 1
782	# assuming that either BORN or OFFSPRING, or both, are present for each individual
783	nodes = max(nodes_born, nodes_offspring)
784	nodes = min(nodes, max_nodes if max_nodes != 0 else nodes)+1
785
786	self.parents = [{} for x in range(nodes)]
787	self.children = [[] for x in range(nodes)]
788	self.time = [0] * nodes
789	self.kind = [0] * nodes
790	self.life_lenght = [0] * nodes
791	self.props = {}
792
793	print("nodes: %d" % len(self.parents))
794
795
796	get_id("virtual_parent")
797	loaded_so_far = 0
798	max_time = 0
799	# rewind the file
800
801	for filename in filenames:
802	file = open(filename)
803	time_offset = max_time
804	if max_time != 0:
805	print("NOTE: merging files, assuming cumulative time offset for '%s' to be %d" % (filename, time_offset))
806
807	lasttime = timelib.time()
808
809	for line in file:
810	line_arr = line.split(' ', 1)
811	if len(line_arr) == 2:
812	if line_arr[0] == CLI_PREFIX:
813	line_arr = line_arr[1].split(' ', 1)
814	if line_arr[0] == "[BORN]":
815	creature = try_to_load(line_arr[1])
816	if not creature:
817	nodes -= 1
818	break
819
820	if get_id(creature["ID"], False) is None:
821	loaded_so_far += 1
822
823	load_born_props(creature)
824	load_creature_props(creature)
825
826	if line_arr[0] == "[OFFSPRING]":
827	creature = try_to_load(line_arr[1])
828	if not creature:
829	nodes -= 1
830	break
831
832	if get_id(creature["ID"], False) is None:
833	loaded_so_far += 1
834	# load time only if there was no [BORN] yet
835	load_born_props(creature)
836
837	load_offspring_props(creature)
838
839	if line_arr[0] == "[DIED]":
840	creature = try_to_load(line_arr[1])
841	if not creature:
842	nodes -= 1
843	break
844	if get_id(creature["ID"], False) is not None:
845	load_creature_props(creature)
846	else:
847	print("NOTE: encountered [DIED] entry for individual " + creature["ID"] + " before it was born")
848
849	# debug
850	if loaded_so_far%1000 == 0:
851	#print(". " + str(creature_id) + " " + str(timelib.time() - lasttime))
852	lasttime = timelib.time()
853
854	# breaking both loops
855	if loaded_so_far >= max_nodes and max_nodes != 0:
856	break
857	if loaded_so_far >= max_nodes and max_nodes != 0:
858	break
859
860	print("NOTE: all individuals with parent not provided or missing were connected to a single 'virtual parent' node: " + str(merged_with_virtual_parent))
861
862	for c_id in range(1, nodes):
863	if not self.parents[c_id]:
864	self.parents[c_id][get_id("virtual_parent")] = 1
865
866	for k in range(len(self.parents)):
867	v = self.parents[k]
868	for val in self.parents[k]:
869	self.children[val].append(k)
870
871	depth = {}
872	kind = {}
873
874	def main():
875
876	parser = argparse.ArgumentParser(description='Draws a genealogical tree (generates a SVG file) based on parent-child relationship '
877	'information from a text file. Supports files generated by Framsticks experiments.')
878	parser.add_argument('-i', '--in', nargs='+', dest='input', required=True, help='input file name with stuctured evolutionary data (or a list of input files)')
879	parser.add_argument('-o', '--out', dest='output', required=True, help='output file name for the evolutionary tree (SVG/PNG/JPG/BMP)')
880	parser.add_argument('-c', '--config', dest='config', default="", help='config file name ')
881
882	parser.add_argument('-W', '--width', default=600, type=int, dest='width', help='width of the output image (600 by default)')
883	parser.add_argument('-H', '--height', default=800, type=int, dest='height', help='height of the output image (800 by default)')
884	parser.add_argument('-m', '--multi', default=1, type=int, dest='multi', help='multisampling factor (applicable only for raster images)')
885
886	parser.add_argument('-t', '--time', default='GENERATIONAL', dest='time', help='values on vertical axis (BIRTHS/GENERATIONAL(d)/REAL); '
887	'BIRTHS: time measured as the number of births since the beginning; '
888	'GENERATIONAL: time measured as number of ancestors; '
889	'REAL: real time of the simulation')
890	parser.add_argument('-b', '--balance', default='DENSITY', dest='balance', help='method of placing nodes in the tree (RANDOM/MIN/DENSITY(d))')
891	parser.add_argument('-s', '--scale', default='SIMPLE', dest='scale', help='type of timescale added to the tree (NONE(d)/SIMPLE)')
892	parser.add_argument('-j', '--jitter', dest="jitter", action='store_true', help='draw horizontal positions of children from the normal distribution')
893	parser.add_argument('-p', '--skip', dest="skip", type=int, default=0, help='skip last P levels of the tree (0 by default)')
894	parser.add_argument('-x', '--max-nodes', type=int, default=0, dest='max_nodes', help='maximum number of nodes drawn (starting from the first one)')
895	parser.add_argument('--seed', type=int, dest='seed', help='seed for the random number generator (-1 for random)')
896
897	parser.set_defaults(draw_tree=True)
898	parser.set_defaults(draw_skeleton=False)
899	parser.set_defaults(draw_spine=False)
900
901	parser.set_defaults(seed=-1)
902
903	args = parser.parse_args()
904
905	TIME = args.time.upper()
906	BALANCE = args.balance.upper()
907	SCALE = args.scale.upper()
908	JITTER = args.jitter
909	if not TIME in ['BIRTHS', 'GENERATIONAL', 'REAL']\
910	or not BALANCE in ['RANDOM', 'MIN', 'DENSITY']\
911	or not SCALE in ['NONE', 'SIMPLE']:
912	print("Incorrect value of one of the parameters! (time or balance or scale).") #user has to figure out which parameter is wrong...
913	return
914
915	dir = args.input
916
917	seed = args.seed
918	if seed == -1:
919	seed = random.randint(0, 10000)
920	random.seed(seed)
921	print("randomseed:", seed)
922
923	tree = TreeData()
924	tree.load(dir, max_nodes=args.max_nodes)
925
926
927	designer = Designer(tree, jitter=JITTER, time=TIME, balance=BALANCE)
928	designer.calculate_measures()
929	designer.calculate_node_positions(ignore_last=args.skip)
930
931	if args.output.endswith(".svg"):
932	drawer = SvgDrawer(designer, args.config, w=args.width, h=args.height)
933	else:
934	drawer = PngDrawer(designer, args.config, w=args.width, h=args.height)
935	drawer.draw_design(args.output, args.input, multi=args.multi, scale=SCALE)
936
937
938	main()

Note: See TracBrowser for help on using the repository browser.

Download in other formats: