annotate venn_diagram.py @ 2:5ac986568a3d draft

planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
author proteore
date Wed, 28 Nov 2018 09:58:46 -0500
parents b17f0fbbd6c9
children 1645a66fd0ee
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
1 #!/usr/bin/env python2.7
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
2
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
3 import os
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
4 import sys
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
5 import json
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
6 import operator
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
7 import argparse
1
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
8 import re, csv
0
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
9 from itertools import combinations
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
10
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
11 CURRENT_DIR = os.path.dirname(os.path.abspath(__file__))
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
12
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
13 ##################################################################################################################################################
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
14 # FUNCTIONS
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
15 ##################################################################################################################################################
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
16
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
17 def isnumber(format, n):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
18 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
19 Check if an element is integer or float
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
20 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
21 float_format = re.compile(r"^[-]?[1-9][0-9]*.?[0-9]+$")
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
22 int_format = re.compile(r"^[-]?[1-9][0-9]*$")
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
23 test = ""
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
24 if format == "int":
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
25 test = re.match(int_format, n)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
26 elif format == "float":
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
27 test = re.match(float_format, n)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
28 if test:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
29 return True
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
30 else:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
31 return False
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
32
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
33 def input_to_dict(inputs):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
34 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
35 Parse input and return a dictionary of name and data of each lists/files
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
36 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
37 comp_dict = {}
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
38 title_dict = {}
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
39 c = ["A", "B", "C", "D", "E", "F"]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
40 for i in range(len(inputs)):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
41 input_file = inputs[i][0]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
42 name = inputs[i][1]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
43 input_type = inputs[i][2]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
44 title = c[i]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
45 title_dict[title] = name
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
46 ids = set()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
47 if input_type == "file":
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
48 header = inputs[i][3]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
49 ncol = inputs[i][4]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
50 file_content = open(input_file, "r").readlines()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
51
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
52 # Check if column number is in right form
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
53 if isnumber("int", ncol.replace("c", "")):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
54 if header == "true":
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
55 file_content = [x.strip() for x in [line.split("\t")[int(ncol.replace("c", ""))-1].split(";")[0] for line in file_content[1:]]] # take only first IDs
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
56 else:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
57 file_content = [x.strip() for x in [line.split("\t")[int(ncol.replace("c", ""))-1].split(";")[0] for line in file_content]] # take only first IDs
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
58 else:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
59 raise ValueError("Please fill in the right format of column number")
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
60 else:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
61 ids = set()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
62 file_content = inputs[i][0].split()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
63
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
64 ids.update(file_content)
1
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
65 if 'NA' in ids : ids.remove('NA')
0
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
66 comp_dict[title] = ids
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
67
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
68 return comp_dict, title_dict
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
69
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
70 def intersect(comp_dict):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
71 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
72 Calculate the intersections of input
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
73 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
74 names = set(comp_dict)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
75 for i in range(1, len(comp_dict) + 1):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
76 for group in combinations(sorted(comp_dict), i):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
77 others = set()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
78 [others.add(name) for name in names if name not in group]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
79 difference = []
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
80 intersected = set.intersection(*(comp_dict[k] for k in group))
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
81 if len(others) > 0:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
82 difference = intersected.difference(set.union(*(comp_dict[k] for k in others)))
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
83 yield group, list(intersected), list(difference)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
84
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
85 def diagram(comp_dict, title_dict):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
86 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
87 Create json string for jvenn diagram plot
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
88 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
89 result = {}
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
90 result["name"] = {}
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
91 for k in comp_dict.keys():
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
92 result["name"][k] = title_dict[k]
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
93
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
94 result["data"] = {}
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
95 result["values"] = {}
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
96 for group, intersected, difference in intersect(comp_dict):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
97 if len(group) == 1:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
98 result["data"]["".join(group)] = difference
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
99 result["values"]["".join(group)] = len(difference)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
100 elif len(group) > 1 and len(group) < len(comp_dict):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
101 result["data"]["".join(group)] = difference
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
102 result["values"]["".join(group)] = len(difference)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
103 elif len(group) == len(comp_dict):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
104 result["data"]["".join(group)] = intersected
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
105 result["values"]["".join(group)] = len(intersected)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
106
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
107 return result
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
108
1
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
109 #Write intersections of input to text output file
0
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
110 def write_text_venn(json_result):
1
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
111 output = open("venn_diagram_text_output.tsv", "w")
0
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
112 lines = []
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
113 result = dict((k, v) for k, v in json_result["data"].iteritems() if v != [])
1
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
114 for key in result :
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
115 if 'NA' in result[key] : result[key].remove("NA")
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
116 list_names = dict((k, v) for k, v in json_result["name"].iteritems() if v != [])
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
117 nb_lines_max = max(len(v) for v in result.values())
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
118
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
119 #get list names associated to each column
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
120 column_dict = {}
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
121 for key in result :
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
122 if key in list_names :
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
123 column_dict[key] = list_names[key]
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
124 else :
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
125 keys= list(key)
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
126 column_dict[key] = "_".join([list_names[k] for k in keys])
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
127
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
128 #construct tsv
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
129 for key in result :
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
130 line = [column_dict[key]]
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
131 line.extend(result[key])
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
132 if len(line) < nb_lines_max :
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
133 line.extend(['NA']*(nb_lines_max-len(line)))
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
134 lines.append(line)
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
135 #transpose tsv
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
136 lines=zip(*lines)
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
137
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
138 with open("venn_diagram_text_output.tsv", "w") as output:
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
139 tsv_output = csv.writer(output, delimiter='\t')
b17f0fbbd6c9 planemo upload commit ba044b029418f46b923830e8eaa1088833e6ef6b-dirty
proteore
parents: 0
diff changeset
140 tsv_output.writerows(lines)
0
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
141
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
142 def write_summary(summary_file, inputs):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
143 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
144 Paste json string into template file
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
145 """
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
146 a, b = input_to_dict(inputs)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
147 data = diagram(a, b)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
148 write_text_venn(data)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
149
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
150 to_replace = {
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
151 "series": [data],
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
152 "displayStat": "true",
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
153 "displaySwitch": "true",
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
154 "shortNumber": "true",
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
155 }
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
156
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
157 FH_summary_tpl = open(os.path.join(CURRENT_DIR, "jvenn_template.html"))
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
158 FH_summary_out = open(summary_file, "w" )
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
159 for line in FH_summary_tpl:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
160 if "###JVENN_DATA###" in line:
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
161 line = line.replace("###JVENN_DATA###", json.dumps(to_replace))
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
162 FH_summary_out.write(line)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
163
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
164 FH_summary_out.close()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
165 FH_summary_tpl.close()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
166
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
167 def process(args):
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
168 write_summary(args.summary, args.input)
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
169
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
170
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
171 ##################################################################################################################################################
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
172 # MAIN
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
173 ##################################################################################################################################################
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
174 if __name__ == '__main__':
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
175 # Parse parameters
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
176 parser = argparse.ArgumentParser(description='Filters an abundance file')
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
177 group_input = parser.add_argument_group( 'Inputs' )
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
178 group_input.add_argument('--input', nargs="+", action="append", required=True, help="The input tabular file.")
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
179 group_output = parser.add_argument_group( 'Outputs' )
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
180 group_output.add_argument('--summary', default="summary.html", help="The HTML file containing the graphs. [Default: %(default)s]")
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
181 args = parser.parse_args()
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
182
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
183 # Process
8d61f5ca50a4 planemo upload commit 9760cde192a15cdf3d2dbec05dd867eaa0392bcd-dirty
proteore
parents:
diff changeset
184 process( args )