Mercurial > repos > recetox > matchms_formatter
comparison formatter.py @ 1:364976b9aba6 draft
"planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit 67040e686204e86c07ec46ca90129e50e40eb737"
author | recetox |
---|---|
date | Tue, 11 Jan 2022 15:13:57 +0000 |
parents | 0a08bed94964 |
children | 4ca9807c56e6 |
comparison
equal
deleted
inserted
replaced
0:0a08bed94964 | 1:364976b9aba6 |
---|---|
71 matches_filename (str): Path to matches table. | 71 matches_filename (str): Path to matches table. |
72 | 72 |
73 Returns: | 73 Returns: |
74 DataFrame: Joined dataframe on compounds containing scores an matches in long format. | 74 DataFrame: Joined dataframe on compounds containing scores an matches in long format. |
75 """ | 75 """ |
76 matches = read_csv(matches_filename, sep='\t', index_col=0) | 76 matches = read_csv(matches_filename, sep=None, index_col=0) |
77 scores = read_csv(scores_filename, sep='\t', index_col=0) | 77 scores = read_csv(scores_filename, sep=None, index_col=0) |
78 | 78 |
79 scores_long = create_long_table(scores, 'score') | 79 scores_long = create_long_table(scores, 'score') |
80 matches_long = create_long_table(matches, 'matches') | 80 matches_long = create_long_table(matches, 'matches') |
81 | 81 |
82 combined = join_df(matches_long, scores_long, on=['compound'], how='inner') | 82 combined = join_df(matches_long, scores_long, on=['compound'], how='inner') |
111 return result | 111 return result |
112 | 112 |
113 | 113 |
114 @cli.resultcallback() | 114 @cli.resultcallback() |
115 def write_output(result: DataFrame, scores_filename, matches_filename, output_filename): | 115 def write_output(result: DataFrame, scores_filename, matches_filename, output_filename): |
116 input_file = read_csv(scores_filename, sep=None, iterator=True) | |
117 sep = input_file._engine.data.dialect.delimiter | |
118 | |
116 result = result.reset_index().rename(columns={'level_0': 'query', 'compound': 'reference'}) | 119 result = result.reset_index().rename(columns={'level_0': 'query', 'compound': 'reference'}) |
117 result.to_csv(output_filename, sep="\t", index=False) | 120 result.to_csv(output_filename, sep=sep, index=False) |
118 | 121 |
119 | 122 |
120 if __name__ == '__main__': | 123 if __name__ == '__main__': |
121 cli(obj={}) | 124 cli(obj={}) |