Mercurial > repos > greg > cwpair2
comparison cwpair2_util.py @ 2:279cdc63bcff draft
Uploaded
| author | greg |
|---|---|
| date | Sat, 21 Nov 2015 09:01:24 -0500 |
| parents | 4d86371aafa8 |
| children | 2e0ddcc726f9 |
comparison
equal
deleted
inserted
replaced
| 1:4d86371aafa8 | 2:279cdc63bcff |
|---|---|
| 20 COLORS = 'krg' | 20 COLORS = 'krg' |
| 21 Y_LABEL = 'Peak-pair counts' | 21 Y_LABEL = 'Peak-pair counts' |
| 22 X_LABEL = 'Peak-pair distance (bp)' | 22 X_LABEL = 'Peak-pair distance (bp)' |
| 23 TICK_WIDTH = 3 | 23 TICK_WIDTH = 3 |
| 24 ADJUST = [0.140, 0.9, 0.9, 0.1] | 24 ADJUST = [0.140, 0.9, 0.9, 0.1] |
| 25 PLOT_FORMAT = 'pdf' | |
| 25 pyplot.rc('xtick.major', size=10.00) | 26 pyplot.rc('xtick.major', size=10.00) |
| 26 pyplot.rc('ytick.major', size=10.00) | 27 pyplot.rc('ytick.major', size=10.00) |
| 27 pyplot.rc('lines', linewidth=4.00) | 28 pyplot.rc('lines', linewidth=4.00) |
| 28 pyplot.rc('axes', linewidth=3.00) | 29 pyplot.rc('axes', linewidth=3.00) |
| 29 pyplot.rc('font', family='Bitstream Vera Sans', size=32.0) | 30 pyplot.rc('font', family='Bitstream Vera Sans', size=32.0) |
| 221 os.mkdir('%s_%s' % (match_method, PREVIEW_PLOTS)) | 222 os.mkdir('%s_%s' % (match_method, PREVIEW_PLOTS)) |
| 222 os.mkdir('%s_%s' % (match_method, SIMPLES)) | 223 os.mkdir('%s_%s' % (match_method, SIMPLES)) |
| 223 os.mkdir('%s_%s' % (match_method, STATS_GRAPH)) | 224 os.mkdir('%s_%s' % (match_method, STATS_GRAPH)) |
| 224 | 225 |
| 225 | 226 |
| 226 def process_file(dataset_path, galaxy_hid, method, threshold, up_distance, down_distance, | 227 def process_file(dataset_path, galaxy_hid, method, threshold, up_distance, |
| 227 binsize, output_files, plot_format, sort_chromosome, sort_score): | 228 down_distance, binsize, output_files, sort_chromosome, sort_score): |
| 228 if method == 'all': | 229 if method == 'all': |
| 229 match_methods = METHODS.keys() | 230 match_methods = METHODS.keys() |
| 230 else: | 231 else: |
| 231 match_methods = [method] | 232 match_methods = [method] |
| 232 statistics = [] | 233 statistics = [] |
| 237 threshold, | 238 threshold, |
| 238 up_distance, | 239 up_distance, |
| 239 down_distance, | 240 down_distance, |
| 240 binsize, | 241 binsize, |
| 241 output_files, | 242 output_files, |
| 242 plot_format, | |
| 243 sort_chromosome, | 243 sort_chromosome, |
| 244 sort_score) | 244 sort_score) |
| 245 statistics.append(stats) | 245 statistics.append(stats) |
| 246 if output_files == 'all' and method == 'all': | 246 if output_files == 'all' and method == 'all': |
| 247 frequency_plot([s['dist'] for s in statistics], | 247 frequency_plot([s['dist'] for s in statistics], |
| 249 labels=METHODS.keys()) | 249 labels=METHODS.keys()) |
| 250 return statistics | 250 return statistics |
| 251 | 251 |
| 252 | 252 |
| 253 def perform_process(dataset_path, galaxy_hid, method, threshold, up_distance, | 253 def perform_process(dataset_path, galaxy_hid, method, threshold, up_distance, |
| 254 down_distance, binsize, output_files, plot_format, sort_chromosome, sort_score): | 254 down_distance, binsize, output_files, sort_chromosome, sort_score): |
| 255 output_details = output_files in ["all", "simple_orphan_detail"] | 255 output_details = output_files in ["all", "simple_orphan_detail"] |
| 256 output_plots = output_files in ["all"] | 256 output_plots = output_files in ["all"] |
| 257 output_orphans = output_files in ["all", "simple_orphan", "simple_orphan_detail"] | 257 output_orphans = output_files in ["all", "simple_orphan", "simple_orphan_detail"] |
| 258 # Keep track of statistics for the output file | 258 # Keep track of statistics for the output file |
| 259 statistics = {} | 259 statistics = {} |
| 284 # Details | 284 # Details |
| 285 detailed_output = td_writer('%s_%s' % (method, DETAILS), extension=TABULAR_EXT) | 285 detailed_output = td_writer('%s_%s' % (method, DETAILS), extension=TABULAR_EXT) |
| 286 detailed_output.writerow(('chrom', 'start', 'end', 'value', 'strand') * 2 + ('midpoint', 'c-w reads sum', 'c-w distance (bp)')) | 286 detailed_output.writerow(('chrom', 'start', 'end', 'value', 'strand') * 2 + ('midpoint', 'c-w reads sum', 'c-w distance (bp)')) |
| 287 if output_plots: | 287 if output_plots: |
| 288 # Final Plot | 288 # Final Plot |
| 289 final_plot_path = make_path('%s_%s' % (method, FINAL_PLOTS), plot_format) | 289 final_plot_path = make_path('%s_%s' % (method, FINAL_PLOTS), PLOT_FORMAT) |
| 290 if output_orphans: | 290 if output_orphans: |
| 291 # Orphans | 291 # Orphans |
| 292 orphan_output = td_writer('%s_%s' % (method, ORPHANS), extension=TABULAR_EXT) | 292 orphan_output = td_writer('%s_%s' % (method, ORPHANS), extension=TABULAR_EXT) |
| 293 orphan_output.writerow(('chrom', 'strand', 'start', 'end', 'value')) | 293 orphan_output.writerow(('chrom', 'strand', 'start', 'end', 'value')) |
| 294 if output_plots: | 294 if output_plots: |
| 295 # Preview Plot | 295 # Preview Plot |
| 296 preview_plot_path = make_path('%s_%s' % (method, PREVIEW_PLOTS), plot_format) | 296 preview_plot_path = make_path('%s_%s' % (method, PREVIEW_PLOTS), PLOT_FORMAT) |
| 297 # Simple | 297 # Simple |
| 298 simple_output = td_writer('%s_%s' % (method, SIMPLES), extension=GFF_EXT) | 298 simple_output = td_writer('%s_%s' % (method, SIMPLES), extension=GFF_EXT) |
| 299 statistics['stats_path'] = 'statistics.%s' % TABULAR_EXT | 299 statistics['stats_path'] = 'statistics.%s' % TABULAR_EXT |
| 300 if output_plots: | 300 if output_plots: |
| 301 statistics['graph_path'] = make_path('%s_%s' % (method, STATS_GRAPH), plot_format) | 301 statistics['graph_path'] = make_path('%s_%s' % (method, STATS_GRAPH), PLOT_FORMAT) |
| 302 statistics['perc95'] = perc95(chromosomes) | 302 statistics['perc95'] = perc95(chromosomes) |
| 303 if threshold > 0: | 303 if threshold > 0: |
| 304 # Apply filter | 304 # Apply filter |
| 305 filter(chromosomes, threshold) | 305 filter(chromosomes, threshold) |
| 306 if method == 'mode': | 306 if method == 'mode': |
