annotate BEDTools-Version-2.14.3/src/unionBedGraphs/unionBedGraphsMain.cpp @ 0:dfcd8b6c1bda

Uploaded
author aaronquinlan
date Thu, 03 Nov 2011 10:25:04 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
1 /*****************************************************************************
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
2 unionBedGraphsMain.cpp
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
3
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
4 (c) 2010 - Assaf Gordon, CSHL
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
5 - Aaron Quinlan, UVA
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
6 Hall Laboratory
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
7 Department of Biochemistry and Molecular Genetics
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
8 University of Virginia
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
9 aaronquinlan@gmail.com
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
10
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
11 Licenced under the GNU General Public License 2.0 license.
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
12 ******************************************************************************/
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
13 #include <climits>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
14 #include <cstring>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
15 #include <cstdlib>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
16 #include <vector>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
17 #include <string>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
18 #include <iostream>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
19 #include <getopt.h>
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
20 #include <libgen.h> //for basename()
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
21 #include "version.h"
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
22
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
23 #include "genomeFile.h"
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
24 #include "unionBedGraphs.h"
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
25
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
26 using namespace std;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
27
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
28 // define our program name
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
29 #define PROGRAM_NAME "unionBedGraphs"
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
30
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
31 // define our parameter checking macro
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
32 #define PARAMETER_CHECK(param, paramLen, actualLen) (strncmp(argv[i], param, min(actualLen, paramLen))== 0) && (actualLen == paramLen)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
33
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
34 //STLized version of basename()
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
35 // (because POSIX basename() modifies the input string pointer)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
36 // Additionally: removes any extension the basename might have.
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
37 std::string stl_basename(const std::string& path);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
38
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
39 // function declarations
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
40 void ShowHelp(void);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
41 void ShowExamples(void);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
42
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
43
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
44 int main(int argc, char* argv[])
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
45 {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
46 bool haveFiles = false;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
47 bool haveTitles = false;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
48 bool haveGenome = false;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
49 bool haveFiller = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
50 bool printHeader = false;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
51 bool printEmptyRegions = false;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
52 bool showHelp = false;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
53 string genomeFile;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
54 string basePath;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
55 string noCoverageValue = "0";
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
56 vector<string> inputFiles;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
57 vector<string> inputTitles;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
58
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
59 //Parse command line options
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
60 if(argc <= 1)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
61 ShowHelp();
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
62
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
63 for(int i = 1; i < argc; i++) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
64 int parameterLength = (int)strlen(argv[i]);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
65
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
66 if((PARAMETER_CHECK("-h", 2, parameterLength)) ||
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
67 (PARAMETER_CHECK("--help", 5, parameterLength))) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
68 showHelp = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
69 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
70 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
71
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
72 if(showHelp == true) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
73 ShowHelp();
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
74 exit(1);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
75 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
76
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
77 // do some parsing (all of these parameters require 2 strings)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
78 for(int i = 1; i < argc; i++) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
79
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
80 int parameterLength = (int)strlen(argv[i]);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
81
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
82 if(PARAMETER_CHECK("-i", 2, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
83 if ((i+1) < argc) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
84 haveFiles = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
85 i = i+1;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
86 string file = argv[i];
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
87 while (file[0] != '-' && i < argc) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
88 inputFiles.push_back(file);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
89 i++;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
90 if (i < argc)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
91 file = argv[i];
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
92 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
93 i--;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
94 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
95 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
96 else if(PARAMETER_CHECK("-names", 6, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
97 if ((i+1) < argc) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
98 haveTitles = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
99 i = i+1;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
100 string title = argv[i];
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
101 while (title[0] != '-' && i < argc) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
102 inputTitles.push_back(title);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
103 i++;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
104 if (i < argc)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
105 title = argv[i];
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
106 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
107 i--;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
108 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
109 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
110 else if(PARAMETER_CHECK("-g", 2, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
111 if ((i+1) < argc) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
112 haveGenome = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
113 genomeFile = argv[i + 1];
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
114 i++;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
115 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
116 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
117 else if(PARAMETER_CHECK("-filler", 7, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
118 if ((i+1) < argc) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
119 haveFiller = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
120 noCoverageValue = argv[i + 1];
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
121 i++;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
122 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
123 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
124 else if(PARAMETER_CHECK("-header", 7, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
125 printHeader = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
126 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
127 else if(PARAMETER_CHECK("-empty", 6, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
128 printEmptyRegions = true;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
129 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
130 else if(PARAMETER_CHECK("-examples", 9, parameterLength)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
131 ShowHelp();
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
132 ShowExamples();
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
133 exit(1);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
134 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
135 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
136
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
137 //Sanity checks
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
138 if (inputFiles.empty() == true) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
139 cerr << "Error: missing BedGraph file names (-i) to combine." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
140 exit(1);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
141 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
142 if (inputFiles.size() == 1) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
143 cerr << "Error: Only a single BedGraph file was specified. Nothing to combine, exiting." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
144 exit(1);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
145 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
146 if (printEmptyRegions && (genomeFile.empty() == true)) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
147 cerr << "Error: when using -empty, the genome sizes file (-g) must be specified using '-g FILE'." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
148 exit(1);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
149 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
150 if ((haveTitles == true) && (inputFiles.size() != inputTitles.size())) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
151 cerr << "Error: The number of file titles (-names) does not match the number of files (-i)." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
152 exit(1);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
153 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
154
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
155 UnionBedGraphs ubg(cout, inputFiles, inputTitles, printEmptyRegions, genomeFile, noCoverageValue);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
156 if (printHeader)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
157 ubg.PrintHeader();
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
158 ubg.Union();
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
159 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
160
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
161 void ShowHelp(void) {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
162
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
163 cerr << endl << "Program: " << PROGRAM_NAME << " (v" << VERSION << ")" << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
164
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
165 cerr << "Authors: Assaf Gordon, CSHL" << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
166 cerr << " Aaron Quinlan (aaronquinlan@gmail.com)" << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
167
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
168 cerr << "Summary: Combines multiple BedGraph files into a single file," << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
169 cerr << "\t allowing coverage comparisons between them." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
170
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
171 cerr << "Usage: " << PROGRAM_NAME << " [OPTIONS] -i FILE1 FILE2 .. FILEn" << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
172 cerr << "\t Assumes that each BedGraph file is sorted by chrom/start " << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
173 cerr << "\t and that the intervals in each are non-overlapping." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
174
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
175 cerr << "Options: " << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
176
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
177 cerr << "\t-header\t\t" << "Print a header line." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
178 cerr << "\t\t\t(chrom/start/end + names of each file)." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
179
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
180 cerr << "\t-names\t\t" << "A list of names (one / file) to describe each file in -i." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
181 cerr << "\t\t\tThese names will be printed in the header line." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
182
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
183 cerr << "\t-g\t\t" << "Use genome file to calculate empty regions." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
184 cerr << "\t\t\t- STRING." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
185
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
186 cerr << "\t-empty\t\t" << "Report empty regions (i.e., start/end intervals w/o" << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
187 cerr << "\t\t\tvalues in all files)." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
188 cerr << "\t\t\t- Requires the '-g FILE' parameter.\n" << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
189
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
190 cerr << "\t-filler TEXT\t" << "Use TEXT when representing intervals having no value." << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
191 cerr << "\t\t\t- Default is '0', but you can use 'N/A' or any other text." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
192
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
193 cerr << "\t-examples\t" << "Show detailed usage examples." << endl << endl;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
194 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
195
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
196
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
197
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
198 void ShowExamples()
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
199 {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
200 cerr << "Example usage:\n\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
201 "== Input files: ==\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
202 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
203 " $ cat 1.bg\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
204 " chr1 1000 1500 10\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
205 " chr1 2000 2100 20\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
206 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
207 " $ cat 2.bg\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
208 " chr1 900 1600 60\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
209 " chr1 1700 2050 50\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
210 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
211 " $ cat 3.bg\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
212 " chr1 1980 2070 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
213 " chr1 2090 2100 20\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
214 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
215 " $ cat sizes.txt\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
216 " chr1 5000\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
217 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
218 "== Union/combine the files: ==\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
219 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
220 " $ unionBedGraphs -i 1.bg 2.bg 3.bg\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
221 " chr1 900 1000 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
222 " chr1 1000 1500 10 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
223 " chr1 1500 1600 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
224 " chr1 1700 1980 0 50 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
225 " chr1 1980 2000 0 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
226 " chr1 2000 2050 20 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
227 " chr1 2050 2070 20 0 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
228 " chr1 2070 2090 20 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
229 " chr1 2090 2100 20 0 20\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
230 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
231 "== Union/combine the files, with a header line (titles are the file names): ==\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
232 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
233 " $ unionBedGraphs -header -i 1.bg 2.bg 3.bg\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
234 " chrom start end 1 2 3\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
235 " chr1 900 1000 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
236 " chr1 1000 1500 10 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
237 " chr1 1500 1600 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
238 " chr1 1700 1980 0 50 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
239 " chr1 1980 2000 0 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
240 " chr1 2000 2050 20 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
241 " chr1 2050 2070 20 0 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
242 " chr1 2070 2090 20 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
243 " chr1 2090 2100 20 0 20\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
244 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
245 "== Union/combine the files, with a header line and custom names: ==\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
246 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
247 " $ unionBedGraphs -header -i 1.bg 2.bg 3.bg -names WT-1 WT-2 KO-1\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
248 " chrom start end WT-1 WT-2 KO-1\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
249 " chr1 900 1000 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
250 " chr1 1000 1500 10 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
251 " chr1 1500 1600 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
252 " chr1 1700 1980 0 50 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
253 " chr1 1980 2000 0 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
254 " chr1 2000 2050 20 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
255 " chr1 2050 2070 20 0 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
256 " chr1 2070 2090 20 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
257 " chr1 2090 2100 20 0 20\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
258 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
259 "== Union/combine, showing empty regions (note, requires -g): ==\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
260 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
261 " $ unionBedGraphs -header -empty -g sizes.TXT -i 1.bg 2.bg 3.bg\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
262 " chrom start end 1 2 3\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
263 " chr1 0 900 0 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
264 " chr1 900 1000 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
265 " chr1 1000 1500 10 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
266 " chr1 1500 1600 0 60 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
267 " chr1 1600 1700 0 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
268 " chr1 1700 1980 0 50 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
269 " chr1 1980 2000 0 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
270 " chr1 2000 2050 20 50 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
271 " chr1 2050 2070 20 0 80\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
272 " chr1 2070 2090 20 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
273 " chr1 2090 2100 20 0 20\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
274 " chr1 2100 5000 0 0 0\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
275 "\n" \
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
276 ;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
277 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
278
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
279 std::string stl_basename(const std::string& path)
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
280 {
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
281 string result;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
282
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
283 char* path_dup = strdup(path.c_str());
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
284 char* basename_part = basename(path_dup);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
285 result = basename_part;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
286 free(path_dup);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
287
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
288 size_t pos = result.find_last_of('.');
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
289 if (pos != string::npos )
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
290 result = result.substr(0,pos);
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
291
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
292 return result;
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
293 }
dfcd8b6c1bda Uploaded
aaronquinlan
parents:
diff changeset
294