Mercurial > repos > aaronquinlan > multi_intersect
comparison BEDTools-Version-2.14.3/src/utils/genomeFile/genomeFile.cpp @ 0:dfcd8b6c1bda
Uploaded
author | aaronquinlan |
---|---|
date | Thu, 03 Nov 2011 10:25:04 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:dfcd8b6c1bda |
---|---|
1 /***************************************************************************** | |
2 genomeFile.cpp | |
3 | |
4 (c) 2009 - Aaron Quinlan | |
5 Hall Laboratory | |
6 Department of Biochemistry and Molecular Genetics | |
7 University of Virginia | |
8 aaronquinlan@gmail.com | |
9 | |
10 Licensed under the GNU General Public License 2.0 license. | |
11 ******************************************************************************/ | |
12 #include "lineFileUtilities.h" | |
13 #include "genomeFile.h" | |
14 | |
15 | |
16 GenomeFile::GenomeFile(const string &genomeFile) { | |
17 _genomeFile = genomeFile; | |
18 loadGenomeFileIntoMap(); | |
19 } | |
20 | |
21 GenomeFile::GenomeFile(const RefVector &genome) { | |
22 for (size_t i = 0; i < genome.size(); ++i) { | |
23 string chrom = genome[i].RefName; | |
24 int length = genome[i].RefLength; | |
25 | |
26 _chromSizes[chrom] = length; | |
27 _chromList.push_back(chrom); | |
28 } | |
29 } | |
30 | |
31 // Destructor | |
32 GenomeFile::~GenomeFile(void) { | |
33 } | |
34 | |
35 | |
36 void GenomeFile::loadGenomeFileIntoMap() { | |
37 | |
38 string genomeLine; | |
39 int lineNum = 0; | |
40 vector<string> genomeFields; // vector for a GENOME entry | |
41 | |
42 // open the GENOME file for reading | |
43 ifstream genome(_genomeFile.c_str(), ios::in); | |
44 if ( !genome ) { | |
45 cerr << "Error: The requested genome file (" << _genomeFile << ") could not be opened. Exiting!" << endl; | |
46 exit (1); | |
47 } | |
48 | |
49 while (getline(genome, genomeLine)) { | |
50 | |
51 Tokenize(genomeLine,genomeFields); // load the fields into the vector | |
52 lineNum++; | |
53 | |
54 // ignore a blank line | |
55 if (genomeFields.size() > 0) { | |
56 if (genomeFields[0].find("#") == string::npos) { | |
57 | |
58 // we need at least 2 columns | |
59 if (genomeFields.size() >= 2) { | |
60 char *p2End; | |
61 long c2; | |
62 // make sure the second column is numeric. | |
63 c2 = strtol(genomeFields[1].c_str(), &p2End, 10); | |
64 | |
65 // strtol will set p2End to the start of the string if non-integral, base 10 | |
66 if (p2End != genomeFields[1].c_str()) { | |
67 string chrom = genomeFields[0]; | |
68 int size = atoi(genomeFields[1].c_str()); | |
69 _chromSizes[chrom] = size; | |
70 _chromList.push_back(chrom); | |
71 } | |
72 } | |
73 else { | |
74 cerr << "Less than the req'd two fields were encountered in the genome file (" << _genomeFile << ")"; | |
75 cerr << " at line " << lineNum << ". Exiting." << endl; | |
76 exit (1); | |
77 } | |
78 } | |
79 } | |
80 genomeFields.clear(); | |
81 } | |
82 } | |
83 | |
84 | |
85 int GenomeFile::getChromSize(const string &chrom) { | |
86 chromToSizes::const_iterator chromIt = _chromSizes.find(chrom); | |
87 if (chromIt != _chromSizes.end()) | |
88 return _chromSizes[chrom]; | |
89 else | |
90 return -1; // chrom not found. | |
91 } | |
92 | |
93 vector<string> GenomeFile::getChromList() { | |
94 return _chromList; | |
95 } | |
96 | |
97 int GenomeFile::getNumberOfChroms() { | |
98 return _chromList.size(); | |
99 } | |
100 | |
101 string GenomeFile::getGenomeFileName() { | |
102 return _genomeFile; | |
103 } |