1 #include "globaldata.hpp"
3 #include "sparsematrix.hpp"
5 /*******************************************************/
7 /******************************************************/
8 GlobalData* GlobalData::getInstance() {
9 if( _uniqueInstance == 0) {
10 _uniqueInstance = new GlobalData();
12 return _uniqueInstance;
14 /*******************************************************/
16 /******************************************************/
17 //This function parses through the option string of the command to remove its parameters
18 void GlobalData::parseGlobalData(string commandString, string optionText){
20 commandName = commandString; //save command name to be used by other classes
22 //set all non filename paramters to default
25 //clears out data from previous read
26 if((commandName == "read.dist") || (commandName == "read.otu") || (commandName == "read.tree")) {
33 labels.clear(); lines.clear(); Groups.clear();
38 if(commandName =="help") {
39 helpRequest = optionText;
42 if(commandName == "libshuff") {
47 //set default value for cutoff
48 if(commandName == "dist.seqs") { cutoff = "1.0"; }
51 //reads in parameters and values
52 if((optionText != "") && (commandName != "help")){
53 while((optionText.find_first_of(',') != -1)) { //while there are parameters
54 splitAtComma(value, optionText);
55 splitAtEquals(key, value);
57 if(key == "phylip") { phylipfile = value; inputFileName = value; fileroot = value; format = "phylip"; }
58 if(key == "column") { columnfile = value; inputFileName = value; fileroot = value; format = "column"; }
59 if(key == "list") { listfile = value; inputFileName = value; fileroot = value; format = "list"; }
60 if(key == "rabund") { rabundfile = value; inputFileName = value; fileroot = value; format = "rabund"; }
61 if(key == "sabund") { sabundfile = value; inputFileName = value; fileroot = value; format = "sabund"; }
62 if(key == "fasta") { fastafile = value; inputFileName = value; fileroot = value; format = "fasta"; }
63 if(key == "tree") { treefile = value; inputFileName = value; fileroot = value; format = "tree"; }
64 if(key == "shared") { sharedfile = value; inputFileName = value; fileroot = value; format = "sharedfile"; }
65 if(key == "name") { namefile = value; }
66 if(key == "order") { orderfile = value; }
67 if(key == "group") { groupfile = value; }
68 if(key == "cutoff") { cutoff = value; }
69 if(key == "precision") { precision = value; }
70 if(key == "iters") { iters = value; }
71 if(key == "jumble") { jumble = value; }
72 if(key == "freq") { freq = value; }
73 if(key == "method") { method = value; }
74 if(key == "fileroot") { fileroot = value; }
75 if(key == "abund") { abund = value; }
76 if(key == "random") { randomtree = value; }
77 if(key == "calc") { calc = value; }
78 if(key == "step") { step = value; }
79 if(key == "form") { form = value; }
80 if(key == "sorted") { sorted = value; }
81 if(key == "vertical") { vertical = value; }
82 if(key == "trump") { trump = value; }
83 if(key == "hard") { hard = value; }
84 if(key == "soft") { soft = value; }
85 if(key == "scale") { scale = value; }
86 if(key == "countends") { countends = value; }
87 if(key == "processors") { processors = value; }
88 if(key == "size") { size = value; }
89 if(key == "candidate") { candidatefile = value; }
90 if(key == "search") { search = value; }
91 if(key == "ksize") { ksize = value; }
92 if(key == "align") { align = value; }
93 if(key == "match") { match = value; }
94 if(key == "mismatch") { mismatch = value; }
95 if(key == "gapopen") { gapopen = value; }
96 if(key == "gapextend") { gapextend = value; }
97 if(key == "start") { startPos = value; }
98 if(key == "end") { endPos = value; }
99 if(key == "maxambig") { maxAmbig = value; }
100 if(key == "maxhomop") { maxHomoPolymer = value; }
101 if(key == "minlength") { minLength = value; }
102 if(key == "maxlength") { maxLength = value; }
103 if(key == "flip" ) { flip = value; }
104 if(key == "oligos" ) { oligoFile = value; }
105 if(key == "forward" ) { forMismatch = value; }
106 if(key == "reverse" ) { revMismatch = value; }
107 if(key == "barcode" ) { barMismatch = value; }
109 if(key == "line") {//stores lines to be used in a vector
114 if(line != "all") { splitAtDash(value, lines); allLines = 0; }
115 else { allLines = 1; }
118 if(key == "label") {//stores lines to be used in a vector
123 if(label != "all") { splitAtDash(value, labels); allLines = 0; }
124 else { allLines = 1; }
127 if(key == "groups") {//stores groups to be used in a vector
130 splitAtDash(value, Groups);
135 //saves the last parameter ==> this seems silly...
137 splitAtEquals(key, value);
138 if(key == "phylip") { phylipfile = value; inputFileName = value; fileroot = value; format = "phylip"; }
139 if(key == "column") { columnfile = value; inputFileName = value; fileroot = value; format = "column"; }
140 if(key == "list") { listfile = value; inputFileName = value; fileroot = value; format = "list"; }
141 if(key == "rabund") { rabundfile = value; inputFileName = value; fileroot = value; format = "rabund"; }
142 if(key == "sabund") { sabundfile = value; inputFileName = value; fileroot = value; format = "sabund"; }
143 if(key == "fasta") { fastafile = value; inputFileName = value; fileroot = value; format = "fasta"; }
144 if(key == "tree") { treefile = value; inputFileName = value; fileroot = value; format = "tree"; }
145 if(key == "shared") { sharedfile = value; inputFileName = value; fileroot = value; format = "sharedfile"; }
146 if(key == "name") { namefile = value; }
147 if(key == "order") { orderfile = value; }
148 if(key == "group") { groupfile = value; }
149 if(key == "cutoff") { cutoff = value; }
150 if(key == "precision") { precision = value; }
151 if(key == "iters") { iters = value; }
152 if(key == "jumble") { jumble = value; }
153 if(key == "freq") { freq = value; }
154 if(key == "method") { method = value; }
155 if(key == "fileroot") { fileroot = value; }
156 if(key == "abund") { abund = value; }
157 if(key == "random") { randomtree = value; }
158 if(key == "calc") { calc = value; }
159 if(key == "step") { step = value; }
160 if(key == "form") { form = value; }
161 if(key == "sorted") { sorted = value; }
162 if(key == "vertical") { vertical = value; }
163 if(key == "trump") { trump = value; }
164 if(key == "hard") { hard = value; }
165 if(key == "soft") { soft = value; }
166 if(key == "scale") { scale = value; }
167 if(key == "countends") { countends = value; }
168 if(key == "processors") { processors = value; }
169 if(key == "size") { size = value; }
170 if(key == "candidate") { candidatefile = value; }
171 if(key == "search") { search = value; }
172 if(key == "ksize") { ksize = value; }
173 if(key == "align") { align = value; }
174 if(key == "match") { match = value; }
175 if(key == "mismatch") { mismatch = value; }
176 if(key == "gapopen") { gapopen = value; }
177 if(key == "gapextend") { gapextend = value; }
178 if(key == "start") { startPos = value; }
179 if(key == "end") { endPos = value; }
180 if(key == "maxambig") { maxAmbig = value; }
181 if(key == "maxhomop") { maxHomoPolymer = value; }
182 if(key == "minlength") { minLength = value; }
183 if(key == "maxlength") { maxLength = value; }
184 if(key == "flip" ) { flip = value; }
185 if(key == "oligos" ) { oligoFile = value; }
186 if(key == "forward" ) { forMismatch = value; }
187 if(key == "reverse" ) { revMismatch = value; }
188 if(key == "barcode" ) { barMismatch = value; }
191 if(key == "line") {//stores lines to be used in a vector
196 if(line != "all") { splitAtDash(value, lines); allLines = 0; }
197 else { allLines = 1; }
200 if(key == "label") {//stores lines to be used in a vector
205 if(label != "all") { splitAtDash(value, labels); allLines = 0; }
206 else { allLines = 1; }
209 if(key == "groups") {//stores groups to be used in a vector
212 splitAtDash(value, Groups);
216 //set format for shared
217 if((listfile != "") && (groupfile != "")) { format = "shared"; }
218 if((phylipfile != "") && (groupfile != "")) { format = "matrix"; }
220 //input defaults for calculators
221 if(commandName == "collect.single") {
223 if((calc == "default") || (calc == "")) { calc = "sobs-chao-ace-jack-shannon-npshannon-simpson"; }
225 splitAtDash(calc, Estimators);
227 if(commandName == "rarefaction.single") {
228 if((calc == "default") || (calc == "")) { calc = "sobs"; }
230 splitAtDash(calc, Estimators);
232 if(commandName == "collect.shared") {
233 if((calc == "default") || (calc == "")) { calc = "sharedsobs-sharedchao-sharedace-jabund-sorabund-jclass-sorclass-jest-sorest-thetayc-thetan"; }
235 splitAtDash(calc, Estimators);
237 if(commandName == "summary.single") {
238 if((calc == "default") || (calc == "")) { calc = "sobs-chao-ace-jack-shannon-npshannon-simpson"; }
240 splitAtDash(calc, Estimators);
242 if(commandName == "summary.shared") {
243 if((calc == "default") || (calc == "")) { calc = "sharedsobs-sharedchao-sharedace-jabund-sorabund-jclass-sorclass-jest-sorest-thetayc-thetan"; }
245 splitAtDash(calc, Estimators);
247 if(commandName == "rarefaction.shared") {
248 if((calc == "default") || (calc == "")) { calc = "sharedobserved"; }
250 splitAtDash(calc, Estimators);
252 if(commandName == "dist.seqs") {
253 if((calc == "default") || (calc == "")) { calc = "onegap"; }
254 if(countends == "") { countends = "T"; }
256 splitAtDash(calc, Estimators);
258 if(commandName == "venn") {
259 if((calc == "default") || (calc == "")) {
260 if(format == "list") { calc = "sobs"; }
261 else { calc = "sharedsobs"; }
264 splitAtDash(calc, Estimators);
266 if((commandName == "tree.shared") || (commandName == "bootstrap.shared") || (commandName == "dist.shared")) {
267 if((calc == "default") || (calc == "")) {
268 calc = "jclass-thetayc";
271 splitAtDash(calc, Estimators);
274 if(commandName == "filter.seqs"){
275 if(trump == "" && vertical == "" && hard == "" && soft == ""){
281 //ifyou have done a read.otu with a groupfile but don't want to use it anymore because you want to do single commands
282 if((commandName == "collect.single") || (commandName == "rarefaction.single") || (commandName == "summary.single")) {
283 if(listfile != "") { format = "list"; }
284 else if(sabundfile != "") { format = "sabund"; }
285 else if(rabundfile != "") { format = "rabund"; }
288 catch(exception& e) {
289 cout << "Standard Error: " << e.what() << " has occurred in the GlobalData class Function parseGlobalData. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
293 cout << "An unknown error has occurred in the GlobalData class function parseGlobalData. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
297 /*******************************************************/
299 /******************************************************/
300 // These functions give you the option parameters of the commands
301 string GlobalData::getPhylipFile() { return phylipfile; }
302 string GlobalData::getColumnFile() { return columnfile; }
303 string GlobalData::getListFile() { return listfile; }
304 string GlobalData::getRabundFile() { return rabundfile; }
305 string GlobalData::getSabundFile() { return sabundfile; }
306 string GlobalData::getNameFile() { return namefile; }
307 string GlobalData::getGroupFile() { return groupfile; }
308 string GlobalData::getOrderFile() { return orderfile; }
309 string GlobalData::getTreeFile() { return treefile; }
310 string GlobalData::getSharedFile() { return sharedfile; }
311 string GlobalData::getFastaFile() { return fastafile; }
312 string GlobalData::getCutOff() { return cutoff; }
313 string GlobalData::getFormat() { return format; }
314 string GlobalData::getPrecision() { return precision; }
315 string GlobalData::getMethod() { return method; }
316 string GlobalData::getFileRoot() { return fileroot; }
317 string GlobalData::getIters() { return iters; }
318 string GlobalData::getJumble() { return jumble; }
319 string GlobalData::getFreq() { return freq; }
320 string GlobalData::getAbund() { return abund; }
321 string GlobalData::getRandomTree() { return randomtree; }
322 string GlobalData::getGroups() { return groups; }
323 string GlobalData::getStep() { return step; }
324 string GlobalData::getForm() { return form; }
325 string GlobalData::getSorted() { return sorted; }
326 string GlobalData::getVertical() { return vertical; }
327 string GlobalData::getTrump() { return trump; }
328 string GlobalData::getSoft() { return soft; }
329 string GlobalData::getHard() { return hard; }
330 string GlobalData::getScale() { return scale; }
331 string GlobalData::getCountEnds() { return countends; }
332 string GlobalData::getProcessors() { return processors; }
333 string GlobalData::getSize() { return size; }
334 string GlobalData::getCandidateFile() { return candidatefile; }
335 string GlobalData::getSearch() { return search; }
336 string GlobalData::getKSize() { return ksize; }
337 string GlobalData::getAlign() { return align; }
338 string GlobalData::getMatch() { return match; }
339 string GlobalData::getMismatch() { return mismatch; }
340 string GlobalData::getGapopen() { return gapopen; }
341 string GlobalData::getGapextend() { return gapextend; }
342 string GlobalData::getStartPos() { return startPos; }
343 string GlobalData::getEndPos() { return endPos; }
344 string GlobalData::getMaxAmbig() { return maxAmbig; }
345 string GlobalData::getMaxHomoPolymer() { return maxHomoPolymer; }
346 string GlobalData::getMinLength() { return minLength; }
347 string GlobalData::getMaxLength() { return maxLength; }
348 string GlobalData::getFlip() { return flip; }
349 string GlobalData::getOligosFile() { return oligoFile; }
350 string GlobalData::getForwardMismatch() { return forMismatch; }
351 string GlobalData::getReverseMismatch() { return revMismatch; }
352 string GlobalData::getBarcodeMismatch() { return barMismatch; }
355 void GlobalData::setListFile(string file) { listfile = file; inputFileName = file; }
356 void GlobalData::setRabundFile(string file) { rabundfile = file; inputFileName = file; }
357 void GlobalData::setSabundFile(string file) { sabundfile = file; inputFileName = file; }
358 void GlobalData::setPhylipFile(string file) { phylipfile = file; inputFileName = file; }
359 void GlobalData::setColumnFile(string file) { columnfile = file; inputFileName = file; }
360 void GlobalData::setGroupFile(string file) { groupfile = file; }
361 void GlobalData::setSharedFile(string file) { sharedfile = file; inputFileName = file; fileroot = file; }
362 void GlobalData::setNameFile(string file) { namefile = file; }
363 void GlobalData::setFormat(string Format) { format = Format; }
364 void GlobalData::setRandomTree(string Random) { randomtree = Random; }
365 void GlobalData::setGroups(string g) { groups = g; }
366 void GlobalData::setCalc(string Calc) { calc = Calc; }
367 void GlobalData::setCountEnds(string e) { countends = e; }
368 void GlobalData::setProcessors(string p) { processors = p; }
371 /*******************************************************/
373 /******************************************************/
374 GlobalData::GlobalData() {
375 //option definitions should go here...
379 gSparseMatrix = NULL;
381 /*******************************************************/
383 /******************************************************/
384 void GlobalData::clear() {
385 //option definitions should go here...
405 jumble = "1"; //0 means don't jumble, 1 means jumble.
406 randomtree = ""; //"" means user will enter some user trees, "outputfile" means they just want the random tree distribution to be outputted to outputfile.
413 sorted = "T"; //F means don't sort, T means sort.
419 countends = "T"; //yes
432 maxHomoPolymer = "-1";
442 //*******************************************************/
444 /******************************************************/
445 void GlobalData::reset() {
452 jumble = "1"; //0 means don't jumble, 1 means jumble.
453 sorted = "T"; //F means don't sort, T means sort.
454 randomtree = ""; //"" means user will enter some user trees, "outputfile" means they just want the random tree distribution to be outputted to outputfile.
478 maxHomoPolymer = "-1";
488 /*******************************************************/
490 /******************************************************/
491 GlobalData::~GlobalData() {
493 if(gListVector != NULL) { delete gListVector; }
494 if(gSparseMatrix != NULL) { delete gSparseMatrix; }
495 if(gorder != NULL) { delete gorder; }
497 /*******************************************************/
499 /*******************************************************/
500 void GlobalData::parseTreeFile() {
501 //Why is THIS in GlobalData??? - PDS
503 //only takes names from the first tree and assumes that all trees use the same names.
505 string filename = treefile;
507 openInputFile(filename, filehandle);
511 //ifyou are not a nexus file
512 if((c = filehandle.peek()) != '#') {
513 while((c = filehandle.peek()) != ';') {
514 while ((c = filehandle.peek()) != ';') {
522 if((c == '(') && (comment != 1)){ break; }
526 readTreeString(filehandle);
528 //ifyou are a nexus file
529 }else if((c = filehandle.peek()) == '#') {
533 while(holder != "translate" && holder != "Translate"){
534 if(holder == "[" || holder == "[!"){
540 filehandle >> holder;
542 //ifthere is no translate then you must read tree string otherwise use translate to get names
543 if(holder == "tree" && comment != 1){
544 //pass over the "tree rep.6878900 = "
545 while (((c = filehandle.get()) != '(') && ((c = filehandle.peek()) != EOF)) {;}
547 if(c == EOF) { break; }
548 filehandle.putback(c); //put back first ( of tree.
549 readTreeString(filehandle);
554 //use nexus translation rather than parsing tree to save time
555 if((holder == "translate") || (holder == "Translate")) {
557 string number, name, h;
558 h = ""; // so it enters the loop the first time
559 while((h != ";") && (number != ";")) {
560 filehandle >> number;
563 //c = , until done with translation then c = ;
564 h = name.substr(name.length()-1, name.length());
565 name.erase(name.end()-1); //erase the comma
566 Treenames.push_back(number);
568 if(number == ";") { Treenames.pop_back(); } //in case ';' from translation is on next line instead of next to last name
573 catch(exception& e) {
574 cout << "Standard Error: " << e.what() << " has occurred in the GlobalData class Function parseTreeFile. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
578 cout << "An unknown error has occurred in the GlobalData class function parseTreeFile. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
582 /*******************************************************/
584 /*******************************************************/
585 void GlobalData::readTreeString(ifstream& filehandle) {
590 while((c = filehandle.peek()) != ';') {
592 if((c != '(') && (c != ')') && (c != ',') && (c != ':') && (c != '\n') && (c != '\t') && (c != 32)) { //32 is space
594 c = filehandle.get();
597 while ((c != '(') && (c != ')') && (c != ',') && (c != ':') && (c != '\n') && (c != 32) && (c != '\t')) {
599 c = filehandle.get();
601 //cout << " in name while " << k << endl;
604 //cout << "name = " << name << endl;
605 Treenames.push_back(name);
606 filehandle.putback(c);
608 //cout << " after putback" << k << endl;
611 if(c == ':') { //read until you reach the end of the branch length
612 while ((c != '(') && (c != ')') && (c != ',') && (c != ';') && (c != '\n') && (c != '\t') && (c != 32)) {
613 c = filehandle.get();
615 //cout << " in branch while " << k << endl;
617 filehandle.putback(c);
619 c = filehandle.get();
620 if(c == ';') { break; }
626 catch(exception& e) {
627 cout << "Standard Error: " << e.what() << " has occurred in the GlobalData class Function parseTreeFile. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
631 cout << "An unknown error has occurred in the GlobalData class function parseTreeFile. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
636 /*******************************************************/
638 /*******************************************************/