added errorchecking and help info on new unifrac and treeclimber code

author westcott <westcott>

Wed, 11 Feb 2009 18:14:23 +0000 (18:14 +0000)

committer westcott <westcott>

Wed, 11 Feb 2009 18:14:23 +0000 (18:14 +0000)
author westcott <westcott>
Wed, 11 Feb 2009 18:14:23 +0000 (18:14 +0000)
committer westcott <westcott>
Wed, 11 Feb 2009 18:14:23 +0000 (18:14 +0000)
diff --git a/errorchecking.cpp b/errorchecking.cpp

index 03844d5fa5b132e21ad1ae60e1c9e7b43e343aa2..067d246d4c50f1427840c3879be04bac2ff7cdf8 100644 (file)
--- a/errorchecking.cpp
+++ b/errorchecking.cpp
@@ -90,7 +90,7 @@ bool ErrorCheck::checkInput(string input) {
                                 if (parameter == "name" )               { namefile = value; }
                                 if (parameter == "order" )              { orderfile = value; }
                                 if (parameter == "fasta" )              { fastafile = value; }
-                               if (parameter == "treefile" )           { treefile = value; }
+                               if (parameter == "tree" )               { treefile = value; }
                                 if (parameter == "group" )              { groupfile = value; }
                                 if (parameter == "cutoff" )                     { cutoff = value; }
                                 if (parameter == "precision" )          { precision = value; }
@@ -161,7 +161,7 @@ bool ErrorCheck::checkInput(string input) {
                                 if (parameter == "order" )              { orderfile = value; }
                                 if (parameter == "group" )              { groupfile = value; }
                                 if (parameter == "fasta" )              { fastafile = value; }
-                               if (parameter == "treefile" )           { treefile = value; }
+                               if (parameter == "tree" )               { treefile = value; }
                                 if (parameter == "cutoff" )                     { cutoff = value; }
                                 if (parameter == "precision" )          { precision = value; }
                                 if (parameter == "iters" )                      { iters = value; }
@@ -254,6 +254,11 @@ bool ErrorCheck::checkInput(string input) {
                         }
                 }
                 
+               if ((commandName == "unifrac.weighted") || (commandName == "unifrac.unweighted")) {
+                       if (globaldata->gTree.size() == 0) {//no trees were read
+                               cout << "You must execute the read.tree command, before you may execute the unifrac.weighted or unifrac.unweighted command." << endl; return false;  }
+               }
+               
                 //check for valid method
                 if (commandName == "cluster") {
                         if ((method == "furthest") || (method == "nearest") || (method == "average")) { }
diff --git a/globaldata.cpp b/globaldata.cpp

index bc836e854cb3c4f1b7cc184789b0d49d6e8e3f45..d4eb9980c9051919eecb25e18a0c7b685dae65a1 100644 (file)
--- a/globaldata.cpp
+++ b/globaldata.cpp
@@ -103,7 +103,7 @@ void GlobalData::parseGlobalData(string commandString, string optionText){
                                 if (key == "rabund" )   { rabundfile = value; inputFileName = value; fileroot = value; format = "rabund";       }
                                 if (key == "sabund" )   { sabundfile = value; inputFileName = value; fileroot = value; format = "sabund";       } 
                                 if (key == "fasta" )    { fastafile = value; inputFileName = value; fileroot = value; format = "fasta";         } 
-                               if (key == "treefile" )         { treefile = value; inputFileName = value; fileroot = value; format = "tree";           }
+                               if (key == "tree" )             { treefile = value; inputFileName = value; fileroot = value; format = "tree";           }
                                 if (key == "name" )             { namefile = value;             }
                                 if (key == "order" )    { orderfile = value;    }
                                 if (key == "group" )    { groupfile = value;    }
@@ -154,14 +154,14 @@ void GlobalData::parseGlobalData(string commandString, string optionText){
                                         splitAtDash(value, lines);
                                         allLines = 0;
                                 }
-                               if (key == "label") {//stores lines to be used in a set
+                               if (key == "label") {//stores labels to be used in a set
                                         labels.clear();
                                         label = value;
                                         line = "";
                                         splitAtDash(value, labels);
                                         allLines = 0;
                                 }
-                               if (key == "groups") {//stores lines to be used in a vector
+                               if (key == "groups") {//stores groups to be used in a vector
                                         Groups.clear();
                                         groups = value;
                                         splitAtDash(value, Groups);
@@ -178,7 +178,7 @@ void GlobalData::parseGlobalData(string commandString, string optionText){
                         if (key == "rabund" )   { rabundfile = value; inputFileName = value; fileroot = value; format = "rabund";       }
                         if (key == "sabund" )   { sabundfile = value; inputFileName = value; fileroot = value; format = "sabund";       }
                         if (key == "fasta" )    { fastafile = value; inputFileName = value; fileroot = value; format = "fasta";         }
-                       if (key == "treefile" )         { treefile = value; inputFileName = value; fileroot = value; format = "tree";           }  
+                       if (key == "tree" )             { treefile = value; inputFileName = value; fileroot = value; format = "tree";           }  
                         if (key == "name" )             { namefile = value;             }
                         if (key == "order" )    { orderfile = value;    }
                         if (key == "group" )    { groupfile = value;    }
@@ -190,6 +190,8 @@ void GlobalData::parseGlobalData(string commandString, string optionText){
                         if (key == "method" )           { method = value;               }
                         if (key == "fileroot" )         { fileroot = value;             }
                         if (key == "randomtree" )       { randomtree = value;   }
+                       if (key == "groups" )           { groups = value;       }
+
                         
                         if (key == "single") {//stores estimators in a vector
                                 singleEstimators.clear(); //clears out old values
@@ -236,6 +238,12 @@ void GlobalData::parseGlobalData(string commandString, string optionText){
                                 splitAtDash(value, labels);
                                 allLines = 0;
                         }
+                       if (key == "groups") {//stores groups to be used in a vector
+                                       Groups.clear();
+                                       groups = value;
+                                       splitAtDash(value, Groups);
+                       }
+
                 }
                 
                 //set format for shared
@@ -345,6 +353,7 @@ void GlobalData::clear() {
         iters                   =       "1000"; 
         line                    =   "";
         label                   =       "";
+       groups                  =       "";
         jumble                  =       "1";    //0 means don't jumble, 1 means jumble.
         randomtree              =       "0";  //0 means user will enter some user trees, 1 means they just want the random tree distribution.
         freq                    =       "100";
diff --git a/helpcommand.cpp b/helpcommand.cpp

index 6fe793175f930c4ea44a3fdbad6caf7b2a068227..bc17dbed4c95d7c74b04e03fc470078b8bc67496 100644 (file)
--- a/helpcommand.cpp
+++ b/helpcommand.cpp
@@ -42,6 +42,12 @@ int HelpCommand::execute(){
                 cout << "The list parameter and group paramaters are required. When using the command the second way read.otu command parses the .list file" << "\n";
                 cout << "and separates it into groups.  It outputs a .shared file containing the OTU information for each group. The read.otu command also outputs a .list file for each group. " << "\n";
                 cout << "Note: No spaces between parameter labels (i.e. list), '=' and parameters (i.e.yourListfile)." << "\n" << "\n";
+       }else if (globaldata->helpRequest == "read.tree") {
+               cout << "The read.tree command must be run before you execute a unifrac.weighted, unifrac.unweighted. " << "\n";
+               cout << "It also must be run before using the parsimony command, unless you are using the randomtree parameter." << "\n";
+               cout << "The read.tree command should be in the following format: read.tree(tree=yourTreeFile, group=yourGroupFile)." << "\n";
+               cout << "The tree and group parameters are both required." << "\n";
+               cout << "Note: No spaces between parameter labels (i.e. list), '=' and parameters (i.e.yourListfile)." << "\n" << "\n";
         }else if (globaldata->helpRequest == "cluster") {
                 cout << "The cluster command can only be executed after a successful read.dist command." << "\n";
                 cout << "The cluster command parameter options are method, cuttoff and precision. No parameters are required." << "\n";
@@ -112,17 +118,45 @@ int HelpCommand::execute(){
                 cout << "The default value for jumble is 1 (meaning jumble, if it’s set to 0 then it will not jumble) and sharedsummary is sharedsobs-sharedChao-sharedAce-sharedJabund-sharedSorensonAbund-sharedJclass-sharedSorClass-sharedJest-sharedSorEst-SharedThetaYC-SharedThetaN" << "\n";
                 cout << "The label and line parameters are used to analyze specific lines in your input." << "\n";
                 cout << "Note: No spaces between parameter labels (i.e. list), '=' and parameters (i.e.yourListfile)." << "\n" << "\n";
+       }else if (globaldata->helpRequest == "parsimony") { 
+               cout << "The parsimony command can only be executed after a successful read.tree command, unless you use the randomtree parameter." << "\n";
+               cout << "The parsimony command parameters are randomtree and iters.  No parameters are required." << "\n";
+               cout << "The parsimony command should be in the following format: parsimony(randomtree=yourRandomTreeValue, iters=yourIters)." << "\n";
+               cout << "Example parsimony(randomtree=1, iters=500)." << "\n";
+               cout << "The default value for randomTree is 0 (meaning you want to use the trees in your inputfile, randomtree=1 means you just want the random distribution of trees)," << "\n";
+               cout << "and iters is 1000.  The parsimony command output three files: .parsimony, .psummary and .pdistrib, their descriptions are in the manual." << "\n";
+               cout << "Note: No spaces between parameter labels (i.e. list), '=' and parameters (i.e.yourListfile)." << "\n" << "\n";
+       }else if (globaldata->helpRequest == "unifrac.weighted") { 
+               cout << "The unifrac.weighted command can only be executed after a successful read.tree command." << "\n";
+               cout << "The unifrac.weighted command parameters are groups and iters.  No parameters are required." << "\n";
+               cout << "The groups paramter allows you to specify which of the groups in your groupfile you would like analyzed.  You must enter at least 2 valid groups." << "\n";
+               cout << "The group names are separated by dashes.  The iters parameter allows you to specify how many random trees you would like compared to your tree." << "\n";
+               cout << "The unifrac.weighted command should be in the following format: unifrac.weighted(groups=yourGroups, iters=yourIters)." << "\n";
+               cout << "Example unifrac.weighted(groups=A-B-C, iters=500)." << "\n";
+               cout << "The default value for groups is all the groups in your groupfile, and iters is 1000." << "\n";
+               cout << "The unifrac.weighted command output three files: .weighted, .wsummary and .wdistrib, their descriptions are in the manual." << "\n";
+               cout << "Note: No spaces between parameter labels (i.e. list), '=' and parameters (i.e.yourListfile)." << "\n" << "\n";
+       }else if (globaldata->helpRequest == "unifrac.unweighted") { 
+               cout << "The unifrac.unweighted command can only be executed after a successful read.tree command." << "\n";
+               cout << "The unifrac.unweighted command parameters are groups and iters.  No parameters are required." << "\n";
+               cout << "The groups paramter allows you to specify which of the groups in your groupfile you would like analyzed.  You must enter at least 1 valid group." << "\n";
+               cout << "The group names are separated by dashes.  The iters parameter allows you to specify how many random trees you would like compared to your tree." << "\n";
+               cout << "The unifrac.unweighted command should be in the following format: unifrac.unweighted(groups=yourGroups, iters=yourIters)." << "\n";
+               cout << "Example unifrac.unweighted(groups=A-B-C, iters=500)." << "\n";
+               cout << "The default value for groups is all the groups in your groupfile, and iters is 1000." << "\n";
+               cout << "The unifrac.unweighted command output three files: .unweighted, .uwsummary and .uwdistrib, their descriptions are in the manual." << "\n";
+               cout << "Note: No spaces between parameter labels (i.e. list), '=' and parameters (i.e.yourListfile)." << "\n" << "\n";
         }else if (globaldata->helpRequest == "quit") {
                 cout << "The quit command will terminate Dotur and should be in the following format: " << "\n";
                 cout << "quit()" << "\n" << "\n";
         }else if (globaldata->helpRequest == "") {
-               cout << "Valid commands are read.dist(), read.otu(), cluster(), deconvolute(), collect.single(), rarefaction.single(), summary.single(), collect.shared(), rarefaction.shared(), summary.shared(), quit(), help()." << "\n";
+               cout << "Valid commands are read.dist(), read.otu(), read.tree(), cluster(), deconvolute(), collect.single(), rarefaction.single(), summary.single(), collect.shared(), rarefaction.shared(), summary.shared(), parsimony(), unifrac.weighted(), unifrac.unweighted(), quit(), help()." << "\n";
                 cout << "For more information about a specific command type 'help(commandName)' i.e. 'help(read.dist)'" << endl;
         }else {
                 cout << globaldata->helpRequest << " is not a valid command" << endl;
         }
         
-       cout << endl << "For further assistance please refer to the Mothur manual, or contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+       cout << endl << "For further assistance please refer to the Mothur manual on our wiki at http://schloss.micro.umass.edu/mothur/, or contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
         return 0;
  }
  
diff --git a/treemap.cpp b/treemap.cpp

index bee0d11ed21323ee9dff1bc38c860a3042231150..6314eb04d04006ba5c57808f6927bddec89d6a00 100644 (file)
--- a/treemap.cpp
+++ b/treemap.cpp
@@ -100,7 +100,24 @@ void TreeMap::setNamesOfGroups(string seqGroup) {
                                 namesOfGroups.push_back(seqGroup); //new group
                         }
  }
-
+/************************************************************/
+bool TreeMap::isValidGroup(string groupname) {
+       try {
+               for (int i = 0; i < namesOfGroups.size(); i++) {
+                       if (groupname == namesOfGroups[i]) { return true; }
+               }
+               
+               return false;
+       }
+       catch(exception& e) {
+               cout << "Standard Error: " << e.what() << " has occurred in the TreeMap class Function isValidGroup. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+               exit(1);
+       }
+       catch(...) {
+               cout << "An unknown error has occurred in the TreeMap class function isValidGroup. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+               exit(1);
+       }
+}
  /***********************************************************************/
  
  void TreeMap::print(ostream& output){
diff --git a/treemap.h b/treemap.h

index 60f75b388571aff503ac95b96df5946e6fcfa89f..60fb924278c8df36a405ca363c2584d5ae2fa42a 100644 (file)
--- a/treemap.h
+++ b/treemap.h
@@ -34,11 +34,12 @@ public:
         int getNumSeqs();
         void setIndex(string, int);  //sequencename, index
         int getIndex(string);           //returns vector index of sequence
+       bool isValidGroup(string);  //return true if string is a valid group
         string getGroup(string);
         vector<string> namesOfGroups;
         vector<string> namesOfSeqs;
      map<string,int> seqsPerGroup;      //groupname, number of seqs in that group.
-       map<string, GroupIndex> treemap; //sequence name and groupname
+       map<string, GroupIndex> treemap; //sequence name and <groupname, vector index>
         void print(ostream&);
         
  private:
diff --git a/unifracunweightedcommand.cpp b/unifracunweightedcommand.cpp

index 8adff2d896f811d46e80b806acf45261d759c69b..77069443c2fd26a0cebbabf4dd661e1d37288030 100644 (file)
--- a/unifracunweightedcommand.cpp
+++ b/unifracunweightedcommand.cpp
@@ -23,6 +23,23 @@ UnifracUnweightedCommand::UnifracUnweightedCommand() {
                 distFile = globaldata->getTreeFile() + ".uwdistrib";
                 openOutputFile(distFile, outDist);
  
+               //if the user has not entered specific groups to analyze then do them all
+               if (globaldata->Groups.size() != 0) {
+                       //check that groups are valid
+                       for (int i = 0; i < globaldata->Groups.size(); i++) {
+                               if (tmap->isValidGroup(globaldata->Groups[i]) != true) {
+                                       cout << globaldata->Groups[i] << " is not a valid group, and will be disregarded." << endl;
+                                       // erase the invalid group from globaldata->Groups
+                                       globaldata->Groups.erase (globaldata->Groups.begin()+i);
+                               }
+                       }
+                       
+                       //if the user only entered invalid groups
+                       if (globaldata->Groups.size() == 0) { 
+                               cout << "When using the groups parameter you must have at least 1 valid group. I will run the command using all the groups in your groupfile." << endl; 
+                       }               
+               }
+
                 convert(globaldata->getIters(), iters);  //how many random trees to generate
                 unweighted = new Unweighted(tmap);
  
@@ -93,6 +110,8 @@ int UnifracUnweightedCommand::execute() {
                                 outDist << i+1 << '\t' << '\t'<< j+1 << '\t' << '\t' << randomData[0] << endl;
                         }
                         
+                       saveRandomScores(); //save all random scores for unweighted file
+                       
                         //find the signifigance of the score
                         float rcumul = 0.0000;
                         for (it = rscoreFreq.begin(); it != rscoreFreq.end(); it++) { 
@@ -105,8 +124,7 @@ int UnifracUnweightedCommand::execute() {
                         //save the signifigance of the users score for printing later
                         UWScoreSig.push_back(rCumul[userData[0]]);
                         
-                       saveRandomScores(); //save all random scores for unweighted file
-               
+                       
                         //clear random data
                         rscoreFreq.clear();  //you clear this because in the summary file you want the unweighted signifinance to be relative to these 1000 trees.
                         rCumul.clear();
@@ -207,15 +225,14 @@ void UnifracUnweightedCommand::printUWSummaryFile() {
  /***********************************************************/
  void UnifracUnweightedCommand::saveRandomScores() {
         try {
-               //update total map with new random scores
                 for (it = rscoreFreq.begin(); it != rscoreFreq.end(); it++) { 
                         //does this score already exist in the total map
                         it2 = totalrscoreFreq.find(it->first);
                         //if yes then add them
                         if (it2 != totalrscoreFreq.end()) { 
-                               it2->second += it->second;
+                               totalrscoreFreq[it->first] += rscoreFreq[it->first];
                         }else{ //its a new score
-                               totalrscoreFreq[it->first] = 1;
+                               totalrscoreFreq[it->first] = rscoreFreq[it->first];
                         }
                 }
         }
diff --git a/unifracweightedcommand.cpp b/unifracweightedcommand.cpp

index ff2c2450bdd35c005c1f29c3be03741a26da834c..4a8325afda1cf2ea95d3aa19ce228e9f4451cc96 100644 (file)
--- a/unifracweightedcommand.cpp
+++ b/unifracweightedcommand.cpp
@@ -22,8 +22,30 @@ UnifracWeightedCommand::UnifracWeightedCommand() {
                 openOutputFile(sumFile, outSum);
                 distFile = globaldata->getTreeFile() + ".wdistrib";
                 openOutputFile(distFile, outDist);
-
-               numGroups = tmap->getNumGroups();
+               
+               //if the user has not entered specific groups to analyze then do them all
+               if (globaldata->Groups.size() == 0) {
+                       numGroups = tmap->getNumGroups();
+               }else {
+                       //check that groups are valid
+                       for (int i = 0; i < globaldata->Groups.size(); i++) {
+                               if (tmap->isValidGroup(globaldata->Groups[i]) != true) {
+                                       cout << globaldata->Groups[i] << " is not a valid group, and will be disregarded." << endl;
+                                       // erase the invalid group from globaldata->Groups
+                                       globaldata->Groups.erase (globaldata->Groups.begin()+i);
+                               }
+                       }
+                       
+                       //if the user only entered invalid groups
+                       if (globaldata->Groups.size() == 0) { 
+                               numGroups = tmap->getNumGroups();
+                               cout << "When using the groups parameter you must have at least 2 valid groups. I will run the command using all the groups in your groupfile." << endl; 
+                       }else if (globaldata->Groups.size() == 1) { 
+                               cout << "When using the groups parameter you must have at least 2 valid groups. I will run the command using all the groups in your groupfile." << endl;
+                               numGroups = tmap->getNumGroups();
+                               globaldata->Groups.clear();
+                       }else { numGroups = globaldata->Groups.size(); }
+               }
                 
                 //calculate number of comparisons i.e. with groups A,B,C = AB, AC, BC = 3;
                 numComp = 0;
@@ -32,7 +54,11 @@ UnifracWeightedCommand::UnifracWeightedCommand() {
                         numComp += i; 
                         for (int l = n; l < numGroups; l++) {
                                 //set group comparison labels
-                               groupComb.push_back(tmap->namesOfGroups[i-1]+tmap->namesOfGroups[l]);
+                               if (globaldata->Groups.size() != 0) {
+                                       groupComb.push_back(globaldata->Groups[i-1]+globaldata->Groups[l]);
+                               }else {
+                                       groupComb.push_back(tmap->namesOfGroups[i-1]+tmap->namesOfGroups[l]);
+                               }
                         }
                         n++;
                 }
@@ -174,6 +200,8 @@ int UnifracWeightedCommand::execute() {
                 
                 //reset randomTree parameter to 0
                 globaldata->setRandomTree("0");
+               //clear out users groups
+               globaldata->Groups.clear();
                 
                 delete randT;
                 
diff --git a/unweighted.cpp b/unweighted.cpp

index a7cf9c9092e6b8565f538d38b2f86ae4a75b5944..4416e79afd680059b8958cab6c28e035b3633d1c 100644 (file)
--- a/unweighted.cpp
+++ b/unweighted.cpp
@@ -13,7 +13,8 @@
  
  EstOutput Unweighted::getValues(Tree* t) {
         try {
-       
+               globaldata = GlobalData::getInstance();
+               
                 //clear out old values
                 data.resize(1,0); 
                 penalty.resize(t->getNumLeaves(), 0);
@@ -60,7 +61,7 @@ EstOutput Unweighted::getValues(Tree* t) {
      
                 map<string,double>::iterator pos;
                 for(pos=unique.begin();pos!=unique.end();pos++){
-                       if(pos->first!="xxx"){      
+                       if((pos->first!="xxx") && (inUsersGroups(pos->first))){     
                                 UW += unique[pos->first];
                         }
                 }
@@ -85,4 +86,20 @@ EstOutput Unweighted::getValues(Tree* t) {
  
  }
  
-/**************************************************************************************************/
-\ No newline at end of file
+/**************************************************************************************************/
+bool Unweighted::inUsersGroups(string groupname) {
+       try {
+               for (int i = 0; i < globaldata->Groups.size(); i++) {
+                       if (groupname == globaldata->Groups[i]) { return true; }
+               }
+               return false;
+       }
+       catch(exception& e) {
+               cout << "Standard Error: " << e.what() << " has occurred in the Unweighted class Function inUsersGroups. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+               exit(1);
+       }
+       catch(...) {
+               cout << "An unknown error has occurred in the Unweighted class function inUsersGroups. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+               exit(1);
+       }
+}
+\ No newline at end of file
diff --git a/unweighted.h b/unweighted.h

index d39b5e7e71f97a543e92cac087cebbe3d9b41b43..e3bf3a8fc240648e4a38f48ced539845d3648706 100644 (file)
--- a/unweighted.h
+++ b/unweighted.h
@@ -24,9 +24,11 @@ class Unweighted : public TreeCalculator  {
                 EstOutput getValues(Tree*);
                 
         private:
+               GlobalData* globaldata;
                 EstOutput data;
                 vector<int> penalty;
                 TreeMap* tmap;
+               bool inUsersGroups(string);
  
  };
  
diff --git a/validcommands.cpp b/validcommands.cpp

index 8f06fefee54330386e9fed5109603e1a2335d1e9..53ee7431b49fecc06002e5b9330259371bd35729 100644 (file)
--- a/validcommands.cpp
+++ b/validcommands.cpp
@@ -55,7 +55,7 @@ bool ValidCommands::isValidCommand(string command) {
                 if ((commands.find(command)) != (commands.end())) {
                         return true;
                 }else{
-                       cout << command << " is not a valid command in Mothur.  Valid commands are read.dist(), read.otu(), cluster(), collect.single(), collect.shared(), rarefaction.single(), rarefaction.shared(), summary.single(), summary.shared(), quit(), help()." << endl;
+                       cout << command << " is not a valid command in Mothur.  Valid commands are read.dist(), read.otu(), read.tree(), cluster(), deconvolute(), collect.single(), collect.shared(), rarefaction.single(), rarefaction.shared(), summary.single(), summary.shared(), parsimony(), unifrac.weighted(), unifrac.unweighted(), quit(), help()." << endl;
                         return false;
                 }
                 
diff --git a/validparameter.cpp b/validparameter.cpp

index 7072825c69a9186af91f893834f62a0eb18e5acb..fbb368ed2a81ff413805b8deb20f4a79149dd53f 100644 (file)
--- a/validparameter.cpp
+++ b/validparameter.cpp
@@ -23,7 +23,7 @@ ValidParameters::ValidParameters() {
                 parameters["group"]                     = "group"; 
                 parameters["order"]                     = "order"; 
                 parameters["fasta"]                     = "fasta"; 
-               parameters["treefile"]                  = "treefile";
+               parameters["tree"]                      = "tree";
                 parameters["fileroot"]                  = "fileroot";
                 parameters["cutoff"]                    = "cutoff"; 
                 parameters["method"]                    = "method";
diff --git a/weighted.cpp b/weighted.cpp

index 481b34e04f582d11480b14e47f5a27e0290400db..bcdee111a4763db3dae42d5750066e7ab47417cd 100644 (file)
--- a/weighted.cpp
+++ b/weighted.cpp
@@ -13,15 +13,26 @@
  
  EstOutput Weighted::getValues(Tree* t) {
      try {
-       
-               int numGroups = tmap->getNumGroups();
+               globaldata = GlobalData::getInstance();
+               int numGroups;
+               
+               //if the user has not entered specific groups to analyze then do them all
+               if (globaldata->Groups.size() == 0) {
+                       numGroups = tmap->getNumGroups();
+               }else {
+                       numGroups = globaldata->Groups.size();
+               }
                 
                 //calculate number of comparisons i.e. with groups A,B,C = AB, AC, BC = 3;
                 int n = 1;
                 for (int i=1; i<numGroups; i++) { 
                         for (int l = n; l < numGroups; l++) {
                                 //initialize weighted scores
-                               WScore[tmap->namesOfGroups[i-1]+tmap->namesOfGroups[l]] = 0.0;
+                               if (globaldata->Groups.size() == 0) {
+                                       WScore[tmap->namesOfGroups[i-1]+tmap->namesOfGroups[l]] = 0.0;
+                               }else {
+                                       WScore[globaldata->Groups[i-1]+globaldata->Groups[l]] = 0.0;
+                               }
                         }
                 }
  
@@ -70,25 +81,48 @@ EstOutput Weighted::getValues(Tree* t) {
                         for (int b=1; b<numGroups; b++) { 
                                 for (int l = n; l < numGroups; l++) {
                                         double u;
-                                       //does this node have descendants from group b-1
-                                       it = t->tree[i].pcount.find(tmap->namesOfGroups[b-1]);
-                                       //if it does u = # of its descendants with a certain group / total number in tree with a certain group
-                                       if (it != t->tree[i].pcount.end()) {
-                                               u = (double) t->tree[i].pcount[tmap->namesOfGroups[b-1]] / (double) tmap->seqsPerGroup[tmap->namesOfGroups[b-1]];
-                                       }else { u = 0.00; }
+                                       //the user has not entered specific groups
+                                       if (globaldata->Groups.size() == 0) {
+                                               //does this node have descendants from group b-1
+                                               it = t->tree[i].pcount.find(tmap->namesOfGroups[b-1]);
+                                               //if it does u = # of its descendants with a certain group / total number in tree with a certain group
+                                               if (it != t->tree[i].pcount.end()) {
+                                                       u = (double) t->tree[i].pcount[tmap->namesOfGroups[b-1]] / (double) tmap->seqsPerGroup[tmap->namesOfGroups[b-1]];
+                                               }else { u = 0.00; }
                 
-                                       //does this node have descendants from group l
-                                       it = t->tree[i].pcount.find(tmap->namesOfGroups[l]);
-                                       //if it does subtract their percentage from u
-                                       if (it != t->tree[i].pcount.end()) {
-                                               u -= (double) t->tree[i].pcount[tmap->namesOfGroups[l]] / (double) tmap->seqsPerGroup[tmap->namesOfGroups[l]];
-                                       }
+                                               //does this node have descendants from group l
+                                               it = t->tree[i].pcount.find(tmap->namesOfGroups[l]);
+                                               //if it does subtract their percentage from u
+                                               if (it != t->tree[i].pcount.end()) {
+                                                       u -= (double) t->tree[i].pcount[tmap->namesOfGroups[l]] / (double) tmap->seqsPerGroup[tmap->namesOfGroups[l]];
+                                               }
                                                 
-                                       u = abs(u) * t->tree[i].getBranchLength();
+                                               u = abs(u) * t->tree[i].getBranchLength();
                                         
-                                       //save groupcombs u value
-                                       WScore[tmap->namesOfGroups[b-1]+tmap->namesOfGroups[l]] += u;
-
+                                               //save groupcombs u value
+                                               WScore[tmap->namesOfGroups[b-1]+tmap->namesOfGroups[l]] += u;
+                                               
+                                       //the user has entered specific groups  
+                                       }else {
+                                               //does this node have descendants from group b-1
+                                               it = t->tree[i].pcount.find(globaldata->Groups[b-1]);
+                                               //if it does u = # of its descendants with a certain group / total number in tree with a certain group
+                                               if (it != t->tree[i].pcount.end()) {
+                                                       u = (double) t->tree[i].pcount[globaldata->Groups[b-1]] / (double) tmap->seqsPerGroup[globaldata->Groups[b-1]];
+                                               }else { u = 0.00; }
+               
+                                               //does this node have descendants from group l
+                                               it = t->tree[i].pcount.find(globaldata->Groups[l]);
+                                               //if it does subtract their percentage from u
+                                               if (it != t->tree[i].pcount.end()) {
+                                                       u -= (double) t->tree[i].pcount[globaldata->Groups[l]] / (double) tmap->seqsPerGroup[globaldata->Groups[l]];
+                                               }
+                                               
+                                               u = abs(u) * t->tree[i].getBranchLength();
+                                       
+                                               //save groupcombs u value
+                                               WScore[globaldata->Groups[b-1]+globaldata->Groups[l]] += u;
+                                       }
                                 }
                                 n++;
                         }
@@ -99,7 +133,12 @@ EstOutput Weighted::getValues(Tree* t) {
                 n = 1;
                 for (int i=1; i<numGroups; i++) { 
                         for (int l = n; l < numGroups; l++) {
-                               UN = (WScore[tmap->namesOfGroups[i-1]+tmap->namesOfGroups[l]] / D);
+                               //the user has not entered specific groups
+                               if (globaldata->Groups.size() == 0) {
+                                       UN = (WScore[tmap->namesOfGroups[i-1]+tmap->namesOfGroups[l]] / D);
+                               }else {//they have entered specific groups
+                                       UN = (WScore[globaldata->Groups[i-1]+globaldata->Groups[l]] / D);
+                               }
                                 if (isnan(UN) || isinf(UN)) { UN = 0; } 
                                 data.push_back(UN);
                         }
diff --git a/weighted.h b/weighted.h

index b0d443333d230b410d6a4f64c88c2ee0b18f2a61..7e4be7c6d0f4ebc95c7d3a224ba3c5e71a4e6d06 100644 (file)
--- a/weighted.h
+++ b/weighted.h
@@ -24,6 +24,7 @@ class Weighted : public TreeCalculator  {
                 EstOutput getValues(Tree*);
                 
         private:
+               GlobalData* globaldata;
                 EstOutput data;
                 TreeMap* tmap;
                 map<string, int>::iterator it;
author	westcott <westcott>
	Wed, 11 Feb 2009 18:14:23 +0000 (18:14 +0000)
committer	westcott <westcott>
	Wed, 11 Feb 2009 18:14:23 +0000 (18:14 +0000)
errorchecking.cpp		patch \| blob \| history
globaldata.cpp		patch \| blob \| history
helpcommand.cpp		patch \| blob \| history
treemap.cpp		patch \| blob \| history
treemap.h		patch \| blob \| history
unifracunweightedcommand.cpp		patch \| blob \| history
unifracweightedcommand.cpp		patch \| blob \| history
unweighted.cpp		patch \| blob \| history
unweighted.h		patch \| blob \| history
validcommands.cpp		patch \| blob \| history
validparameter.cpp		patch \| blob \| history
weighted.cpp		patch \| blob \| history
weighted.h		patch \| blob \| history