X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;f=mothur.h;h=fdaa06362db6ecda7054fe4ff9b21442487c19d4;hb=6777912b79eb6d011163da47f3ada09d1a9293c1;hp=c1d93ed197fe2990c24ca2ba0d89f52f8fe8320e;hpb=dc08123b7f14e2305e5bb2b3a8fcef96fc829b07;p=mothur.git diff --git a/mothur.h b/mothur.h index c1d93ed..fdaa063 100644 --- a/mothur.h +++ b/mothur.h @@ -1,7 +1,6 @@ #ifndef MOTHUR_H #define MOTHUR_H -using namespace std; /* @@ -22,6 +21,8 @@ using namespace std; #include #include #include +#include + //exception #include @@ -41,7 +42,39 @@ using namespace std; #include #include -typedef unsigned long long ull; +//misc +#include +#include +#include + +/***********************************************************************/ + +#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) + #include + #include + + #ifdef USE_READLINE + #include + #include + #endif + + //#include + //#include +#else + #include //allows unbuffered screen capture from stdin + #include //get cwd +#endif + +using namespace std; + +#define exp(x) (exp((double) x)) +#define sqrt(x) (sqrt((double) x)) +#define log10(x) (log10((double) x)) +#define log2(x) (log10(x)/log10(2)) +#define isnan(x) ((x) != (x)) +#define isinf(x) (fabs(x) == std::numeric_limits::infinity()) + +typedef unsigned long ull; struct IntNode { int lvalue; @@ -50,8 +83,38 @@ struct IntNode { int rcoef; IntNode* left; IntNode* right; -}; + IntNode(int lv, int rv, IntNode* l, IntNode* r) : lvalue(lv), rvalue(rv), left(l), right(r) {}; + IntNode() {}; +}; + +struct ThreadNode { + int* pid; + IntNode* left; + IntNode* right; +}; + +/************************************************************/ +struct clusterNode { + int numSeq; + int parent; + int smallChild; //used to make linkTable work with list and rabund. represents bin number of this cluster node + clusterNode(int num, int par, int kid) : numSeq(num), parent(par), smallChild(kid) {}; +}; +/************************************************************/ +struct seqDist { + int seq1; + int seq2; + float dist; + seqDist() {} + seqDist(int s1, int s2, float d) : seq1(s1), seq2(s2), dist(d) {} + ~seqDist() {} +}; +//******************************************************************************************************************** +//sorts lowest to highest +inline bool compareSequenceDistance(seqDist left, seqDist right){ + return (left.dist < right.dist); +} /***********************************************************************/ // snagged from http://www.parashift.com/c++-faq-lite/misc-technical-issues.html#faq-39.2 @@ -71,6 +134,20 @@ inline void convert(const string& s, T& x, bool failIfLeftoverChars = true){ if (!(i >> x) || (failIfLeftoverChars && i.get(c))) throw BadConversion(s); } + +//********************************************************************************************************************** + +template +inline bool convertTestFloat(const string& s, T& x, bool failIfLeftoverChars = true){ + istringstream i(s); + char c; + if (!(i >> x) || (failIfLeftoverChars && i.get(c))) + { + return false; + } + return true; +} + //********************************************************************************************************************** template @@ -79,7 +156,7 @@ inline bool convertTest(const string& s, T& x, bool failIfLeftoverChars = true){ char c; if (!(i >> x) || (failIfLeftoverChars && i.get(c))) { - cout << "'" << s << "' is unable to be converted into an integer.\n"; + cout << "unable to be converted into an integer.\n" << endl; return false; } return true; @@ -115,8 +192,20 @@ string toString(const T&x, int i){ return output.str(); } +/***********************************************************************/ +inline int openOutputFileAppend(string fileName, ofstream& fileHandle){ + + fileHandle.open(fileName.c_str(), ios::app); + if(!fileHandle) { + cout << "Error: Could not open " << fileName << endl; + return 1; + } + else { + return 0; + } +} /***********************************************************************/ inline void gobble(istream& f){ @@ -126,6 +215,106 @@ inline void gobble(istream& f){ f.putback(d); } +/***********************************************************************/ + +inline string getline(ifstream& fileHandle) { + try { + + string line = ""; + + while (!fileHandle.eof()) { + //get next character + char c = fileHandle.get(); + + //are you at the end of the line + if ((c == '\n') || (c == '\r') || (c == '\f')){ break; } + else { line += c; } + } + + return line; + + } + catch(exception& e) { + cout << "Error in mothur function getline" << endl; + exit(1); + } +} + +/**************************************************************************************************/ + +inline void mothurOut(string message) { + try{ + ofstream out; + string logFileName = "mothur.logFile"; + openOutputFileAppend(logFileName, out); + + cout << message; + out << message; + + out.close(); + } + catch(exception& e) { + cout << "Error in mothur class mothurOut" << endl; + exit(1); + } +} +/**************************************************************************************************/ + +inline void mothurOut(string message, string precision) { + try{ + ofstream out; + string logFileName = "mothur.logFile"; + openOutputFileAppend(logFileName, out); + + cout << precision << message; + out << precision << message; + + out.close(); + } + catch(exception& e) { + cout << "Error in mothur class mothurOut" << endl; + exit(1); + } +} + +/**************************************************************************************************/ + +inline void mothurOutEndLine() { + try { + ofstream out; + string logFileName = "mothur.logFile"; + openOutputFileAppend(logFileName, out); + + cout << endl; + out << endl; + + out.close(); + } + catch(exception& e) { + cout << "error in mothur mothurOutEndLine" << endl; + exit(1); + } +} + + +/**************************************************************************************************/ + +inline void errorOut(exception& e, string object, string function) { + + mothurOut("Error: "); + mothurOut(toString(e.what())); + mothurOut(" has occurred in the " + object + " class function " + function + ". Please contact Pat Schloss at mothur.bugs@gmail.com, and be sure to include the mothur.logFile with your inquiry."); + mothurOutEndLine(); + +} + +/***********************************************************************/ + +inline bool isTrue(string f){ + + if ((f == "TRUE") || (f == "T") || (f == "true") || (f == "t")) { return true; } + else { return false; } +} /***********************************************************************/ @@ -204,13 +393,21 @@ inline string getSimpleName(string longName){ string simpleName = longName; - if(longName.find_last_of("/") != longName.npos){ - int pos = longName.find_last_of('/')+1; - simpleName = longName.substr(pos, longName.length()); - } + size_t found; + found=longName.find_last_of("/\\"); + if(found != longName.npos){ + simpleName = longName.substr(found+1); + } + + //if(longName.find_last_of("/") != longName.npos){ + // int pos = longName.find_last_of('/')+1; + // simpleName = longName.substr(pos, longName.length()); + //} + return simpleName; } + /***********************************************************************/ inline int factorial(int num){ @@ -222,6 +419,13 @@ inline int factorial(int num){ return total; } +/************************************************************************************************** + +double min(double x, double y) +{ + if(x 0) { simpleCWD = cwd.substr(1); } + + //break apart the current working directory + vector dirs; + while (simpleCWD.find_first_of('/') != -1) { + string dir = simpleCWD.substr(0,simpleCWD.find_first_of('/')); + simpleCWD = simpleCWD.substr(simpleCWD.find_first_of('/')+1, simpleCWD.length()); + dirs.push_back(dir); + } + //get last one // ex. ../../../filename = /user/work/desktop/filename + dirs.push_back(simpleCWD); //ex. dirs[0] = user, dirs[1] = work, dirs[2] = desktop + + int index = dirs.size()-1; + + while((pos = path.rfind("./")) != -1) { //while you don't have a complete path + if (path[(pos-1)] == '.') { //you want your parent directory ../ + path = path.substr(0, pos-1); + index--; + if (index == 0) { break; } + }else if (path[(pos-1)] == '/') { //you want the current working dir ./ + path = path.substr(0, pos); + }else if (pos == 1) { break; + }else { mothurOut("cannot resolve path for " + fileName); mothurOutEndLine(); return fileName; } + } + + for (int i = index; i >= 0; i--) { + newFileName = dirs[i] + "/" + newFileName; + } + + newFileName = "/" + newFileName; + return newFileName; + + #else + if (path.rfind(".\\") == -1) { return fileName; } //already complete name + else { newFileName = fileName.substr(fileName.rfind(".\\")+2); } //save the complete part of the name + + char *cwdpath = NULL; + cwdpath = getcwd(NULL, 0); // or _getcwd + if ( cwdpath != NULL) { cwd = cwdpath; } + else { cwd = ""; } + + //break apart the current working directory + vector dirs; + while (cwd.find_first_of('\\') != -1) { + string dir = cwd.substr(0,cwd.find_first_of('\\')); + cwd = cwd.substr(cwd.find_first_of('\\')+1, cwd.length()); + dirs.push_back(dir); + + } + //get last one + dirs.push_back(cwd); //ex. dirs[0] = user, dirs[1] = work, dirs[2] = desktop + + int index = dirs.size()-1; + + while((pos = path.rfind(".\\")) != -1) { //while you don't have a complete path + if (path[(pos-1)] == '.') { //you want your parent directory ../ + path = path.substr(0, pos-1); + index--; + if (index == 0) { break; } + }else if (path[(pos-1)] == '\\') { //you want the current working dir ./ + path = path.substr(0, pos); + }else if (pos == 1) { break; + }else { mothurOut("cannot resolve path for " + fileName); mothurOutEndLine(); return fileName; } + } + + for (int i = index; i >= 0; i--) { + newFileName = dirs[i] + "\\" + newFileName; + } + + return newFileName; + + #endif + } + +} +/***********************************************************************/ + +inline int openInputFile(string fileName, ifstream& fileHandle, string m){ + + //get full path name + string completeFileName = getFullPathName(fileName); + + fileHandle.open(completeFileName.c_str()); + if(!fileHandle) { + return 1; + }else { + //check for blank file + gobble(fileHandle); + return 0; + } +} +/***********************************************************************/ + +inline int openInputFile(string fileName, ifstream& fileHandle){ + //get full path name + string completeFileName = getFullPathName(fileName); + + fileHandle.open(completeFileName.c_str()); + if(!fileHandle) { + mothurOut("Error: Could not open " + completeFileName); mothurOutEndLine(); return 1; } else { + //check for blank file + gobble(fileHandle); + if (fileHandle.eof()) { mothurOut(completeFileName + " is blank. Please correct."); mothurOutEndLine(); return 1; } + return 0; } } +/***********************************************************************/ + +inline int renameFile(string oldName, string newName){ + + ifstream inTest; + int exist = openInputFile(newName, inTest, ""); + +#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) + if (exist == 0) { //you could open it so you want to delete it + inTest.close(); + string command = "rm " + newName; + system(command.c_str()); + } + + string command = "mv " + oldName + " " + newName; + system(command.c_str()); +#else + remove(newName.c_str()); + renameOk = rename(oldName.c_str(), newName.c_str()); +#endif + return 0; +} /***********************************************************************/ inline int openOutputFile(string fileName, ofstream& fileHandle){ + + string completeFileName = getFullPathName(fileName); - fileHandle.open(fileName.c_str(), ios::trunc); + fileHandle.open(completeFileName.c_str(), ios::trunc); if(!fileHandle) { - cerr << "Error: Could not open " << fileName << endl; + mothurOut("Error: Could not open " + completeFileName); mothurOutEndLine(); return 1; } else { @@ -269,6 +663,25 @@ inline int openOutputFile(string fileName, ofstream& fileHandle){ /***********************************************************************/ +inline int getNumSeqs(ifstream& file){ + + int numSeqs = count(istreambuf_iterator(file),istreambuf_iterator(), '>'); + file.seekg(0); + return numSeqs; + +} +/***********************************************************************/ + +inline bool inVector(string member, vector group){ + + for (int i = 0; i < group.size(); i++) { + if (group[i] == member) { return true; } + } + + return false; +} +/***********************************************************************/ + //This function parses the estimator options and puts them in a vector inline void splitAtDash(string& estim, vector& container) { try { @@ -285,14 +698,9 @@ inline void splitAtDash(string& estim, vector& container) { container.push_back(estim); } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function splitAtDash. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; - exit(1); - } - catch(...) { - cout << "An unknown error has occurred in the mothur class function splitAtDash. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "splitAtDash"); exit(1); } - } /***********************************************************************/ @@ -312,14 +720,9 @@ inline void splitAtDash(string& estim, set& container) { container.insert(estim); } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function splitAtDash. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "splitAtDash"); exit(1); } - catch(...) { - cout << "An unknown error has occurred in the mothur class function splitAtDash. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; - exit(1); - } - } /***********************************************************************/ //This function parses the line options and puts them in a set @@ -341,14 +744,9 @@ inline void splitAtDash(string& estim, set& container) { container.insert(lineNum); } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function splitAtDash. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "splitAtDash"); exit(1); } - catch(...) { - cout << "An unknown error has occurred in the mothur class function splitAtDash. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; - exit(1); - } - } /***********************************************************************/ //This function parses the a string and puts peices in a vector @@ -367,11 +765,7 @@ inline void splitAtComma(string& estim, vector& container) { container.push_back(estim); } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function splitAtComma. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; - exit(1); - } - catch(...) { - cout << "An unknown error has occurred in the mothur class function splitAtComma. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "splitAtComma"); exit(1); } } @@ -390,14 +784,9 @@ inline void splitAtComma(string& prefix, string& suffix){ } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function splitAtComma. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "splitAtComma"); exit(1); } - catch(...) { - cout << "An unknown error has occurred in the mothur class function splitAtComma. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; - exit(1); - } - } /***********************************************************************/ @@ -415,14 +804,9 @@ inline void splitAtEquals(string& key, string& value){ } } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function splitAtEquals. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; - exit(1); - } - catch(...) { - cout << "An unknown error has occurred in the mothur class function splitAtEquals. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "splitAtEquals"); exit(1); } - } /**************************************************************************************************/ @@ -434,17 +818,228 @@ inline bool inUsersGroups(string groupname, vector Groups) { return false; } catch(exception& e) { - cout << "Standard Error: " << e.what() << " has occurred in the mothur class Function inUsersGroups. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; + errorOut(e, "mothur", "inUsersGroups"); exit(1); } - catch(...) { - cout << "An unknown error has occurred in the mothur class function inUsersGroups. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n"; +} + +/**************************************************************************************************/ + +inline void mothurOutJustToLog(string message) { + try { + ofstream out; + string logFileName = "mothur.logFile"; + openOutputFileAppend(logFileName, out); + + out << message; + + out.close(); + } + catch(exception& e) { + errorOut(e, "mothur", "mothurOutJustToLog"); + exit(1); + } +} + + +/**************************************************************************************************/ + +inline void mothurOut(float num) { + try { + ofstream out; + string logFileName = "mothur.logFile"; + openOutputFileAppend(logFileName, out); + + cout << num; + out << num; + + out.close(); + } + catch(exception& e) { + cout << "Error in mothur class mothurOut float" << endl; + exit(1); + } +} +/***********************************************************************/ +inline void mothurOut(double value) { + try { + ofstream out; + string logFileName = "mothur.logFile"; + openOutputFileAppend(logFileName, out); + + cout << value; + out << value; + + out.close(); + } + catch(exception& e) { + cout << "Error in mothur class mothurOut double" << endl; + exit(1); + } +} + +/***********************************************************************/ +//this function determines if the user has given us labels that are smaller than the given label. +//if so then it returns true so that the calling function can run the previous valid distance. +//it's a "smart" distance function. It also checks for invalid labels. +inline bool anyLabelsToProcess(string label, set& userLabels, string errorOff) { + try { + set::iterator it; + vector orderFloat; + map userMap; //the conversion process removes trailing 0's which we need to put back + map::iterator it2; + float labelFloat; + bool smaller = false; + + //unique is the smallest line + if (label == "unique") { return false; } + else { convert(label, labelFloat); } + + //go through users set and make them floats + for(it = userLabels.begin(); it != userLabels.end(); ++it) { + + float temp; + if ((*it != "unique") && (convertTestFloat(*it, temp) == true)){ + convert(*it, temp); + orderFloat.push_back(temp); + userMap[*it] = temp; + }else if (*it == "unique") { + orderFloat.push_back(-1.0); + userMap["unique"] = -1.0; + }else { + if (errorOff == "") { mothurOut(*it + " is not a valid label."); mothurOutEndLine(); } + userLabels.erase(*it); + it--; + } + } + + //sort order + sort(orderFloat.begin(), orderFloat.end()); + + /*************************************************/ + //is this label bigger than any of the users labels + /*************************************************/ + + //loop through order until you find a label greater than label + for (int i = 0; i < orderFloat.size(); i++) { + if (orderFloat[i] < labelFloat) { + smaller = true; + if (orderFloat[i] == -1) { + if (errorOff == "") { mothurOut("Your file does not include the label unique."); mothurOutEndLine(); } + userLabels.erase("unique"); + } + else { + if (errorOff == "") { mothurOut("Your file does not include the label "); mothurOutEndLine(); } + string s = ""; + for (it2 = userMap.begin(); it2!= userMap.end(); it2++) { + if (it2->second == orderFloat[i]) { + s = it2->first; + //remove small labels + userLabels.erase(s); + break; + } + } + if (errorOff == "") { mothurOut(s + ". I will use the next smallest distance. "); mothurOutEndLine(); } + } + //since they are sorted once you find a bigger one stop looking + }else { break; } + } + + return smaller; + + } + catch(exception& e) { + errorOut(e, "mothur", "anyLabelsToProcess"); exit(1); } } /**************************************************************************************************/ +inline void appendFiles(string temp, string filename) { + try{ + ofstream output; + ifstream input; + + //open output file in append mode + openOutputFileAppend(filename, output); + openInputFile(temp, input); + + while(char c = input.get()){ + if(input.eof()) { break; } + else { output << c; } + } + + input.close(); + output.close(); + } + catch(exception& e) { + errorOut(e, "mothur", "appendFiles"); + exit(1); + } +} +/**************************************************************************************************/ +inline string sortFile(string distFile){ + try { + string outfile = getRootName(distFile) + "sorted.dist"; + + //if you can, use the unix sort since its been optimized for years + #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) + string command = "sort -n -k +3 " + distFile + " -o " + outfile; + system(command.c_str()); + #else //you are stuck with my best attempt... + //windows sort does not have a way to specify a column, only a character in the line + //since we cannot assume that the distance will always be at the the same character location on each line + //due to variable sequence name lengths, I chose to force the distance into first position, then sort and then put it back. + + //read in file line by file and put distance first + string tempDistFile = distFile + ".temp"; + ifstream input; + ofstream output; + openInputFile(distFile, input); + openOutputFile(tempDistFile, output); + string firstName, secondName; + float dist; + while (input) { + input >> firstName >> secondName >> dist; + output << dist << '\t' << firstName << '\t' << secondName << endl; + gobble(input); + } + input.close(); + output.close(); + + + //sort using windows sort + string tempOutfile = outfile + ".temp"; + string command = "sort " + tempDistFile + " /O " + tempOutfile; + system(command.c_str()); + + //read in sorted file and put distance at end again + ifstream input2; + openInputFile(tempOutfile, input2); + openOutputFile(outfile, output); + + while (input2) { + input2 >> dist >> firstName >> secondName; + output << firstName << '\t' << secondName << '\t' << dist << endl; + gobble(input2); + } + input2.close(); + output.close(); + + //remove temp files + remove(tempDistFile.c_str()); + remove(tempOutfile.c_str()); + #endif + + return outfile; + } + catch(exception& e) { + errorOut(e, "mothur", "sortFile"); + exit(1); + } +} +/**************************************************************************************************/ #endif