5 * Created by westcott on 2/25/10.
6 * Copyright 2010 Schloss Lab. All rights reserved.
10 #include "mothurout.h"
13 /******************************************************/
14 MothurOut* MothurOut::getInstance() {
15 if( _uniqueInstance == 0) {
16 _uniqueInstance = new MothurOut();
18 return _uniqueInstance;
20 /*********************************************************************************************/
21 set<string> MothurOut::getCurrentTypes() {
25 types.insert("fasta");
26 types.insert("accnos");
27 types.insert("column");
28 types.insert("design");
29 types.insert("group");
32 types.insert("oligos");
33 types.insert("order");
34 types.insert("ordergroup");
35 types.insert("phylip");
36 types.insert("qfile");
37 types.insert("relabund");
38 types.insert("sabund");
39 types.insert("rabund");
41 types.insert("shared");
42 types.insert("taxonomy");
46 types.insert("counttable");
47 types.insert("processors");
52 errorOut(e, "MothurOut", "getCurrentTypes");
56 /*********************************************************************************************/
57 void MothurOut::printCurrentFiles() {
61 if (accnosfile != "") { mothurOut("accnos=" + accnosfile); mothurOutEndLine(); }
62 if (columnfile != "") { mothurOut("column=" + columnfile); mothurOutEndLine(); }
63 if (designfile != "") { mothurOut("design=" + designfile); mothurOutEndLine(); }
64 if (fastafile != "") { mothurOut("fasta=" + fastafile); mothurOutEndLine(); }
65 if (groupfile != "") { mothurOut("group=" + groupfile); mothurOutEndLine(); }
66 if (listfile != "") { mothurOut("list=" + listfile); mothurOutEndLine(); }
67 if (namefile != "") { mothurOut("name=" + namefile); mothurOutEndLine(); }
68 if (oligosfile != "") { mothurOut("oligos=" + oligosfile); mothurOutEndLine(); }
69 if (orderfile != "") { mothurOut("order=" + orderfile); mothurOutEndLine(); }
70 if (ordergroupfile != "") { mothurOut("ordergroup=" + ordergroupfile); mothurOutEndLine(); }
71 if (phylipfile != "") { mothurOut("phylip=" + phylipfile); mothurOutEndLine(); }
72 if (qualfile != "") { mothurOut("qfile=" + qualfile); mothurOutEndLine(); }
73 if (rabundfile != "") { mothurOut("rabund=" + rabundfile); mothurOutEndLine(); }
74 if (relabundfile != "") { mothurOut("relabund=" + relabundfile); mothurOutEndLine(); }
75 if (sabundfile != "") { mothurOut("sabund=" + sabundfile); mothurOutEndLine(); }
76 if (sfffile != "") { mothurOut("sff=" + sfffile); mothurOutEndLine(); }
77 if (sharedfile != "") { mothurOut("shared=" + sharedfile); mothurOutEndLine(); }
78 if (taxonomyfile != "") { mothurOut("taxonomy=" + taxonomyfile); mothurOutEndLine(); }
79 if (treefile != "") { mothurOut("tree=" + treefile); mothurOutEndLine(); }
80 if (flowfile != "") { mothurOut("flow=" + flowfile); mothurOutEndLine(); }
81 if (biomfile != "") { mothurOut("biom=" + biomfile); mothurOutEndLine(); }
82 if (counttablefile != "") { mothurOut("counttable=" + counttablefile); mothurOutEndLine(); }
83 if (processors != "1") { mothurOut("processors=" + processors); mothurOutEndLine(); }
87 errorOut(e, "MothurOut", "printCurrentFiles");
91 /*********************************************************************************************/
92 bool MothurOut::hasCurrentFiles() {
94 bool hasCurrent = false;
96 if (accnosfile != "") { return true; }
97 if (columnfile != "") { return true; }
98 if (designfile != "") { return true; }
99 if (fastafile != "") { return true; }
100 if (groupfile != "") { return true; }
101 if (listfile != "") { return true; }
102 if (namefile != "") { return true; }
103 if (oligosfile != "") { return true; }
104 if (orderfile != "") { return true; }
105 if (ordergroupfile != "") { return true; }
106 if (phylipfile != "") { return true; }
107 if (qualfile != "") { return true; }
108 if (rabundfile != "") { return true; }
109 if (relabundfile != "") { return true; }
110 if (sabundfile != "") { return true; }
111 if (sfffile != "") { return true; }
112 if (sharedfile != "") { return true; }
113 if (taxonomyfile != "") { return true; }
114 if (treefile != "") { return true; }
115 if (flowfile != "") { return true; }
116 if (biomfile != "") { return true; }
117 if (counttablefile != "") { return true; }
118 if (processors != "1") { return true; }
123 catch(exception& e) {
124 errorOut(e, "MothurOut", "hasCurrentFiles");
129 /*********************************************************************************************/
130 void MothurOut::clearCurrentFiles() {
156 catch(exception& e) {
157 errorOut(e, "MothurOut", "clearCurrentFiles");
161 /***********************************************************************/
162 string MothurOut::findProgramPath(string programName){
165 string envPath = getenv("PATH");
168 //delimiting path char
170 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
176 //break apart path variable by ':'
178 splitAtChar(envPath, dirs, delim);
180 if (debug) { mothurOut("[DEBUG]: dir's in path: \n"); }
182 //get path related to mothur
183 for (int i = 0; i < dirs.size(); i++) {
185 if (debug) { mothurOut("[DEBUG]: " + dirs[i] + "\n"); }
187 //to lower so we can find it
188 string tempLower = "";
189 for (int j = 0; j < dirs[i].length(); j++) { tempLower += tolower(dirs[i][j]); }
191 //is this mothurs path?
192 if (tempLower.find(programName) != -1) { pPath = dirs[i]; break; }
195 if (debug) { mothurOut("[DEBUG]: programPath = " + pPath + "\n"); }
198 //add programName so it looks like what argv would look like
199 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
200 pPath += "/" + programName;
202 pPath += "\\" + programName;
205 //okay programName is not in the path, so the folder programName is in must be in the path
206 //lets find out which one
208 //get path related to the program
209 for (int i = 0; i < dirs.size(); i++) {
211 if (debug) { mothurOut("[DEBUG]: looking in " + dirs[i] + " for " + programName + " \n"); }
213 //is this the programs path?
215 string tempIn = dirs[i];
216 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
217 tempIn += "/" + programName;
219 tempIn += "\\" + programName;
221 openInputFile(tempIn, in, "");
223 //if this file exists
224 if (in) { in.close(); pPath = tempIn; if (debug) { mothurOut("[DEBUG]: found it, programPath = " + pPath + "\n"); } break; }
231 catch(exception& e) {
232 errorOut(e, "MothurOut", "findProgramPath");
236 /*********************************************************************************************/
237 void MothurOut::setFileName(string filename) {
239 logFileName = filename;
243 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
245 if (pid == 0) { //only one process should output to screen
248 openOutputFile(filename, out);
254 catch(exception& e) {
255 errorOut(e, "MothurOut", "setFileName");
259 /*********************************************************************************************/
260 void MothurOut::setDefaultPath(string pathname) {
263 //add / to name if needed
264 string lastChar = pathname.substr(pathname.length()-1);
265 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
266 if (lastChar != "/") { pathname += "/"; }
268 if (lastChar != "\\") { pathname += "\\"; }
271 defaultPath = pathname;
274 catch(exception& e) {
275 errorOut(e, "MothurOut", "setDefaultPath");
279 /*********************************************************************************************/
280 void MothurOut::setOutputDir(string pathname) {
282 outputDir = pathname;
284 catch(exception& e) {
285 errorOut(e, "MothurOut", "setOutputDir");
289 /*********************************************************************************************/
290 void MothurOut::closeLog() {
295 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
297 if (pid == 0) { //only one process should output to screen
306 catch(exception& e) {
307 errorOut(e, "MothurOut", "closeLog");
312 /*********************************************************************************************/
313 MothurOut::~MothurOut() {
318 catch(exception& e) {
319 errorOut(e, "MothurOut", "MothurOut");
323 /*********************************************************************************************/
324 void MothurOut::mothurOut(string output) {
329 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
331 if (pid == 0) { //only one process should output to screen
341 catch(exception& e) {
342 errorOut(e, "MothurOut", "MothurOut");
346 /*********************************************************************************************/
347 void MothurOut::mothurOutEndLine() {
351 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
353 if (pid == 0) { //only one process should output to screen
363 catch(exception& e) {
364 errorOut(e, "MothurOut", "MothurOutEndLine");
368 /*********************************************************************************************/
369 void MothurOut::mothurOut(string output, ofstream& outputFile) {
374 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
376 if (pid == 0) { //only one process should output to screen
381 outputFile << output;
389 catch(exception& e) {
390 errorOut(e, "MothurOut", "MothurOut");
394 /*********************************************************************************************/
395 void MothurOut::mothurOutEndLine(ofstream& outputFile) {
399 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
401 if (pid == 0) { //only one process should output to screen
412 catch(exception& e) {
413 errorOut(e, "MothurOut", "MothurOutEndLine");
417 /*********************************************************************************************/
418 void MothurOut::mothurOutJustToLog(string output) {
422 MPI_Comm_rank(MPI_COMM_WORLD, &pid);
424 if (pid == 0) { //only one process should output to screen
433 catch(exception& e) {
434 errorOut(e, "MothurOut", "MothurOutJustToLog");
438 /*********************************************************************************************/
439 void MothurOut::errorOut(exception& e, string object, string function) {
441 //mem_usage(vm, rss);
443 mothurOut("[ERROR]: ");
444 mothurOut(toString(e.what()));
445 mothurOut(" has occurred in the " + object + " class function " + function + ". Please contact Pat Schloss at mothur.bugs@gmail.com, and be sure to include the mothur.logFile with your inquiry.");
448 /*********************************************************************************************/
449 //The following was originally from http://stackoverflow.com/questions/669438/how-to-get-memory-usage-at-run-time-in-c
450 // process_mem_usage(double &, double &) - takes two doubles by reference,
451 // attempts to read the system-dependent data for a process' virtual memory
452 // size and resident set size, and return the results in KB.
454 // On failure, returns 0.0, 0.0
455 int MothurOut::mem_usage(double& vm_usage, double& resident_set) {
456 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
461 // 'file' stat seems to give the most reliable results
463 ifstream stat_stream("/proc/self/stat",ios_base::in);
465 // dummy vars for leading entries in stat that we don't care about
467 string pid, comm, state, ppid, pgrp, session, tty_nr;
468 string tpgid, flags, minflt, cminflt, majflt, cmajflt;
469 string utime, stime, cutime, cstime, priority, nice;
470 string O, itrealvalue, starttime;
472 // the two fields we want
477 stat_stream >> pid >> comm >> state >> ppid >> pgrp >> session >> tty_nr
478 >> tpgid >> flags >> minflt >> cminflt >> majflt >> cmajflt
479 >> utime >> stime >> cutime >> cstime >> priority >> nice
480 >> O >> itrealvalue >> starttime >> vsize >> rss; // don't care about the rest
482 long page_size_kb = sysconf(_SC_PAGE_SIZE) / 1024; // in case x86-64 is configured to use 2MB pages
483 vm_usage = vsize / 1024.0;
484 resident_set = rss * page_size_kb;
486 mothurOut("Memory Usage: vm = " + toString(vm_usage) + " rss = " + toString(resident_set) + "\n");
490 /* //windows memory usage
491 // Get the list of process identifiers.
492 DWORD aProcesses[1024], cbNeeded, cProcesses;
494 if ( !EnumProcesses( aProcesses, sizeof(aProcesses), &cbNeeded ) ){ return 1; }
496 // Calculate how many process identifiers were returned.
497 cProcesses = cbNeeded / sizeof(DWORD);
499 // Print the memory usage for each process
500 for (int i = 0; i < cProcesses; i++ ) {
501 DWORD processID = aProcesses[i];
503 PROCESS_MEMORY_COUNTERS pmc;
505 HANDLE hProcess = OpenProcess((PROCESS_QUERY_INFORMATION | PROCESS_VM_READ), FALSE, processID);
507 // Print the process identifier.
508 printf( "\nProcess ID: %u\n", processID);
510 if (NULL != hProcess) {
512 if ( GetProcessMemoryInfo( hProcess, &pmc, sizeof(pmc)) ) {
513 printf( "\tPageFaultCount: 0x%08X\n", pmc.PageFaultCount );
514 printf( "\tPeakWorkingSetSize: 0x%08X\n", pmc.PeakWorkingSetSize );
515 printf( "\tWorkingSetSize: 0x%08X\n", pmc.WorkingSetSize );
516 printf( "\tQuotaPeakPagedPoolUsage: 0x%08X\n", pmc.QuotaPeakPagedPoolUsage );
517 printf( "\tQuotaPagedPoolUsage: 0x%08X\n", pmc.QuotaPagedPoolUsage );
518 printf( "\tQuotaPeakNonPagedPoolUsage: 0x%08X\n", pmc.QuotaPeakNonPagedPoolUsage );
519 printf( "\tQuotaNonPagedPoolUsage: 0x%08X\n", pmc.QuotaNonPagedPoolUsage );
520 printf( "\tPagefileUsage: 0x%08X\n", pmc.PagefileUsage );
521 printf( "\tPeakPagefileUsage: 0x%08X\n", pmc.PeakPagefileUsage );
523 CloseHandle(hProcess);
533 /***********************************************************************/
534 int MothurOut::openOutputFileAppend(string fileName, ofstream& fileHandle){
536 fileName = getFullPathName(fileName);
538 fileHandle.open(fileName.c_str(), ios::app);
540 mothurOut("[ERROR]: Could not open " + fileName); mothurOutEndLine();
547 catch(exception& e) {
548 errorOut(e, "MothurOut", "openOutputFileAppend");
552 /***********************************************************************/
553 void MothurOut::gobble(istream& f){
557 while(isspace(d=f.get())) { ;}
558 if(!f.eof()) { f.putback(d); }
560 catch(exception& e) {
561 errorOut(e, "MothurOut", "gobble");
565 /***********************************************************************/
566 void MothurOut::gobble(istringstream& f){
569 while(isspace(d=f.get())) {;}
570 if(!f.eof()) { f.putback(d); }
572 catch(exception& e) {
573 errorOut(e, "MothurOut", "gobble");
578 /***********************************************************************/
580 string MothurOut::getline(istringstream& fileHandle) {
585 while (!fileHandle.eof()) {
587 char c = fileHandle.get();
589 //are you at the end of the line
590 if ((c == '\n') || (c == '\r') || (c == '\f')){ break; }
597 catch(exception& e) {
598 errorOut(e, "MothurOut", "getline");
602 /***********************************************************************/
604 string MothurOut::getline(ifstream& fileHandle) {
611 char c = fileHandle.get();
613 //are you at the end of the line
614 if ((c == '\n') || (c == '\r') || (c == '\f') || (c == EOF)){ break; }
621 catch(exception& e) {
622 errorOut(e, "MothurOut", "getline");
626 /***********************************************************************/
628 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
629 #ifdef USE_COMPRESSION
630 inline bool endsWith(string s, const char * suffix){
631 size_t suffixLength = strlen(suffix);
632 return s.size() >= suffixLength && s.substr(s.size() - suffixLength, suffixLength).compare(suffix) == 0;
637 string MothurOut::getRootName(string longName){
640 string rootName = longName;
642 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
643 #ifdef USE_COMPRESSION
644 if (endsWith(rootName, ".gz") || endsWith(rootName, ".bz2")) {
645 int pos = rootName.find_last_of('.');
646 rootName = rootName.substr(0, pos);
647 cerr << "shortening " << longName << " to " << rootName << "\n";
651 if(rootName.find_last_of(".") != rootName.npos){
652 int pos = rootName.find_last_of('.')+1;
653 rootName = rootName.substr(0, pos);
658 catch(exception& e) {
659 errorOut(e, "MothurOut", "getRootName");
663 /***********************************************************************/
665 string MothurOut::getSimpleName(string longName){
667 string simpleName = longName;
670 found=longName.find_last_of("/\\");
672 if(found != longName.npos){
673 simpleName = longName.substr(found+1);
678 catch(exception& e) {
679 errorOut(e, "MothurOut", "getSimpleName");
684 /***********************************************************************/
686 int MothurOut::getRandomIndex(int highest){
689 int random = (int) ((float)(highest+1) * (float)(rand()) / ((float)RAND_MAX+1.0));
693 catch(exception& e) {
694 errorOut(e, "MothurOut", "getRandomIndex");
699 /**********************************************************************/
701 string MothurOut::getPathName(string longName){
703 string rootPathName = longName;
705 if(longName.find_last_of("/\\") != longName.npos){
706 int pos = longName.find_last_of("/\\")+1;
707 rootPathName = longName.substr(0, pos);
712 catch(exception& e) {
713 errorOut(e, "MothurOut", "getPathName");
718 /***********************************************************************/
720 bool MothurOut::dirCheck(string& dirName){
726 MPI_Comm_rank(MPI_COMM_WORLD, &pid); //find out who we are
731 //add / to name if needed
732 string lastChar = dirName.substr(dirName.length()-1);
733 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
734 if (lastChar != "/") { dirName += "/"; }
736 if (lastChar != "\\") { dirName += "\\"; }
739 //test to make sure directory exists
740 dirName = getFullPathName(dirName);
741 string outTemp = dirName + tag + "temp";
743 out.open(outTemp.c_str(), ios::trunc);
745 mothurOut(dirName + " directory does not exist or is not writable."); mothurOutEndLine();
748 mothurRemove(outTemp);
754 catch(exception& e) {
755 errorOut(e, "MothurOut", "dirCheck");
760 /***********************************************************************/
762 string MothurOut::hasPath(string longName){
767 found=longName.find_last_of("~/\\");
769 if(found != longName.npos){
770 path = longName.substr(0, found+1);
775 catch(exception& e) {
776 errorOut(e, "MothurOut", "hasPath");
781 /***********************************************************************/
783 string MothurOut::getExtension(string longName){
785 string extension = "";
787 if(longName.find_last_of('.') != longName.npos){
788 int pos = longName.find_last_of('.');
789 extension = longName.substr(pos, longName.length());
794 catch(exception& e) {
795 errorOut(e, "MothurOut", "getExtension");
799 /***********************************************************************/
800 bool MothurOut::isBlank(string fileName){
803 fileName = getFullPathName(fileName);
806 fileHandle.open(fileName.c_str());
808 mothurOut("[ERROR]: Could not open " + fileName); mothurOutEndLine();
811 //check for blank file
813 if (fileHandle.eof()) { fileHandle.close(); return true; }
818 catch(exception& e) {
819 errorOut(e, "MothurOut", "isBlank");
823 /***********************************************************************/
825 string MothurOut::getFullPathName(string fileName){
828 string path = hasPath(fileName);
832 if (path == "") { return fileName; } //its a simple name
833 else { //we need to complete the pathname
834 // ex. ../../../filename
835 // cwd = /user/work/desktop
838 //get current working directory
839 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
841 if (path.find("~") != -1) { //go to home directory
844 char *homepath = NULL;
845 homepath = getenv ("HOME");
846 if ( homepath != NULL) { homeDir = homepath; }
847 else { homeDir = ""; }
849 newFileName = homeDir + fileName.substr(fileName.find("~")+1);
852 if (path.rfind("./") == string::npos) { return fileName; } //already complete name
853 else { newFileName = fileName.substr(fileName.rfind("./")+2); } //save the complete part of the name
855 //char* cwdpath = new char[1024];
857 //cwdpath=getcwd(cwdpath,size);
860 char *cwdpath = NULL;
861 cwdpath = getcwd(NULL, 0); // or _getcwd
862 if ( cwdpath != NULL) { cwd = cwdpath; }
868 if (cwd.length() > 0) { simpleCWD = cwd.substr(1); }
870 //break apart the current working directory
872 while (simpleCWD.find_first_of('/') != string::npos) {
873 string dir = simpleCWD.substr(0,simpleCWD.find_first_of('/'));
874 simpleCWD = simpleCWD.substr(simpleCWD.find_first_of('/')+1, simpleCWD.length());
877 //get last one // ex. ../../../filename = /user/work/desktop/filename
878 dirs.push_back(simpleCWD); //ex. dirs[0] = user, dirs[1] = work, dirs[2] = desktop
881 int index = dirs.size()-1;
883 while((pos = path.rfind("./")) != string::npos) { //while you don't have a complete path
884 if (pos == 0) { break; //you are at the end
885 }else if (path[(pos-1)] == '.') { //you want your parent directory ../
886 path = path.substr(0, pos-1);
888 if (index == 0) { break; }
889 }else if (path[(pos-1)] == '/') { //you want the current working dir ./
890 path = path.substr(0, pos);
891 }else if (pos == 1) { break; //you are at the end
892 }else { mothurOut("cannot resolve path for " + fileName + "\n"); return fileName; }
895 for (int i = index; i >= 0; i--) {
896 newFileName = dirs[i] + "/" + newFileName;
899 newFileName = "/" + newFileName;
903 if (path.find("~") != string::npos) { //go to home directory
904 string homeDir = getenv ("HOMEPATH");
905 newFileName = homeDir + fileName.substr(fileName.find("~")+1);
908 if (path.rfind(".\\") == string::npos) { return fileName; } //already complete name
909 else { newFileName = fileName.substr(fileName.rfind(".\\")+2); } //save the complete part of the name
911 char *cwdpath = NULL;
912 cwdpath = getcwd(NULL, 0); // or _getcwd
913 if ( cwdpath != NULL) { cwd = cwdpath; }
916 //break apart the current working directory
918 while (cwd.find_first_of('\\') != -1) {
919 string dir = cwd.substr(0,cwd.find_first_of('\\'));
920 cwd = cwd.substr(cwd.find_first_of('\\')+1, cwd.length());
925 dirs.push_back(cwd); //ex. dirs[0] = user, dirs[1] = work, dirs[2] = desktop
927 int index = dirs.size()-1;
929 while((pos = path.rfind(".\\")) != string::npos) { //while you don't have a complete path
930 if (pos == 0) { break; //you are at the end
931 }else if (path[(pos-1)] == '.') { //you want your parent directory ../
932 path = path.substr(0, pos-1);
934 if (index == 0) { break; }
935 }else if (path[(pos-1)] == '\\') { //you want the current working dir ./
936 path = path.substr(0, pos);
937 }else if (pos == 1) { break; //you are at the end
938 }else { mothurOut("cannot resolve path for " + fileName + "\n"); return fileName; }
941 for (int i = index; i >= 0; i--) {
942 newFileName = dirs[i] + "\\" + newFileName;
951 catch(exception& e) {
952 errorOut(e, "MothurOut", "getFullPathName");
956 /***********************************************************************/
958 int MothurOut::openInputFile(string fileName, ifstream& fileHandle, string m){
961 string completeFileName = getFullPathName(fileName);
962 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
963 #ifdef USE_COMPRESSION
964 // check for gzipped or bzipped file
965 if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
966 string tempName = string(tmpnam(0));
967 mkfifo(tempName.c_str(), 0666);
968 int fork_result = fork();
969 if (fork_result < 0) {
970 cerr << "Error forking.\n";
972 } else if (fork_result == 0) {
973 string command = (endsWith(completeFileName, ".gz") ? "zcat " : "bzcat ") + completeFileName + string(" > ") + tempName;
974 cerr << "Decompressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
975 system(command.c_str());
976 cerr << "Done decompressing " << completeFileName << "\n";
977 mothurRemove(tempName);
980 cerr << "waiting on child process " << fork_result << "\n";
981 completeFileName = tempName;
986 fileHandle.open(completeFileName.c_str());
988 //mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
991 //check for blank file
996 catch(exception& e) {
997 errorOut(e, "MothurOut", "openInputFile - no Error");
1001 /***********************************************************************/
1003 int MothurOut::openInputFile(string fileName, ifstream& fileHandle){
1006 //get full path name
1007 string completeFileName = getFullPathName(fileName);
1008 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
1009 #ifdef USE_COMPRESSION
1010 // check for gzipped or bzipped file
1011 if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
1012 string tempName = string(tmpnam(0));
1013 mkfifo(tempName.c_str(), 0666);
1014 int fork_result = fork();
1015 if (fork_result < 0) {
1016 cerr << "Error forking.\n";
1018 } else if (fork_result == 0) {
1019 string command = (endsWith(completeFileName, ".gz") ? "zcat " : "bzcat ") + completeFileName + string(" > ") + tempName;
1020 cerr << "Decompressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
1021 system(command.c_str());
1022 cerr << "Done decompressing " << completeFileName << "\n";
1023 mothurRemove(tempName);
1026 cerr << "waiting on child process " << fork_result << "\n";
1027 completeFileName = tempName;
1033 fileHandle.open(completeFileName.c_str());
1035 mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
1039 //check for blank file
1041 if (fileHandle.eof()) { mothurOut("[ERROR]: " + completeFileName + " is blank. Please correct."); mothurOutEndLine(); }
1046 catch(exception& e) {
1047 errorOut(e, "MothurOut", "openInputFile");
1051 /***********************************************************************/
1053 int MothurOut::renameFile(string oldName, string newName){
1056 int exist = openInputFile(newName, inTest, "");
1059 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
1060 if (exist == 0) { //you could open it so you want to delete it
1061 string command = "rm " + newName;
1062 system(command.c_str());
1065 string command = "mv " + oldName + " " + newName;
1066 system(command.c_str());
1068 mothurRemove(newName);
1069 int renameOk = rename(oldName.c_str(), newName.c_str());
1074 catch(exception& e) {
1075 errorOut(e, "MothurOut", "renameFile");
1080 /***********************************************************************/
1082 int MothurOut::openOutputFile(string fileName, ofstream& fileHandle){
1085 string completeFileName = getFullPathName(fileName);
1086 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
1087 #ifdef USE_COMPRESSION
1088 // check for gzipped file
1089 if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
1090 string tempName = string(tmpnam(0));
1091 mkfifo(tempName.c_str(), 0666);
1092 cerr << "Compressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
1093 int fork_result = fork();
1094 if (fork_result < 0) {
1095 cerr << "Error forking.\n";
1097 } else if (fork_result == 0) {
1098 string command = string(endsWith(completeFileName, ".gz") ? "gzip" : "bzip2") + " -v > " + completeFileName + string(" < ") + tempName;
1099 system(command.c_str());
1102 completeFileName = tempName;
1107 fileHandle.open(completeFileName.c_str(), ios::trunc);
1109 mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
1116 catch(exception& e) {
1117 errorOut(e, "MothurOut", "openOutputFile");
1123 /**************************************************************************************************/
1124 int MothurOut::appendFiles(string temp, string filename) {
1129 //open output file in append mode
1130 openOutputFileAppend(filename, output);
1131 int ableToOpen = openInputFile(temp, input, "no error");
1132 //int ableToOpen = openInputFile(temp, input);
1135 if (ableToOpen == 0) { //you opened it
1138 while (!input.eof()) {
1139 input.read(buffer, 4096);
1140 output.write(buffer, input.gcount());
1141 //count number of lines
1142 for (int i = 0; i < input.gcount(); i++) { if (buffer[i] == '\n') {numLines++;} }
1151 catch(exception& e) {
1152 errorOut(e, "MothurOut", "appendFiles");
1157 /**************************************************************************************************/
1158 string MothurOut::sortFile(string distFile, string outputDir){
1161 //if (outputDir == "") { outputDir += hasPath(distFile); }
1162 string outfile = getRootName(distFile) + "sorted.dist";
1165 //if you can, use the unix sort since its been optimized for years
1166 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
1167 string command = "sort -n -k +3 " + distFile + " -o " + outfile;
1168 system(command.c_str());
1169 #else //you are stuck with my best attempt...
1170 //windows sort does not have a way to specify a column, only a character in the line
1171 //since we cannot assume that the distance will always be at the the same character location on each line
1172 //due to variable sequence name lengths, I chose to force the distance into first position, then sort and then put it back.
1174 //read in file line by file and put distance first
1175 string tempDistFile = distFile + ".temp";
1178 openInputFile(distFile, input);
1179 openOutputFile(tempDistFile, output);
1181 string firstName, secondName;
1184 input >> firstName >> secondName >> dist;
1185 output << dist << '\t' << firstName << '\t' << secondName << endl;
1192 //sort using windows sort
1193 string tempOutfile = outfile + ".temp";
1194 string command = "sort " + tempDistFile + " /O " + tempOutfile;
1195 system(command.c_str());
1197 //read in sorted file and put distance at end again
1199 openInputFile(tempOutfile, input2);
1200 openOutputFile(outfile, output);
1203 input2 >> dist >> firstName >> secondName;
1204 output << firstName << '\t' << secondName << '\t' << dist << endl;
1211 mothurRemove(tempDistFile);
1212 mothurRemove(tempOutfile);
1217 catch(exception& e) {
1218 errorOut(e, "MothurOut", "sortFile");
1222 /**************************************************************************************************/
1223 vector<unsigned long long> MothurOut::setFilePosFasta(string filename, int& num) {
1225 vector<unsigned long long> positions;
1227 //openInputFile(filename, inFASTA);
1228 inFASTA.open(filename.c_str(), ios::binary);
1231 unsigned long long count = 0;
1232 while(!inFASTA.eof()){
1233 //input = getline(inFASTA);
1234 //cout << input << '\t' << inFASTA.tellg() << endl;
1235 //if (input.length() != 0) {
1236 // if(input[0] == '>'){ unsigned long int pos = inFASTA.tellg(); positions.push_back(pos - input.length() - 1); cout << (pos - input.length() - 1) << endl; }
1238 //gobble(inFASTA); //has to be here since windows line endings are 2 characters and mess up the positions
1239 char c = inFASTA.get(); count++;
1241 positions.push_back(count-1);
1242 //cout << count << endl;
1247 num = positions.size();
1252 //get num bytes in file
1253 pFile = fopen (filename.c_str(),"rb");
1254 if (pFile==NULL) perror ("Error opening file");
1256 fseek (pFile, 0, SEEK_END);
1261 unsigned long long size = positions[(positions.size()-1)];
1263 openInputFile(filename, in);
1268 if(in.eof()) { break; }
1273 positions.push_back(size);
1278 catch(exception& e) {
1279 errorOut(e, "MothurOut", "setFilePosFasta");
1283 /**************************************************************************************************/
1284 vector<unsigned long long> MothurOut::setFilePosEachLine(string filename, int& num) {
1286 filename = getFullPathName(filename);
1288 vector<unsigned long long> positions;
1290 //openInputFile(filename, in);
1291 in.open(filename.c_str(), ios::binary);
1294 unsigned long long count = 0;
1295 positions.push_back(0);
1298 //getline counting reads
1299 char d = in.get(); count++;
1300 while ((d != '\n') && (d != '\r') && (d != '\f') && (d != in.eof())) {
1301 //get next character
1307 d=in.get(); count++;
1308 while(isspace(d) && (d != in.eof())) { d=in.get(); count++;}
1310 positions.push_back(count-1);
1311 //cout << count-1 << endl;
1315 num = positions.size()-1;
1318 unsigned long long size;
1320 //get num bytes in file
1321 pFile = fopen (filename.c_str(),"rb");
1322 if (pFile==NULL) perror ("Error opening file");
1324 fseek (pFile, 0, SEEK_END);
1329 positions[(positions.size()-1)] = size;
1333 catch(exception& e) {
1334 errorOut(e, "MothurOut", "setFilePosEachLine");
1338 /**************************************************************************************************/
1340 vector<unsigned long long> MothurOut::divideFile(string filename, int& proc) {
1342 vector<unsigned long long> filePos;
1343 filePos.push_back(0);
1346 unsigned long long size;
1348 filename = getFullPathName(filename);
1350 //get num bytes in file
1351 pFile = fopen (filename.c_str(),"rb");
1352 if (pFile==NULL) perror ("Error opening file");
1354 fseek (pFile, 0, SEEK_END);
1359 #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix)
1361 //estimate file breaks
1362 unsigned long long chunkSize = 0;
1363 chunkSize = size / proc;
1365 //file to small to divide by processors
1366 if (chunkSize == 0) { proc = 1; filePos.push_back(size); return filePos; }
1368 //for each process seekg to closest file break and search for next '>' char. make that the filebreak
1369 for (int i = 0; i < proc; i++) {
1370 unsigned long long spot = (i+1) * chunkSize;
1373 openInputFile(filename, in);
1377 unsigned long long newSpot = spot;
1381 if (c == '>') { in.putback(c); newSpot = in.tellg(); break; }
1382 else if (int(c) == -1) { break; }
1386 //there was not another sequence before the end of the file
1387 unsigned long long sanityPos = in.tellg();
1389 if (sanityPos == -1) { break; }
1390 else { filePos.push_back(newSpot); }
1396 filePos.push_back(size);
1398 //sanity check filePos
1399 for (int i = 0; i < (filePos.size()-1); i++) {
1400 if (filePos[(i+1)] <= filePos[i]) { filePos.erase(filePos.begin()+(i+1)); i--; }
1403 proc = (filePos.size() - 1);
1405 mothurOut("[ERROR]: Windows version should not be calling the divideFile function."); mothurOutEndLine();
1407 filePos.push_back(size);
1411 catch(exception& e) {
1412 errorOut(e, "MothurOut", "divideFile");
1416 /**************************************************************************************************/
1417 int MothurOut::divideFile(string filename, int& proc, vector<string>& files) {
1420 vector<unsigned long long> filePos = divideFile(filename, proc);
1422 for (int i = 0; i < (filePos.size()-1); i++) {
1426 openInputFile(filename, in);
1427 in.seekg(filePos[i]);
1428 unsigned long long size = filePos[(i+1)] - filePos[i];
1429 char* chunk = new char[size];
1430 in.read(chunk, size);
1434 string fileChunkName = filename + "." + toString(i) + ".tmp";
1436 openOutputFile(fileChunkName, out);
1438 out << chunk << endl;
1443 files.push_back(fileChunkName);
1448 catch(exception& e) {
1449 errorOut(e, "MothurOut", "divideFile");
1453 /***********************************************************************/
1455 bool MothurOut::isTrue(string f){
1458 for (int i = 0; i < f.length(); i++) { f[i] = toupper(f[i]); }
1460 if ((f == "TRUE") || (f == "T")) { return true; }
1461 else { return false; }
1463 catch(exception& e) {
1464 errorOut(e, "MothurOut", "isTrue");
1469 /***********************************************************************/
1471 float MothurOut::roundDist(float dist, int precision){
1473 return int(dist * precision + 0.5)/float(precision);
1475 catch(exception& e) {
1476 errorOut(e, "MothurOut", "roundDist");
1480 /***********************************************************************/
1482 float MothurOut::ceilDist(float dist, int precision){
1484 return int(ceil(dist * precision))/float(precision);
1486 catch(exception& e) {
1487 errorOut(e, "MothurOut", "ceilDist");
1491 /***********************************************************************/
1493 vector<string> MothurOut::splitWhiteSpace(string& rest, char buffer[], int size){
1495 vector<string> pieces;
1497 for (int i = 0; i < size; i++) {
1498 if (!isspace(buffer[i])) { rest += buffer[i]; }
1500 if (rest != "") { pieces.push_back(rest); rest = ""; }
1501 while (i < size) { //gobble white space
1502 if (isspace(buffer[i])) { i++; }
1503 else { rest = buffer[i]; break; } //cout << "next piece buffer = " << nextPiece << endl;
1510 catch(exception& e) {
1511 errorOut(e, "MothurOut", "splitWhiteSpace");
1515 /***********************************************************************/
1516 vector<string> MothurOut::splitWhiteSpace(string input){
1518 vector<string> pieces;
1521 for (int i = 0; i < input.length(); i++) {
1522 if (!isspace(input[i])) { rest += input[i]; }
1524 if (rest != "") { pieces.push_back(rest); rest = ""; }
1525 while (i < input.length()) { //gobble white space
1526 if (isspace(input[i])) { i++; }
1527 else { rest = input[i]; break; } //cout << "next piece buffer = " << nextPiece << endl;
1532 if (rest != "") { pieces.push_back(rest); }
1536 catch(exception& e) {
1537 errorOut(e, "MothurOut", "splitWhiteSpace");
1541 //**********************************************************************************************************************
1542 int MothurOut::readTax(string namefile, map<string, string>& taxMap) {
1547 openInputFile(namefile, in);
1551 bool pairDone = false;
1552 bool columnOne = true;
1553 string firstCol, secondCol;
1556 if (control_pressed) { break; }
1558 in.read(buffer, 4096);
1559 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1561 for (int i = 0; i < pieces.size(); i++) {
1562 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1563 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1566 //are there confidence scores, if so remove them
1567 if (secondCol.find_first_of('(') != -1) { removeConfidences(secondCol); }
1568 taxMap[firstCol] = secondCol;
1569 if (debug) { mothurOut("[DEBUG]: name = '" + firstCol + "' tax = '" + secondCol + "'\n"); }
1576 return taxMap.size();
1579 catch(exception& e) {
1580 errorOut(e, "MothurOut", "readTax");
1584 /**********************************************************************************************************************/
1585 int MothurOut::readNames(string namefile, map<string, string>& nameMap, bool redund) {
1590 openInputFile(namefile, in);
1594 bool pairDone = false;
1595 bool columnOne = true;
1596 string firstCol, secondCol;
1599 if (control_pressed) { break; }
1601 in.read(buffer, 4096);
1602 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1604 for (int i = 0; i < pieces.size(); i++) {
1605 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1606 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1609 //parse names into vector
1610 vector<string> theseNames;
1611 splitAtComma(secondCol, theseNames);
1612 for (int i = 0; i < theseNames.size(); i++) { nameMap[theseNames[i]] = firstCol; }
1619 return nameMap.size();
1622 catch(exception& e) {
1623 errorOut(e, "MothurOut", "readNames");
1627 /**********************************************************************************************************************/
1628 int MothurOut::readNames(string namefile, map<string, string>& nameMap, int flip) {
1633 openInputFile(namefile, in);
1637 bool pairDone = false;
1638 bool columnOne = true;
1639 string firstCol, secondCol;
1642 if (control_pressed) { break; }
1644 in.read(buffer, 4096);
1645 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1647 for (int i = 0; i < pieces.size(); i++) {
1648 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1649 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1652 nameMap[secondCol] = firstCol;
1659 return nameMap.size();
1662 catch(exception& e) {
1663 errorOut(e, "MothurOut", "readNames");
1667 /**********************************************************************************************************************/
1668 int MothurOut::readNames(string namefile, map<string, string>& nameMap, map<string, int>& nameCount) {
1670 nameMap.clear(); nameCount.clear();
1673 openInputFile(namefile, in);
1677 bool pairDone = false;
1678 bool columnOne = true;
1679 string firstCol, secondCol;
1682 if (control_pressed) { break; }
1684 in.read(buffer, 4096);
1685 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1687 for (int i = 0; i < pieces.size(); i++) {
1688 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1689 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1692 //parse names into vector
1693 vector<string> theseNames;
1694 splitAtComma(secondCol, theseNames);
1695 for (int i = 0; i < theseNames.size(); i++) { nameMap[theseNames[i]] = firstCol; }
1696 nameCount[firstCol] = theseNames.size();
1703 return nameMap.size();
1706 catch(exception& e) {
1707 errorOut(e, "MothurOut", "readNames");
1711 /**********************************************************************************************************************/
1712 int MothurOut::readNames(string namefile, map<string, string>& nameMap) {
1717 openInputFile(namefile, in);
1721 bool pairDone = false;
1722 bool columnOne = true;
1723 string firstCol, secondCol;
1726 if (control_pressed) { break; }
1728 in.read(buffer, 4096);
1729 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1731 for (int i = 0; i < pieces.size(); i++) {
1732 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1733 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1735 if (pairDone) { nameMap[firstCol] = secondCol; pairDone = false; }
1740 return nameMap.size();
1743 catch(exception& e) {
1744 errorOut(e, "MothurOut", "readNames");
1748 /**********************************************************************************************************************/
1749 int MothurOut::readNames(string namefile, map<string, vector<string> >& nameMap) {
1754 openInputFile(namefile, in);
1758 bool pairDone = false;
1759 bool columnOne = true;
1760 string firstCol, secondCol;
1763 if (control_pressed) { break; }
1765 in.read(buffer, 4096);
1766 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1768 for (int i = 0; i < pieces.size(); i++) {
1769 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1770 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1773 vector<string> temp;
1774 splitAtComma(secondCol, temp);
1775 nameMap[firstCol] = temp;
1782 return nameMap.size();
1784 catch(exception& e) {
1785 errorOut(e, "MothurOut", "readNames");
1789 /**********************************************************************************************************************/
1790 map<string, int> MothurOut::readNames(string namefile) {
1793 map<string, int> nameMap;
1797 openInputFile(namefile, in);
1801 bool pairDone = false;
1802 bool columnOne = true;
1803 string firstCol, secondCol;
1806 if (control_pressed) { break; }
1808 in.read(buffer, 4096);
1809 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1811 for (int i = 0; i < pieces.size(); i++) {
1812 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1813 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1816 int num = getNumNames(secondCol);
1817 nameMap[firstCol] = num;
1827 catch(exception& e) {
1828 errorOut(e, "MothurOut", "readNames");
1832 /**********************************************************************************************************************/
1833 int MothurOut::readNames(string namefile, vector<seqPriorityNode>& nameVector, map<string, string>& fastamap) {
1839 openInputFile(namefile, in);
1843 bool pairDone = false;
1844 bool columnOne = true;
1845 string firstCol, secondCol;
1848 if (control_pressed) { break; }
1850 in.read(buffer, 4096);
1851 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1853 for (int i = 0; i < pieces.size(); i++) {
1854 if (columnOne) { firstCol = pieces[i]; columnOne=false; }
1855 else { secondCol = pieces[i]; pairDone = true; columnOne=true; }
1858 int num = getNumNames(secondCol);
1860 map<string, string>::iterator it = fastamap.find(firstCol);
1861 if (it == fastamap.end()) {
1863 mothurOut("[ERROR]: " + firstCol + " is not in your fastafile, but is in your namesfile, please correct."); mothurOutEndLine();
1865 seqPriorityNode temp(num, it->second, firstCol);
1866 nameVector.push_back(temp);
1877 catch(exception& e) {
1878 errorOut(e, "MothurOut", "readNames");
1882 //**********************************************************************************************************************
1883 set<string> MothurOut::readAccnos(string accnosfile){
1887 openInputFile(accnosfile, in);
1894 if (control_pressed) { break; }
1896 in.read(buffer, 4096);
1897 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1899 for (int i = 0; i < pieces.size(); i++) { names.insert(pieces[i]); }
1905 catch(exception& e) {
1906 errorOut(e, "MothurOut", "readAccnos");
1910 //**********************************************************************************************************************
1911 int MothurOut::readAccnos(string accnosfile, vector<string>& names){
1915 openInputFile(accnosfile, in);
1922 if (control_pressed) { break; }
1924 in.read(buffer, 4096);
1925 vector<string> pieces = splitWhiteSpace(rest, buffer, in.gcount());
1927 for (int i = 0; i < pieces.size(); i++) { names.push_back(pieces[i]); }
1933 catch(exception& e) {
1934 errorOut(e, "MothurOut", "readAccnos");
1938 /***********************************************************************/
1940 int MothurOut::getNumNames(string names){
1946 for(int i=0;i<names.size();i++){
1947 if(names[i] == ','){
1955 catch(exception& e) {
1956 errorOut(e, "MothurOut", "getNumNames");
1960 /***********************************************************************/
1962 int MothurOut::getNumChar(string line, char c){
1967 for(int i=0;i<line.size();i++){
1976 catch(exception& e) {
1977 errorOut(e, "MothurOut", "getNumChar");
1981 /***********************************************************************/
1982 int MothurOut::mothurRemove(string filename){
1984 filename = getFullPathName(filename);
1985 int error = remove(filename.c_str());
1987 // if (errno != ENOENT) { //ENOENT == file does not exist
1988 // string message = "Error deleting file " + filename;
1989 // perror(message.c_str());
1994 catch(exception& e) {
1995 errorOut(e, "MothurOut", "mothurRemove");
1999 /***********************************************************************/
2000 bool MothurOut::mothurConvert(string item, int& num){
2004 if (isNumeric1(item)) {
2009 mothurOut("[ERROR]: cannot convert " + item + " to an integer."); mothurOutEndLine();
2010 commandInputsConvertError = true;
2015 catch(exception& e) {
2016 errorOut(e, "MothurOut", "mothurConvert");
2020 /***********************************************************************/
2021 bool MothurOut::isNumeric1(string stringToCheck){
2023 bool numeric = false;
2025 if(stringToCheck.find_first_not_of("0123456789.-") == string::npos) { numeric = true; }
2029 catch(exception& e) {
2030 errorOut(e, "MothurOut", "isNumeric1");
2035 /***********************************************************************/
2036 bool MothurOut::mothurConvert(string item, float& num){
2040 if (isNumeric1(item)) {
2045 mothurOut("[ERROR]: cannot convert " + item + " to a float."); mothurOutEndLine();
2046 commandInputsConvertError = true;
2051 catch(exception& e) {
2052 errorOut(e, "MothurOut", "mothurConvert");
2056 /***********************************************************************/
2057 bool MothurOut::mothurConvert(string item, double& num){
2061 if (isNumeric1(item)) {
2066 mothurOut("[ERROR]: cannot convert " + item + " to a double."); mothurOutEndLine();
2067 commandInputsConvertError = true;
2072 catch(exception& e) {
2073 errorOut(e, "MothurOut", "mothurConvert");
2077 /**************************************************************************************************/
2079 vector<vector<double> > MothurOut::binomial(int maxOrder){
2081 vector<vector<double> > binomial(maxOrder+1);
2083 for(int i=0;i<=maxOrder;i++){
2084 binomial[i].resize(maxOrder+1);
2093 for(int i=2;i<=maxOrder;i++){
2097 for(int i=2;i<=maxOrder;i++){
2098 for(int j=1;j<=maxOrder;j++){
2099 if(i==j){ binomial[i][j]=1; }
2100 if(j>i) { binomial[i][j]=0; }
2101 else { binomial[i][j]=binomial[i-1][j-1]+binomial[i-1][j]; }
2108 catch(exception& e) {
2109 errorOut(e, "MothurOut", "binomial");
2113 /**************************************************************************************************/
2114 unsigned int MothurOut::fromBase36(string base36){
2116 unsigned int num = 0;
2118 map<char, int> converts;
2183 while (i < base36.length()) {
2185 num = 36 * num + converts[c];
2192 catch(exception& e) {
2193 errorOut(e, "MothurOut", "fromBase36");
2197 /***********************************************************************/
2199 int MothurOut::factorial(int num){
2203 for (int i = 1; i <= num; i++) {
2209 catch(exception& e) {
2210 errorOut(e, "MothurOut", "factorial");
2214 /***********************************************************************/
2216 int MothurOut::getNumSeqs(ifstream& file){
2218 int numSeqs = count(istreambuf_iterator<char>(file),istreambuf_iterator<char>(), '>');
2222 catch(exception& e) {
2223 errorOut(e, "MothurOut", "getNumSeqs");
2227 /***********************************************************************/
2228 void MothurOut::getNumSeqs(ifstream& file, int& numSeqs){
2233 input = getline(file);
2234 if (input.length() != 0) {
2235 if(input[0] == '>'){ numSeqs++; }
2239 catch(exception& e) {
2240 errorOut(e, "MothurOut", "getNumSeqs");
2244 /***********************************************************************/
2246 //This function parses the estimator options and puts them in a vector
2247 void MothurOut::splitAtChar(string& estim, vector<string>& container, char symbol) {
2249 string individual = "";
2250 int estimLength = estim.size();
2251 for(int i=0;i<estimLength;i++){
2252 if(estim[i] == symbol){
2253 container.push_back(individual);
2257 individual += estim[i];
2260 container.push_back(individual);
2263 catch(exception& e) {
2264 errorOut(e, "MothurOut", "splitAtChar");
2269 /***********************************************************************/
2271 //This function parses the estimator options and puts them in a vector
2272 void MothurOut::splitAtDash(string& estim, vector<string>& container) {
2274 string individual = "";
2275 int estimLength = estim.size();
2276 for(int i=0;i<estimLength;i++){
2277 if(estim[i] == '-'){
2278 container.push_back(individual);
2282 individual += estim[i];
2285 container.push_back(individual);
2288 /* string individual;
2290 while (estim.find_first_of('-') != -1) {
2291 individual = estim.substr(0,estim.find_first_of('-'));
2292 if ((estim.find_first_of('-')+1) <= estim.length()) { //checks to make sure you don't have dash at end of string
2293 estim = estim.substr(estim.find_first_of('-')+1, estim.length());
2294 container.push_back(individual);
2298 container.push_back(estim); */
2300 catch(exception& e) {
2301 errorOut(e, "MothurOut", "splitAtDash");
2306 /***********************************************************************/
2307 //This function parses the label options and puts them in a set
2308 void MothurOut::splitAtDash(string& estim, set<string>& container) {
2310 string individual = "";
2311 int estimLength = estim.size();
2312 for(int i=0;i<estimLength;i++){
2313 if(estim[i] == '-'){
2314 container.insert(individual);
2318 individual += estim[i];
2321 container.insert(individual);
2323 // string individual;
2325 // while (estim.find_first_of('-') != -1) {
2326 // individual = estim.substr(0,estim.find_first_of('-'));
2327 // if ((estim.find_first_of('-')+1) <= estim.length()) { //checks to make sure you don't have dash at end of string
2328 // estim = estim.substr(estim.find_first_of('-')+1, estim.length());
2329 // container.insert(individual);
2333 // container.insert(estim);
2336 catch(exception& e) {
2337 errorOut(e, "MothurOut", "splitAtDash");
2341 /***********************************************************************/
2342 //This function parses the line options and puts them in a set
2343 void MothurOut::splitAtDash(string& estim, set<int>& container) {
2348 while (estim.find_first_of('-') != -1) {
2349 individual = estim.substr(0,estim.find_first_of('-'));
2350 if ((estim.find_first_of('-')+1) <= estim.length()) { //checks to make sure you don't have dash at end of string
2351 estim = estim.substr(estim.find_first_of('-')+1, estim.length());
2352 convert(individual, lineNum); //convert the string to int
2353 container.insert(lineNum);
2357 convert(estim, lineNum); //convert the string to int
2358 container.insert(lineNum);
2360 catch(exception& e) {
2361 errorOut(e, "MothurOut", "splitAtDash");
2365 /***********************************************************************/
2366 string MothurOut::makeList(vector<string>& names) {
2370 if (names.size() == 0) { return list; }
2372 for (int i = 0; i < names.size()-1; i++) { list += names[i] + ","; }
2375 list += names[names.size()-1];
2379 catch(exception& e) {
2380 errorOut(e, "MothurOut", "makeList");
2385 /***********************************************************************/
2386 //This function parses the a string and puts peices in a vector
2387 void MothurOut::splitAtComma(string& estim, vector<string>& container) {
2389 string individual = "";
2390 int estimLength = estim.size();
2391 for(int i=0;i<estimLength;i++){
2392 if(estim[i] == ','){
2393 container.push_back(individual);
2397 individual += estim[i];
2400 container.push_back(individual);
2405 // string individual;
2407 // while (estim.find_first_of(',') != -1) {
2408 // individual = estim.substr(0,estim.find_first_of(','));
2409 // if ((estim.find_first_of(',')+1) <= estim.length()) { //checks to make sure you don't have comma at end of string
2410 // estim = estim.substr(estim.find_first_of(',')+1, estim.length());
2411 // container.push_back(individual);
2415 // container.push_back(estim);
2417 catch(exception& e) {
2418 errorOut(e, "MothurOut", "splitAtComma");
2422 /***********************************************************************/
2423 //This function splits up the various option parameters
2424 void MothurOut::splitAtChar(string& prefix, string& suffix, char c){
2426 prefix = suffix.substr(0,suffix.find_first_of(c));
2427 if ((suffix.find_first_of(c)+2) <= suffix.length()) { //checks to make sure you don't have comma at end of string
2428 suffix = suffix.substr(suffix.find_first_of(c)+1, suffix.length());
2430 while(suffix.at(0) == ' ')
2431 suffix = suffix.substr(1, suffix.length());
2435 catch(exception& e) {
2436 errorOut(e, "MothurOut", "splitAtComma");
2441 /***********************************************************************/
2443 //This function splits up the various option parameters
2444 void MothurOut::splitAtComma(string& prefix, string& suffix){
2446 prefix = suffix.substr(0,suffix.find_first_of(','));
2447 if ((suffix.find_first_of(',')+2) <= suffix.length()) { //checks to make sure you don't have comma at end of string
2448 suffix = suffix.substr(suffix.find_first_of(',')+1, suffix.length());
2450 while(suffix.at(0) == ' ')
2451 suffix = suffix.substr(1, suffix.length());
2455 catch(exception& e) {
2456 errorOut(e, "MothurOut", "splitAtComma");
2460 /***********************************************************************/
2462 //This function separates the key value from the option value i.e. dist=96_...
2463 void MothurOut::splitAtEquals(string& key, string& value){
2465 if(value.find_first_of('=') != -1){
2466 key = value.substr(0,value.find_first_of('='));
2467 if ((value.find_first_of('=')+1) <= value.length()) {
2468 value = value.substr(value.find_first_of('=')+1, value.length());
2475 catch(exception& e) {
2476 errorOut(e, "MothurOut", "splitAtEquals");
2481 /**************************************************************************************************/
2483 bool MothurOut::inUsersGroups(string groupname, vector<string> Groups) {
2485 for (int i = 0; i < Groups.size(); i++) {
2486 if (groupname == Groups[i]) { return true; }
2490 catch(exception& e) {
2491 errorOut(e, "MothurOut", "inUsersGroups");
2495 /**************************************************************************************************/
2496 //returns true if any of the strings in first vector are in second vector
2497 bool MothurOut::inUsersGroups(vector<string> groupnames, vector<string> Groups) {
2500 for (int i = 0; i < groupnames.size(); i++) {
2501 if (inUsersGroups(groupnames[i], Groups)) { return true; }
2505 catch(exception& e) {
2506 errorOut(e, "MothurOut", "inUsersGroups");
2510 /***********************************************************************/
2511 //this function determines if the user has given us labels that are smaller than the given label.
2512 //if so then it returns true so that the calling function can run the previous valid distance.
2513 //it's a "smart" distance function. It also checks for invalid labels.
2514 bool MothurOut::anyLabelsToProcess(string label, set<string>& userLabels, string errorOff) {
2517 set<string>::iterator it;
2518 vector<float> orderFloat;
2519 map<string, float> userMap; //the conversion process removes trailing 0's which we need to put back
2520 map<string, float>::iterator it2;
2522 bool smaller = false;
2524 //unique is the smallest line
2525 if (label == "unique") { return false; }
2527 if (convertTestFloat(label, labelFloat)) {
2528 convert(label, labelFloat);
2529 }else { //cant convert
2534 //go through users set and make them floats
2535 for(it = userLabels.begin(); it != userLabels.end();) {
2538 if ((*it != "unique") && (convertTestFloat(*it, temp) == true)){
2540 orderFloat.push_back(temp);
2541 userMap[*it] = temp;
2543 }else if (*it == "unique") {
2544 orderFloat.push_back(-1.0);
2545 userMap["unique"] = -1.0;
2548 if (errorOff == "") { mothurOut(*it + " is not a valid label."); mothurOutEndLine(); }
2549 userLabels.erase(it++);
2554 sort(orderFloat.begin(), orderFloat.end());
2556 /*************************************************/
2557 //is this label bigger than any of the users labels
2558 /*************************************************/
2560 //loop through order until you find a label greater than label
2561 for (int i = 0; i < orderFloat.size(); i++) {
2562 if (orderFloat[i] < labelFloat) {
2564 if (orderFloat[i] == -1) {
2565 if (errorOff == "") { mothurOut("Your file does not include the label unique."); mothurOutEndLine(); }
2566 userLabels.erase("unique");
2569 if (errorOff == "") { mothurOut("Your file does not include the label "); mothurOutEndLine(); }
2571 for (it2 = userMap.begin(); it2!= userMap.end(); it2++) {
2572 if (it2->second == orderFloat[i]) {
2574 //remove small labels
2575 userLabels.erase(s);
2579 if (errorOff == "") {mothurOut( s + ". I will use the next smallest distance. "); mothurOutEndLine(); }
2581 //since they are sorted once you find a bigger one stop looking
2588 catch(exception& e) {
2589 errorOut(e, "MothurOut", "anyLabelsToProcess");
2594 /**************************************************************************************************/
2595 bool MothurOut::checkReleaseVersion(ifstream& file, string version) {
2600 string line = getline(file);
2602 //before we added this check
2603 if (line[0] != '#') { good = false; }
2606 line = line.substr(1);
2608 vector<string> versionVector;
2609 splitAtChar(version, versionVector, '.');
2611 //check file version
2612 vector<string> linesVector;
2613 splitAtChar(line, linesVector, '.');
2615 if (versionVector.size() != linesVector.size()) { good = false; }
2617 for (int j = 0; j < versionVector.size(); j++) {
2619 convert(versionVector[j], num1);
2620 convert(linesVector[j], num2);
2622 //if mothurs version is newer than this files version, then we want to remake it
2623 if (num1 > num2) { good = false; break; }
2629 if (!good) { file.close(); }
2630 else { file.seekg(0); }
2634 catch(exception& e) {
2635 errorOut(e, "MothurOut", "checkReleaseVersion");
2639 /**************************************************************************************************/
2640 bool MothurOut::isContainingOnlyDigits(string input) {
2643 //are you a digit in ascii code
2644 for (int i = 0;i < input.length(); i++){
2645 if( input[i]>47 && input[i]<58){}
2646 else { return false; }
2651 catch(exception& e) {
2652 errorOut(e, "MothurOut", "isContainingOnlyDigits");
2656 /**************************************************************************************************/
2657 int MothurOut::removeConfidences(string& tax) {
2663 while (tax.find_first_of(';') != -1) {
2665 if (control_pressed) { return 0; }
2668 taxon = tax.substr(0,tax.find_first_of(';'));
2670 int pos = taxon.find_last_of('(');
2673 int pos2 = taxon.find_last_of(')');
2675 string confidenceScore = taxon.substr(pos+1, (pos2-(pos+1)));
2676 if (isNumeric1(confidenceScore)) {
2677 taxon = taxon.substr(0, pos); //rip off confidence
2683 tax = tax.substr(tax.find_first_of(';')+1, tax.length());
2691 catch(exception& e) {
2692 errorOut(e, "MothurOut", "removeConfidences");
2696 /**************************************************************************************************/