]> git.donarmstrong.com Git - mothur.git/blobdiff - mothurout.cpp
fixes while testing
[mothur.git] / mothurout.cpp
index f6b2a1d6312421da8405626b7aea19e71cd2b985..cd9e3212bfb3e4759ed798895fcfb004784e31c5 100644 (file)
@@ -60,6 +60,16 @@ void MothurOut::setDefaultPath(string pathname)  {
        }
 }
 /*********************************************************************************************/
+void MothurOut::setOutputDir(string pathname)  {
+       try {
+               outputDir = pathname;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "setOutputDir");
+               exit(1);
+       }
+}
+/*********************************************************************************************/
 void MothurOut::closeLog()  {
        try {
                
@@ -276,8 +286,9 @@ int MothurOut::openOutputFileAppend(string fileName, ofstream& fileHandle){
 /***********************************************************************/
 void MothurOut::gobble(istream& f){
        try {
+               
                char d;
-               while(isspace(d=f.get()))               {;}
+               while(isspace(d=f.get()))               { ;}
                f.putback(d);
        }
        catch(exception& e) {
@@ -348,14 +359,29 @@ string MothurOut::getline(ifstream& fileHandle) {
 }
 /***********************************************************************/
 
+#ifdef USE_COMPRESSION
+inline bool endsWith(string s, const char * suffix){
+  size_t suffixLength = strlen(suffix);
+  return s.size() >= suffixLength && s.substr(s.size() - suffixLength, suffixLength).compare(suffix) == 0;
+}
+#endif
+
 string MothurOut::getRootName(string longName){
        try {
        
                string rootName = longName;
-               
-               if(longName.find_last_of(".") != longName.npos){
-                       int pos = longName.find_last_of('.')+1;
-                       rootName = longName.substr(0, pos);
+
+#ifdef USE_COMPRESSION
+    if (endsWith(rootName, ".gz") || endsWith(rootName, ".bz2")) {
+      int pos = rootName.find_last_of('.');
+      rootName = rootName.substr(0, pos);
+      cerr << "shortening " << longName << " to " << rootName << "\n";
+    }
+#endif
+
+               if(rootName.find_last_of(".") != rootName.npos){
+                       int pos = rootName.find_last_of('.')+1;
+                       rootName = rootName.substr(0, pos);
                }
 
                return rootName;
@@ -486,7 +512,13 @@ string MothurOut::getFullPathName(string fileName){
                #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)   
                        
                        if (path.find("~") != -1) { //go to home directory
-                               string homeDir = getenv ("HOME");
+                               string homeDir;
+                       
+                               char *homepath = NULL;
+                               homepath = getenv ("HOME");
+                               if ( homepath != NULL) { homeDir = homepath; }
+                               else { homeDir = "";  }
+
                                newFileName = homeDir + fileName.substr(fileName.find("~")+1);
                                return newFileName;
                        }else { //find path
@@ -494,7 +526,6 @@ string MothurOut::getFullPathName(string fileName){
                                else { newFileName = fileName.substr(fileName.rfind("./")+2); } //save the complete part of the name
                                
                                //char* cwdpath = new char[1024];
-
                                //size_t size;
                                //cwdpath=getcwd(cwdpath,size);
                                //cwd = cwdpath;
@@ -503,6 +534,7 @@ string MothurOut::getFullPathName(string fileName){
                                cwdpath = getcwd(NULL, 0); // or _getcwd
                                if ( cwdpath != NULL) { cwd = cwdpath; }
                                else { cwd = "";  }
+
                                
                                //rip off first '/'
                                string simpleCWD;
@@ -539,7 +571,6 @@ string MothurOut::getFullPathName(string fileName){
                                
                                newFileName =  "/" +  newFileName;
                                return newFileName;
-               
                        }       
                #else
                        if (path.find("~") != -1) { //go to home directory
@@ -596,12 +627,35 @@ string MothurOut::getFullPathName(string fileName){
        }       
 }
 /***********************************************************************/
-//no error open
+
 int MothurOut::openInputFile(string fileName, ifstream& fileHandle, string m){
        try {
                        //get full path name
                        string completeFileName = getFullPathName(fileName);
 
+#ifdef USE_COMPRESSION
+      // check for gzipped or bzipped file
+      if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
+        string tempName = string(tmpnam(0));
+        mkfifo(tempName.c_str(), 0666);
+        int fork_result = fork();
+        if (fork_result < 0) {
+          cerr << "Error forking.\n";
+          exit(1);
+        } else if (fork_result == 0) {
+          string command = (endsWith(completeFileName, ".gz") ? "zcat " : "bzcat ") + completeFileName + string(" > ") + tempName;
+          cerr << "Decompressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
+          system(command.c_str());
+          cerr << "Done decompressing " << completeFileName << "\n";
+          remove(tempName.c_str());
+          exit(EXIT_SUCCESS);
+        } else {
+          cerr << "waiting on child process " << fork_result << "\n";
+          completeFileName = tempName;
+        }
+      }
+#endif
+
                        fileHandle.open(completeFileName.c_str());
                        if(!fileHandle) {
                                return 1;
@@ -620,9 +674,34 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle, string m){
 
 int MothurOut::openInputFile(string fileName, ifstream& fileHandle){
        try {
+
                //get full path name
                string completeFileName = getFullPathName(fileName);
 
+#ifdef USE_COMPRESSION
+  // check for gzipped or bzipped file
+  if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
+    string tempName = string(tmpnam(0));
+    mkfifo(tempName.c_str(), 0666);
+    int fork_result = fork();
+    if (fork_result < 0) {
+      cerr << "Error forking.\n";
+      exit(1);
+    } else if (fork_result == 0) {
+      string command = (endsWith(completeFileName, ".gz") ? "zcat " : "bzcat ") + completeFileName + string(" > ") + tempName;
+      cerr << "Decompressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
+      system(command.c_str());
+      cerr << "Done decompressing " << completeFileName << "\n";
+      remove(tempName.c_str());
+      exit(EXIT_SUCCESS);
+    } else {
+      cerr << "waiting on child process " << fork_result << "\n";
+      completeFileName = tempName;
+    }
+  }
+#endif
+
+
                fileHandle.open(completeFileName.c_str());
                if(!fileHandle) {
                        mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
@@ -676,7 +755,27 @@ int MothurOut::openOutputFile(string fileName, ofstream& fileHandle){
        try { 
        
                string completeFileName = getFullPathName(fileName);
-               
+
+#ifdef USE_COMPRESSION
+    // check for gzipped file
+    if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
+      string tempName = string(tmpnam(0));
+      mkfifo(tempName.c_str(), 0666);
+      cerr << "Compressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
+      int fork_result = fork();
+      if (fork_result < 0) {
+        cerr << "Error forking.\n";
+        exit(1);
+      } else if (fork_result == 0) {
+        string command = string(endsWith(completeFileName, ".gz") ?  "gzip" : "bzip2") + " -v > " + completeFileName + string(" < ") + tempName;
+        system(command.c_str());
+        exit(0);
+      } else {
+        completeFileName = tempName;
+      }
+    }
+#endif
+
                fileHandle.open(completeFileName.c_str(), ios::trunc);
                if(!fileHandle) {
                        mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
@@ -906,7 +1005,7 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
                //estimate file breaks
                unsigned long int chunkSize = 0;
                chunkSize = size / proc;
-       
+
                //file to small to divide by processors
                if (chunkSize == 0)  {  proc = 1;       filePos.push_back(size); return filePos;        }
        
@@ -924,7 +1023,7 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
                           char c = in.get();
                           if (c == '>') {   in.putback(c); newSpot = in.tellg(); break;  }
                        }
-                       
+               
                        //there was not another sequence before the end of the file
                        unsigned long int sanityPos = in.tellg();
 
@@ -939,7 +1038,7 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
 
                //sanity check filePos
                for (int i = 0; i < (filePos.size()-1); i++) {
-                       if (filePos[(i+1)] <= filePos[i]) {  filePos.erase(filePos.begin()+(i+1)); i--; }
+                       if (filePos[(i+1)] <= filePos[i]) {  cout << "erasing " << (i+1) << endl; filePos.erase(filePos.begin()+(i+1)); i--; }
                }
 
                proc = (filePos.size() - 1);
@@ -1103,7 +1202,20 @@ void MothurOut::getNumSeqs(ifstream& file, int& numSeqs){
 //This function parses the estimator options and puts them in a vector
 void MothurOut::splitAtChar(string& estim, vector<string>& container, char symbol) {
        try {
-               string individual;
+               string individual = "";
+               int estimLength = estim.size();
+               for(int i=0;i<estimLength;i++){
+                       if(estim[i] == symbol){
+                               container.push_back(individual);
+                               individual = "";                                
+                       }
+                       else{
+                               individual += estim[i];
+                       }
+               }
+               container.push_back(individual);
+
+               /*
                
                while (estim.find_first_of(symbol) != -1) {
                        individual = estim.substr(0,estim.find_first_of(symbol));
@@ -1113,7 +1225,7 @@ void MothurOut::splitAtChar(string& estim, vector<string>& container, char symbo
                        }
                }
                //get last one
-               container.push_back(estim);
+               container.push_back(estim); */
        }
        catch(exception& e) {
                errorOut(e, "MothurOut", "splitAtChar");