]> git.donarmstrong.com Git - mothur.git/blobdiff - mothurout.cpp
metastats in progress
[mothur.git] / mothurout.cpp
index 67c62c1bed469a387462f5decac8252971dda43e..001e8c48a8932374d7266b4e6097036c5b2ed9ac 100644 (file)
@@ -9,6 +9,7 @@
 
 #include "mothurout.h"
 
+
 /******************************************************/
 MothurOut* MothurOut::getInstance() {
        if( _uniqueInstance == 0) {
@@ -17,6 +18,103 @@ MothurOut* MothurOut::getInstance() {
        return _uniqueInstance;
 }
 /*********************************************************************************************/
+void MothurOut::printCurrentFiles()  {
+       try {
+               if (accnosfile != "")           {  mothurOut("accnos=" + accnosfile); mothurOutEndLine();                       }
+               if (columnfile != "")           {  mothurOut("column=" + columnfile); mothurOutEndLine();                       }
+               if (designfile != "")           {  mothurOut("design=" + designfile); mothurOutEndLine();                       }
+               if (fastafile != "")            {  mothurOut("fasta=" + fastafile); mothurOutEndLine();                         }
+               if (groupfile != "")            {  mothurOut("group=" + groupfile); mothurOutEndLine();                         }
+               if (listfile != "")                     {  mothurOut("list=" + listfile); mothurOutEndLine();                           }
+               if (namefile != "")                     {  mothurOut("name=" + namefile); mothurOutEndLine();                           }
+               if (oligosfile != "")           {  mothurOut("oligos=" + oligosfile); mothurOutEndLine();                       }
+               if (orderfile != "")            {  mothurOut("order=" + orderfile); mothurOutEndLine();                         }
+               if (ordergroupfile != "")       {  mothurOut("ordergroup=" + ordergroupfile); mothurOutEndLine();       }
+               if (phylipfile != "")           {  mothurOut("phylip=" + phylipfile); mothurOutEndLine();                       }
+               if (qualfile != "")                     {  mothurOut("qfile=" + qualfile); mothurOutEndLine();                          }
+               if (rabundfile != "")           {  mothurOut("rabund=" + rabundfile); mothurOutEndLine();                       }
+               if (relabundfile != "")         {  mothurOut("relabund=" + relabundfile); mothurOutEndLine();           }
+               if (sabundfile != "")           {  mothurOut("sabund=" + sabundfile); mothurOutEndLine();                       }
+               if (sfffile != "")                      {  mothurOut("sff=" + sfffile); mothurOutEndLine();                                     }
+               if (sharedfile != "")           {  mothurOut("shared=" + sharedfile); mothurOutEndLine();                       }
+               if (taxonomyfile != "")         {  mothurOut("taxonomy=" + taxonomyfile); mothurOutEndLine();           }
+               if (treefile != "")                     {  mothurOut("tree=" + treefile); mothurOutEndLine();                           }
+               if (flowfile != "")                     {  mothurOut("flow=" + flowfile); mothurOutEndLine();                           }
+               if (processors != "1")          {  mothurOut("processors=" + processors); mothurOutEndLine();           }
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "printCurrentFiles");
+               exit(1);
+       }
+}
+/*********************************************************************************************/
+bool MothurOut::hasCurrentFiles()  {
+       try {
+               bool hasCurrent = false;
+               
+               if (accnosfile != "")           {  return true;                 }
+               if (columnfile != "")           {  return true;                 }
+               if (designfile != "")           {  return true;                 }
+               if (fastafile != "")            {  return true;                 }
+               if (groupfile != "")            {  return true;                 }
+               if (listfile != "")                     {  return true;                 }
+               if (namefile != "")                     {  return true;                 }
+               if (oligosfile != "")           {  return true;                 }
+               if (orderfile != "")            {  return true;                 }
+               if (ordergroupfile != "")       {  return true;                 }
+               if (phylipfile != "")           {  return true;                 }
+               if (qualfile != "")                     {  return true;                 }
+               if (rabundfile != "")           {  return true;                 }
+               if (relabundfile != "")         {  return true;                 }
+               if (sabundfile != "")           {  return true;                 }
+               if (sfffile != "")                      {  return true;                 }
+               if (sharedfile != "")           {  return true;                 }
+               if (taxonomyfile != "")         {  return true;                 }
+               if (treefile != "")                     {  return true;                 }
+               if (flowfile != "")                     {  return true;                 }
+               if (processors != "1")          {  return true;                 }
+               
+               return hasCurrent;
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "hasCurrentFiles");
+               exit(1);
+       }
+}
+
+/*********************************************************************************************/
+void MothurOut::clearCurrentFiles()  {
+       try {
+               phylipfile = "";
+               columnfile = "";
+               listfile = "";
+               rabundfile = "";
+               sabundfile = "";
+               namefile = "";
+               groupfile = "";
+               designfile = "";
+               orderfile = "";
+               treefile = "";
+               sharedfile = "";
+               ordergroupfile = "";
+               relabundfile = "";
+               fastafile = "";
+               qualfile = "";
+               sfffile = "";
+               oligosfile = "";
+               accnosfile = "";
+               taxonomyfile = "";      
+               flowfile = "";
+               processors = "1";
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "clearCurrentFiles");
+               exit(1);
+       }
+}
+/*********************************************************************************************/
 void MothurOut::setFileName(string filename)  {
        try {
                logFileName = filename;
@@ -60,6 +158,16 @@ void MothurOut::setDefaultPath(string pathname)  {
        }
 }
 /*********************************************************************************************/
+void MothurOut::setOutputDir(string pathname)  {
+       try {
+               outputDir = pathname;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "setOutputDir");
+               exit(1);
+       }
+}
+/*********************************************************************************************/
 void MothurOut::closeLog()  {
        try {
                
@@ -139,6 +247,53 @@ void MothurOut::mothurOutEndLine() {
        }
 }
 /*********************************************************************************************/
+void MothurOut::mothurOut(string output, ofstream& outputFile) {
+       try {
+               
+#ifdef USE_MPI
+               int pid;
+               MPI_Comm_rank(MPI_COMM_WORLD, &pid); 
+               
+               if (pid == 0) { //only one process should output to screen
+#endif
+                       
+                       cout << output;
+                       out << output;
+                       outputFile << output;
+                       
+#ifdef USE_MPI
+               }
+#endif
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "MothurOut");
+               exit(1);
+       }
+}
+/*********************************************************************************************/
+void MothurOut::mothurOutEndLine(ofstream& outputFile) {
+       try {
+#ifdef USE_MPI
+               int pid;
+               MPI_Comm_rank(MPI_COMM_WORLD, &pid); 
+               
+               if (pid == 0) { //only one process should output to screen
+#endif
+                       
+                       cout << endl;
+                       out << endl;
+                       outputFile << endl;
+                       
+#ifdef USE_MPI
+               }
+#endif
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "MothurOutEndLine");
+               exit(1);
+       }
+}
+/*********************************************************************************************/
 void MothurOut::mothurOutJustToLog(string output) {
        try {
                #ifdef USE_MPI
@@ -279,7 +434,7 @@ void MothurOut::gobble(istream& f){
                
                char d;
                while(isspace(d=f.get()))               { ;}
-               f.putback(d);
+               if(!f.eof()) { f.putback(d); }
        }
        catch(exception& e) {
                errorOut(e, "MothurOut", "gobble");
@@ -291,7 +446,7 @@ void MothurOut::gobble(istringstream& f){
        try {
                char d;
                while(isspace(d=f.get()))               {;}
-               f.putback(d);
+               if(!f.eof()) { f.putback(d); }
        }
        catch(exception& e) {
                errorOut(e, "MothurOut", "gobble");
@@ -330,12 +485,12 @@ string MothurOut::getline(ifstream& fileHandle) {
        
                string line = "";
                
-               while (!fileHandle.eof())       {
+               while (fileHandle)      {
                        //get next character
                        char c = fileHandle.get(); 
                        
                        //are you at the end of the line
-                       if ((c == '\n') || (c == '\r') || (c == '\f')){  break; }       
+                       if ((c == '\n') || (c == '\r') || (c == '\f') || (c == EOF)){  break;   }       
                        else {          line += c;              }
                }
                
@@ -349,18 +504,21 @@ string MothurOut::getline(ifstream& fileHandle) {
 }
 /***********************************************************************/
 
+#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)
 #ifdef USE_COMPRESSION
 inline bool endsWith(string s, const char * suffix){
   size_t suffixLength = strlen(suffix);
   return s.size() >= suffixLength && s.substr(s.size() - suffixLength, suffixLength).compare(suffix) == 0;
 }
 #endif
+#endif
 
 string MothurOut::getRootName(string longName){
        try {
        
                string rootName = longName;
 
+#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)
 #ifdef USE_COMPRESSION
     if (endsWith(rootName, ".gz") || endsWith(rootName, ".bz2")) {
       int pos = rootName.find_last_of('.');
@@ -368,7 +526,7 @@ string MothurOut::getRootName(string longName){
       cerr << "shortening " << longName << " to " << rootName << "\n";
     }
 #endif
-
+#endif
                if(rootName.find_last_of(".") != rootName.npos){
                        int pos = rootName.find_last_of('.')+1;
                        rootName = rootName.substr(0, pos);
@@ -404,6 +562,21 @@ string MothurOut::getSimpleName(string longName){
 
 /***********************************************************************/
 
+int MothurOut::getRandomIndex(int highest){
+       try {
+               
+               int random = (int) ((float)(highest+1) * (float)(rand()) / ((float)RAND_MAX+1.0));
+               
+               return random;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "getRandomIndex");
+               exit(1);
+       }       
+       
+}
+/**********************************************************************/
+
 string MothurOut::getPathName(string longName){
        try {
                string rootPathName = longName;
@@ -475,6 +648,7 @@ bool MothurOut::isBlank(string fileName){
                        //check for blank file
                        gobble(fileHandle);
                        if (fileHandle.eof()) { fileHandle.close(); return true;  }
+                       fileHandle.close();
                }
                return false;
        }
@@ -512,7 +686,7 @@ string MothurOut::getFullPathName(string fileName){
                                newFileName = homeDir + fileName.substr(fileName.find("~")+1);
                                return newFileName;
                        }else { //find path
-                               if (path.rfind("./") == -1) { return fileName; } //already complete name
+                               if (path.rfind("./") == string::npos) { return fileName; } //already complete name
                                else { newFileName = fileName.substr(fileName.rfind("./")+2); } //save the complete part of the name
                                
                                //char* cwdpath = new char[1024];
@@ -532,7 +706,7 @@ string MothurOut::getFullPathName(string fileName){
                                
                                //break apart the current working directory
                                vector<string> dirs;
-                               while (simpleCWD.find_first_of('/') != -1) {
+                               while (simpleCWD.find_first_of('/') != string::npos) {
                                        string dir = simpleCWD.substr(0,simpleCWD.find_first_of('/'));
                                        simpleCWD = simpleCWD.substr(simpleCWD.find_first_of('/')+1, simpleCWD.length());
                                        dirs.push_back(dir);
@@ -543,7 +717,7 @@ string MothurOut::getFullPathName(string fileName){
                        
                                int index = dirs.size()-1;
                
-                               while((pos = path.rfind("./")) != -1) { //while you don't have a complete path
+                               while((pos = path.rfind("./")) != string::npos) { //while you don't have a complete path
                                        if (pos == 0) { break;  //you are at the end
                                        }else if (path[(pos-1)] == '.') { //you want your parent directory ../
                                                path = path.substr(0, pos-1);
@@ -563,12 +737,12 @@ string MothurOut::getFullPathName(string fileName){
                                return newFileName;
                        }       
                #else
-                       if (path.find("~") != -1) { //go to home directory
+                       if (path.find("~") != string::npos) { //go to home directory
                                string homeDir = getenv ("HOMEPATH");
                                newFileName = homeDir + fileName.substr(fileName.find("~")+1);
                                return newFileName;
                        }else { //find path
-                               if (path.rfind(".\\") == -1) { return fileName; } //already complete name
+                               if (path.rfind(".\\") == string::npos) { return fileName; } //already complete name
                                else { newFileName = fileName.substr(fileName.rfind(".\\")+2); } //save the complete part of the name
                                                        
                                char *cwdpath = NULL;
@@ -589,7 +763,7 @@ string MothurOut::getFullPathName(string fileName){
                                        
                                int index = dirs.size()-1;
                                        
-                               while((pos = path.rfind(".\\")) != -1) { //while you don't have a complete path
+                               while((pos = path.rfind(".\\")) != string::npos) { //while you don't have a complete path
                                        if (pos == 0) { break;  //you are at the end
                                        }else if (path[(pos-1)] == '.') { //you want your parent directory ../
                                                path = path.substr(0, pos-1);
@@ -622,7 +796,7 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle, string m){
        try {
                        //get full path name
                        string completeFileName = getFullPathName(fileName);
-
+#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)
 #ifdef USE_COMPRESSION
       // check for gzipped or bzipped file
       if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
@@ -637,7 +811,7 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle, string m){
           cerr << "Decompressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
           system(command.c_str());
           cerr << "Done decompressing " << completeFileName << "\n";
-          remove(tempName.c_str());
+          mothurRemove(tempName);
           exit(EXIT_SUCCESS);
         } else {
           cerr << "waiting on child process " << fork_result << "\n";
@@ -645,9 +819,10 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle, string m){
         }
       }
 #endif
-
+#endif
                        fileHandle.open(completeFileName.c_str());
                        if(!fileHandle) {
+                               //mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
                                return 1;
                        }else {
                                //check for blank file
@@ -667,7 +842,7 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle){
 
                //get full path name
                string completeFileName = getFullPathName(fileName);
-
+#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)
 #ifdef USE_COMPRESSION
   // check for gzipped or bzipped file
   if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
@@ -682,7 +857,7 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle){
       cerr << "Decompressing " << completeFileName << " via temporary named pipe " << tempName << "\n";
       system(command.c_str());
       cerr << "Done decompressing " << completeFileName << "\n";
-      remove(tempName.c_str());
+      mothurRemove(tempName);
       exit(EXIT_SUCCESS);
     } else {
       cerr << "waiting on child process " << fork_result << "\n";
@@ -690,7 +865,7 @@ int MothurOut::openInputFile(string fileName, ifstream& fileHandle){
     }
   }
 #endif
-
+#endif
 
                fileHandle.open(completeFileName.c_str());
                if(!fileHandle) {
@@ -716,10 +891,10 @@ int MothurOut::renameFile(string oldName, string newName){
        try {
                ifstream inTest;
                int exist = openInputFile(newName, inTest, "");
+               inTest.close();
                
        #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)           
                if (exist == 0) { //you could open it so you want to delete it
-                       inTest.close();
                        string command = "rm " + newName;
                        system(command.c_str());
                }
@@ -727,7 +902,7 @@ int MothurOut::renameFile(string oldName, string newName){
                string command = "mv " + oldName + " " + newName;
                system(command.c_str());
        #else
-               remove(newName.c_str());
+               mothurRemove(newName);
                int renameOk = rename(oldName.c_str(), newName.c_str());
        #endif
                return 0;
@@ -745,7 +920,7 @@ int MothurOut::openOutputFile(string fileName, ofstream& fileHandle){
        try { 
        
                string completeFileName = getFullPathName(fileName);
-
+#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)
 #ifdef USE_COMPRESSION
     // check for gzipped file
     if (endsWith(completeFileName, ".gz") || endsWith(completeFileName, ".bz2")) {
@@ -765,7 +940,7 @@ int MothurOut::openOutputFile(string fileName, ofstream& fileHandle){
       }
     }
 #endif
-
+#endif
                fileHandle.open(completeFileName.c_str(), ios::trunc);
                if(!fileHandle) {
                        mothurOut("[ERROR]: Could not open " + completeFileName); mothurOutEndLine();
@@ -783,7 +958,7 @@ int MothurOut::openOutputFile(string fileName, ofstream& fileHandle){
 }
 
 /**************************************************************************************************/
-void MothurOut::appendFiles(string temp, string filename) {
+int MothurOut::appendFiles(string temp, string filename) {
        try{
                ofstream output;
                ifstream input;
@@ -791,16 +966,20 @@ void MothurOut::appendFiles(string temp, string filename) {
                //open output file in append mode
                openOutputFileAppend(filename, output);
                int ableToOpen = openInputFile(temp, input, "no error");
+               //int ableToOpen = openInputFile(temp, input);
                
+               int numLines = 0;
                if (ableToOpen == 0) { //you opened it
                        while(char c = input.get()){
                                if(input.eof())         {       break;                  }
-                               else                            {       output << c;    }
+                               else                            {       output << c;    if (c == '\n') {numLines++;} }
                        }
                        input.close();
                }
                
                output.close();
+               
+               return numLines;
        }
        catch(exception& e) {
                errorOut(e, "MothurOut", "appendFiles");
@@ -862,8 +1041,8 @@ string MothurOut::sortFile(string distFile, string outputDir){
                        output.close();
                
                        //remove temp files
-                       remove(tempDistFile.c_str());
-                       remove(tempOutfile.c_str());
+                       mothurRemove(tempDistFile);
+                       mothurRemove(tempOutfile);
                #endif
                
                return outfile;
@@ -874,19 +1053,27 @@ string MothurOut::sortFile(string distFile, string outputDir){
        }       
 }
 /**************************************************************************************************/
-vector<unsigned long int> MothurOut::setFilePosFasta(string filename, int& num) {
+vector<unsigned long long> MothurOut::setFilePosFasta(string filename, int& num) {
        try {
-                       vector<unsigned long int> positions;
+                       vector<unsigned long long> positions;
                        ifstream inFASTA;
-                       openInputFile(filename, inFASTA);
+                       //openInputFile(filename, inFASTA);
+                       inFASTA.open(filename.c_str(), ios::binary);
                                                
                        string input;
+                       unsigned long long count = 0;
                        while(!inFASTA.eof()){
-                               input = getline(inFASTA); 
-                               if (input.length() != 0) {
-                                       if(input[0] == '>'){    unsigned long int pos = inFASTA.tellg(); positions.push_back(pos - input.length() - 1); }
+                               //input = getline(inFASTA); 
+                               //cout << input << '\t' << inFASTA.tellg() << endl;
+                               //if (input.length() != 0) {
+                               //      if(input[0] == '>'){    unsigned long int pos = inFASTA.tellg(); positions.push_back(pos - input.length() - 1);  cout << (pos - input.length() - 1) << endl; }
+                               //}
+                               //gobble(inFASTA); //has to be here since windows line endings are 2 characters and mess up the positions
+                               char c = inFASTA.get(); count++;
+                               if (c == '>') {
+                                       positions.push_back(count-1);
+                                       //cout << count << endl;
                                }
-                               gobble(inFASTA); //has to be here since windows line endings are 2 characters and mess up the positions
                        }
                        inFASTA.close();
                
@@ -904,19 +1091,20 @@ vector<unsigned long int> MothurOut::setFilePosFasta(string filename, int& num)
                                fclose (pFile);
                        }*/
                        
-                       unsigned long int size = positions[(positions.size()-1)];
+                       unsigned long long size = positions[(positions.size()-1)];
                        ifstream in;
                        openInputFile(filename, in);
                        
                        in.seekg(size);
                
-                       while(char c = in.get()){
+                       while(in.get()){
                                if(in.eof())            {       break;  }
                                else                            {       size++; }
                        }
                        in.close();
                
                        positions.push_back(size);
+                       positions[0] = 0;
                
                        return positions;
        }
@@ -926,31 +1114,51 @@ vector<unsigned long int> MothurOut::setFilePosFasta(string filename, int& num)
        }
 }
 /**************************************************************************************************/
-vector<unsigned long int> MothurOut::setFilePosEachLine(string filename, int& num) {
+vector<unsigned long long> MothurOut::setFilePosEachLine(string filename, int& num) {
        try {
                        filename = getFullPathName(filename);
                        
-                       vector<unsigned long int> positions;
+                       vector<unsigned long long> positions;
                        ifstream in;
-                       openInputFile(filename, in);
-                               
+                       //openInputFile(filename, in);
+                       in.open(filename.c_str(), ios::binary);
+               
                        string input;
+                       unsigned long long count = 0;
+                       positions.push_back(0);
+               
                        while(!in.eof()){
-                               unsigned long int lastpos = in.tellg();
-                               input = getline(in); 
-                               if (input.length() != 0) {
-                                       unsigned long int pos = in.tellg(); 
-                                       if (pos != -1) { positions.push_back(pos - input.length() - 1); }
-                                       else {  positions.push_back(lastpos);  }
+                               //unsigned long long lastpos = in.tellg();
+                               //input = getline(in); 
+                               //if (input.length() != 0) {
+                                       //unsigned long long pos = in.tellg(); 
+                                       //if (pos != -1) { positions.push_back(pos - input.length() - 1);       }
+                                       //else {  positions.push_back(lastpos);  }
+                               //}
+                               //gobble(in); //has to be here since windows line endings are 2 characters and mess up the positions
+                               
+                               
+                               //getline counting reads
+                               char d = in.get(); count++;
+                               while ((d != '\n') && (d != '\r') && (d != '\f') && (d != in.eof()))    {
+                                       //get next character
+                                       d = in.get(); 
+                                       count++;
+                               }
+                               
+                               if (!in.eof()) {
+                                       d=in.get(); count++;
+                                       while(isspace(d) && (d != in.eof()))            { d=in.get(); count++;}
                                }
-                               gobble(in); //has to be here since windows line endings are 2 characters and mess up the positions
+                               positions.push_back(count-1);
+                               cout << count-1 << endl;
                        }
                        in.close();
                
-                       num = positions.size();
+                       num = positions.size()-1;
                
                        FILE * pFile;
-                       unsigned long int size;
+                       unsigned long long size;
                        
                        //get num bytes in file
                        pFile = fopen (filename.c_str(),"rb");
@@ -961,7 +1169,7 @@ vector<unsigned long int> MothurOut::setFilePosEachLine(string filename, int& nu
                                fclose (pFile);
                        }
                
-                       positions.push_back(size);
+                       positions[(positions.size()-1)] = size;
                
                        return positions;
        }
@@ -972,17 +1180,16 @@ vector<unsigned long int> MothurOut::setFilePosEachLine(string filename, int& nu
 }
 /**************************************************************************************************/
 
-vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
+vector<unsigned long long> MothurOut::divideFile(string filename, int& proc) {
        try{
-       
-               vector<unsigned long int> filePos;
+               vector<unsigned long long> filePos;
                filePos.push_back(0);
                
                FILE * pFile;
-               unsigned long int size;
+               unsigned long long size;
                
                filename = getFullPathName(filename);
-               
+       
                //get num bytes in file
                pFile = fopen (filename.c_str(),"rb");
                if (pFile==NULL) perror ("Error opening file");
@@ -991,9 +1198,11 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
                        size=ftell (pFile);
                        fclose (pFile);
                }
-       
+               
+       #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux)
+                               
                //estimate file breaks
-               unsigned long int chunkSize = 0;
+               unsigned long long chunkSize = 0;
                chunkSize = size / proc;
 
                //file to small to divide by processors
@@ -1001,21 +1210,24 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
        
                //for each process seekg to closest file break and search for next '>' char. make that the filebreak
                for (int i = 0; i < proc; i++) {
-                       unsigned long int spot = (i+1) * chunkSize;
+                       unsigned long long spot = (i+1) * chunkSize;
                        
                        ifstream in;
                        openInputFile(filename, in);
                        in.seekg(spot);
                        
                        //look for next '>'
-                       unsigned long int newSpot = spot;
+                       unsigned long long newSpot = spot;
                        while (!in.eof()) {
                           char c = in.get();
+                               
                           if (c == '>') {   in.putback(c); newSpot = in.tellg(); break;  }
+                          else if (int(c) == -1) { break; }
+                               
                        }
                
                        //there was not another sequence before the end of the file
-                       unsigned long int sanityPos = in.tellg();
+                       unsigned long long sanityPos = in.tellg();
 
                        if (sanityPos == -1) {  break;  }
                        else {  filePos.push_back(newSpot);  }
@@ -1025,14 +1237,18 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
                
                //save end pos
                filePos.push_back(size);
-
+               
                //sanity check filePos
                for (int i = 0; i < (filePos.size()-1); i++) {
-                       if (filePos[(i+1)] <= filePos[i]) {  cout << "erasing " << (i+1) << endl; filePos.erase(filePos.begin()+(i+1)); i--; }
+                       if (filePos[(i+1)] <= filePos[i]) {  filePos.erase(filePos.begin()+(i+1)); i--; }
                }
 
                proc = (filePos.size() - 1);
-               
+#else
+               mothurOut("[ERROR]: Windows version should not be calling the divideFile function."); mothurOutEndLine();
+               proc=1;
+               filePos.push_back(size);
+#endif
                return filePos;
        }
        catch(exception& e) {
@@ -1040,7 +1256,43 @@ vector<unsigned long int> MothurOut::divideFile(string filename, int& proc) {
                exit(1);
        }
 }
-
+/**************************************************************************************************/
+int MothurOut::divideFile(string filename, int& proc, vector<string>& files) {
+       try{
+               
+               vector<unsigned long long> filePos = divideFile(filename, proc);
+               
+               for (int i = 0; i < (filePos.size()-1); i++) {
+                       
+                       //read file chunk
+                       ifstream in;
+                       openInputFile(filename, in);
+                       in.seekg(filePos[i]);
+                       unsigned long long size = filePos[(i+1)] - filePos[i];
+                       char* chunk = new char[size];
+                       in.read(chunk, size);
+                       in.close();
+                       
+                       //open new file
+                       string fileChunkName = filename + "." + toString(i) + ".tmp";
+                       ofstream out; 
+                       openOutputFile(fileChunkName, out);
+                       
+                       out << chunk << endl;
+                       out.close();
+                       delete[] chunk;
+                       
+                       //save name
+                       files.push_back(fileChunkName);
+               }
+                               
+               return 0;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "divideFile");
+               exit(1);
+       }
+}
 /***********************************************************************/
 
 bool MothurOut::isTrue(string f){
@@ -1079,6 +1331,127 @@ float MothurOut::ceilDist(float dist, int precision){
                exit(1);
        }
 }
+/**********************************************************************************************************************/
+int MothurOut::readNames(string namefile, map<string, string>& nameMap) { 
+       try {
+               
+               //open input file
+               ifstream in;
+               openInputFile(namefile, in);
+               
+               while (!in.eof()) {
+                       if (control_pressed) { break; }
+                       
+                       string firstCol, secondCol;
+                       in >> firstCol >> secondCol; gobble(in);
+                       
+                       nameMap[firstCol] = secondCol;
+               }
+               in.close();
+               
+               return 0;
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "readNames");
+               exit(1);
+       }
+}
+/**********************************************************************************************************************/
+int MothurOut::readNames(string namefile, map<string, vector<string> >& nameMap) { 
+       try {
+               
+               //open input file
+               ifstream in;
+               openInputFile(namefile, in);
+               
+               while (!in.eof()) {
+                       if (control_pressed) { break; }
+                       
+                       string firstCol, secondCol;
+                       in >> firstCol >> secondCol; gobble(in);
+                       
+                       vector<string> temp;
+                       splitAtComma(secondCol, temp);
+                       
+                       nameMap[firstCol] = temp;
+               }
+               in.close();
+               
+               return 0;
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "readNames");
+               exit(1);
+       }
+}
+/**********************************************************************************************************************/
+map<string, int> MothurOut::readNames(string namefile) { 
+       try {
+               
+               map<string, int> nameMap;
+               
+               //open input file
+               ifstream in;
+               openInputFile(namefile, in);
+               
+               while (!in.eof()) {
+                       if (control_pressed) { break; }
+                       
+                       string firstCol, secondCol;
+                       in >> firstCol >> secondCol; gobble(in);
+                       
+                       int num = getNumNames(secondCol);
+                       
+                       nameMap[firstCol] = num;
+               }
+               in.close();
+               
+               return nameMap;
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "readNames");
+               exit(1);
+       }
+}
+/**********************************************************************************************************************/
+int MothurOut::readNames(string namefile, vector<seqPriorityNode>& nameVector, map<string, string>& fastamap) { 
+       try {
+               int error = 0;
+               
+               //open input file
+               ifstream in;
+               openInputFile(namefile, in);
+               
+               while (!in.eof()) {
+                       if (control_pressed) { break; }
+                       
+                       string firstCol, secondCol;
+                       in >> firstCol >> secondCol; gobble(in);
+                       
+                       int num = getNumNames(secondCol);
+                       
+                       map<string, string>::iterator it = fastamap.find(firstCol);
+                       if (it == fastamap.end()) {
+                               error = 1;
+                               mothurOut("[ERROR]: " + firstCol + " is not in your fastafile, but is in your namesfile, please correct."); mothurOutEndLine();
+                       }else {
+                               seqPriorityNode temp(num, it->second, firstCol);
+                               nameVector.push_back(temp);
+                       }
+               }
+               in.close();
+               
+               return error;
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "readNames");
+               exit(1);
+       }
+}
 
 /***********************************************************************/
 
@@ -1102,7 +1475,25 @@ int MothurOut::getNumNames(string names){
                exit(1);
        }
 }
+/***********************************************************************/
 
+int MothurOut::mothurRemove(string filename){
+       try {
+               filename = getFullPathName(filename);
+               int error = remove(filename.c_str());
+               //if (error != 0) { 
+               //      if (errno != ENOENT) { //ENOENT == file does not exist
+               //              string message = "Error deleting file " + filename;
+               //              perror(message.c_str()); 
+               //      }
+               //}
+               return error;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "mothurRemove");
+               exit(1);
+       }
+}
 /**************************************************************************************************/
 
 vector<vector<double> > MothurOut::binomial(int maxOrder){
@@ -1139,7 +1530,90 @@ vector<vector<double> > MothurOut::binomial(int maxOrder){
                exit(1);
        }
 }
-
+/**************************************************************************************************/
+unsigned int MothurOut::fromBase36(string base36){
+       try {
+               unsigned int num = 0;
+               
+               map<char, int> converts;
+               converts['A'] = 0;
+               converts['a'] = 0;
+               converts['B'] = 1;
+               converts['b'] = 1;
+               converts['C'] = 2;
+               converts['c'] = 2;
+               converts['D'] = 3;
+               converts['d'] = 3;
+               converts['E'] = 4;
+               converts['e'] = 4;
+               converts['F'] = 5;
+               converts['f'] = 5;
+               converts['G'] = 6;
+               converts['g'] = 6;
+               converts['H'] = 7;
+               converts['h'] = 7;
+               converts['I'] = 8;
+               converts['i'] = 8;
+               converts['J'] = 9;
+               converts['j'] = 9;
+               converts['K'] = 10;
+               converts['k'] = 10;
+               converts['L'] = 11;
+               converts['l'] = 11;
+               converts['M'] = 12;
+               converts['m'] = 12;
+               converts['N'] = 13;
+               converts['n'] = 13;
+               converts['O'] = 14;
+               converts['o'] = 14;
+               converts['P'] = 15;
+               converts['p'] = 15;
+               converts['Q'] = 16;
+               converts['q'] = 16;
+               converts['R'] = 17;
+               converts['r'] = 17;
+               converts['S'] = 18;
+               converts['s'] = 18;
+               converts['T'] = 19;
+               converts['t'] = 19;
+               converts['U'] = 20;
+               converts['u'] = 20;
+               converts['V'] = 21;
+               converts['v'] = 21;
+               converts['W'] = 22;
+               converts['w'] = 22;
+               converts['X'] = 23;
+               converts['x'] = 23;
+               converts['Y'] = 24;
+               converts['y'] = 24;
+               converts['Z'] = 25;
+               converts['z'] = 25;
+               converts['0'] = 26;
+               converts['1'] = 27;
+               converts['2'] = 28;
+               converts['3'] = 29;
+               converts['4'] = 30;
+               converts['5'] = 31;
+               converts['6'] = 32;
+               converts['7'] = 33;
+               converts['8'] = 34;
+               converts['9'] = 35;             
+               
+               int i = 0;
+               while (i < base36.length()) {
+                       char c = base36[i];
+                       num = 36 * num + converts[c];
+                       i++;
+               }
+               
+               return num;
+               
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "fromBase36");
+               exit(1);
+       }
+}
 /***********************************************************************/
 
 int MothurOut::factorial(int num){
@@ -1205,17 +1679,6 @@ void MothurOut::splitAtChar(string& estim, vector<string>& container, char symbo
                }
                container.push_back(individual);
 
-               /*
-               
-               while (estim.find_first_of(symbol) != -1) {
-                       individual = estim.substr(0,estim.find_first_of(symbol));
-                       if ((estim.find_first_of(symbol)+1) <= estim.length()) { //checks to make sure you don't have dash at end of string
-                               estim = estim.substr(estim.find_first_of(symbol)+1, estim.length());
-                               container.push_back(individual);
-                       }
-               }
-               //get last one
-               container.push_back(estim); */
        }
        catch(exception& e) {
                errorOut(e, "MothurOut", "splitAtChar");
@@ -1450,20 +1913,21 @@ bool MothurOut::anyLabelsToProcess(string label, set<string>& userLabels, string
                }
                
                //go through users set and make them floats
-               for(it = userLabels.begin(); it != userLabels.end(); ++it) {
+               for(it = userLabels.begin(); it != userLabels.end();) {
                        
                        float temp;
                        if ((*it != "unique") && (convertTestFloat(*it, temp) == true)){
                                convert(*it, temp);
                                orderFloat.push_back(temp);
                                userMap[*it] = temp;
+                               it++;
                        }else if (*it == "unique") { 
                                orderFloat.push_back(-1.0);
                                userMap["unique"] = -1.0;
+                               it++;
                        }else {
-                               if (errorOff == "") {  cout << *it << " is not a valid label." << endl;  }
-                               userLabels.erase(*it); 
-                               it--;
+                               if (errorOff == "") {  mothurOut(*it + " is not a valid label."); mothurOutEndLine();  }
+                               userLabels.erase(it++); 
                        }
                }
                
@@ -1479,11 +1943,11 @@ bool MothurOut::anyLabelsToProcess(string label, set<string>& userLabels, string
                        if (orderFloat[i] < labelFloat) {
                                smaller = true;
                                if (orderFloat[i] == -1) { 
-                                       if (errorOff == "") { cout << "Your file does not include the label unique." << endl; }
+                                       if (errorOff == "") { mothurOut("Your file does not include the label unique."); mothurOutEndLine(); }
                                        userLabels.erase("unique");
                                }
                                else {  
-                                       if (errorOff == "") { cout << "Your file does not include the label " << endl; }
+                                       if (errorOff == "") { mothurOut("Your file does not include the label "); mothurOutEndLine(); }
                                        string s = "";
                                        for (it2 = userMap.begin(); it2!= userMap.end(); it2++) {  
                                                if (it2->second == orderFloat[i]) {  
@@ -1493,7 +1957,7 @@ bool MothurOut::anyLabelsToProcess(string label, set<string>& userLabels, string
                                                        break;
                                                }
                                        }
-                                       if (errorOff == "") {cout << s <<  ". I will use the next smallest distance. " << endl; }
+                                       if (errorOff == "") {mothurOut( s +  ". I will use the next smallest distance. "); mothurOutEndLine(); }
                                }
                        //since they are sorted once you find a bigger one stop looking
                        }else { break; }
@@ -1554,6 +2018,63 @@ bool MothurOut::checkReleaseVersion(ifstream& file, string version) {
        }
 }
 /**************************************************************************************************/
+bool MothurOut::isContainingOnlyDigits(string input) {
+       try{
+               
+               //are you a digit in ascii code
+               for (int i = 0;i < input.length(); i++){
+                       if( input[i]>47 && input[i]<58){}
+                       else { return false; }
+               }
+               
+               return true;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "isContainingOnlyDigits");             
+               exit(1);
+       }
+}
+/**************************************************************************************************/
+int MothurOut::removeConfidences(string& tax) {
+       try {
+               
+               string taxon;
+               string newTax = "";
+               
+               while (tax.find_first_of(';') != -1) {
+                       
+                       if (control_pressed) { return 0; }
+                       
+                       //get taxon
+                       taxon = tax.substr(0,tax.find_first_of(';'));
+       
+                       int pos = taxon.find_last_of('(');
+                       if (pos != -1) {
+                               //is it a number?
+                               int pos2 = taxon.find_last_of(')');
+                               if (pos2 != -1) {
+                                       string confidenceScore = taxon.substr(pos+1, (pos2-(pos+1)));
+                                       if (isContainingOnlyDigits(confidenceScore)) {
+                                               taxon = taxon.substr(0, pos); //rip off confidence 
+                                       }
+                               }
+                       }
+                       taxon += ";";
+                       
+                       tax = tax.substr(tax.find_first_of(';')+1, tax.length());
+                       newTax += taxon;
+               }
+               
+               tax = newTax;
+               
+               return 0;
+       }
+       catch(exception& e) {
+               errorOut(e, "MothurOut", "removeConfidences");
+               exit(1);
+       }
+}
+/**************************************************************************************************/