X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;f=rarefactcommand.cpp;h=8d1cfc864d35d12d2127672f68af60802cd8b02d;hb=1b0bddfbf4ac5df7e2dad03c8a5350e71b052f78;hp=8d883aa64ae03c4e0619b0669f3b29fafd752435;hpb=55386dddad84cc1140d736cabaf4dd0ae16f2e01;p=mothur.git diff --git a/rarefactcommand.cpp b/rarefactcommand.cpp index 8d883aa..8d1cfc8 100644 --- a/rarefactcommand.cpp +++ b/rarefactcommand.cpp @@ -38,6 +38,7 @@ vector RareFactCommand::setParameters(){ CommandParameter pcalc("calc", "Multiple", "sobs-chao-nseqs-coverage-ace-jack-shannon-shannoneven-npshannon-heip-smithwilson-simpson-simpsoneven-invsimpson-bootstrap", "sobs", "", "", "",true,false); parameters.push_back(pcalc); CommandParameter pabund("abund", "Number", "", "10", "", "", "",false,false); parameters.push_back(pabund); CommandParameter pprocessors("processors", "Number", "", "1", "", "", "",false,false); parameters.push_back(pprocessors); + CommandParameter pgroupmode("groupmode", "Boolean", "", "T", "", "", "",false,false); parameters.push_back(pgroupmode); CommandParameter pinputdir("inputdir", "String", "", "", "", "", "",false,false); parameters.push_back(pinputdir); CommandParameter poutputdir("outputdir", "String", "", "", "", "", "",false,false); parameters.push_back(poutputdir); @@ -63,6 +64,7 @@ string RareFactCommand::getHelpString(){ helpString += "Example rarefaction.single(label=unique-.01-.03, iters=10000, freq=10, calc=sobs-rchao-race-rjack-rbootstrap-rshannon-rnpshannon-rsimpson).\n"; helpString += "The default values for iters is 1000, freq is 100, and calc is rarefaction which calculates the rarefaction curve for the observed richness.\n"; validCalculator.printCalc("rarefaction"); + helpString += "If you are running rarefaction.single with a shared file and would like your results collated in one file, set groupmode=t. (Default=true).\n"; helpString += "The label parameter is used to analyze specific labels in your input.\n"; helpString += "Note: No spaces between parameter labels (i.e. freq), '=' and parameters (i.e.yourFreq).\n"; return helpString; @@ -262,6 +264,9 @@ RareFactCommand::RareFactCommand(string option) { temp = validParameter.validFile(parameters, "processors", false); if (temp == "not found"){ temp = m->getProcessors(); } m->setProcessors(temp); convert(temp, processors); + + temp = validParameter.validFile(parameters, "groupmode", false); if (temp == "not found") { temp = "T"; } + groupMode = m->isTrue(temp); } } @@ -282,6 +287,7 @@ int RareFactCommand::execute(){ if (m->control_pressed) { return 0; } + map nameMap; for (int p = 0; p < inputFileNames.size(); p++) { string fileNameRoot = outputDir + m->getRootName(m->getSimpleName(inputFileNames[p])); @@ -290,6 +296,7 @@ int RareFactCommand::execute(){ if (inputFileNames.size() > 1) { m->mothurOutEndLine(); m->mothurOut("Processing group " + groups[p]); m->mothurOutEndLine(); m->mothurOutEndLine(); + nameMap[fileNameRoot] = groups[p]; } int i; ValidCalculators validCalculator; @@ -440,6 +447,11 @@ int RareFactCommand::execute(){ } + if (m->control_pressed) { for (int i = 0; i < outputNames.size(); i++) { m->mothurRemove(outputNames[i]); } return 0; } + + //create summary file containing all the groups data for each label - this function just combines the info from the files already created. + if ((sharedfile != "") && (groupMode)) { outputNames = createGroupFile(outputNames, nameMap); } + if (m->control_pressed) { for (int i = 0; i < outputNames.size(); i++) { m->mothurRemove(outputNames[i]); } return 0; } m->mothurOutEndLine(); @@ -455,6 +467,136 @@ int RareFactCommand::execute(){ } } //********************************************************************************************************************** +vector RareFactCommand::createGroupFile(vector& outputNames, map nameMap) { + try { + + vector newFileNames; + + //find different types of files + map > typesFiles; + for (int i = 0; i < outputNames.size(); i++) { + string extension = m->getExtension(outputNames[i]); + + ifstream in; + m->openInputFile(outputNames[i], in); + + string labels = m->getline(in); + string newLine = labels.substr(0, labels.find_first_of('\t')); + + newLine += "\tGroup" + labels.substr(labels.find_first_of('\t')); + + typesFiles[extension].push_back(outputNames[i]); + + string combineFileName = outputDir + m->getRootName(m->getSimpleName(sharedfile)) + "groups" + extension; + + //print headers + ofstream out; + m->openOutputFile(combineFileName, out); + out << newLine << endl; + out.close(); + + } + + //for each type create a combo file + map lineToNumber; + for (map >::iterator it = typesFiles.begin(); it != typesFiles.end(); it++) { + + ofstream out; + string combineFileName = outputDir + m->getRootName(m->getSimpleName(sharedfile)) + "groups" + it->first; + m->openOutputFileAppend(combineFileName, out); + newFileNames.push_back(combineFileName); + + vector thisTypesFiles = it->second; + + //open each type summary file + map > files; //maps file name to lines in file + int maxLines = 0; + int numColumns = 0; + for (int i=0; iopenInputFile(thisTypesFiles[i], temp); + + //read through first line - labels + m->getline(temp); m->gobble(temp); + + vector thisFilesLines; + string fileNameRoot = m->getRootName(thisTypesFiles[i]); + map::iterator itName = nameMap.find(fileNameRoot); + string group = ""; + if (itName != nameMap.end()) { + group = itName->second; + }else { + group = "not found" + i; + m->mothurOut("[ERROR]: can't parse filename."); m->mothurOutEndLine(); + } + + thisFilesLines.push_back(group); + int count = 1; + while (!temp.eof()){ + + string thisLine = m->getline(temp); + + string numSampled = thisLine.substr(0, thisLine.find_first_of('\t')); + int num = 0; + convert(numSampled, num); + numColumns = m->getNumChar(thisLine, '\t'); + lineToNumber[count] = num; + count++; + + thisFilesLines.push_back(thisLine); + + m->gobble(temp); + } + + files[thisTypesFiles[i]] = thisFilesLines; + + //save longest file for below + if (maxLines < thisFilesLines.size()) { maxLines = thisFilesLines.size(); } + + temp.close(); + m->mothurRemove(thisTypesFiles[i]); + } + + + //for each label + for (int k = 1; k < maxLines; k++) { + + //grab data for each group + for (int i=0; i::iterator itLine = lineToNumber.find(k); + if (itLine != lineToNumber.end()) { + string output = toString(itLine->second); + if (k < files[thisTypesFiles[i]].size()) { + string line = files[thisTypesFiles[i]][k]; + output = line.substr(0, line.find_first_of('\t')); + output += '\t' + files[thisTypesFiles[i]][0] + '\t' + line.substr(line.find_first_of('\t')); + }else{ + output += '\t' + files[thisTypesFiles[i]][0] + '\t'; + for (int h = 0; h < numColumns; h++) { + output += "NA\t"; + } + } + out << output << endl; + }else { m->mothurOut("[ERROR]: parsing results, cant find " + toString(k)); m->mothurOutEndLine(); } + } + } + + out.close(); + + } + + //return combine file name + return newFileNames; + + } + catch(exception& e) { + m->errorOut(e, "RareFactCommand", "createGroupFile"); + exit(1); + } +} +//********************************************************************************************************************** vector RareFactCommand::parseSharedFile(string filename) { try { vector filenames;