temp = validParameter.validFile(parameters, "dereplicate", false);
- if (temp == "not found") {
- if (groupfile != "") { temp = "false"; }
- else { temp = "true"; }
- }
+ if (temp == "not found") { temp = "false"; }
dups = m->isTrue(temp);
int error;
if (hasCount) {
CountTable ct;
- ct.readTable(nameFile);
+ ct.readTable(nameFile, true);
for(map<string, string>::iterator it = seqs.begin(); it != seqs.end(); it++) {
int num = ct.getNumSeqs(it->first);
if (num == 0) { error = 1; }
if(processors == 1) { totalSeqs = driverGroups(outputFileName, newFasta, accnosFileName, alnsFileName, newCountFile, 0, groups.size(), groups);
- //read my own
- if (hasCount && !dups) {
- CountTable newCount; newCount.readTable(nameFile);
-
+ if (hasCount && dups) {
+ CountTable c; c.readTable(nameFile, true);
if (!m->isBlank(newCountFile)) {
ifstream in2;
m->openInputFile(newCountFile, in2);
string name, group;
while (!in2.eof()) {
in2 >> name >> group; m->gobble(in2);
- newCount.setAbund(name, group, 0);
+ c.setAbund(name, group, 0);
}
in2.close();
}
m->mothurRemove(newCountFile);
- newCount.printTable(newCountFile);
+ c.printTable(newCountFile);
}
}else { totalSeqs = createProcessesGroups(outputFileName, newFasta, accnosFileName, alnsFileName, newCountFile, groups, nameFile, groupFile, fastaFileNames[s]); }
m->mothurOutEndLine(); m->mothurOut("It took " + toString(time(NULL) - start) + " secs to check " + toString(totalSeqs) + " sequences. " + toString(totalChimeras) + " chimeras were found."); m->mothurOutEndLine();
m->mothurOut("The number of sequences checked may be larger than the number of unique sequences because some sequences are found in several samples."); m->mothurOutEndLine();
}else {
- /*if (hasCount) { //removed empty seqs
+
+ if (hasCount) {
+ set<string> doNotRemove;
+ CountTable c; c.readTable(newCountFile, true);
+ vector<string> namesInTable = c.getNamesOfSeqs();
+ for (int i = 0; i < namesInTable.size(); i++) {
+ int temp = c.getNumSeqs(namesInTable[i]);
+ if (temp == 0) { c.remove(namesInTable[i]); }
+ else { doNotRemove.insert((namesInTable[i])); }
+ }
+ //remove names we want to keep from accnos file.
+ set<string> accnosNames = m->readAccnos(accnosFileName);
ofstream out2;
m->openOutputFile(accnosFileName, out2);
-
- CountTable c; c.readTable(newCountFile);
- vector<string> nseqs = c.getNamesOfSeqs();
- vector<string> ngroups = c.getNamesOfGroups();
- for (int l = 0; l < nseqs.size(); l++) {
- if (c.getNumSeqs(nseqs[l]) == 0) {
- c.remove(nseqs[l]);
- out2 << nseqs[l] << endl;
- }
- }
- for (int l = 0; l < ngroups.size(); l++) {
- if (c.getGroupCount(ngroups[l]) == 0) { c.removeGroup(ngroups[l]); }
+ for (set<string>::iterator it = accnosNames.begin(); it != accnosNames.end(); it++) {
+ if (doNotRemove.count(*it) == 0) { out2 << (*it) << endl; }
}
out2.close();
c.printTable(newCountFile);
- }*/
+ outputNames.push_back(newCountFile); outputTypes["count"].push_back(newCountFile);
+ }
}
if (hasCount) { delete cparser; }
if (itTypes != outputTypes.end()) {
if ((itTypes->second).size() != 0) { current = (itTypes->second)[0]; m->setAccnosFile(current); }
}
+
+ itTypes = outputTypes.find("count");
+ if (itTypes != outputTypes.end()) {
+ if ((itTypes->second).size() != 0) { current = (itTypes->second)[0]; m->setCountTableFile(current); }
+ }
m->mothurOutEndLine();
m->mothurOut("Output File Names: "); m->mothurOutEndLine();
map<string, string>::iterator itUnique;
int total = 0;
- //edit accnos file
- ifstream in2;
- m->openInputFile(accnosFileName, in2);
-
ofstream out2;
m->openOutputFile(accnosFileName+".temp", out2);
set<string> chimerasInFile;
set<string>::iterator itChimeras;
-
- while (!in2.eof()) {
- if (m->control_pressed) { in2.close(); out2.close(); m->mothurRemove(outputFileName); m->mothurRemove((accnosFileName+".temp")); return 0; }
-
- in2 >> name; m->gobble(in2);
-
- //find unique name
- itUnique = uniqueNames.find(name);
-
- if (itUnique == uniqueNames.end()) { m->mothurOut("[ERROR]: trouble parsing accnos results. Cannot find " + name + "."); m->mothurOutEndLine(); m->control_pressed = true; }
- else {
- itChimeras = chimerasInFile.find((itUnique->second));
-
- if (itChimeras == chimerasInFile.end()) {
- out2 << itUnique->second << endl;
- chimerasInFile.insert((itUnique->second));
- total++;
- }
- }
- }
- in2.close();
+ if (!m->isBlank(accnosFileName)) {
+ //edit accnos file
+ ifstream in2;
+ m->openInputFile(accnosFileName, in2);
+
+ while (!in2.eof()) {
+ if (m->control_pressed) { in2.close(); out2.close(); m->mothurRemove(outputFileName); m->mothurRemove((accnosFileName+".temp")); return 0; }
+
+ in2 >> name; m->gobble(in2);
+
+ //find unique name
+ itUnique = uniqueNames.find(name);
+
+ if (itUnique == uniqueNames.end()) { m->mothurOut("[ERROR]: trouble parsing accnos results. Cannot find " + name + "."); m->mothurOutEndLine(); m->control_pressed = true; }
+ else {
+ itChimeras = chimerasInFile.find((itUnique->second));
+
+ if (itChimeras == chimerasInFile.end()) {
+ out2 << itUnique->second << endl;
+ chimerasInFile.insert((itUnique->second));
+ total++;
+ }
+ }
+ }
+ in2.close();
+ }
out2.close();
m->mothurRemove(accnosFileName);
int totalSeqs = 0;
int numChimeras = 0;
+
ofstream outCountList;
if (hasCount && dups) { m->openOutputFile(countlist, outCountList); }
int num = 0;
CountTable newCount;
- if (hasCount && dups) { newCount.readTable(nameFile); }
+ if (hasCount && dups) { newCount.readTable(nameFile, true); }
//sanity check
if (groups.size() < processors) { processors = groups.size(); }
#endif
-
+
//read my own
if (hasCount && dups) {
if (!m->isBlank(accnos + ".byCount")) {
}
m->mothurRemove(accnos + ".byCount");
}
-
+
//append output files
for(int i=0;i<processIDS.size();i++){
m->appendFiles((outputFName + toString(processIDS[i]) + ".temp"), outputFName);
}
//print new *.pick.count_table
- if (hasCount && dups) { newCount.printTable(newCountFile); }
-
+ if (hasCount && dups) { newCount.printTable(newCountFile); }
+
return num;
}