X-Git-Url: https://git.donarmstrong.com/?p=mothur.git;a=blobdiff_plain;f=treemap.cpp;h=47b7cf343635e2d104db75114aa77fbe8007c466;hp=e472570895414a4ec535e10c5f02bee10dfea982;hb=1a20e24ee786195ab0e1cccd4f5aede7a88f3f4e;hpb=219104a887d4725af80487729f4c34a030fe4358 diff --git a/treemap.cpp b/treemap.cpp index e472570..47b7cf3 100644 --- a/treemap.cpp +++ b/treemap.cpp @@ -12,36 +12,194 @@ /************************************************************/ TreeMap::TreeMap(string filename) { + m = MothurOut::getInstance(); + ofstream out2; + m->openOutputFileAppend(filename, out2); + out2 << endl; out2.close(); groupFileName = filename; - openInputFile(filename, fileHandle); + m->openInputFile(filename, fileHandle); } /************************************************************/ TreeMap::~TreeMap(){} +/************************************************************/ +int TreeMap::readMap(string gf) { + try { + ofstream out2; + m->openOutputFileAppend(gf, out2); + out2 << endl; out2.close(); + + groupFileName = gf; + m->openInputFile(gf, fileHandle); + + string seqName, seqGroup; + int error = 0; + string rest = ""; + char buffer[4096]; + bool pairDone = false; + bool columnOne = true; + + while (!fileHandle.eof()) { + if (m->control_pressed) { fileHandle.close(); return 1; } + + fileHandle.read(buffer, 4096); + vector pieces = m->splitWhiteSpace(rest, buffer, fileHandle.gcount()); + + for (int i = 0; i < pieces.size(); i++) { + if (columnOne) { seqName = pieces[i]; columnOne=false; } + else { seqGroup = pieces[i]; pairDone = true; columnOne=true; } + + if (pairDone) { + setNamesOfGroups(seqGroup); + + map::iterator itCheck = treemap.find(seqName); + if (itCheck != treemap.end()) { error = 1; m->mothurOut("[WARNING]: Your groupfile contains more than 1 sequence named " + seqName + ", sequence names must be unique. Please correct."); m->mothurOutEndLine(); } + else { + namesOfSeqs.push_back(seqName); + treemap[seqName].groupname = seqGroup; //store data in map + + it2 = seqsPerGroup.find(seqGroup); + if (it2 == seqsPerGroup.end()) { //if it's a new group + seqsPerGroup[seqGroup] = 1; + }else {//it's a group we already have + seqsPerGroup[seqGroup]++; + } + } + pairDone = false; + } + } + } + fileHandle.close(); + + if (rest != "") { + vector pieces = m->splitWhiteSpace(rest); + + for (int i = 0; i < pieces.size(); i++) { + if (columnOne) { seqName = pieces[i]; columnOne=false; } + else { seqGroup = pieces[i]; pairDone = true; columnOne=true; } + + if (pairDone) { + setNamesOfGroups(seqGroup); + + map::iterator itCheck = treemap.find(seqName); + if (itCheck != treemap.end()) { error = 1; m->mothurOut("[WARNING]: Your groupfile contains more than 1 sequence named " + seqName + ", sequence names must be unique. Please correct."); m->mothurOutEndLine(); } + else { + namesOfSeqs.push_back(seqName); + treemap[seqName].groupname = seqGroup; //store data in map + + it2 = seqsPerGroup.find(seqGroup); + if (it2 == seqsPerGroup.end()) { //if it's a new group + seqsPerGroup[seqGroup] = 1; + }else {//it's a group we already have + seqsPerGroup[seqGroup]++; + } + } + pairDone = false; + } + } + } + + return error; + } + catch(exception& e) { + m->errorOut(e, "TreeMap", "readMap"); + exit(1); + } +} + +/************************************************************/ +int TreeMap::readMap() { + try { + string seqName, seqGroup; + int error = 0; + + string rest = ""; + char buffer[4096]; + bool pairDone = false; + bool columnOne = true; + + while (!fileHandle.eof()) { + if (m->control_pressed) { fileHandle.close(); return 1; } + + fileHandle.read(buffer, 4096); + vector pieces = m->splitWhiteSpace(rest, buffer, fileHandle.gcount()); + + for (int i = 0; i < pieces.size(); i++) { + if (columnOne) { seqName = pieces[i]; columnOne=false; } + else { seqGroup = pieces[i]; pairDone = true; columnOne=true; } + + if (pairDone) { + setNamesOfGroups(seqGroup); + + map::iterator itCheck = treemap.find(seqName); + if (itCheck != treemap.end()) { error = 1; m->mothurOut("[WARNING]: Your groupfile contains more than 1 sequence named " + seqName + ", sequence names must be unique. Please correct."); m->mothurOutEndLine(); } + else { + namesOfSeqs.push_back(seqName); + treemap[seqName].groupname = seqGroup; //store data in map + + it2 = seqsPerGroup.find(seqGroup); + if (it2 == seqsPerGroup.end()) { //if it's a new group + seqsPerGroup[seqGroup] = 1; + }else {//it's a group we already have + seqsPerGroup[seqGroup]++; + } + } + pairDone = false; + } + } + } + fileHandle.close(); + + if (rest != "") { + vector pieces = m->splitWhiteSpace(rest); + + for (int i = 0; i < pieces.size(); i++) { + if (columnOne) { seqName = pieces[i]; columnOne=false; } + else { seqGroup = pieces[i]; pairDone = true; columnOne=true; } + + if (pairDone) { + setNamesOfGroups(seqGroup); + + map::iterator itCheck = treemap.find(seqName); + if (itCheck != treemap.end()) { error = 1; m->mothurOut("[WARNING]: Your groupfile contains more than 1 sequence named " + seqName + ", sequence names must be unique. Please correct."); m->mothurOutEndLine(); } + else { + namesOfSeqs.push_back(seqName); + treemap[seqName].groupname = seqGroup; //store data in map + + it2 = seqsPerGroup.find(seqGroup); + if (it2 == seqsPerGroup.end()) { //if it's a new group + seqsPerGroup[seqGroup] = 1; + }else {//it's a group we already have + seqsPerGroup[seqGroup]++; + } + } + pairDone = false; + } + } + } + + return error; + } + catch(exception& e) { + m->errorOut(e, "TreeMap", "readMap"); + exit(1); + } +} /************************************************************/ -void TreeMap::readMap() { - string seqName, seqGroup; +void TreeMap::addSeq(string seqName, string seqGroup) { - while(fileHandle){ - fileHandle >> seqName; //read from first column - fileHandle >> seqGroup; //read from second column + namesOfSeqs.push_back(seqName); + setNamesOfGroups(seqGroup); + + treemap[seqName].groupname = seqGroup; //store data in map - namesOfSeqs.push_back(seqName); - setNamesOfGroups(seqGroup); - - treemap[seqName].groupname = seqGroup; //store data in map - - it2 = seqsPerGroup.find(seqGroup); - if (it2 == seqsPerGroup.end()) { //if it's a new group - seqsPerGroup[seqGroup] = 1; - }else {//it's a group we already have - seqsPerGroup[seqGroup]++; - } - - gobble(fileHandle); + it2 = seqsPerGroup.find(seqGroup); + if (it2 == seqsPerGroup.end()) { //if it's a new group + seqsPerGroup[seqGroup] = 1; + }else {//it's a group we already have + seqsPerGroup[seqGroup]++; } - fileHandle.close(); } /************************************************************/ void TreeMap::removeSeq(string seqName) { @@ -49,7 +207,7 @@ void TreeMap::removeSeq(string seqName) { //erase name from namesOfSeqs for (int i = 0; i < namesOfSeqs.size(); i++) { if (namesOfSeqs[i] == seqName) { - namesOfSeqs.erase (namesOfSeqs.begin()+i); + namesOfSeqs.erase(namesOfSeqs.begin()+i); break; } } @@ -61,8 +219,6 @@ void TreeMap::removeSeq(string seqName) { //remove seq from treemap it = treemap.find(seqName); treemap.erase(it); - - } /************************************************************/ @@ -90,26 +246,6 @@ string TreeMap::getGroup(string sequenceName) { return "not found"; } -} -/************************************************************/ -void TreeMap::setIndex(string seq, int index) { - it = treemap.find(seq); - if (it != treemap.end()) { //sequence name was in group file - treemap[seq].vectorIndex = index; - }else { - treemap[seq].vectorIndex = index; - treemap[seq].groupname = "not found"; - } -} -/************************************************************/ -int TreeMap::getIndex(string seq) { - - it = treemap.find(seq); - // if it is a valid sequence name then return index - if (it != treemap.end()) { return treemap[seq].vectorIndex; } - // if not return error code - else { return -1; } - } /************************************************************/ @@ -137,7 +273,7 @@ bool TreeMap::isValidGroup(string groupname) { return false; } catch(exception& e) { - errorOut(e, "TreeMap", "isValidGroup"); + m->errorOut(e, "TreeMap", "isValidGroup"); exit(1); } } @@ -151,19 +287,19 @@ void TreeMap::print(ostream& output){ } } catch(exception& e) { - errorOut(e, "TreeMap", "print"); + m->errorOut(e, "TreeMap", "print"); exit(1); } } /************************************************************/ -void TreeMap::makeSim(GroupMap* groupmap) { +void TreeMap::makeSim(vector ThisnamesOfGroups) { try { //set names of groups - namesOfGroups = groupmap->namesOfGroups; + namesOfGroups = ThisnamesOfGroups; //set names of seqs to names of groups - namesOfSeqs = groupmap->namesOfGroups; + namesOfSeqs = ThisnamesOfGroups; // make map where key and value are both the group name since that what the tree.shared command wants for (int i = 0; i < namesOfGroups.size(); i++) { @@ -175,7 +311,7 @@ void TreeMap::makeSim(GroupMap* groupmap) { } catch(exception& e) { - errorOut(e, "TreeMap", "makeSim"); + m->errorOut(e, "TreeMap", "makeSim"); exit(1); } } @@ -201,7 +337,61 @@ void TreeMap::makeSim(ListVector* list) { } catch(exception& e) { - errorOut(e, "TreeMap", "makeSim"); + m->errorOut(e, "TreeMap", "makeSim"); + exit(1); + } +} +/************************************************************/ +int TreeMap::getCopy(TreeMap& copy){ + try { + + namesOfGroups = copy.getNamesOfGroups(); + numGroups = copy.getNumGroups(); + namesOfSeqs = copy.namesOfSeqs; + seqsPerGroup = copy.seqsPerGroup; + treemap = copy.treemap; + + return 0; + } + catch(exception& e) { + m->errorOut(e, "TreeMap", "getCopy"); + exit(1); + } +} +/************************************************************/ +vector TreeMap::getNamesSeqs(){ + try { + + vector names; + + for(it = treemap.begin(); it != treemap.end(); it++){ + names.push_back(it->first); + } + + return names; + } + catch(exception& e) { + m->errorOut(e, "TreeMap", "getNamesSeqs"); + exit(1); + } +} +/************************************************************/ +vector TreeMap::getNamesSeqs(vector picked){ + try { + + vector names; + + for(it = treemap.begin(); it != treemap.end(); it++){ + //if you are belong to one the the groups in the picked vector add you + if (m->inUsersGroups(it->second.groupname, picked)) { + names.push_back(it->first); + } + } + + return names; + } + catch(exception& e) { + m->errorOut(e, "TreeMap", "getNamesSeqs"); exit(1); } }