X-Git-Url: https://git.donarmstrong.com/?p=mothur.git;a=blobdiff_plain;f=treegroupscommand.cpp;h=80698f1b4b0317719421dbe9c4af3c0583bd9d97;hp=0d014599fa794217233694f8a28ed707b99c86eb;hb=df7e3ff9f68ef157b0328a2d353c3258c5d45d89;hpb=4458418562cc9dfc9a29ed4f8f6cfc7bfb927d40 diff --git a/treegroupscommand.cpp b/treegroupscommand.cpp index 0d01459..80698f1 100644 --- a/treegroupscommand.cpp +++ b/treegroupscommand.cpp @@ -458,7 +458,7 @@ int TreeGroupCommand::execute(){ readMatrix->read(nameMap); }else if (countfile != "") { ct = new CountTable(); - ct->readTable(countfile); + ct->readTable(countfile, true); readMatrix->read(ct); }else { readMatrix->read(nameMap); @@ -644,6 +644,7 @@ int TreeGroupCommand::makeSimsShared() { }else { m->clearGroups(); Groups.clear(); + m->Treenames.clear(); vector temp; for (int i = 0; i < lookup.size(); i++) { if (lookup[i]->getNumSeqs() < subsampleSize) { @@ -652,6 +653,7 @@ int TreeGroupCommand::makeSimsShared() { }else { Groups.push_back(lookup[i]->getGroup()); temp.push_back(lookup[i]); + m->Treenames.push_back(lookup[i]->getGroup()); } } lookup = temp; @@ -660,8 +662,18 @@ int TreeGroupCommand::makeSimsShared() { if (lookup.size() < 2) { m->mothurOut("You have not provided enough valid groups. I cannot run the command."); m->mothurOutEndLine(); m->control_pressed = true; return 0; } } - numGroups = lookup.size(); + + //sanity check to make sure processors < numComparisions + int numDists = 0; + for(int i=0;i processors) { break; } + } + } + if (numDists < processors) { processors = numDists; } + lines.resize(processors); for (int i = 0; i < processors; i++) { lines[i].start = int (sqrt(float(i)/float(processors)) * numGroups); @@ -890,6 +902,9 @@ int TreeGroupCommand::process(vector thisLookup) { //Close all thread handles and free memory allocations. for(int i=0; i < pDataArray.size(); i++){ + if (pDataArray[i]->count != (pDataArray[i]->end-pDataArray[i]->start)) { + m->mothurOut("[ERROR]: process " + toString(i) + " only processed " + toString(pDataArray[i]->count) + " of " + toString(pDataArray[i]->end-pDataArray[i]->start) + " groups assigned to it, quitting. \n"); m->control_pressed = true; + } for (int j = 0; j < pDataArray[i]->thisLookup.size(); j++) { delete pDataArray[i]->thisLookup[j]; } for (int k = 0; k < calcDists.size(); k++) { @@ -913,35 +928,17 @@ int TreeGroupCommand::process(vector thisLookup) { thisItersLookup.clear(); for (int i = 0; i < calcDists.size(); i++) { calcDists[i].clear(); } } + + if (m->debug) { m->mothurOut("[DEBUG]: iter = " + toString(thisIter) + ".\n"); } } - + + if (m->debug) { m->mothurOut("[DEBUG]: done with iters.\n"); } + if (iters != 1) { //we need to find the average distance and standard deviation for each groups distance + vector< vector > calcAverages = m->getAverages(calcDistsTotals); - vector< vector > calcAverages; calcAverages.resize(treeCalculators.size()); - for (int i = 0; i < calcAverages.size(); i++) { //initialize sums to zero. - calcAverages[i].resize(calcDistsTotals[0][i].size()); - - for (int j = 0; j < calcAverages[i].size(); j++) { - calcAverages[i][j].seq1 = calcDists[i][j].seq1; - calcAverages[i][j].seq2 = calcDists[i][j].seq2; - calcAverages[i][j].dist = 0.0; - } - } - - for (int thisIter = 0; thisIter < iters; thisIter++) { //sum all groups dists for each calculator - for (int i = 0; i < calcAverages.size(); i++) { //initialize sums to zero. - for (int j = 0; j < calcAverages[i].size(); j++) { - calcAverages[i][j].dist += calcDistsTotals[thisIter][i][j].dist; - } - } - } - - for (int i = 0; i < calcAverages.size(); i++) { //finds average. - for (int j = 0; j < calcAverages[i].size(); j++) { - calcAverages[i][j].dist /= (float) iters; - } - } + if (m->debug) { m->mothurOut("[DEBUG]: found averages.\n"); } //create average tree for each calc for (int i = 0; i < calcDists.size(); i++) { @@ -972,6 +969,8 @@ int TreeGroupCommand::process(vector thisLookup) { if (newTree != NULL) { writeTree(outputFile, newTree); } } + if (m->debug) { m->mothurOut("[DEBUG]: done averages trees.\n"); } + //create all trees for each calc and find their consensus tree for (int i = 0; i < calcDists.size(); i++) { if (m->control_pressed) { break; } @@ -1003,7 +1002,7 @@ int TreeGroupCommand::process(vector thisLookup) { int row = calcDistsTotals[myIter][i][j].seq1; int column = calcDistsTotals[myIter][i][j].seq2; double dist = calcDistsTotals[myIter][i][j].dist; - + matrix[row][column] = dist; matrix[column][row] = dist; } @@ -1018,11 +1017,15 @@ int TreeGroupCommand::process(vector thisLookup) { outAll.close(); if (m->control_pressed) { for (int k = 0; k < trees.size(); k++) { delete trees[k]; } } + if (m->debug) { m->mothurOut("[DEBUG]: done all trees.\n"); } + Consensus consensus; //clear old tree names if any m->Treenames.clear(); m->Treenames = m->getGroups(); //may have changed if subsample eliminated groups Tree* conTree = consensus.getTree(trees); + if (m->debug) { m->mothurOut("[DEBUG]: done cons tree.\n"); } + //create a new filename variables["[tag]"] = "cons"; string conFile = getOutputFileName("tree",variables);