X-Git-Url: https://git.donarmstrong.com/?p=mothur.git;a=blobdiff_plain;f=parsimony.cpp;h=6a0485c133b2868670e49e5873186e5d10df474d;hp=efc7d3a4dfcdcb9db47dc24de5a7a412953a7aba;hb=1a20e24ee786195ab0e1cccd4f5aede7a88f3f4e;hpb=4ad32478c7b1bbb464c839a6e133f5b517a3efec diff --git a/parsimony.cpp b/parsimony.cpp index efc7d3a..6a0485c 100644 --- a/parsimony.cpp +++ b/parsimony.cpp @@ -11,106 +11,201 @@ /**************************************************************************************************/ -EstOutput Parsimony::getValues(Tree* t) { +EstOutput Parsimony::getValues(Tree* t, int p, string o) { try { - globaldata = GlobalData::getInstance(); - vector groups; - - copyTree = new Tree(); + processors = p; + outputDir = o; + CountTable* ct = t->getCountTable(); //if the users enters no groups then give them the score of all groups - int numGroups = globaldata->Groups.size(); + vector mGroups = m->getGroups(); + int numGroups = mGroups.size(); //calculate number of comparsions int numComp = 0; + vector< vector > namesOfGroupCombos; for (int r=0; r groups; groups.push_back(mGroups[r]); groups.push_back(mGroups[l]); + //cout << globaldata->Groups[r] << '\t' << globaldata->Groups[l] << endl; + namesOfGroupCombos.push_back(groups); } } //numComp+1 for AB, AC, BC, ABC - data.resize(numComp+1,0); + if (numComp != 1) { + vector groups; + if (numGroups == 0) { + //get score for all users groups + vector tGroups = ct->getNamesOfGroups(); + for (int i = 0; i < tGroups.size(); i++) { + if (tGroups[i] != "xxx") { + groups.push_back(tGroups[i]); + //cout << tmap->namesOfGroups[i] << endl; + } + } + namesOfGroupCombos.push_back(groups); + }else { + for (int i = 0; i < mGroups.size(); i++) { + groups.push_back(mGroups[i]); + //cout << globaldata->Groups[i] << endl; + } + namesOfGroupCombos.push_back(groups); + } + } - int count = 0; - for (int a=0; aGroups[a]); groups.push_back(globaldata->Groups[l]); + #if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix) + if(processors == 1){ + data = driver(t, namesOfGroupCombos, 0, namesOfGroupCombos.size(), ct); + }else{ + lines.clear(); + int numPairs = namesOfGroupCombos.size(); + + int numPairsPerProcessor = numPairs / processors; + + for (int i = 0; i < processors; i++) { + int startPos = i * numPairsPerProcessor; - //copy users tree so that you can redo pgroups - copyTree->getCopy(t); - - //create pgroups that reflect the groups the user want to use - for(int i=copyTree->getNumLeaves();igetNumNodes();i++){ - copyTree->tree[i].pGroups = (copyTree->mergeUserGroups(i, groups)); + if(i == processors - 1){ + numPairsPerProcessor = numPairs - i * numPairsPerProcessor; } - - for(int i=copyTree->getNumLeaves();igetNumNodes();i++){ - if (m->control_pressed) { return data; } - - int lc = copyTree->tree[i].getLChild(); - int rc = copyTree->tree[i].getRChild(); + lines.push_back(linePair(startPos, numPairsPerProcessor)); + } - int iSize = copyTree->tree[i].pGroups.size(); - int rcSize = copyTree->tree[rc].pGroups.size(); - int lcSize = copyTree->tree[lc].pGroups.size(); + data = createProcesses(t, namesOfGroupCombos, ct); + } + #else + data = driver(t, namesOfGroupCombos, 0, namesOfGroupCombos.size(), ct); + #endif - //if isize are 0 then that branch is to be ignored - if (iSize == 0) { } - else if ((rcSize == 0) || (lcSize == 0)) { } - //if you have more groups than either of your kids then theres been a change. - else if(iSize > rcSize || iSize > lcSize){ - score++; - } - } + return data; + + } + catch(exception& e) { + m->errorOut(e, "Parsimony", "getValues"); + exit(1); + } +} +/**************************************************************************************************/ + +EstOutput Parsimony::createProcesses(Tree* t, vector< vector > namesOfGroupCombos, CountTable* ct) { + try { +#if defined (__APPLE__) || (__MACH__) || (linux) || (__linux) || (__linux__) || (__unix__) || (__unix) + int process = 1; + vector processIDS; + + EstOutput results; + + //loop through and create all the processes you want + while (process != processors) { + int pid = fork(); + + if (pid > 0) { + processIDS.push_back(pid); //create map from line number to pid so you can append files in correct order later + process++; + }else if (pid == 0){ + EstOutput myresults; + myresults = driver(t, namesOfGroupCombos, lines[process].start, lines[process].num, ct); + + if (m->control_pressed) { exit(0); } - data[count] = score; - count++; - groups.clear(); + //pass numSeqs to parent + ofstream out; + string tempFile = outputDir + toString(getpid()) + ".pars.results.temp"; + m->openOutputFile(tempFile, out); + out << myresults.size() << endl; + for (int i = 0; i < myresults.size(); i++) { out << myresults[i] << '\t'; } out << endl; + out.close(); + + exit(0); + }else { + m->mothurOut("[ERROR]: unable to spawn the necessary processes."); m->mothurOutEndLine(); + for (int i = 0; i < processIDS.size(); i++) { kill (processIDS[i], SIGINT); } + exit(0); } } - if (numComp != 1) { - if (numGroups == 0) { - //get score for all users groups - for (int i = 0; i < tmap->namesOfGroups.size(); i++) { - if (tmap->namesOfGroups[i] != "xxx") { - groups.push_back(tmap->namesOfGroups[i]); - } - } - }else { - for (int i = 0; i < globaldata->Groups.size(); i++) { - groups.push_back(globaldata->Groups[i]); + results = driver(t, namesOfGroupCombos, lines[0].start, lines[0].num, ct); + + //force parent to wait until all the processes are done + for (int i=0;icontrol_pressed) { return results; } + + //get data created by processes + for (int i=0;iopenInputFile(s, in); + + //get scores + if (!in.eof()) { + int num; + in >> num; m->gobble(in); + + if (m->control_pressed) { break; } + + double w; + for (int j = 0; j < num; j++) { + in >> w; + results.push_back(w); } + m->gobble(in); } + in.close(); + m->mothurRemove(s); + } + + return results; +#endif + } + catch(exception& e) { + m->errorOut(e, "Parsimony", "createProcesses"); + exit(1); + } +} +/**************************************************************************************************/ +EstOutput Parsimony::driver(Tree* t, vector< vector > namesOfGroupCombos, int start, int num, CountTable* ct) { + try { + + EstOutput results; results.resize(num); + + Tree* copyTree = new Tree(ct); + int count = 0; + + for (int h = start; h < (start+num); h++) { + + if (m->control_pressed) { delete copyTree; return results; } + + int score = 0; + + //groups in this combo + vector groups = namesOfGroupCombos[h]; //copy users tree so that you can redo pgroups copyTree->getCopy(t); - int score = 0; - + //create pgroups that reflect the groups the user want to use for(int i=copyTree->getNumLeaves();igetNumNodes();i++){ copyTree->tree[i].pGroups = (copyTree->mergeUserGroups(i, groups)); } - -// map::iterator it; for(int i=copyTree->getNumLeaves();igetNumNodes();i++){ - + if (m->control_pressed) { return data; } int lc = copyTree->tree[i].getLChild(); int rc = copyTree->tree[i].getRChild(); - + int iSize = copyTree->tree[i].pGroups.size(); int rcSize = copyTree->tree[rc].pGroups.size(); int lcSize = copyTree->tree[lc].pGroups.size(); - //if isize are 0 then that branch is to be ignored if (iSize == 0) { } else if ((rcSize == 0) || (lcSize == 0)) { } @@ -119,17 +214,17 @@ EstOutput Parsimony::getValues(Tree* t) { score++; } } - - data[count] = score; - + + results[count] = score; + count++; } - + delete copyTree; - - return data; + + return results; } catch(exception& e) { - m->errorOut(e, "Parsimony", "getValues"); + m->errorOut(e, "Parsimony", "driver"); exit(1); } }