X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;f=nmdscommand.cpp;h=946aa68ab24ed5a10800d6d5c9e2ca32f4fd2ade;hb=7bf9a81bba76538ecaf351ae208de3da4bf1b6dd;hp=0661f24b09d4494d658a6044fdce1fafe0b5582f;hpb=6d12ed0ba66fb35e9e2781fe3ca361e2293f2476;p=mothur.git diff --git a/nmdscommand.cpp b/nmdscommand.cpp index 0661f24..946aa68 100644 --- a/nmdscommand.cpp +++ b/nmdscommand.cpp @@ -11,52 +11,61 @@ #include "readphylipvector.h" //********************************************************************************************************************** -vector NMDSCommand::getValidParameters(){ +vector NMDSCommand::setParameters(){ try { - string Array[] = {"phylip","axes","mindim","maxdim","iters","maxiters","epsilon","outputdir","inputdir"}; - vector myArray (Array, Array+(sizeof(Array)/sizeof(string))); + CommandParameter paxes("axes", "InputTypes", "", "", "none", "none", "none",false,false); parameters.push_back(paxes); + CommandParameter pphylip("phylip", "InputTypes", "", "", "none", "none", "none",false,true); parameters.push_back(pphylip); + CommandParameter pmaxdim("maxdim", "Number", "", "2", "", "", "",false,false); parameters.push_back(pmaxdim); + CommandParameter pmindim("mindim", "Number", "", "2", "", "", "",false,false); parameters.push_back(pmindim); + CommandParameter piters("iters", "Number", "", "10", "", "", "",false,false); parameters.push_back(piters); + CommandParameter pmaxiters("maxiters", "Number", "", "500", "", "", "",false,false); parameters.push_back(pmaxiters); + CommandParameter pepsilon("epsilon", "Number", "", "0.000000000001", "", "", "",false,false); parameters.push_back(pepsilon); + CommandParameter pinputdir("inputdir", "String", "", "", "", "", "",false,false); parameters.push_back(pinputdir); + CommandParameter poutputdir("outputdir", "String", "", "", "", "", "",false,false); parameters.push_back(poutputdir); + + vector myArray; + for (int i = 0; i < parameters.size(); i++) { myArray.push_back(parameters[i].name); } return myArray; } catch(exception& e) { - m->errorOut(e, "NMDSCommand", "getValidParameters"); + m->errorOut(e, "NMDSCommand", "setParameters"); exit(1); } } //********************************************************************************************************************** -NMDSCommand::NMDSCommand(){ +string NMDSCommand::getHelpString(){ try { - abort = true; - //initialize outputTypes - vector tempOutNames; - outputTypes["nmds"] = tempOutNames; - outputTypes["stress"] = tempOutNames; - outputTypes["iters"] = tempOutNames; + string helpString = ""; + helpString += "The nmds command is modelled after the nmds code written in R by Sarah Goslee, using Non-metric multidimensional scaling function using the majorization algorithm from Borg & Groenen 1997, Modern Multidimensional Scaling.\n"; + helpString += "The nmds command parameters are phylip, axes, mindim, maxdim, maxiters, iters and epsilon.\n"; + helpString += "The phylip parameter allows you to enter your distance file.\n"; + helpString += "The axes parameter allows you to enter a file containing a starting configuration.\n"; + helpString += "The maxdim parameter allows you to select the maximum dimensions to use. Default=2\n"; + helpString += "The mindim parameter allows you to select the minimum dimensions to use. Default=2\n"; + helpString += "The maxiters parameter allows you to select the maximum number of iters to try with each random configuration. Default=500\n"; + helpString += "The iters parameter allows you to select the number of random configuration to try. Default=10\n"; + helpString += "The epsilon parameter allows you to select set an acceptable stopping point. Default=1e-12.\n"; + helpString += "Example nmds(phylip=yourDistanceFile).\n"; + helpString += "Note: No spaces between parameter labels (i.e. phylip), '=' and parameters (i.e.yourDistanceFile).\n"; + return helpString; } catch(exception& e) { - m->errorOut(e, "NMDSCommand", "NMDSCommand"); + m->errorOut(e, "NMDSCommand", "getHelpString"); exit(1); } } //********************************************************************************************************************** -vector NMDSCommand::getRequiredParameters(){ - try { - string Array[] = {"phylip"}; - vector myArray (Array, Array+(sizeof(Array)/sizeof(string))); - return myArray; - } - catch(exception& e) { - m->errorOut(e, "NMDSCommand", "getRequiredParameters"); - exit(1); - } -} -//********************************************************************************************************************** -vector NMDSCommand::getRequiredFiles(){ +NMDSCommand::NMDSCommand(){ try { - vector myArray; - return myArray; + abort = true; calledHelp = true; + setParameters(); + vector tempOutNames; + outputTypes["nmds"] = tempOutNames; + outputTypes["stress"] = tempOutNames; + outputTypes["iters"] = tempOutNames; } catch(exception& e) { - m->errorOut(e, "NMDSCommand", "getRequiredFiles"); + m->errorOut(e, "NMDSCommand", "NMDSCommand"); exit(1); } } @@ -64,15 +73,14 @@ vector NMDSCommand::getRequiredFiles(){ NMDSCommand::NMDSCommand(string option) { try { - abort = false; + abort = false; calledHelp = false; //allow user to run help - if(option == "help") { help(); abort = true; } + if(option == "help") { help(); abort = true; calledHelp = true; } + else if(option == "citation") { citation(); abort = true; calledHelp = true;} else { - //valid paramters for this command - string Array[] = {"phylip","axes","mindim","maxdim","iters","maxiters","epsilon","outputdir", "inputdir"}; - vector myArray (Array, Array+(sizeof(Array)/sizeof(string))); + vector myArray = setParameters(); OptionParser parser(option); map parameters = parser. getParameters(); @@ -115,7 +123,12 @@ NMDSCommand::NMDSCommand(string option) { //required parameters phylipfile = validParameter.validFile(parameters, "phylip", true); if (phylipfile == "not open") { phylipfile = ""; abort = true; } - else if (phylipfile == "not found") { phylipfile = ""; m->mothurOut("You must provide a distance file before running the nmds command."); m->mothurOutEndLine(); abort = true; } + else if (phylipfile == "not found") { + //if there is a current phylip file, use it + phylipfile = m->getPhylipFile(); + if (phylipfile != "") { m->mothurOut("Using " + phylipfile + " as input file for the phylip parameter."); m->mothurOutEndLine(); } + else { m->mothurOut("You have no current phylip file and the phylip parameter is required."); m->mothurOutEndLine(); abort = true; } + }else { m->setPhylipFile(phylipfile); } axesfile = validParameter.validFile(parameters, "axes", true); if (axesfile == "not open") { axesfile = ""; abort = true; } @@ -153,32 +166,10 @@ NMDSCommand::NMDSCommand(string option) { } } //********************************************************************************************************************** -void NMDSCommand::help(){ - try { - m->mothurOut("The nmds command is modelled after the nmds code written in R by Sarah Goslee, using Non-metric multidimensional scaling function using the majorization algorithm from Borg & Groenen 1997, Modern Multidimensional Scaling."); m->mothurOutEndLine(); - m->mothurOut("The nmds command parameters are phylip, axes, mindim, maxdim, maxiters, iters and epsilon."); m->mothurOutEndLine(); - m->mothurOut("The phylip parameter allows you to enter your distance file."); m->mothurOutEndLine(); - m->mothurOut("The axes parameter allows you to enter a file containing a starting configuration."); m->mothurOutEndLine(); - m->mothurOut("The maxdim parameter allows you to select how maximum dimensions to use. Default=2"); m->mothurOutEndLine(); - m->mothurOut("The mindim parameter allows you to select how minimum dimensions to use. Default=2"); m->mothurOutEndLine(); - m->mothurOut("The maxiters parameter allows you to select the maximum number of iters to try with each random configuration. Default=500"); m->mothurOutEndLine(); - m->mothurOut("The iters parameter allows you to select the number of random configuration to try. Default=10"); m->mothurOutEndLine(); - m->mothurOut("The epsilon parameter allows you to select set an acceptable stopping point. Default=1e-12."); m->mothurOutEndLine(); - m->mothurOut("Example nmds(phylip=yourDistanceFile).\n"); - m->mothurOut("Note: No spaces between parameter labels (i.e. phylip), '=' and parameters (i.e.yourDistanceFile).\n\n"); - } - catch(exception& e) { - m->errorOut(e, "NMDSCommand", "help"); - exit(1); - } -} -//********************************************************************************************************************** -NMDSCommand::~NMDSCommand(){} -//********************************************************************************************************************** int NMDSCommand::execute(){ try { - if (abort == true) { return 0; } + if (abort == true) { if (calledHelp) { return 0; } return 2; } cout.setf(ios::fixed, ios::floatfield); cout.setf(ios::showpoint); @@ -196,7 +187,7 @@ int NMDSCommand::execute(){ if (axesfile != "") { axes = readAxes(names); } string outputFileName = outputDir + m->getRootName(m->getSimpleName(phylipfile)) + "nmds.iters"; - string stressFileName = outputDir + m->getRootName(m->getSimpleName(phylipfile)) + "stress.nmds"; + string stressFileName = outputDir + m->getRootName(m->getSimpleName(phylipfile)) + "nmds.stress"; outputNames.push_back(outputFileName); outputTypes["iters"].push_back(outputFileName); outputNames.push_back(stressFileName); outputTypes["stress"].push_back(stressFileName); @@ -209,10 +200,12 @@ int NMDSCommand::execute(){ out.setf(ios::fixed, ios::floatfield); out.setf(ios::showpoint); - out2 << "Dimension\tIter\tStress\tCorr" << endl; + out2 << "Dimension\tIter\tStress\tRsq" << endl; double bestStress = 10000000; + double bestR2 = 10000000; vector< vector > bestConfig; + int bestDim = 0; for (int i = mindim; i <= maxdim; i++) { m->mothurOut("Processing Dimension: " + toString(i)); m->mothurOutEndLine(); @@ -236,21 +229,23 @@ int NMDSCommand::execute(){ if (m->control_pressed) { out.close(); out2.close(); for (int k = 0; k < outputNames.size(); k++) { remove(outputNames[k].c_str()); } return 0; } //calc correlation between original distances and euclidean distances from this config - double corr = linearCalc.calcPearson(newEuclid, matrix); - corr *= corr; + double rsquared = linearCalc.calcPearson(newEuclid, matrix); + rsquared *= rsquared; if (m->control_pressed) { out.close(); out2.close(); for (int k = 0; k < outputNames.size(); k++) { remove(outputNames[k].c_str()); } return 0; } //output results out << "Config" << (j+1) << '\t'; for (int k = 0; k < i; k++) { out << "axis" << (k+1) << '\t'; } out << endl; - out2 << i << '\t' << (j+1) << '\t' << stress << '\t' << corr << endl; + out2 << i << '\t' << (j+1) << '\t' << stress << '\t' << rsquared << endl; output(endConfig, names, out); //save best if (stress < bestStress) { + bestDim = i; bestStress = stress; + bestR2 = rsquared; bestConfig = endConfig; } @@ -264,6 +259,10 @@ int NMDSCommand::execute(){ string BestFileName = outputDir + m->getRootName(m->getSimpleName(phylipfile)) + "nmds.axes"; outputNames.push_back(BestFileName); outputTypes["nmds"].push_back(BestFileName); + m->mothurOut("\nNumber of dimensions:\t" + toString(bestDim) + "\n"); + m->mothurOut("Lowest stress :\t" + toString(bestStress) + "\n"); + m->mothurOut("R-squared for configuration:\t" + toString(bestR2) + "\n"); + ofstream outBest; m->openOutputFile(BestFileName, outBest); outBest.setf(ios::fixed, ios::floatfield);