X-Git-Url: https://git.donarmstrong.com/?a=blobdiff_plain;ds=sidebyside;f=classifyseqscommand.h;h=f075b41495afc9002e2a695d47972d4d947eafc9;hb=62c36830aae6dd6151898ec6e07df59c8aed79fe;hp=3294118343bbf763fa93dc56b6a05a3f8043c5ca;hpb=956cdff34f2d609a7736838b1631cd7957580b8b;p=mothur.git diff --git a/classifyseqscommand.h b/classifyseqscommand.h index 3294118..f075b41 100644 --- a/classifyseqscommand.h +++ b/classifyseqscommand.h @@ -12,7 +12,6 @@ #include "mothur.h" #include "command.hpp" -//#include "alignment.hpp" #include "classify.h" //KNN and Bayesian methods modeled from algorithms in @@ -29,21 +28,34 @@ class ClassifySeqsCommand : public Command { public: ClassifySeqsCommand(string); + ClassifySeqsCommand(); ~ClassifySeqsCommand(); + + vector setParameters(); + string getCommandName() { return "classify.seqs"; } + string getCommandCategory() { return "Phylotype Analysis"; } + string getHelpString(); + string getCitation() { return "Wang Q, Garrity GM, Tiedje JM, Cole JR (2007). Naive Bayesian classifier for rapid assignment of rRNA sequences into the new bacterial taxonomy. Appl Environ Microbiol 73: 5261-7. [ for Bayesian classifier ] \nAltschul SF, Madden TL, Schaffer AA, Zhang J, Zhang Z, Miller W, Lipman DJ (1997). Gapped BLAST and PSI-BLAST: a new generation of protein database search programs. Nucleic Acids Res 25: 3389-402. [ for BLAST ] \nDeSantis TZ, Hugenholtz P, Larsen N, Rojas M, Brodie EL, Keller K, Huber T, Dalevi D, Hu P, Andersen GL (2006). Greengenes, a chimera-checked 16S rRNA gene database and workbench compatible with ARB. Appl Environ Microbiol 72: 5069-72. [ for kmer ] \nhttp://www.mothur.org/wiki/Classify.seqs"; } + + int execute(); - void help(); + void help() { m->mothurOut(getHelpString()); } + + private: struct linePair { unsigned long int start; - int numSeqs; - linePair(unsigned long int i, int j) : start(i), numSeqs(j) {} + unsigned long int end; + linePair(unsigned long int i, unsigned long int j) : start(i), end(j) {} }; + vector processIDS; //processid vector lines; vector fastaFileNames; vector namefileNames; vector groupfileNames; + vector outputNames; map > nameMap; map >::iterator itNames; @@ -56,12 +68,12 @@ private: int driver(linePair*, string, string, string); void appendTaxFiles(string, string); - void createProcesses(string, string, string); + int createProcesses(string, string, string); string addUnclassifieds(string, int); int MPIReadNamesFile(string); #ifdef USE_MPI - int driverMPI(int, int, MPI_File&, MPI_File&, MPI_File&, vector&); + int driverMPI(int, int, MPI_File&, MPI_File&, MPI_File&, vector&); #endif };