]> git.donarmstrong.com Git - mothur.git/blob - getoturepcommand.h
removed read.dist, read.otu, read.tree and globaldata. added current to defaults...
[mothur.git] / getoturepcommand.h
1 #ifndef GETOTUREPCOMMAND_H
2 #define GETOTUREPCOMMAND_H
3 /*
4  *  getoturepcommand.h
5  *  Mothur
6  *
7  *  Created by Sarah Westcott on 4/6/09.
8  *  Copyright 2009 Schloss Lab UMASS Amherst. All rights reserved.
9  *
10  */
11  
12  /* The get.oturep command outputs a .fastarep file for each distance you specify, selecting one OTU representative for each bin. */
13
14 #include "command.hpp"
15 #include "listvector.hpp"
16 #include "inputdata.h"
17 #include "fastamap.h"
18 #include "groupmap.h"
19 #include "readmatrix.hpp"
20 #include "formatmatrix.h"
21
22 typedef list<PCell>::iterator MatData;
23 typedef map<int, float> SeqMap;
24
25 struct repStruct {
26                 string name;
27                 int     bin;
28                 int size;
29                 string group;
30                 
31                 repStruct(){}
32                 repStruct(string n, int b, int s, string g) : name(n), bin(b), size(s), group(g) {}
33                 ~repStruct() {}
34 };
35
36 class GetOTURepCommand : public Command {
37
38 public:
39         GetOTURepCommand(string);
40         GetOTURepCommand();
41         ~GetOTURepCommand(){}
42         
43         vector<string> setParameters();
44         string getCommandName()                 { return "get.oturep";                          }
45         string getCommandCategory()             { return "OTU-Based Approaches";        }
46         string getHelpString(); 
47         
48         int execute(); 
49         void help() { m->mothurOut(getHelpString()); }  
50         
51         
52 private:
53         ListVector* list;
54         InputData* input;
55         FastaMap* fasta;
56         GroupMap* groupMap;
57         ReadMatrix* readMatrix;
58         FormatMatrix* formatMatrix;
59         NameAssignment* nameMap;
60         string filename, fastafile, listfile, namefile, groupfile, label, sorted, phylipfile, columnfile, distFile, format, outputDir, groups;
61         ofstream out;
62         ifstream in, inNames, inRow;
63         bool abort, allLines, groupError, large, weighted;
64         set<string> labels; //holds labels to be used
65         map<string, int> nameToIndex;  //maps sequence name to index in sparsematrix
66         map<string, string> nameFileMap;
67         vector<string> outputNames, Groups;
68         map<string, string> outputNameFiles;
69         float cutoff;
70         int precision;
71         vector<SeqMap> seqVec;                  // contains maps with sequence index and distance
72                                                                         // for all distances related to a certain sequence
73         vector<int> rowPositions;
74
75         void readNamesFile();
76         void readNamesFile(bool);
77         int process(ListVector*);
78         SeqMap getMap(int);
79         string findRep(vector<string>);         // returns the name of the "representative" sequence of given bin or subset of a bin, for groups
80         int processNames(string, string);
81 };
82
83 #endif
84