]> git.donarmstrong.com Git - mothur.git/blob - pintail.h
chimeras, fix to sabundvector and sharedsabundvector that caused getRabundVector...
[mothur.git] / pintail.h
1 #ifndef PINTAIL_H
2 #define PINTAIL_H
3
4 /*
5  *  pintail.h
6  *  Mothur
7  *
8  *  Created by Sarah Westcott on 7/9/09.
9  *  Copyright 2009 Schloss Lab UMASS Amherst. All rights reserved.
10  *
11  */
12
13 #include "chimera.h"
14 #include "dist.h"
15 #include "decalc.h"
16
17 /***********************************************************/
18 //This class was created using the algorythms described in the 
19 // "At Least 1 in 20 16S rRNA Sequence Records Currently Held in the Public Repositories is Estimated To Contain Substantial Anomalies" paper 
20 //by Kevin E. Ashelford 1, Nadia A. Chuzhanova 3, John C. Fry 1, Antonia J. Jones 2 and Andrew J. Weightman 1.
21
22 /***********************************************************/
23
24 class Pintail : public Chimera {
25         
26         public:
27                 Pintail(string, string);        
28                 ~Pintail();
29                 
30                 int getChimeras(Sequence*);
31                 void print(ostream&);
32                 
33                 void setCons(string c)          { consfile = c;  }
34                 void setQuantiles(string q) { quanfile = q;  }
35                 
36                 
37         private:
38         
39                 Dist* distcalculator;
40                 DeCalculator* decalc;
41                 int iters;
42                 string fastafile, consfile;
43                 
44                 vector<linePair*> templateLines;
45                 Sequence*querySeq;
46                                 
47                 Sequence* bestfit;  //closest match to query in template
48                 
49                 vector<float>  obsDistance;  //obsDistance is the vector of observed distances for query 
50                 vector<float>  expectedDistance;  //expectedDistance is the vector of expected distances for query
51                 float deviation;  //deviation is the percentage of mismatched pairs over the whole seq between query and its best match.
52                 vector<int>  windowsForeachQuery;  // windowsForeachQuery is a vector containing the starting spot in query aligned sequence for each window.
53                                                                                 //this is needed so you can move by bases and not just spots in the alignment
54                                                                                 
55                 int windowSizes;                        //windowSizes = window size of query
56                 vector<int> windowSizesTemplate;    //windowSizesTemplate[0] = window size of templateSeqs[0]
57                 
58                 map<int, int> trimmed;    //trimmed = start and stop of trimmed sequences for query
59                 map<int, int>::iterator it;
60                 
61                 vector<float>  Qav;     //Qav is the vector of average variablility for query
62                 float  seqCoef;         //seqCoef is the coeff for query
63                 float DE;                       //DE is the deviaation for query
64                 vector<float> probabilityProfile;
65                 vector< vector<float> > quantiles;  //quantiles[0] is the vector of deviations with ceiling score of 1, quantiles[1] is the vector of deviations with ceiling score of 2...
66                 vector< vector<quanMember> > quantilesMembers;  //quantiles[0] is the vector of deviations with ceiling score of 1, quantiles[1] is the vector of deviations with ceiling score of 2...
67                 set<int>  h;
68                 string mergedFilterString;
69                 
70                 
71                 vector<float> readFreq();
72                 Sequence* findPairs(Sequence*);
73                         
74                 void createProcessesQuan();
75                 void doPrep();
76                 
77 };
78
79 /***********************************************************/
80
81 #endif
82