]> git.donarmstrong.com Git - mothur.git/blobdiff - heatmap.cpp
removed "shared" from some of the calculator names and classes
[mothur.git] / heatmap.cpp
index fb070567da4bb6f05c95111d067a7795d45b2239..523662ece3dae73f4ff48461621ba6b92ae9d8cc 100644 (file)
@@ -14,6 +14,8 @@ HeatMap::HeatMap(){
        try {
                globaldata = GlobalData::getInstance();
                format = globaldata->getFormat();
+               sorted = globaldata->getSorted();
+               util = new SharedUtil();
                
        }
        catch(exception& e) {
@@ -32,41 +34,96 @@ void HeatMap::getPic(OrderVector* order) {
                
                rabund = order->getRAbundVector();
                
+               //get users scaling method
+               scaler = globaldata->getScaler();
+               
+               float maxbin = 0.0;
                for (int i = 0; i < rabund.size(); i++) {
-                       colorScale[rabund.get(i)] = "";
+                       if (rabund.get(i) != 0) { //don't want log value of 0.
+                                       if (scaler == "log10") {
+                                               colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))] = "";  
+                                               if (maxbin < (log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))) { maxbin = (log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100)); }
+                                       }else if (scaler == "log2") {
+                                               colorScale[(log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))] = "";  
+                                               if (maxbin < (log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))) { maxbin = (log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100)); }
+                                       }else if (scaler == "linear") {
+                                               colorScale[rabund.get(i)] = "";
+                                               if (maxbin < rabund.get(i)) { maxbin = rabund.get(i); }
+                                       }else {  //if user enters invalid scaler option.
+                                               cout << scaler << " is not a valid scaler option. I will use log10." << endl;
+                                               colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))] = ""; 
+                                               if (maxbin < (log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))) { maxbin = (log10((rabund.get(i)) / (float)rabund.getNumSeqs()) * 100); }  
+                                       } 
+                       }else { colorScale[0] = "00";  }
                }
                
-               float scaler = 255 / (float) colorScale.size();
+               float scalers = 255 / (float) maxbin;
                
                //go through map and give each score a color value
                for (it = colorScale.begin(); it != colorScale.end(); it++) {
-                       it->second = toHex(int(float(it->first) * scaler));
+                       it->second = toHex(int(float(it->first) * scalers));
                        if(it->second.length() == 1) {  it->second = "0" + it->second;  }
                }
 
-               string filenamesvg = globaldata->inputFileName + ".heatmap." + order->getLabel() + ".svg";
-               
+               string filenamesvg = getRootName(globaldata->inputFileName) + order->getLabel() + ".heatmap.svg";
                openOutputFile(filenamesvg, outsvg);
                
-               //scale max rank so the maxrank = bright red
-                       
                //svg image
-               outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 300 " + toString((rabund.getNumBins()*5 + 15))  + "\">\n";
+               outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 300 " + toString((rabund.getNumBins()*5 + 120))  + "\">\n";
                outsvg << "<g>\n";
                
-               int x = 15;
-               int y = 15;
+               //white backround
+               outsvg << "<rect fill=\"white\" stroke=\"white\" x=\"0\" y=\"0\" width=\"300\" height=\"" + toString((rabund.getNumBins()*5 + 120))  + "\"/>"; 
+               outsvg << "<text fill=\"black\" class=\"seri\" x=\"100\" y=\"25\">Heatmap at distance " + order->getLabel() + "</text>\n";
+               
+               //output legend and color labels
+               //go through map and give each score a color value
                string color;
+               int x = 0;
+               int y = 103 + (rabund.getNumBins()*5);
+               if (maxbin != 0) {
+                       //convert maxbin to relative abundance again
+                       if (scaler == "log10") {
+                               maxbin = pow(10, maxbin) / 100;
+                       }else if (scaler == "log2") {
+                               maxbin = pow(2, maxbin) / 100;
+                       }else {  maxbin = pow(10, maxbin) / 100;        } 
+               }else { maxbin = 0.00; }
+               
+               //5 is the number of boxes in the legend
+               float maxbinScaler = maxbin / 10;
+               float colorScaler = 255 / 10;
+                                       
+               for (int i = 0; i < 10; i++) {
+                       string label = toString(((i+1) * maxbinScaler));
+                       //set precision of relative abundance to 3
+                       int pos = label.find_first_of('.');
+                       label = label.substr(0,pos+4);
+                       color = toHex(int((float)(i+1) * colorScaler));
 
+                       outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"30\" height=\"10\"/>\n";
+                       outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\">" + label + "</text>\n";
+                       x += 30;
+               }
+       
+               x = 0;
+               y = 70;
                for (int i = 0; i <= rabund.getNumBins(); i++) {
-               
-                       color = colorScale[rabund.get(i)];
+                       if (rabund.get(i) != 0) { //don't want log value of 0.
+                               if (scaler == "log10") {
+                                       color = colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))];  
+                               }else if (scaler == "log2") {
+                                       color = colorScale[(log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))];  
+                               }else if (scaler == "linear") {
+                                       color = colorScale[rabund.get(i)]; 
+                               }else {  color = colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))];       } 
+                       }else { color = "OO";  }
                        
                        outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"300\" height=\"5\"/>\n";
                        y += 5;
                }
-               outsvg << "</g>\n</svg>\n";
                
+               outsvg << "</g>\n</svg>\n";
                outsvg.close();
                
        }
@@ -85,52 +142,119 @@ void HeatMap::getPic(SharedOrderVector* sharedorder) {
                colorScale.clear();
                
                //fills vector of sharedsabunds - lookup
-               getSharedVectors(sharedorder);
+               util->getSharedVectors(globaldata->Groups, lookup, sharedorder);  //fills group vectors from order vector.
+               
+               //sort lookup so shared bins are on top
+               if (sorted == "1") {  sortSharedVectors();  }
+               
+               //get users scaling method
+               scaler = globaldata->getScaler();
                
-               //get maxBin
+               float maxbin = 0.0;
                for (int i = 0; i < lookup.size(); i++) {
                        for (int j = 0; j < lookup[i]->size(); j++) {
-                               colorScale[lookup[i]->getAbundance(j)] = "";
+                               if (lookup[i]->getAbundance(j) != 0) { //don't want log value of 0.
+                                       if (scaler == "log10") {
+                                               colorScale[(log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))] = "";  
+                                               if (maxbin < (log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))) { maxbin = (log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100)); }
+                                       }else if (scaler == "log2") {
+                                               colorScale[(log2((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))] = "";  
+                                               if (maxbin < (log2((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))) { maxbin = (log2((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100)); }
+                                       }else if (scaler == "linear") {
+                                               colorScale[lookup[i]->getAbundance(j)] = "";
+                                               if (maxbin < lookup[i]->getAbundance(j)) { maxbin = lookup[i]->getAbundance(j); }
+                                       }else {  //if user enters invalid scaler option.
+                                               cout << scaler << " is not a valid scaler option. I will use log10." << endl;
+                                               colorScale[(log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))] = ""; 
+                                               if (maxbin < (log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))) { maxbin = (log10((lookup[i]->getAbundance(j)) / (float)lookup[i]->getNumSeqs()) * 100); }  
+                                       } 
+                               }else { colorScale[0] = "00";  }
                        }
                }
                
                //get scaler
-               float scaler = 255 / (float) colorScale.size();
+               float scalers = 255 / (float) maxbin;
+               
                
                //go through map and give each score a color value
                for (it = colorScale.begin(); it != colorScale.end(); it++) {
-                       it->second = toHex(int(float(it->first) * scaler));
+                       it->second = toHex(int(float(it->first) * scalers));
                        if(it->second.length() == 1) {  it->second = "0" + it->second;  }
                }
                
-               string filenamesvg = globaldata->inputFileName + ".heatmap." + sharedorder->getLabel() + "." + groupComb + ".svg";
+               string filenamesvg = getRootName(globaldata->inputFileName) + sharedorder->getLabel() + ".heatmap.svg";
                openOutputFile(filenamesvg, outsvg);
                
                //svg image
-               outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 " + toString(lookup.size() * 300) + " " + toString((lookup[0]->getNumBins()*5 + 15))  + "\">\n";
+               outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 " + toString(lookup.size() * 300) + " " + toString((lookup[0]->getNumBins()*5 + 120))  + "\">\n";
                outsvg << "<g>\n";
                
-               int x = 15;
-               int y = 15;
+               //white backround
+               outsvg << "<rect fill=\"white\" stroke=\"white\" x=\"0\" y=\"0\" width=\"" + toString(lookup.size() * 300) + "\" height=\"" + toString((lookup[0]->getNumBins()*5 + 120))  + "\"/>"; 
+               outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString((lookup.size() * 150) - 40) + "\" y=\"25\">Heatmap at distance " + sharedorder->getLabel() + "</text>\n";
+               
+               //column labels
+               for (int h = 0; h < lookup.size(); h++) {
+                       outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString(((300 * (h+1)) - 150) - ((int)lookup[h]->getGroup().length() / 2)) + "\" y=\"50\">" + lookup[h]->getGroup() + "</text>\n"; 
+               }
+               
+               //output legend and color labels
+               //go through map and give each score a color value
                string color;
+               int x = 0;
+               int y = 103 + (lookup[0]->getNumBins()*5);
+               if (maxbin != 0) {
+                       //convert maxbin to relative abundance again
+                       if (scaler == "log10") {
+                               maxbin = pow(10, maxbin) / 100;
+                       }else if (scaler == "log2") {
+                               maxbin = pow(2, maxbin) / 100;
+                       }else {  maxbin = pow(10, maxbin) / 100;        } 
+               }else { maxbin = 0.00; }
+               
+               //((lookup.size() * 300) / 60) is the number of boxes in the legend
+               float maxbinScaler = maxbin / ((lookup.size() * 300) / 60);
+               float colorScaler = 255 / ((lookup.size() * 300) / 60);
+                                       
+               for (int i = 0; i < ((lookup.size() * 300) / 60); i++) {
+                       string label = toString(((i+1) * maxbinScaler));
+                       //set precision of relative abundance to 3
+                       int pos = label.find_first_of('.');
+                       label = label.substr(0,pos+4);
 
-               for (int i = 0; i <= lookup[0]->getNumBins(); i++) {
+                       color = toHex(int(((i+1) * colorScaler) + 15));
+                       outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"30\" height=\"10\"/>\n";
+                       outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\">" + label + "</text>\n";
+                       x += 30;
+               }
                
+               x = 0;
+               y = 70;
+               
+               for (int i = 0; i <= lookup[0]->getNumBins(); i++) {
                        for (int j = 0; j < lookup.size(); j++) {
-                       
-                               color = colorScale[lookup[j]->getAbundance(i)]; 
-                                               
+                               
+                               if (lookup[j]->getAbundance(i) != 0) { //don't want log value of 0.
+                                       if (scaler == "log10") {
+                                               color = colorScale[(log10((lookup[j]->getAbundance(i) / (float)lookup[j]->getNumSeqs()) * 100))];  
+                                       }else if (scaler == "log2") {
+                                               color = colorScale[(log2((lookup[j]->getAbundance(i) / (float)lookup[j]->getNumSeqs()) * 100))];  
+                                       }else if (scaler == "linear") {
+                                               color = colorScale[lookup[j]->getAbundance(i)]; 
+                                       }else {  color = colorScale[(log10((lookup[j]->getAbundance(i) / (float)lookup[j]->getNumSeqs()) * 100))];      } 
+                               }else { color = "OO";  }
+
+                               
                                outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"300\" height=\"5\"/>\n";
                                x += 300;
                        }
-                       x = 15;
+                       x = 0;
                        y += 5;
                }
-               outsvg << "</g>\n</svg>\n";
                
-               outsvg.close();
-
                
+               outsvg << "</g>\n</svg>\n";
+               outsvg.close();
                
        }
        catch(exception& e) {
@@ -142,46 +266,84 @@ void HeatMap::getPic(SharedOrderVector* sharedorder) {
                exit(1);
        }
 }
+
 //**********************************************************************************************************************
-void HeatMap::getSharedVectors(SharedOrderVector* order){
+void HeatMap::sortSharedVectors(){
        try {
-               lookup.clear();
+               //copy lookup and then clear it to refill with sorted.
+               //loop though lookup and determine if they are shared
+               //if they are then insert in the front
+               //if not push to back
                
-               groupComb = "";
+               vector<SharedRAbundVector*> looktemp;
+               map<int, int> place; //spot in lookup where you insert shared by, ie, 3 -> 2 if they are shared by 3 inset into location 2.
+               map<int, int>::iterator it;
+               int count;
                
-               //create and initialize vector of sharedvectors, one for each group
-               for (int i = 0; i < globaldata->Groups.size(); i++) { 
-                       SharedRAbundVector* temp = new SharedRAbundVector(order->getNumBins());
-                       temp->setLabel(order->getLabel());
-                       temp->setGroup(globaldata->Groups[i]);
-                       groupComb += globaldata->Groups[i];
-                       lookup.push_back(temp);
+               //create and initialize looktemp as a copy of lookup
+               for (int i = 0; i < lookup.size(); i++) { 
+                       SharedRAbundVector* temp = new SharedRAbundVector(lookup[i]->getNumBins());
+                       temp->setLabel(lookup[i]->getLabel());
+                       temp->setGroup(lookup[i]->getGroup());
+                       //copy lookup i's info
+                       for (int j = 0; j < lookup[i]->size(); j++) {
+                               temp->set(j, lookup[i]->getAbundance(j), lookup[i]->getGroup());
+                       }
+                       looktemp.push_back(temp);
                }
                
-               int numSeqs = order->size();
-               //sample all the members
-               for(int i=0;i<numSeqs;i++){
-                       //get first sample
-                       individual chosen = order->get(i);
-                       int abundance; 
-                                       
-                       //set info for sharedvector in chosens group
-                       for (int j = 0; j < lookup.size(); j++) { 
-                               if (chosen.group == lookup[j]->getGroup()) {
-                                        abundance = lookup[j]->getAbundance(chosen.bin);
-                                        lookup[j]->set(chosen.bin, (abundance + 1), chosen.group);
-                                        break;
+               //clear out lookup to create sorted lookup
+               lookup.clear();
+               
+               //create and initialize lookup to empty vectors
+               for (int i = 0; i < looktemp.size(); i++) { 
+                       SharedRAbundVector* temp = new SharedRAbundVector();
+                       temp->setLabel(looktemp[i]->getLabel());
+                       temp->setGroup(looktemp[i]->getGroup());
+                       lookup.push_back(temp); 
+                       
+                       //initialize place map
+                       place[i] = 0;
+               }
+               
+               
+               //for each bin
+               for (int i = 0; i < looktemp[0]->size(); i++) {
+                       count = 0;
+                       bool updatePlace = false;
+                       //for each group
+                       for (int j = 0; j < looktemp.size(); j++) {
+                               if (looktemp[j]->getAbundance(i) != 0) { count++; }
+                       }
+                       
+                       //fill lookup
+                       for (int j = 0; j < looktemp.size(); j++) {
+                               //if they are not shared then push to back, if they are not insert in front
+                               if (count < 2)  { lookup[j]->push_back(looktemp[j]->getAbundance(i), i, looktemp[j]->getGroup()); }
+                               //they are shared by some
+                               else {  lookup[j]->insert(looktemp[j]->getAbundance(i), place[count], looktemp[j]->getGroup());   updatePlace = true; }
+                       }
+                       
+                       if (updatePlace == true) {
+                               //move place holders below where you entered up to "make space" for you entry
+                               for (it = place.begin(); it!= place.end(); it++) {  
+                                       if (it->first < count) { it->second++; }
                                }
                        }
                }
                
+               //delete looktemp
+               for (int j = 0; j < looktemp.size(); j++) {
+                       delete looktemp[j];
+               }
+               
        }
        catch(exception& e) {
-               cout << "Standard Error: " << e.what() << " has occurred in the HeatMap class Function getSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+               cout << "Standard Error: " << e.what() << " has occurred in the HeatMap class Function sortSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
                exit(1);
        }
        catch(...) {
-               cout << "An unknown error has occurred in the HeatMap class function getSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+               cout << "An unknown error has occurred in the HeatMap class function sortSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
                exit(1);
        }
 
@@ -191,3 +353,5 @@ void HeatMap::getSharedVectors(SharedOrderVector* order){
 
 
 
+
+