try {
globaldata = GlobalData::getInstance();
format = globaldata->getFormat();
+ sorted = globaldata->getSorted();
+ util = new SharedUtil();
}
catch(exception& e) {
rabund = order->getRAbundVector();
+ //get users scaling method
+ scaler = globaldata->getScaler();
+
+ float maxbin = 0.0;
for (int i = 0; i < rabund.size(); i++) {
- colorScale[rabund.get(i)] = "";
+ if (rabund.get(i) != 0) { //don't want log value of 0.
+ if (scaler == "log10") {
+ colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))] = "";
+ if (maxbin < (log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))) { maxbin = (log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100)); }
+ }else if (scaler == "log2") {
+ colorScale[(log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))] = "";
+ if (maxbin < (log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))) { maxbin = (log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100)); }
+ }else if (scaler == "linear") {
+ colorScale[rabund.get(i)] = "";
+ if (maxbin < rabund.get(i)) { maxbin = rabund.get(i); }
+ }else { //if user enters invalid scaler option.
+ cout << scaler << " is not a valid scaler option. I will use log10." << endl;
+ colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))] = "";
+ if (maxbin < (log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))) { maxbin = (log10((rabund.get(i)) / (float)rabund.getNumSeqs()) * 100); }
+ }
+ }else { colorScale[0] = "00"; }
}
- float scaler = 255 / (float) colorScale.size();
+ float scalers = 255 / (float) maxbin;
//go through map and give each score a color value
for (it = colorScale.begin(); it != colorScale.end(); it++) {
- it->second = toHex(int(float(it->first) * scaler));
+ it->second = toHex(int(float(it->first) * scalers));
if(it->second.length() == 1) { it->second = "0" + it->second; }
}
- string filenamesvg = globaldata->inputFileName + ".heatmap." + order->getLabel() + ".svg";
-
+ string filenamesvg = getRootName(globaldata->inputFileName) + order->getLabel() + ".heatmap.svg";
openOutputFile(filenamesvg, outsvg);
- //scale max rank so the maxrank = bright red
-
//svg image
- outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 300 " + toString((rabund.getNumBins()*5 + 15)) + "\">\n";
+ outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 300 " + toString((rabund.getNumBins()*5 + 120)) + "\">\n";
outsvg << "<g>\n";
- int x = 15;
- int y = 15;
+ //white backround
+ outsvg << "<rect fill=\"white\" stroke=\"white\" x=\"0\" y=\"0\" width=\"300\" height=\"" + toString((rabund.getNumBins()*5 + 120)) + "\"/>";
+ outsvg << "<text fill=\"black\" class=\"seri\" x=\"100\" y=\"25\">Heatmap at distance " + order->getLabel() + "</text>\n";
+
+ //output legend and color labels
+ //go through map and give each score a color value
string color;
+ int x = 0;
+ int y = 103 + (rabund.getNumBins()*5);
+ if (maxbin != 0) {
+ //convert maxbin to relative abundance again
+ if (scaler == "log10") {
+ maxbin = pow(10, maxbin) / 100;
+ }else if (scaler == "log2") {
+ maxbin = pow(2, maxbin) / 100;
+ }else { maxbin = pow(10, maxbin) / 100; }
+ }else { maxbin = 0.00; }
+
+ //5 is the number of boxes in the legend
+ float maxbinScaler = maxbin / 10;
+ float colorScaler = 255 / 10;
+
+ for (int i = 0; i < 10; i++) {
+ string label = toString(((i+1) * maxbinScaler));
+ //set precision of relative abundance to 3
+ int pos = label.find_first_of('.');
+ label = label.substr(0,pos+4);
+ color = toHex(int((float)(i+1) * colorScaler));
+ outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"30\" height=\"10\"/>\n";
+ outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\">" + label + "</text>\n";
+ x += 30;
+ }
+
+ x = 0;
+ y = 70;
for (int i = 0; i <= rabund.getNumBins(); i++) {
-
- color = colorScale[rabund.get(i)];
+ if (rabund.get(i) != 0) { //don't want log value of 0.
+ if (scaler == "log10") {
+ color = colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))];
+ }else if (scaler == "log2") {
+ color = colorScale[(log2((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))];
+ }else if (scaler == "linear") {
+ color = colorScale[rabund.get(i)];
+ }else { color = colorScale[(log10((rabund.get(i) / (float)rabund.getNumSeqs()) * 100))]; }
+ }else { color = "OO"; }
outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"300\" height=\"5\"/>\n";
y += 5;
}
- outsvg << "</g>\n</svg>\n";
+ outsvg << "</g>\n</svg>\n";
outsvg.close();
}
colorScale.clear();
//fills vector of sharedsabunds - lookup
- getSharedVectors(sharedorder);
+ util->getSharedVectors(globaldata->Groups, lookup, sharedorder); //fills group vectors from order vector.
+
+ //sort lookup so shared bins are on top
+ if (sorted == "1") { sortSharedVectors(); }
+
+ //get users scaling method
+ scaler = globaldata->getScaler();
- //get maxBin
+ float maxbin = 0.0;
for (int i = 0; i < lookup.size(); i++) {
for (int j = 0; j < lookup[i]->size(); j++) {
- colorScale[lookup[i]->getAbundance(j)] = "";
+ if (lookup[i]->getAbundance(j) != 0) { //don't want log value of 0.
+ if (scaler == "log10") {
+ colorScale[(log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))] = "";
+ if (maxbin < (log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))) { maxbin = (log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100)); }
+ }else if (scaler == "log2") {
+ colorScale[(log2((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))] = "";
+ if (maxbin < (log2((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))) { maxbin = (log2((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100)); }
+ }else if (scaler == "linear") {
+ colorScale[lookup[i]->getAbundance(j)] = "";
+ if (maxbin < lookup[i]->getAbundance(j)) { maxbin = lookup[i]->getAbundance(j); }
+ }else { //if user enters invalid scaler option.
+ cout << scaler << " is not a valid scaler option. I will use log10." << endl;
+ colorScale[(log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))] = "";
+ if (maxbin < (log10((lookup[i]->getAbundance(j) / (float)lookup[i]->getNumSeqs()) * 100))) { maxbin = (log10((lookup[i]->getAbundance(j)) / (float)lookup[i]->getNumSeqs()) * 100); }
+ }
+ }else { colorScale[0] = "00"; }
}
}
//get scaler
- float scaler = 255 / (float) colorScale.size();
+ float scalers = 255 / (float) maxbin;
+
//go through map and give each score a color value
for (it = colorScale.begin(); it != colorScale.end(); it++) {
- it->second = toHex(int(float(it->first) * scaler));
+ it->second = toHex(int(float(it->first) * scalers));
if(it->second.length() == 1) { it->second = "0" + it->second; }
}
- string filenamesvg = globaldata->inputFileName + ".heatmap." + sharedorder->getLabel() + "." + groupComb + ".svg";
+ string filenamesvg = getRootName(globaldata->inputFileName) + sharedorder->getLabel() + ".heatmap.svg";
openOutputFile(filenamesvg, outsvg);
//svg image
- outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 " + toString(lookup.size() * 300) + " " + toString((lookup[0]->getNumBins()*5 + 15)) + "\">\n";
+ outsvg << "<svg width=\"100%\" height=\"100%\" viewBox=\"0 0 " + toString(lookup.size() * 300) + " " + toString((lookup[0]->getNumBins()*5 + 120)) + "\">\n";
outsvg << "<g>\n";
- int x = 15;
- int y = 15;
+ //white backround
+ outsvg << "<rect fill=\"white\" stroke=\"white\" x=\"0\" y=\"0\" width=\"" + toString(lookup.size() * 300) + "\" height=\"" + toString((lookup[0]->getNumBins()*5 + 120)) + "\"/>";
+ outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString((lookup.size() * 150) - 40) + "\" y=\"25\">Heatmap at distance " + sharedorder->getLabel() + "</text>\n";
+
+ //column labels
+ for (int h = 0; h < lookup.size(); h++) {
+ outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString(((300 * (h+1)) - 150) - ((int)lookup[h]->getGroup().length() / 2)) + "\" y=\"50\">" + lookup[h]->getGroup() + "</text>\n";
+ }
+
+ //output legend and color labels
+ //go through map and give each score a color value
string color;
+ int x = 0;
+ int y = 103 + (lookup[0]->getNumBins()*5);
+ if (maxbin != 0) {
+ //convert maxbin to relative abundance again
+ if (scaler == "log10") {
+ maxbin = pow(10, maxbin) / 100;
+ }else if (scaler == "log2") {
+ maxbin = pow(2, maxbin) / 100;
+ }else { maxbin = pow(10, maxbin) / 100; }
+ }else { maxbin = 0.00; }
+
+ //((lookup.size() * 300) / 60) is the number of boxes in the legend
+ float maxbinScaler = maxbin / ((lookup.size() * 300) / 60);
+ float colorScaler = 255 / ((lookup.size() * 300) / 60);
+
+ for (int i = 0; i < ((lookup.size() * 300) / 60); i++) {
+ string label = toString(((i+1) * maxbinScaler));
+ //set precision of relative abundance to 3
+ int pos = label.find_first_of('.');
+ label = label.substr(0,pos+4);
- for (int i = 0; i <= lookup[0]->getNumBins(); i++) {
+ color = toHex(int(((i+1) * colorScaler) + 15));
+ outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"30\" height=\"10\"/>\n";
+ outsvg << "<text fill=\"black\" class=\"seri\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\">" + label + "</text>\n";
+ x += 30;
+ }
+ x = 0;
+ y = 70;
+
+ for (int i = 0; i <= lookup[0]->getNumBins(); i++) {
for (int j = 0; j < lookup.size(); j++) {
-
- color = colorScale[lookup[j]->getAbundance(i)];
-
+
+ if (lookup[j]->getAbundance(i) != 0) { //don't want log value of 0.
+ if (scaler == "log10") {
+ color = colorScale[(log10((lookup[j]->getAbundance(i) / (float)lookup[j]->getNumSeqs()) * 100))];
+ }else if (scaler == "log2") {
+ color = colorScale[(log2((lookup[j]->getAbundance(i) / (float)lookup[j]->getNumSeqs()) * 100))];
+ }else if (scaler == "linear") {
+ color = colorScale[lookup[j]->getAbundance(i)];
+ }else { color = colorScale[(log10((lookup[j]->getAbundance(i) / (float)lookup[j]->getNumSeqs()) * 100))]; }
+ }else { color = "OO"; }
+
+
outsvg << "<rect fill=\"#" + color + "0000\" stroke=\"#" + color + "0000\" x=\"" + toString(x) + "\" y=\"" + toString(y) + "\" width=\"300\" height=\"5\"/>\n";
x += 300;
}
- x = 15;
+ x = 0;
y += 5;
}
- outsvg << "</g>\n</svg>\n";
- outsvg.close();
-
+ outsvg << "</g>\n</svg>\n";
+ outsvg.close();
}
catch(exception& e) {
exit(1);
}
}
+
//**********************************************************************************************************************
-void HeatMap::getSharedVectors(SharedOrderVector* order){
+void HeatMap::sortSharedVectors(){
try {
- lookup.clear();
+ //copy lookup and then clear it to refill with sorted.
+ //loop though lookup and determine if they are shared
+ //if they are then insert in the front
+ //if not push to back
- groupComb = "";
+ vector<SharedRAbundVector*> looktemp;
+ map<int, int> place; //spot in lookup where you insert shared by, ie, 3 -> 2 if they are shared by 3 inset into location 2.
+ map<int, int>::iterator it;
+ int count;
- //create and initialize vector of sharedvectors, one for each group
- for (int i = 0; i < globaldata->Groups.size(); i++) {
- SharedRAbundVector* temp = new SharedRAbundVector(order->getNumBins());
- temp->setLabel(order->getLabel());
- temp->setGroup(globaldata->Groups[i]);
- groupComb += globaldata->Groups[i];
- lookup.push_back(temp);
+ //create and initialize looktemp as a copy of lookup
+ for (int i = 0; i < lookup.size(); i++) {
+ SharedRAbundVector* temp = new SharedRAbundVector(lookup[i]->getNumBins());
+ temp->setLabel(lookup[i]->getLabel());
+ temp->setGroup(lookup[i]->getGroup());
+ //copy lookup i's info
+ for (int j = 0; j < lookup[i]->size(); j++) {
+ temp->set(j, lookup[i]->getAbundance(j), lookup[i]->getGroup());
+ }
+ looktemp.push_back(temp);
}
- int numSeqs = order->size();
- //sample all the members
- for(int i=0;i<numSeqs;i++){
- //get first sample
- individual chosen = order->get(i);
- int abundance;
-
- //set info for sharedvector in chosens group
- for (int j = 0; j < lookup.size(); j++) {
- if (chosen.group == lookup[j]->getGroup()) {
- abundance = lookup[j]->getAbundance(chosen.bin);
- lookup[j]->set(chosen.bin, (abundance + 1), chosen.group);
- break;
+ //clear out lookup to create sorted lookup
+ lookup.clear();
+
+ //create and initialize lookup to empty vectors
+ for (int i = 0; i < looktemp.size(); i++) {
+ SharedRAbundVector* temp = new SharedRAbundVector();
+ temp->setLabel(looktemp[i]->getLabel());
+ temp->setGroup(looktemp[i]->getGroup());
+ lookup.push_back(temp);
+
+ //initialize place map
+ place[i] = 0;
+ }
+
+
+ //for each bin
+ for (int i = 0; i < looktemp[0]->size(); i++) {
+ count = 0;
+ bool updatePlace = false;
+ //for each group
+ for (int j = 0; j < looktemp.size(); j++) {
+ if (looktemp[j]->getAbundance(i) != 0) { count++; }
+ }
+
+ //fill lookup
+ for (int j = 0; j < looktemp.size(); j++) {
+ //if they are not shared then push to back, if they are not insert in front
+ if (count < 2) { lookup[j]->push_back(looktemp[j]->getAbundance(i), i, looktemp[j]->getGroup()); }
+ //they are shared by some
+ else { lookup[j]->insert(looktemp[j]->getAbundance(i), place[count], looktemp[j]->getGroup()); updatePlace = true; }
+ }
+
+ if (updatePlace == true) {
+ //move place holders below where you entered up to "make space" for you entry
+ for (it = place.begin(); it!= place.end(); it++) {
+ if (it->first < count) { it->second++; }
}
}
}
+ //delete looktemp
+ for (int j = 0; j < looktemp.size(); j++) {
+ delete looktemp[j];
+ }
+
}
catch(exception& e) {
- cout << "Standard Error: " << e.what() << " has occurred in the HeatMap class Function getSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+ cout << "Standard Error: " << e.what() << " has occurred in the HeatMap class Function sortSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
exit(1);
}
catch(...) {
- cout << "An unknown error has occurred in the HeatMap class function getSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
+ cout << "An unknown error has occurred in the HeatMap class function sortSharedVectors. Please contact Pat Schloss at pschloss@microbio.umass.edu." << "\n";
exit(1);
}
+
+