fix from Pierre Legendre

author paradis <paradis@6e262413-ae40-0410-9e79-b911bd7a66b7>

Wed, 13 Feb 2013 06:52:04 +0000 (06:52 +0000)

committer paradis <paradis@6e262413-ae40-0410-9e79-b911bd7a66b7>

Wed, 13 Feb 2013 06:52:04 +0000 (06:52 +0000)
author paradis <paradis@6e262413-ae40-0410-9e79-b911bd7a66b7>
Wed, 13 Feb 2013 06:52:04 +0000 (06:52 +0000)
committer paradis <paradis@6e262413-ae40-0410-9e79-b911bd7a66b7>
Wed, 13 Feb 2013 06:52:04 +0000 (06:52 +0000)
diff --git a/CADM.global.R b/CADM.global.R

new file mode 100644 (file)

index 0000000..5644ca5
--- /dev/null
+++ b/CADM.global.R
@@ -0,0 +1,216 @@
+`CADM.global` <-
+       function(Dmat, nmat, n, nperm=99, make.sym=TRUE, weights=NULL, silent=FALSE)
+{
+### Function to test the overall significance of the congruence among 
+### a group of distance matrices using Kendall's coefficient of concordance W.
+###
+### copyleft - Pierre Legendre, December 2008
+###
+### Reference -
+### Legendre, P. and F.-J. Lapointe. 2004. Assessing congruence among distance 
+### matrices: single malt Scotch whiskies revisited. Australian and New Zealand 
+### Journal of Statistics 46: 615-629.
+###
+### Parameters of the function --
+###
+### Dmat = A text file listing the distance matrices one after the other, with
+###        or without blank lines.
+###        Each matrix is in the form of a square distance matrix with 0's 
+###        on the diagonal.
+###
+### nmat = number of distance matrices in file Dmat.
+###
+### n = number of objects in each distance matrix. All matrices have same n.
+###
+### nperm = number of permutations for the tests.
+###
+### make.sym = TRUE: turn asymmetric matrices into symmetric matrices by 
+###            averaging the two triangular portions.
+###          = FALSE: analyse asymmetric matrices as they are.
+###
+### weights = a vector of positive weights for the distance matrices. 
+###           Example: weights = c(1,2,3)
+###         = NULL (default): all matrices have same weight in calculation of W.
+###
+### silent = TRUE: informative messages will not be printed, except stopping 
+###          messages. Option useful for simulation work.
+###        = FALSE: informative messages will be printed.
+###
+################################################################################
+       
+       if(nmat < 2) 
+               stop("Analysis requested for a single D matrix: CADM is useless")
+       
+       a <- system.time({
+
+    ## Check the input file
+    if(ncol(Dmat) != n) 
+       stop("Error in the value of 'n' or in the D matrices themselves")
+    nmat2 <- nrow(Dmat)/n
+    if(nmat2 < nmat)  # OK if 'nmat' < number of matrices in the input file
+       stop("Number of input D matrices = ",nmat2,"; this value is < nmat")
+
+    nd <- n*(n-1)/2
+    if(is.null(weights)) {
+       w <- rep(1,nmat)
+       } else {
+       if(length(weights) != nmat) 
+               stop("Incorrect number of values in vector 'weights'")
+       if(length(which(weights < 0)) > 0) 
+               stop("Negative weights are not permitted")
+       w <- weights*nmat/sum(weights)
+       if(!silent) cat("Normalized weights =",w,'\n')
+       }
+    
+    ## Are asymmetric D matrices present?
+    asy <- rep(FALSE, nmat)
+       asymm <- FALSE
+    end <- 0
+    for(k in 1:nmat) {
+        begin <- end+1
+        end <- end+n
+        D.temp <- Dmat[begin:end,]
+        if(sum(abs(diag(as.matrix(D.temp)))) > 0) 
+               stop("Diagonal not 0: matrix #",k," is not a distance matrix")
+        vec1 <- as.vector(as.dist(D.temp))
+        vec2 <- as.vector(as.dist(t(D.temp)))
+        if(sum(abs((vec1-vec2))) > 0) {
+               if(!silent) cat("Matrix #",k," is asymmetric",'\n')
+               asy[k] <- TRUE
+               asymm <- TRUE
+               }
+        }
+    D1 <- as.list(1:nmat)
+    if(asymm) {
+       if(make.sym) {
+               if(!silent) cat("\nAsymmetric matrices were transformed to be symmetric",'\n')
+               } else {
+               nd <- nd*2
+               if(!silent) cat("\nAnalysis carried out on asymmetric matrices",'\n')
+               D2 <- as.list(1:nmat)
+               }
+       } else {
+       if(!silent) cat("Analysis of symmetric matrices",'\n')
+       }
+    Y <- rep(NA,nd)
+    
+    ## String out the distance matrices (vec) and assemble them as columns into matrix 'Y'
+    ## Construct also matrices of ranked distances D1[[k]] and D2[[k]] for permutation test
+    end <- 0
+    for(k in 1:nmat) {
+        begin <- end+1
+        end <- end+n
+        D.temp <- as.matrix(Dmat[begin:end,])
+        vec <- as.vector(as.dist(D.temp))
+        if(asymm) {
+               if(!make.sym) {
+                       ## Analysis carried out on asymmetric matrices: 
+                       ## The ranks are computed on the whole matrix except the diagonal values.
+                       ## The two halves are stored as symmetric matrices in D1[[k]] and D2[[k]]
+                       vec <- c(vec, as.vector(as.dist(t(D.temp))))
+                       diag(D.temp) <- NA
+                       D.temp2 <- rank(D.temp)
+                       diag(D.temp2) <- 0
+                       # cat("nrow =",nrow(D.temp2)," ncol =",ncol(D.temp2),'\n')
+                               # cat("Matrix ",k," min =",min(D.temp2)," max =",max(D.temp2),'\n')
+                               # cat("Matrix ",k," max values #",which(D.temp2 == max(D.temp2)),'\n')
+                       D1[[k]] <- as.matrix(as.dist(D.temp2))
+                       D2[[k]] <- as.matrix(as.dist(t(D.temp2)))
+                       } else {
+                       ## Asymmetric matrices transformed to be symmetric, stored in D1[[k]]
+                       vec <- (vec + as.vector(as.dist(t(D.temp)))) / 2
+                               D.temp2 <- (D.temp + t(D.temp)) / 2
+                               D.temp2 <- as.dist(D.temp2)
+                       D.temp2[] <- rank(D.temp2)
+                               D.temp2 <- as.matrix(D.temp2)
+                       D1[[k]] <- D.temp2
+                       }
+               } else {
+               ## Symmetric matrices are stored in D1[[k]]
+               D.temp2 <- as.dist(D.temp)
+               D.temp2[] <- rank(D.temp2)
+               D1[[k]] <- as.matrix(D.temp2)
+               }
+        Y <- cbind(Y, vec)
+        }
+    Y <- as.matrix(Y[,-1])
+    colnames(Y) <- colnames(Y,do.NULL = FALSE, prefix = "Dmat.")
+    
+    ## Begin calculations for global test
+    
+    ## Compute the reference values of the statistics: W and Chi2
+       ## Transform the distances to ranks, by column
+       Rmat <- apply(Y,2,rank)
+
+       ## Correction factors for tied ranks (eq. 3.3)
+       t.ranks <- apply(Rmat, 2, function(x) summary(as.factor(x), maxsum=nd))
+       TT <- sum(unlist(lapply(t.ranks, function(x) sum((x^3)-x))))
+       # if(!silent) cat("TT = ",TT,'\n')
+       
+       ## Compute the S = Sum-of-Squares of the row-marginal sums of ranks (eq. 1a)
+       ## The ranks are weighted during the sum by the vector of matrix weights 'w'
+       ## Eq. 1b cannot be used with weights; see formula for W below
+       sumRanks <- as.vector(Rmat%*%w)
+       S <- (nd-1)*var(sumRanks)
+       
+       ## Compute Kendall's W (eq. 2a)
+       ## Eq. 2b cannot be used with weights 
+       ## because the sum of all ranks is not equal to m*n*(n+1)/2 in that case
+       W <- (12*S)/(((nmat^2)*((nd^3)-nd))-(nmat*TT))
+               
+       ## Calculate Friedman's Chi-square (Kendall W paper, 2005, eq. 3.4)
+       Chi2 <- nmat*(nd-1)*W
+
+       ## Test the Chi2 statistic by permutation
+       counter <- 1
+       for(j in 1:nperm) {   # Each matrix is permuted independently
+                             # There is no need to permute the last matrix
+               Rmat.perm <- rep(NA,nd)
+               ##
+               if(asymm & !make.sym) {
+                       ## For asymmetric matrices: permute the values within each triangular 
+                       ## portion, stored as square matrices in D1[[]] and D2[[]]
+                       for(k in 1:(nmat-1)) {
+                               order <- sample(n)
+                               vec <- as.vector(as.dist(D1[[k]][order,order]))
+                           vec <- c(vec, as.vector(as.dist(D2[[k]][order,order])))
+                               Rmat.perm <- cbind(Rmat.perm, vec)
+                               }
+                               vec <- as.vector(as.dist(D1[[nmat]]))
+                           vec <- c(vec, as.vector(as.dist(D2[[nmat]])))
+                               Rmat.perm <- cbind(Rmat.perm, vec)
+                       } else {
+                       for(k in 1:(nmat-1)) {
+                               order <- sample(n)
+                               vec <- as.vector(as.dist(D1[[k]][order,order]))
+                               Rmat.perm <- cbind(Rmat.perm, vec)
+                               }
+                               vec <- as.vector(as.dist(D1[[nmat]]))
+                               Rmat.perm <- cbind(Rmat.perm, vec)
+                       }
+               # Remove the first column of Rmat.perm containing NA
+               # The test is based on the comparison of S and S.perm instead of the comparison of 
+               # Chi2 and Chi2.perm: it is faster that way. 
+               # S, W, and Chi2 are equivalent statistics for permutation tests.
+               Rmat.perm <- as.matrix(Rmat.perm[,-1])
+               S.perm <- (nd-1)*var(as.vector(Rmat.perm%*%w))
+               if(S.perm >= S) counter <- counter+1
+       }
+       prob.perm.gr <- counter/(nperm+1)
+
+       table <- rbind(W, Chi2, prob.perm.gr)
+       colnames(table) <- "Statistics"
+       rownames(table) <- c("W", "Chi2", "Prob.perm")
+       })
+       a[3] <- sprintf("%2f",a[3])
+       if(!silent) cat("\nTime to compute global test =",a[3]," sec",'\n')
+#
+       # if(asymm & !make.sym) { out <- list(congruence_analysis=table, D1=D1, D2=D2)
+       # } else {
+          out <- list(congruence_analysis=table)
+       #    }
+#
+       out$nperm <- nperm
+       class(out) <- "CADM.global"
+       out
+}
diff --git a/CADM.post.R b/CADM.post.R

new file mode 100644 (file)

index 0000000..8530cd3
--- /dev/null
+++ b/CADM.post.R
@@ -0,0 +1,276 @@
+`CADM.post` <-
+       function(Dmat, nmat, n, nperm=99, make.sym=TRUE, weights=NULL, mult="holm", mantel=FALSE, silent=FALSE)
+{
+### Function to carry out a posteriori tests of the contribution of individual 
+### matrices to the congruence of a group of distance matrices.
+###
+### copyleft - Pierre Legendre, December 2008
+###
+### Reference -
+### Legendre, P. and F.-J. Lapointe. 2004. Assessing congruence among distance 
+### matrices: single malt Scotch whiskies revisited. Australian and New Zealand 
+### Journal of Statistics 46: 615-629.
+###
+### Parameters of the function --
+###
+### Dmat = A text file listing the distance matrices one after the other, with
+###        or without blank lines.
+###        Each matrix is in the form of a square distance matrix with 0's 
+###        on the diagonal.
+###
+### nmat = number of distance matrices in file Dmat.
+###
+### n = number of objects in each distance matrix. All matrices have same n.
+###
+### nperm = number of permutations for the tests.
+###
+### make.sym = TRUE: turn asymmetric matrices into symmetric matrices by 
+###            averaging the two triangular portions.
+###          = FALSE: analyse asymmetric matrices as they are.
+###
+### weights = a vector of positive weights for the distance matrices. 
+###           Example: weights = c(1,2,3)
+###         = NULL (default): all matrices have same weight in calculation of W.
+###
+### mult = method for correcting P-values due to multiple testing. The methods 
+###        are "holm" (default), "sidak", and "bonferroni". The Bonferroni 
+###        correction is overly conservative; it is not recommended. It is 
+###        included to allow comparisons with the other methods.
+###
+### mantel = TRUE: Mantel statistics are computed from ranked distances,
+###          as well as permutational P-values.
+###        = FALSE (default): Mantel statistics and tests are not computed.
+###
+### silent = TRUE: informative messages will not be printed, except stopping 
+###          messages. Option useful for simulation work.
+###        = FALSE: informative messages will be printed.
+###
+################################################################################
+       
+       mult <- match.arg(mult, c("sidak", "holm", "bonferroni"))
+       if(nmat < 2) 
+               stop("Analysis requested for a single D matrix: CADM is useless")
+       
+       a <- system.time({
+
+    ## Check the input file
+    if(ncol(Dmat) != n) 
+       stop("Error in the value of 'n' or in the D matrices themselves")
+    nmat2 <- nrow(Dmat)/n
+    if(nmat2 < nmat)  # OK if 'nmat' < number of matrices in the input file
+       stop("Number of input D matrices = ",nmat2,"; this value is < nmat")
+
+    nd <- n*(n-1)/2
+    if(is.null(weights)) {
+       w <- rep(1,nmat)
+       } else {
+       if(length(weights) != nmat) 
+               stop("Incorrect number of values in vector 'weights'")
+       if(length(which(weights < 0)) > 0) 
+               stop("Negative weights are not permitted")
+       w <- weights*nmat/sum(weights)
+       if(!silent) cat("Normalized weights =",w,'\n')
+       }
+    
+    ## Are asymmetric D matrices present?
+    asy <- rep(FALSE, nmat)
+       asymm <- FALSE
+    end <- 0
+    for(k in 1:nmat) {
+        begin <- end+1
+        end <- end+n
+        D.temp <- Dmat[begin:end,]
+        if(sum(abs(diag(as.matrix(D.temp)))) > 0) 
+               stop("Diagonal not 0: matrix #",k," is not a distance matrix")
+        vec1 <- as.vector(as.dist(D.temp))
+        vec2 <- as.vector(as.dist(t(D.temp)))
+        if(sum(abs((vec1-vec2))) > 0) {
+               if(!silent) cat("Matrix #",k," is asymmetric",'\n')
+               asy[k] <- TRUE
+               asymm <- TRUE
+               }
+        }
+    D1 <- as.list(1:nmat)
+    if(asymm) {
+       if(make.sym) {
+               if(!silent) cat("\nAsymmetric matrices were transformed to be symmetric",'\n')
+               } else {
+               nd <- nd*2
+               if(!silent) cat("\nAnalysis carried out on asymmetric matrices",'\n')
+               D2 <- as.list(1:nmat)
+               }
+       } else {
+       if(!silent) cat("Analysis of symmetric matrices",'\n')
+       }
+    Y <- rep(NA,nd)
+    
+    ## String out the distance matrices (vec) and assemble them as columns into matrix 'Y'
+    ## Construct also matrices of ranked distances D1[[k]] and D2[[k]] for permutation test
+    end <- 0
+    for(k in 1:nmat) {
+        begin <- end+1
+        end <- end+n
+        D.temp <- as.matrix(Dmat[begin:end,])
+        vec <- as.vector(as.dist(D.temp))
+        if(asymm) {
+               if(!make.sym) {
+                       ## Analysis carried out on asymmetric matrices: 
+                       ## The ranks are computed on the whole matrix except the diagonal values.
+                       ## The two halves are stored as symmetric matrices in D1[[k]] and D2[[k]]
+                       vec <- c(vec, as.vector(as.dist(t(D.temp))))
+                       diag(D.temp) <- NA
+                       D.temp2 <- rank(D.temp)
+                       diag(D.temp2) <- 0
+                       # cat("nrow =",nrow(D.temp2)," ncol =",ncol(D.temp2),'\n')
+                               # cat("Matrix ",k," min =",min(D.temp2)," max =",max(D.temp2),'\n')
+                               # cat("Matrix ",k," max values #",which(D.temp2 == max(D.temp2)),'\n')
+                       D1[[k]] <- as.matrix(as.dist(D.temp2))
+                       D2[[k]] <- as.matrix(as.dist(t(D.temp2)))
+                       } else {
+                       ## Asymmetric matrices transformed to be symmetric, stored in D1[[k]]
+                       vec <- (vec + as.vector(as.dist(t(D.temp)))) / 2
+                               D.temp2 <- (D.temp + t(D.temp)) / 2
+                               D.temp2 <- as.dist(D.temp2)
+                       D.temp2[] <- rank(D.temp2)
+                               D.temp2 <- as.matrix(D.temp2)
+                       D1[[k]] <- D.temp2
+                       }
+               } else {
+               ## Symmetric matrices are stored in D1[[k]]
+               D.temp2 <- as.dist(D.temp)
+               D.temp2[] <- rank(D.temp2)
+               D1[[k]] <- as.matrix(D.temp2)
+               }
+        Y <- cbind(Y, vec)
+        }
+    Y <- as.matrix(Y[,-1])
+    colnames(Y) <- colnames(Y,do.NULL = FALSE, prefix = "Dmat.")
+    
+    ## Begin calculations: compute reference value of S
+
+               ## Transform the distances to ranks, by column
+               Rmat <- apply(Y,2,rank)
+
+               ## Compute the S = Sum-of-Squares of the row-marginal sums of ranks (eq. 1a)
+               ## The ranks are weighted during the sum by the vector of matrix weights 'w'
+               sumRanks <- as.vector(Rmat%*%w)
+               S <- (nd-1)*var(sumRanks)
+
+    ## Begin a posteriori tests of individual matrices
+
+    ## Statistics displayed for each matrix: "Mantel.mean" and "W.per.matrix"
+       ## Calculate the mean of the Mantel correlations on ranks for each matrix
+       Mantel.cor <- cor(Rmat)
+       diag(Mantel.cor) <- 0
+       spear.mean <- as.vector(Mantel.cor%*%w)/(nmat-1)
+       ## Calculate Kendall's W for each variable
+       ## W.var <- ((nmat-1)*spear.mean+1)/nmat
+
+       ## P-value for each matrix: test of S, permuting values in matrix[[k]] only
+       ## as in program CADM.f (2004)
+       ## Initialize the counters
+       counter <- rep(1,nmat)
+
+       ## Test each matrix 'k' in turn
+       for(k in 1:nmat) {
+               ## Create a new Rmat table where the permuted column has been removed
+               Rmat.mod <- Rmat[,-k]
+                               
+               ## Permutation loop: string out permuted matrix 'k' only
+               for(j in 1:nperm) {
+                       order <- sample(n)
+                       if(asymm & !make.sym) {
+                               ## For asymmetric matrices: permute the values within each triangular 
+                               ## portion, stored as square matrices in D1[[]] and D2[[]]
+                               vec <- as.vector(as.dist(D1[[k]][order,order]))
+                           vec <- c(vec, as.vector(as.dist(D2[[k]][order,order])))
+                               } else {
+                               vec <- as.vector(as.dist(D1[[k]][order,order]))
+                               }
+                       Rmat.perm <- cbind(Rmat.mod, vec)
+                       S.perm <- (nd-1)*var(as.vector(Rmat.perm%*%w))
+                       if(S.perm >= S) counter[k] <- counter[k]+1
+               }
+       }
+
+       ## Calculate P-values
+       counter <- counter/(nperm+1)
+       
+       ## Correction to P-values for multiple testing
+               if(mult == "sidak") {
+                       vec.corr = NA
+                       for(i in 1:p) vec.corr = c(vec.corr, (1-(1-counter[i])^p))
+                       vec.corr <- vec.corr[-1]
+                       }
+               if(mult == "holm") vec.corr <- p.adjust(counter, method="holm")
+               if(mult == "bonferroni") vec.corr <- p.adjust(counter, method="bonferroni")
+
+       ## Create a data frame containing the results
+               # table <- rbind(spear.mean, W.var, counter, vec.corr)
+               # rownames(table) <- c("Mantel.mean", "W.per.matrix", "Prob", "Corrected prob")
+               table <- rbind(spear.mean, counter, vec.corr)
+               rownames(table) <- c("Mantel.mean", "Prob", "Corrected.prob")
+               colnames(table) <- colnames(table,do.NULL = FALSE, prefix = "Dmat.")
+       
+       ## Mantel tests
+       if(mantel) {
+               diag(Mantel.cor) <- 1
+               rownames(Mantel.cor) <- colnames(table)
+               colnames(Mantel.cor) <- colnames(table)
+               Mantel.prob <- matrix(1,nmat,nmat)
+               rownames(Mantel.prob) <- colnames(table)
+               colnames(Mantel.prob) <- colnames(table)
+               
+               for(j in 1:nperm) {   # Each matrix is permuted independently
+                                 # There is no need to permute the last matrix
+                       Rmat.perm <- rep(NA,nd)
+                       ##
+                       if(asymm & !make.sym) {
+                               ## For asymmetric matrices: permute the values within each triangular 
+                               ## portion, stored as square matrices in D1[[]] and D2[[]]
+                               for(k in 1:(nmat-1)) {
+                                       order <- sample(n)
+                                       vec <- as.vector(as.dist(D1[[k]][order,order]))
+                               vec <- c(vec, as.vector(as.dist(D2[[k]][order,order])))
+                                       Rmat.perm <- cbind(Rmat.perm, vec)
+                                       }
+                                       vec <- as.vector(as.dist(D1[[nmat]]))
+                               vec <- c(vec, as.vector(as.dist(D2[[nmat]])))
+                                       Rmat.perm <- cbind(Rmat.perm, vec)
+                               } else {
+                               for(k in 1:(nmat-1)) {
+                                       order <- sample(n)
+                                       vec <- as.vector(as.dist(D1[[k]][order,order]))
+                                       Rmat.perm <- cbind(Rmat.perm, vec)
+                                       }
+                                       vec <- as.vector(as.dist(D1[[nmat]]))
+                                       Rmat.perm <- cbind(Rmat.perm, vec)
+                               }
+                       # Remove the first column of Rmat.perm containing NA
+                       Rmat.perm <- as.matrix(Rmat.perm[,-1])
+                       # Compute Mantel correlations on ranks under permutation
+                       Mantel.cor.perm <- cor(Rmat.perm)
+                       for(j2 in 1:(nmat-1)) { # Compute prob in the upper tail
+                               for(j1 in (j2+1):nmat) {
+                                       if(Mantel.cor.perm[j1,j2] >= Mantel.cor[j1,j2]) Mantel.prob[j1,j2] <- Mantel.prob[j1,j2]+1
+                                       }
+                               }
+                       }
+               Mantel.prob <- as.matrix(as.dist(Mantel.prob/(nperm+1)))
+               diag(Mantel.prob) <- NA # Corrected 08feb13
+               }
+       
+       })
+       a[3] <- sprintf("%2f",a[3])
+       if(!silent) cat("Time to compute a posteriori tests (per matrix) =",a[3]," sec",'\n')
+
+       out <- list(A_posteriori_tests=table, Correction.type=mult)
+
+       if(mantel) {
+               out$Mantel.cor  <- Mantel.cor
+               out$Mantel.prob <- Mantel.prob
+               }
+       out$nperm <- nperm
+       class(out) <- "CADM.post"
+       out
+}
diff --git a/NEWS b/NEWS

index 59c6fede8764018d71cbc24b60051792ce803041..9bc3f6c8c56effb85d22da07d4d5fed2f086ee8d 100644 (file)
--- a/NEWS
+++ b/NEWS
@@ -15,6 +15,11 @@ BUG FIXES
        'phy' are not in the same order than the list of trees (thanks
        to Rupert Collins for the report).
  
        'phy' are not in the same order than the list of trees (thanks
        to Rupert Collins for the report).
  
+    o CADM.post() displayed "1" on the diagonal of the matrix of
+      Mantel p-values. It now displays "NA" on the diagonal,
+      indicating that no test of significance is computed between a
+      distance matrix and itself.
+
  
  
                 CHANGES IN APE VERSION 3.0-7
  
  
                 CHANGES IN APE VERSION 3.0-7
diff --git a/R/CDAM.global.R b/R/CDAM.global.R

deleted file mode 100644 (file)

index 5644ca5..0000000
--- a/R/CDAM.global.R
+++ /dev/null
@@ -1,216 +0,0 @@
-`CADM.global` <-
-       function(Dmat, nmat, n, nperm=99, make.sym=TRUE, weights=NULL, silent=FALSE)
-{
-### Function to test the overall significance of the congruence among 
-### a group of distance matrices using Kendall's coefficient of concordance W.
-###
-### copyleft - Pierre Legendre, December 2008
-###
-### Reference -
-### Legendre, P. and F.-J. Lapointe. 2004. Assessing congruence among distance 
-### matrices: single malt Scotch whiskies revisited. Australian and New Zealand 
-### Journal of Statistics 46: 615-629.
-###
-### Parameters of the function --
-###
-### Dmat = A text file listing the distance matrices one after the other, with
-###        or without blank lines.
-###        Each matrix is in the form of a square distance matrix with 0's 
-###        on the diagonal.
-###
-### nmat = number of distance matrices in file Dmat.
-###
-### n = number of objects in each distance matrix. All matrices have same n.
-###
-### nperm = number of permutations for the tests.
-###
-### make.sym = TRUE: turn asymmetric matrices into symmetric matrices by 
-###            averaging the two triangular portions.
-###          = FALSE: analyse asymmetric matrices as they are.
-###
-### weights = a vector of positive weights for the distance matrices. 
-###           Example: weights = c(1,2,3)
-###         = NULL (default): all matrices have same weight in calculation of W.
-###
-### silent = TRUE: informative messages will not be printed, except stopping 
-###          messages. Option useful for simulation work.
-###        = FALSE: informative messages will be printed.
-###
-################################################################################
-       
-       if(nmat < 2) 
-               stop("Analysis requested for a single D matrix: CADM is useless")
-       
-       a <- system.time({
-
-    ## Check the input file
-    if(ncol(Dmat) != n) 
-       stop("Error in the value of 'n' or in the D matrices themselves")
-    nmat2 <- nrow(Dmat)/n
-    if(nmat2 < nmat)  # OK if 'nmat' < number of matrices in the input file
-       stop("Number of input D matrices = ",nmat2,"; this value is < nmat")
-
-    nd <- n*(n-1)/2
-    if(is.null(weights)) {
-       w <- rep(1,nmat)
-       } else {
-       if(length(weights) != nmat) 
-               stop("Incorrect number of values in vector 'weights'")
-       if(length(which(weights < 0)) > 0) 
-               stop("Negative weights are not permitted")
-       w <- weights*nmat/sum(weights)
-       if(!silent) cat("Normalized weights =",w,'\n')
-       }
-    
-    ## Are asymmetric D matrices present?
-    asy <- rep(FALSE, nmat)
-       asymm <- FALSE
-    end <- 0
-    for(k in 1:nmat) {
-        begin <- end+1
-        end <- end+n
-        D.temp <- Dmat[begin:end,]
-        if(sum(abs(diag(as.matrix(D.temp)))) > 0) 
-               stop("Diagonal not 0: matrix #",k," is not a distance matrix")
-        vec1 <- as.vector(as.dist(D.temp))
-        vec2 <- as.vector(as.dist(t(D.temp)))
-        if(sum(abs((vec1-vec2))) > 0) {
-               if(!silent) cat("Matrix #",k," is asymmetric",'\n')
-               asy[k] <- TRUE
-               asymm <- TRUE
-               }
-        }
-    D1 <- as.list(1:nmat)
-    if(asymm) {
-       if(make.sym) {
-               if(!silent) cat("\nAsymmetric matrices were transformed to be symmetric",'\n')
-               } else {
-               nd <- nd*2
-               if(!silent) cat("\nAnalysis carried out on asymmetric matrices",'\n')
-               D2 <- as.list(1:nmat)
-               }
-       } else {
-       if(!silent) cat("Analysis of symmetric matrices",'\n')
-       }
-    Y <- rep(NA,nd)
-    
-    ## String out the distance matrices (vec) and assemble them as columns into matrix 'Y'
-    ## Construct also matrices of ranked distances D1[[k]] and D2[[k]] for permutation test
-    end <- 0
-    for(k in 1:nmat) {
-        begin <- end+1
-        end <- end+n
-        D.temp <- as.matrix(Dmat[begin:end,])
-        vec <- as.vector(as.dist(D.temp))
-        if(asymm) {
-               if(!make.sym) {
-                       ## Analysis carried out on asymmetric matrices: 
-                       ## The ranks are computed on the whole matrix except the diagonal values.
-                       ## The two halves are stored as symmetric matrices in D1[[k]] and D2[[k]]
-                       vec <- c(vec, as.vector(as.dist(t(D.temp))))
-                       diag(D.temp) <- NA
-                       D.temp2 <- rank(D.temp)
-                       diag(D.temp2) <- 0
-                       # cat("nrow =",nrow(D.temp2)," ncol =",ncol(D.temp2),'\n')
-                               # cat("Matrix ",k," min =",min(D.temp2)," max =",max(D.temp2),'\n')
-                               # cat("Matrix ",k," max values #",which(D.temp2 == max(D.temp2)),'\n')
-                       D1[[k]] <- as.matrix(as.dist(D.temp2))
-                       D2[[k]] <- as.matrix(as.dist(t(D.temp2)))
-                       } else {
-                       ## Asymmetric matrices transformed to be symmetric, stored in D1[[k]]
-                       vec <- (vec + as.vector(as.dist(t(D.temp)))) / 2
-                               D.temp2 <- (D.temp + t(D.temp)) / 2
-                               D.temp2 <- as.dist(D.temp2)
-                       D.temp2[] <- rank(D.temp2)
-                               D.temp2 <- as.matrix(D.temp2)
-                       D1[[k]] <- D.temp2
-                       }
-               } else {
-               ## Symmetric matrices are stored in D1[[k]]
-               D.temp2 <- as.dist(D.temp)
-               D.temp2[] <- rank(D.temp2)
-               D1[[k]] <- as.matrix(D.temp2)
-               }
-        Y <- cbind(Y, vec)
-        }
-    Y <- as.matrix(Y[,-1])
-    colnames(Y) <- colnames(Y,do.NULL = FALSE, prefix = "Dmat.")
-    
-    ## Begin calculations for global test
-    
-    ## Compute the reference values of the statistics: W and Chi2
-       ## Transform the distances to ranks, by column
-       Rmat <- apply(Y,2,rank)
-
-       ## Correction factors for tied ranks (eq. 3.3)
-       t.ranks <- apply(Rmat, 2, function(x) summary(as.factor(x), maxsum=nd))
-       TT <- sum(unlist(lapply(t.ranks, function(x) sum((x^3)-x))))
-       # if(!silent) cat("TT = ",TT,'\n')
-       
-       ## Compute the S = Sum-of-Squares of the row-marginal sums of ranks (eq. 1a)
-       ## The ranks are weighted during the sum by the vector of matrix weights 'w'
-       ## Eq. 1b cannot be used with weights; see formula for W below
-       sumRanks <- as.vector(Rmat%*%w)
-       S <- (nd-1)*var(sumRanks)
-       
-       ## Compute Kendall's W (eq. 2a)
-       ## Eq. 2b cannot be used with weights 
-       ## because the sum of all ranks is not equal to m*n*(n+1)/2 in that case
-       W <- (12*S)/(((nmat^2)*((nd^3)-nd))-(nmat*TT))
-               
-       ## Calculate Friedman's Chi-square (Kendall W paper, 2005, eq. 3.4)
-       Chi2 <- nmat*(nd-1)*W
-
-       ## Test the Chi2 statistic by permutation
-       counter <- 1
-       for(j in 1:nperm) {   # Each matrix is permuted independently
-                             # There is no need to permute the last matrix
-               Rmat.perm <- rep(NA,nd)
-               ##
-               if(asymm & !make.sym) {
-                       ## For asymmetric matrices: permute the values within each triangular 
-                       ## portion, stored as square matrices in D1[[]] and D2[[]]
-                       for(k in 1:(nmat-1)) {
-                               order <- sample(n)
-                               vec <- as.vector(as.dist(D1[[k]][order,order]))
-                           vec <- c(vec, as.vector(as.dist(D2[[k]][order,order])))
-                               Rmat.perm <- cbind(Rmat.perm, vec)
-                               }
-                               vec <- as.vector(as.dist(D1[[nmat]]))
-                           vec <- c(vec, as.vector(as.dist(D2[[nmat]])))
-                               Rmat.perm <- cbind(Rmat.perm, vec)
-                       } else {
-                       for(k in 1:(nmat-1)) {
-                               order <- sample(n)
-                               vec <- as.vector(as.dist(D1[[k]][order,order]))
-                               Rmat.perm <- cbind(Rmat.perm, vec)
-                               }
-                               vec <- as.vector(as.dist(D1[[nmat]]))
-                               Rmat.perm <- cbind(Rmat.perm, vec)
-                       }
-               # Remove the first column of Rmat.perm containing NA
-               # The test is based on the comparison of S and S.perm instead of the comparison of 
-               # Chi2 and Chi2.perm: it is faster that way. 
-               # S, W, and Chi2 are equivalent statistics for permutation tests.
-               Rmat.perm <- as.matrix(Rmat.perm[,-1])
-               S.perm <- (nd-1)*var(as.vector(Rmat.perm%*%w))
-               if(S.perm >= S) counter <- counter+1
-       }
-       prob.perm.gr <- counter/(nperm+1)
-
-       table <- rbind(W, Chi2, prob.perm.gr)
-       colnames(table) <- "Statistics"
-       rownames(table) <- c("W", "Chi2", "Prob.perm")
-       })
-       a[3] <- sprintf("%2f",a[3])
-       if(!silent) cat("\nTime to compute global test =",a[3]," sec",'\n')
-#
-       # if(asymm & !make.sym) { out <- list(congruence_analysis=table, D1=D1, D2=D2)
-       # } else {
-          out <- list(congruence_analysis=table)
-       #    }
-#
-       out$nperm <- nperm
-       class(out) <- "CADM.global"
-       out
-}
diff --git a/R/CDAM.post.R b/R/CDAM.post.R

deleted file mode 100644 (file)

index 00b3d76..0000000
--- a/R/CDAM.post.R
+++ /dev/null
@@ -1,276 +0,0 @@
-`CADM.post` <-
-       function(Dmat, nmat, n, nperm=99, make.sym=TRUE, weights=NULL, mult="holm", mantel=FALSE, silent=FALSE)
-{
-### Function to carry out a posteriori tests of the contribution of individual 
-### matrices to the congruence of a group of distance matrices.
-###
-### copyleft - Pierre Legendre, December 2008
-###
-### Reference -
-### Legendre, P. and F.-J. Lapointe. 2004. Assessing congruence among distance 
-### matrices: single malt Scotch whiskies revisited. Australian and New Zealand 
-### Journal of Statistics 46: 615-629.
-###
-### Parameters of the function --
-###
-### Dmat = A text file listing the distance matrices one after the other, with
-###        or without blank lines.
-###        Each matrix is in the form of a square distance matrix with 0's 
-###        on the diagonal.
-###
-### nmat = number of distance matrices in file Dmat.
-###
-### n = number of objects in each distance matrix. All matrices have same n.
-###
-### nperm = number of permutations for the tests.
-###
-### make.sym = TRUE: turn asymmetric matrices into symmetric matrices by 
-###            averaging the two triangular portions.
-###          = FALSE: analyse asymmetric matrices as they are.
-###
-### weights = a vector of positive weights for the distance matrices. 
-###           Example: weights = c(1,2,3)
-###         = NULL (default): all matrices have same weight in calculation of W.
-###
-### mult = method for correcting P-values due to multiple testing. The methods 
-###        are "holm" (default), "sidak", and "bonferroni". The Bonferroni 
-###        correction is overly conservative; it is not recommended. It is 
-###        included to allow comparisons with the other methods.
-###
-### mantel = TRUE: Mantel statistics are computed from ranked distances,
-###          as well as permutational P-values.
-###        = FALSE (default): Mantel statistics and tests are not computed.
-###
-### silent = TRUE: informative messages will not be printed, except stopping 
-###          messages. Option useful for simulation work.
-###        = FALSE: informative messages will be printed.
-###
-################################################################################
-       
-       mult <- match.arg(mult, c("sidak", "holm", "bonferroni"))
-       if(nmat < 2) 
-               stop("Analysis requested for a single D matrix: CADM is useless")
-       
-       a <- system.time({
-
-    ## Check the input file
-    if(ncol(Dmat) != n) 
-       stop("Error in the value of 'n' or in the D matrices themselves")
-    nmat2 <- nrow(Dmat)/n
-    if(nmat2 < nmat)  # OK if 'nmat' < number of matrices in the input file
-       stop("Number of input D matrices = ",nmat2,"; this value is < nmat")
-
-    nd <- n*(n-1)/2
-    if(is.null(weights)) {
-       w <- rep(1,nmat)
-       } else {
-       if(length(weights) != nmat) 
-               stop("Incorrect number of values in vector 'weights'")
-       if(length(which(weights < 0)) > 0) 
-               stop("Negative weights are not permitted")
-       w <- weights*nmat/sum(weights)
-       if(!silent) cat("Normalized weights =",w,'\n')
-       }
-    
-    ## Are asymmetric D matrices present?
-    asy <- rep(FALSE, nmat)
-       asymm <- FALSE
-    end <- 0
-    for(k in 1:nmat) {
-        begin <- end+1
-        end <- end+n
-        D.temp <- Dmat[begin:end,]
-        if(sum(abs(diag(as.matrix(D.temp)))) > 0) 
-               stop("Diagonal not 0: matrix #",k," is not a distance matrix")
-        vec1 <- as.vector(as.dist(D.temp))
-        vec2 <- as.vector(as.dist(t(D.temp)))
-        if(sum(abs((vec1-vec2))) > 0) {
-               if(!silent) cat("Matrix #",k," is asymmetric",'\n')
-               asy[k] <- TRUE
-               asymm <- TRUE
-               }
-        }
-    D1 <- as.list(1:nmat)
-    if(asymm) {
-       if(make.sym) {
-               if(!silent) cat("\nAsymmetric matrices were transformed to be symmetric",'\n')
-               } else {
-               nd <- nd*2
-               if(!silent) cat("\nAnalysis carried out on asymmetric matrices",'\n')
-               D2 <- as.list(1:nmat)
-               }
-       } else {
-       if(!silent) cat("Analysis of symmetric matrices",'\n')
-       }
-    Y <- rep(NA,nd)
-    
-    ## String out the distance matrices (vec) and assemble them as columns into matrix 'Y'
-    ## Construct also matrices of ranked distances D1[[k]] and D2[[k]] for permutation test
-    end <- 0
-    for(k in 1:nmat) {
-        begin <- end+1
-        end <- end+n
-        D.temp <- as.matrix(Dmat[begin:end,])
-        vec <- as.vector(as.dist(D.temp))
-        if(asymm) {
-               if(!make.sym) {
-                       ## Analysis carried out on asymmetric matrices: 
-                       ## The ranks are computed on the whole matrix except the diagonal values.
-                       ## The two halves are stored as symmetric matrices in D1[[k]] and D2[[k]]
-                       vec <- c(vec, as.vector(as.dist(t(D.temp))))
-                       diag(D.temp) <- NA
-                       D.temp2 <- rank(D.temp)
-                       diag(D.temp2) <- 0
-                       # cat("nrow =",nrow(D.temp2)," ncol =",ncol(D.temp2),'\n')
-                               # cat("Matrix ",k," min =",min(D.temp2)," max =",max(D.temp2),'\n')
-                               # cat("Matrix ",k," max values #",which(D.temp2 == max(D.temp2)),'\n')
-                       D1[[k]] <- as.matrix(as.dist(D.temp2))
-                       D2[[k]] <- as.matrix(as.dist(t(D.temp2)))
-                       } else {
-                       ## Asymmetric matrices transformed to be symmetric, stored in D1[[k]]
-                       vec <- (vec + as.vector(as.dist(t(D.temp)))) / 2
-                               D.temp2 <- (D.temp + t(D.temp)) / 2
-                               D.temp2 <- as.dist(D.temp2)
-                       D.temp2[] <- rank(D.temp2)
-                               D.temp2 <- as.matrix(D.temp2)
-                       D1[[k]] <- D.temp2
-                       }
-               } else {
-               ## Symmetric matrices are stored in D1[[k]]
-               D.temp2 <- as.dist(D.temp)
-               D.temp2[] <- rank(D.temp2)
-               D1[[k]] <- as.matrix(D.temp2)
-               }
-        Y <- cbind(Y, vec)
-        }
-    Y <- as.matrix(Y[,-1])
-    colnames(Y) <- colnames(Y,do.NULL = FALSE, prefix = "Dmat.")
-    
-    ## Begin calculations: compute reference value of S
-
-               ## Transform the distances to ranks, by column
-               Rmat <- apply(Y,2,rank)
-
-               ## Compute the S = Sum-of-Squares of the row-marginal sums of ranks (eq. 1a)
-               ## The ranks are weighted during the sum by the vector of matrix weights 'w'
-               sumRanks <- as.vector(Rmat%*%w)
-               S <- (nd-1)*var(sumRanks)
-
-    ## Begin a posteriori tests of individual matrices
-
-    ## Statistics displayed for each matrix: "Mantel.mean" and "W.per.matrix"
-       ## Calculate the mean of the Mantel correlations on ranks for each matrix
-       Mantel.cor <- cor(Rmat)
-       diag(Mantel.cor) <- 0
-       spear.mean <- as.vector(Mantel.cor%*%w)/(nmat-1)
-       ## Calculate Kendall's W for each variable
-       ## W.var <- ((nmat-1)*spear.mean+1)/nmat
-
-       ## P-value for each matrix: test of S, permuting values in matrix[[k]] only
-       ## as in program CADM.f (2004)
-       ## Initialize the counters
-       counter <- rep(1,nmat)
-
-       ## Test each matrix 'k' in turn
-       for(k in 1:nmat) {
-               ## Create a new Rmat table where the permuted column has been removed
-               Rmat.mod <- Rmat[,-k]
-                               
-               ## Permutation loop: string out permuted matrix 'k' only
-               for(j in 1:nperm) {
-                       order <- sample(n)
-                       if(asymm & !make.sym) {
-                               ## For asymmetric matrices: permute the values within each triangular 
-                               ## portion, stored as square matrices in D1[[]] and D2[[]]
-                               vec <- as.vector(as.dist(D1[[k]][order,order]))
-                           vec <- c(vec, as.vector(as.dist(D2[[k]][order,order])))
-                               } else {
-                               vec <- as.vector(as.dist(D1[[k]][order,order]))
-                               }
-                       Rmat.perm <- cbind(Rmat.mod, vec)
-                       S.perm <- (nd-1)*var(as.vector(Rmat.perm%*%w))
-                       if(S.perm >= S) counter[k] <- counter[k]+1
-               }
-       }
-
-       ## Calculate P-values
-       counter <- counter/(nperm+1)
-       
-       ## Correction to P-values for multiple testing
-               if(mult == "sidak") {
-                       vec.corr = NA
-                       for(i in 1:p) vec.corr = c(vec.corr, (1-(1-counter[i])^p))
-                       vec.corr <- vec.corr[-1]
-                       }
-               if(mult == "holm") vec.corr <- p.adjust(counter, method="holm")
-               if(mult == "bonferroni") vec.corr <- p.adjust(counter, method="bonferroni")
-
-       ## Create a data frame containing the results
-               # table <- rbind(spear.mean, W.var, counter, vec.corr)
-               # rownames(table) <- c("Mantel.mean", "W.per.matrix", "Prob", "Corrected prob")
-               table <- rbind(spear.mean, counter, vec.corr)
-               rownames(table) <- c("Mantel.mean", "Prob", "Corrected.prob")
-               colnames(table) <- colnames(table,do.NULL = FALSE, prefix = "Dmat.")
-       
-       ## Mantel tests
-       if(mantel) {
-               diag(Mantel.cor) <- 1
-               rownames(Mantel.cor) <- colnames(table)
-               colnames(Mantel.cor) <- colnames(table)
-               Mantel.prob <- matrix(1,nmat,nmat)
-               rownames(Mantel.prob) <- colnames(table)
-               colnames(Mantel.prob) <- colnames(table)
-               
-               for(j in 1:nperm) {   # Each matrix is permuted independently
-                                 # There is no need to permute the last matrix
-                       Rmat.perm <- rep(NA,nd)
-                       ##
-                       if(asymm & !make.sym) {
-                               ## For asymmetric matrices: permute the values within each triangular 
-                               ## portion, stored as square matrices in D1[[]] and D2[[]]
-                               for(k in 1:(nmat-1)) {
-                                       order <- sample(n)
-                                       vec <- as.vector(as.dist(D1[[k]][order,order]))
-                               vec <- c(vec, as.vector(as.dist(D2[[k]][order,order])))
-                                       Rmat.perm <- cbind(Rmat.perm, vec)
-                                       }
-                                       vec <- as.vector(as.dist(D1[[nmat]]))
-                               vec <- c(vec, as.vector(as.dist(D2[[nmat]])))
-                                       Rmat.perm <- cbind(Rmat.perm, vec)
-                               } else {
-                               for(k in 1:(nmat-1)) {
-                                       order <- sample(n)
-                                       vec <- as.vector(as.dist(D1[[k]][order,order]))
-                                       Rmat.perm <- cbind(Rmat.perm, vec)
-                                       }
-                                       vec <- as.vector(as.dist(D1[[nmat]]))
-                                       Rmat.perm <- cbind(Rmat.perm, vec)
-                               }
-                       # Remove the first column of Rmat.perm containing NA
-                       Rmat.perm <- as.matrix(Rmat.perm[,-1])
-                       # Compute Mantel correlations on ranks under permutation
-                       Mantel.cor.perm <- cor(Rmat.perm)
-                       for(j2 in 1:(nmat-1)) { # Compute prob in the upper tail
-                               for(j1 in (j2+1):nmat) {
-                                       if(Mantel.cor.perm[j1,j2] >= Mantel.cor[j1,j2]) Mantel.prob[j1,j2] <- Mantel.prob[j1,j2]+1
-                                       }
-                               }
-                       }
-               Mantel.prob <- as.matrix(as.dist(Mantel.prob/(nperm+1)))
-               diag(Mantel.prob) <- 1
-               }
-       
-       })
-       a[3] <- sprintf("%2f",a[3])
-       if(!silent) cat("Time to compute a posteriori tests (per matrix) =",a[3]," sec",'\n')
-
-       out <- list(A_posteriori_tests=table, Correction.type=mult)
-
-       if(mantel) {
-               out$Mantel.cor  <- Mantel.cor
-               out$Mantel.prob <- Mantel.prob
-               }
-       out$nperm <- nperm
-       class(out) <- "CADM.post"
-       out
-}
diff --git a/man/chronos.Rd b/man/chronos.Rd

index 22c15f145ee663f3bc9ef7fc86c49dde966ff35b..d85f5f7e1c2a0a3d0ed3b3b38cf4de7b512a8ef8 100644 (file)
--- a/man/chronos.Rd
+++ b/man/chronos.Rd
@@ -102,9 +102,9 @@ chronos.control(...)
    inference: bridging the parsimony-likelihood gap. \emph{Systematic
      Biology}, \bold{57}, 665--674.
  
    inference: bridging the parsimony-likelihood gap. \emph{Systematic
      Biology}, \bold{57}, 665--674.
  
-  Paradis, E. (2012) Molecular dating of phylogenies by likelihood
+  Paradis, E. (2013) Molecular dating of phylogenies by likelihood
    methods: a comparison of models and a new information
    methods: a comparison of models and a new information
-  criterion. \emph{Manuscript}.
+  criterion. \emph{Molecular Phylogenetics and Evolution}, in press.
  
    Sanderson, M. J. (2002) Estimating absolute rates of molecular
    evolution and divergence times: a penalized likelihood
  
    Sanderson, M. J. (2002) Estimating absolute rates of molecular
    evolution and divergence times: a penalized likelihood
author	paradis <paradis@6e262413-ae40-0410-9e79-b911bd7a66b7>
	Wed, 13 Feb 2013 06:52:04 +0000 (06:52 +0000)
committer	paradis <paradis@6e262413-ae40-0410-9e79-b911bd7a66b7>
	Wed, 13 Feb 2013 06:52:04 +0000 (06:52 +0000)
CADM.global.R	[new file with mode: 0644]	patch \| blob
CADM.post.R	[new file with mode: 0644]	patch \| blob
NEWS		patch \| blob \| history
R/CDAM.global.R	[deleted file]	patch \| blob \| history
R/CDAM.post.R	[deleted file]	patch \| blob \| history
man/chronos.Rd		patch \| blob \| history