-
Notifications
You must be signed in to change notification settings - Fork 1
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Fixed opts bug and polished build/check - Thanks for pointing this ou…
…t ! - This closes #2
- Loading branch information
Showing
131 changed files
with
1,015 additions
and
1,358 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,28 @@ | ||
#' @title Add ellipse to an existing plot | ||
#' @description Calculates and plots ellipse corresponding to specified confidence interval in 2-dimensional plot | ||
#' @usage add.ellipse(centroid, covmat, confidence = 0.95, npoints = 100, col = | ||
#' "black", ...) | ||
#' @param centroid Vector with two elements defining the ellipse centroid. | ||
#' @param covmat Covariance matrix for the investigated data. Only diagonal | ||
#' covariances supported. | ||
#' @param confidence Confidence level determining the ellipse borders based on | ||
#' the covariance matrix. | ||
#' @param npoints Number of plotting points. | ||
#' @param col Color. | ||
#' @param ... Other arguments to be passed. | ||
#' @return Used for plotting side effects. | ||
#' @author Leo Lahti \email{leo.lahti@@iki.fi} | ||
#' @keywords utilities | ||
#' @export | ||
#' @examples #add.ellipse(centroid = c(0, 0), covmat = diag(c(1,2))) | ||
add.ellipse <- function (centroid, covmat, confidence = 0.95, npoints = 100, col = "black", ...) { | ||
|
||
# add ellipse to a plot | ||
el <- ellipse(centroid, covmat, confidence, npoints) | ||
points(el, type = "l", col = col, ...) | ||
|
||
el | ||
} | ||
|
||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,27 @@ | ||
#' @title BIC mixture | ||
#' @description Latent class analysis based on (infinite) Gaussian mixture model. If the input is data matrix, a multivariate model is fitted; if the input is a vector, a univariate model is fitted | ||
#' @param x samples x features matrix for multivariate analysis, or a vector for univariate analysis | ||
#' @param max.modes Maximum number of modes to be checked for mixture model selection | ||
#' @param bic.threshold BIC threshold which needs to be exceeded before a new mode is added to the mixture. | ||
#' @param min.modes minimum number of modes | ||
#' @param ... Further optional arguments to be passed | ||
#' @return Fitted latent class model (parameters and free energy) | ||
#' @export | ||
#' @references See citation("netresponse") | ||
#' @author Contact: Leo Lahti \email{leo.lahti@@iki.fi} | ||
#' @keywords utilities | ||
bic.mixture <- function (x, max.modes, bic.threshold = 0, min.modes = 1, ...) { | ||
|
||
# x; max.modes = max.responses; bic.threshold = bic.threshold; min.modes = min.responses | ||
|
||
if (!is.vector(x) && ncol(x) == 1) {x <- x[,1]} | ||
|
||
if (is.vector(x)) { | ||
bic.mixture.univariate(x, max.modes, bic.threshold, min.modes = min.modes, ...) | ||
} else { | ||
bic.mixture.multivariate(x, max.modes, bic.threshold, min.modes = min.modes, ...) | ||
} | ||
|
||
} | ||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,42 @@ | ||
#' @title Multivariate BIC mixture | ||
#' @description Latent class analysis based on (infinite) Gaussian mixture model. If the input (dat) is data matrix, a multivariate model is fitted. | ||
#' @param x matrix (for multivariate analysis) | ||
#' @param max.modes Maximum number of modes to be checked for mixture model selection | ||
#' @param bic.threshold BIC threshold which needs to be exceeded before a new mode is added to the mixture. | ||
#' @param min.modes Minimum number of modes to be checked for mixture model selection | ||
#' @param ... Further optional arguments to be passed | ||
#' @return Fitted latent class model (parameters and free energy) | ||
#' @export | ||
#' @references See citation("netresponse") | ||
#' @author Contact: Leo Lahti \email{leo.lahti@@iki.fi} | ||
#' @keywords utilities | ||
bic.mixture.multivariate <- function (x, max.modes, bic.threshold = 0, min.modes = 1, ...) { | ||
|
||
# x <- mat; max.modes = params$max.responses; bic.threshold = params$bic.threshold | ||
|
||
best.mode <- bic.select.best.mode(x, max.modes, bic.threshold, min.modes) | ||
|
||
mcl <- Mclust(x, G = best.mode) | ||
|
||
bic <- try(-mclustBIC(x, G = best.mode)[, "VVV"]) | ||
if ( is.na(bic) ) { bic <- Inf } # infinitely bad = Inf | ||
|
||
means <- t(mcl$parameters$mean) | ||
vars <- t(apply(mcl$parameters$variance$sigma, 3, function(x){diag(x)})) | ||
sds <- sqrt(vars) | ||
ws <- as.vector(mcl$parameters$pro) | ||
if (is.null(ws)) {ws <- 1} | ||
|
||
Nparams <- prod(dim(means)) + prod(dim(sds)) + length(ws) | ||
|
||
# Determine the most likely mode for each sample (-> hard clusters) | ||
qofz <- P.r.s(t(x), list(mu = means, sd = sds, w = ws), log = FALSE) | ||
rownames(qofz) <- rownames(x) | ||
colnames(qofz) <- paste("Mode", 1:ncol(qofz), sep = "-") | ||
|
||
rownames(means) <- rownames(sds) <- names(ws) <- paste("Mode", 1:length(ws), sep = "-") | ||
colnames(means) <- colnames(sds) <- colnames(x) | ||
|
||
list(means = means, sds = sds, ws = ws, Nparams = Nparams, free.energy = -mcl$loglik, qofz = qofz, bic = bic) | ||
|
||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,47 @@ | ||
#' @title Univariate BIC mixture | ||
#' @description Latent class analysis based on (infinite) Gaussian mixture | ||
#' model. If the input (dat) is data matrix, a multivariate model is fitted. If | ||
#' the input is a vector or a 1-dimensional matrix, a univariate model is | ||
#' fitted. | ||
#' @param x dat vector (for univariate analysis) or a matrix (for multivariate analysis) | ||
#' @param max.modes Maximum number of modes to be checked for mixture model selection | ||
#' @param bic.threshold BIC threshold which needs to be exceeded before a new mode is added to the mixture. | ||
#' @param min.modes minimum number of modes | ||
#' @param ... Further optional arguments to be passed | ||
#' @return Fitted latent class model (parameters and free energy) | ||
#' @author Contact: Leo Lahti \email{leo.lahti@@iki.fi} | ||
#' @references See citation("netresponse") | ||
#' @export | ||
#' @keywords utilities | ||
bic.mixture.univariate <- function (x, max.modes, bic.threshold = 0, min.modes = 1, ...) { | ||
|
||
# x <- datamatrix[, node]; max.modes = params$max.responses; bic.threshold = params$bic.threshold | ||
|
||
best.mode <- bic.select.best.mode(x, max.modes, bic.threshold, min.modes = min.modes) | ||
mcl <- Mclust(x, G = best.mode) | ||
|
||
means <- as.vector(mcl$parameters$mean) | ||
sds <- as.vector(sqrt(mcl$parameters$variance$sigmasq)) | ||
if (length(sds) == 1) {sds <- rep(sds, length(means))} | ||
ws <- as.vector(mcl$parameters$pro) | ||
|
||
if (is.null(ws)) {warning("NULL weights, replacing with 1"); ws <- 1} | ||
if (is.null(means)) {warning("NULL means, replacing with 1"); means <- 1} | ||
if (is.null(sds)) {warning("NULL sds, replacing with 1"); sds <- 1} | ||
|
||
Nparams <- length(means) + length(sds) + length(ws) | ||
|
||
means <- matrix(means, nrow = length(ws)) | ||
sds <- matrix(sds, nrow = length(ws)) | ||
|
||
# Determine the most likely mode for each sample (-> hard clusters) | ||
# save(means, sds, ws, x, file = "~/tmp/tmp.RData") | ||
qofz <- P.r.s(matrix(x, nrow = 1), list(mu = means, sd = sds, w = ws), log = FALSE) | ||
rownames(qofz) <- names(x) | ||
|
||
names(means) <- names(sds) <- names(ws) <- paste("Mode", 1:length(ws), sep = "-") | ||
|
||
list(means = means, sds = sds, ws = ws, Nparams = Nparams, free.energy = -mcl$loglik, qofz = qofz) | ||
|
||
} | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,65 @@ | ||
#' @title Select best mode with BIC | ||
#' @description Select optimal number of mixture components by adding components until | ||
#' the increase in objective function is below threshold. | ||
#' @param x dat vector (for univariate analysis) or a matrix (for multivariate analysis) | ||
#' @param max.modes Maximum number of modes to be checked for mixture model selection | ||
#' @param bic.threshold BIC threshold which needs to be exceeded before a new mode is added to the mixture. | ||
#' @param min.modes Optiomal. Minimum number of modes. | ||
#' @return Fitted latent class model (parameters and free energy) | ||
#' @author Contact: Leo Lahti \email{leo.lahti@@iki.fi} | ||
#' @references See citation("netresponse") | ||
#' @export | ||
#' @keywords utilities | ||
bic.select.best.mode <- function (x, max.modes, bic.threshold, min.modes = 1) { | ||
|
||
# Cost for single mode | ||
# BIC : smaller is better | ||
# mclustBIC returns the value for -BIC, to be exact | ||
nc <- min.modes | ||
if (is.vector(x)) { # univariate | ||
m <- -mclustBIC(x, G = nc)[, "V"] | ||
} else { # multivariate | ||
m <- -mclustBIC(x, G = nc)[, "VVV"] # BIC : smaller is better | ||
} | ||
|
||
# ---------------------------------------------------------------- | ||
|
||
add.component <- TRUE | ||
best.mode <- min.modes | ||
if (max.modes == min.modes) { | ||
add.component <- FALSE | ||
} | ||
|
||
while (add.component && nc < max.modes) { | ||
|
||
nc <- nc + 1 | ||
|
||
# BIC : smaller is better | ||
if (is.vector(x)) { # univariate | ||
m.new <- try(-mclustBIC(x, G = nc)[, "V"]) | ||
} else { # multivariate | ||
m.new <- try(-mclustBIC(x, G = nc)[, "VVV"]) | ||
} | ||
if ( is.na(m.new) ) { m.new <- Inf } # infinitely bad = Inf | ||
|
||
# FIXME: compressing data with PCA after dimensionality gets otherwise too high? | ||
# with around ncol(x) = 30 the mclustBIC is starting to produce NAs | ||
|
||
# FIXME: remove this when code works ok | ||
# if (is.na(m.new)) {save(x, nc, file = "m.new.RData")} | ||
|
||
bic.delta <- m.new - m | ||
|
||
if (bic.delta < -bic.threshold) { | ||
best.mode <- nc | ||
m <- m.new | ||
} else { | ||
add.component <- FALSE | ||
} | ||
} | ||
|
||
best.mode | ||
|
||
} | ||
|
||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.