#' @title Estimate Cyclic Trend of Gene Expression Using Trendfiltering
#'
#' @details We applied quadratic (second-order) trend filtering using
#' the trendfilter function in the \code{genlasso} package. The
#' trendfilter function implements a nonparametric smoothing method
#' which chooses the smoothing parameter by cross-validation and fits
#' a piecewise polynomial regression.
#'
#' @details The trendfilter method determines the folds in
#' cross-validation in a non-random manner: every k-th data point in
#' the ordered sample is placed in the k-th fold, so the folds contain
#' ordered subsamples. We applied five-fold cross-validation and chose
#' the smoothing penalty using the option lambda.1se; among all
#' possible values of the penalty term, the largest value such that
#' the cross-validation standard error is within one standard error of
#' the minimum. Furthermore, we desired that the estimated expression
#' trend be cyclical. To encourage this, we concatenated the ordered
#' gene expression data three times, with one added after another. The
#' quadratic trend filtering was applied to the concatenated data
#' series of each gene.
#'
#' @param yy A vector of gene expression values for a single
#' gene. They must be ordered by cell cycle phase. Also, the
#' expression values should be normalized and transformed to standard
#' normal distribution.
#'
#' @param polyorder Degree of polynomials used in nonparamtric trend
#' filtering.
#'
#' @return A list with two elements: \code{trend.yy}, the estimated
#' cyclic trend; \code{pve}, proportion of variance in gene expression
#' levels explained by the cyclic trend.
#'
#' @examples
#' library(SingleCellExperiment)
#' data(sce_top101genes)
#'
#' # select top 10 cyclic genes
#' sce_top10 <- sce_top101genes[order(rowData(sce_top101genes)$pve_fucci,
#' decreasing=TRUE)[1:10],]
#' coldata <- colData(sce_top10)
#'
#' # cell cycle phase based on FUCCI scores
#' theta <- coldata$theta
#' names(theta) <- rownames(coldata)
#'
#' # normalize expression counts
#' sce_top10 <- data_transform_quantile(sce_top10, ncores=2)
#' exprs_quant <- assay(sce_top10, "cpm_quantNormed")
#'
#' # order FUCCI phase and expression
#' theta_ordered <- theta[order(theta)]
#' yy_ordered <- exprs_quant[1, names(theta_ordered)]
#'
#' fit <- fit_trendfilter(yy_ordered)
#'
#' plot(x=theta_ordered, y=yy_ordered, pch=16, cex=.7, axes=FALSE,
#' ylab="quantile-normalized expression values", xlab="FUCCI phase",
#' main = "trendfilter fit")
#' points(x=theta_ordered, y=fit$trend.yy, col="blue", pch=16, cex=.7)
#' axis(2)
#' axis(1,at=c(0,pi/2, pi, 3*pi/2, 2*pi),
#' labels=c(0,expression(pi/2), expression(pi), expression(3*pi/2),
#' expression(2*pi)))
#' abline(h=0, lty=1, col="black", lwd=.7)
#'
#' @author Joyce Hsiao
#'
#' @importFrom genlasso trendfilter
#' @importFrom genlasso cv.trendfilter
#' @importFrom stats var
#' @importFrom stats predict
#'
#' @export
#'
fit_trendfilter <- function(yy, polyorder=2) {
yy.rep <- rep(yy,3)
include <- rep(c(FALSE, TRUE, FALSE), each = length(yy))
fit.trend <- trendfilter(yy.rep, ord=polyorder, approx=FALSE,
maxsteps = 1000)
cv.trend <- cv.trendfilter(fit.trend)
which.lambda <- cv.trend$i.1se
yy.trend.pred <- predict(fit.trend, lambda=cv.trend$lambda.1se,
df=fit.trend$df[which.lambda])$fit
trend.yy <- yy.trend.pred
pve <- 1 - var(yy - trend.yy)/var(yy)
return(list(trend.yy=trend.yy[include],
pve=pve))
}
#' @title Estimate Cyclic Trends in Gene Expression Levels Using B-splines
#'
#' @param yy A vector of gene expression values for one gene. The
#' expression values are assumed to have been normalized and
#' transformed to standard normal distribution.
#'
#' @param time A vector of angles (cell cycle phase).
#'
#' @return A list with two elements: \code{pred.yy}, the estimated
#' cyclic trend; \code{pve}, proportion of variance in gene expression
#' levels explained by the cyclic trend.
#'
#' @author Joyce Hsiao
#'
#' @examples
#' library(SingleCellExperiment)
#' data(sce_top101genes)
#'
#' # Select top 10 cyclic genes.
#' sce_top10 <- sce_top101genes[order(rowData(sce_top101genes)$pve_fucci,
#' decreasing=TRUE)[1:10],]
#' coldata <- colData(sce_top10)
#'
#' # Get ccell cycle phase based on FUCCI scores.
#' theta <- coldata$theta
#' names(theta) <- rownames(coldata)
#'
#' # Normalize expression counts.
#' sce_top10 <- data_transform_quantile(sce_top10, ncores=2)
#' exprs_quant <- assay(sce_top10, "cpm_quantNormed")
#'
#' # Order FUCCI phase and expression.
#' theta_ordered <- theta[order(theta)]
#' yy_ordered <- exprs_quant[1, names(theta_ordered)]
#'
#' fit <- fit_trendfilter(yy_ordered)
#'
#' plot(x=theta_ordered, y=yy_ordered, pch=16, cex=0.7, axes=FALSE,
#' ylab="quantile-normalized expression values", xlab="FUCCI phase",
#' main = "trendfilter fit")
#' points(x=theta_ordered, y=fit$trend.yy, col="orangered", pch=16, cex=0.7)
#' axis(2)
#' axis(1,at=seq(0,2*pi,pi/2),
#' labels=c(0,expression(pi/2), expression(pi), expression(3*pi/2),
#' expression(2*pi)))
#'
#' @importFrom stats var
#' @importFrom stats predict
#' @importFrom stats smooth.spline
#'
#' @export
#'
fit_bspline <- function(yy, time) {
yy.rep <- rep(yy,3)
time.rep <- c(time, time + (2*pi), time + (4*pi))
include <- rep(c(FALSE, TRUE, FALSE), each = length(yy))
fit <- smooth.spline(x=time.rep, y=yy.rep)
pred.yy <- predict(fit, time.rep)$y[include]
pve <- 1-var(yy-pred.yy)/var(yy)
return(list(pred.yy=pred.yy,
pve=pve))
}
#' @title Estimate Cyclic Trends of Expression Values Using Loess
#'
#' @param yy A vector of gene expression values for a single gene. The
#' expression values are assumed to have been normalized and
#' transformed to standard normal distribution.
#'
#' @param time A vector of angles (cell cycle phase).
#'
#' @return A list with two elements: \code{pred.yy}, the estimated
#' cyclic trend; \code{pve}, proportion of variance in gene expression
#' levels explained by the cyclic trend.
#'
#' @author Joyce Hsiao
#'
#' @examples
#' library(SingleCellExperiment)
#' data(sce_top101genes)
#'
#' # Select top 10 cyclic genes.
#' sce_top10 <- sce_top101genes[order(rowData(sce_top101genes)$pve_fucci,
#' decreasing=TRUE)[1:10],]
#' coldata <- colData(sce_top10)
#'
#' # Get cell cycle phase based on FUCCI scores.
#' theta <- coldata$theta
#' names(theta) <- rownames(coldata)
#'
#' # Normalize expression counts.
#' sce_top10 <- data_transform_quantile(sce_top10, ncores=2)
#' exprs_quant <- assay(sce_top10, "cpm_quantNormed")
#'
#' # Order FUCCI phase and expression.
#' theta_ordered <- theta[order(theta)]
#' yy_ordered <- exprs_quant[1, names(theta_ordered)]
#'
#' fit <- fit_loess(yy_ordered, time=theta_ordered)
#'
#' plot(x=theta_ordered, y=yy_ordered, pch=16, cex=0.7, axes=FALSE,
#' ylab="quantile-normalized expression values", xlab="FUCCI phase",
#' main="loess fit")
#' points(x=theta_ordered, y=fit$pred.yy, col="orangered", pch=16, cex=0.7)
#' axis(2)
#' axis(1,at=seq(0,2*pi,pi/2),
#' labels=c(0,expression(pi/2), expression(pi), expression(3*pi/2),
#' expression(2*pi)))
#' abline(h=0, lty="dashed", col="dodgerblue", lwd=2)
#'
#' @importFrom stats loess
#' @importFrom stats var
#' @importFrom stats predict
#'
#' @export
#'
fit_loess <- function(yy, time) {
yy.rep <- rep(yy,3)
time.rep <- c(time, time + (2*pi), time + (4*pi))
include <- rep(c(FALSE, TRUE, FALSE), each = length(yy))
fit <- loess(yy.rep ~ time.rep)
pred.yy <- fit$fitted[include]
pve <- 1 - var(yy - pred.yy)/var(yy)
return(list(pred.yy=pred.yy,pve=pve))
}
Add the following code to your website.
For more information on customizing the embed code, read Embedding Snippets.