Correlates categorical and numeric variables with Module Eigengenes or hub-gene scores.
Usage
ModuleTraitCorrelation(
seurat_obj,
traits,
group.by = NULL,
features = "hMEs",
cor_method = "pearson",
subset_by = NULL,
subset_groups = NULL,
wgcna_name = NULL,
...
)
Arguments
- seurat_obj
A list of column names in the Seurat object's metadata that you wish to correlate with each module. Traits must be a categorical variable (not a character vector), or a numeric variable.
- features
Which features to use to summarize each modules? Valid choices are hMEs, MEs, or scores
- wgcna_name
The name of the hdWGCNA experiment in the seurat_obj@misc slot
- cor_meth
Which method to use for correlation? Valid choices are pearson, spearman, kendall.
Examples
ModuleTraitCorrelation
#> function (seurat_obj, traits, group.by = NULL, features = "hMEs",
#> cor_method = "pearson", subset_by = NULL, subset_groups = NULL,
#> wgcna_name = NULL, ...)
#> {
#> if (is.null(wgcna_name)) {
#> wgcna_name <- seurat_obj@misc$active_wgcna
#> }
#> CheckWGCNAName(seurat_obj, wgcna_name)
#> if (features == "hMEs") {
#> MEs <- GetMEs(seurat_obj, TRUE, wgcna_name)
#> }
#> else if (features == "MEs") {
#> MEs <- GetMEs(seurat_obj, FALSE, wgcna_name)
#> }
#> else if (features == "scores") {
#> MEs <- GetModuleScores(seurat_obj, wgcna_name)
#> }
#> else {
#> stop("Invalid feature selection. Valid choices: hMEs, MEs, scores, average")
#> }
#> if (!is.null(subset_by)) {
#> print("subsetting")
#> seurat_full <- seurat_obj
#> MEs <- MEs[seurat_obj@meta.data[[subset_by]] %in% subset_groups,
#> ]
#> seurat_obj <- seurat_obj[, seurat_obj@meta.data[[subset_by]] %in%
#> subset_groups]
#> }
#> if (sum(traits %in% colnames(seurat_obj@meta.data)) != length(traits)) {
#> stop(paste("Some of the provided traits were not found in the Seurat obj:",
#> paste(traits[!(traits %in% colnames(seurat_obj@meta.data))],
#> collapse = ", ")))
#> }
#> if (is.null(group.by)) {
#> group.by <- "temp_ident"
#> seurat_obj$temp_ident <- Idents(seurat_obj)
#> }
#> valid_types <- c("numeric", "factor", "integer")
#> data_types <- sapply(traits, function(x) {
#> class(seurat_obj@meta.data[, x])
#> })
#> if (!all(data_types %in% valid_types)) {
#> incorrect <- traits[!(data_types %in% valid_types)]
#> stop(paste0("Invalid data types for ", paste(incorrect,
#> collapse = ", "), ". Accepted data types are numeric, factor, integer."))
#> }
#> if (any(data_types == "factor")) {
#> factor_traits <- traits[data_types == "factor"]
#> for (tr in factor_traits) {
#> warning(paste0("Trait ", tr, " is a factor with levels ",
#> paste0(levels(seurat_obj@meta.data[, tr]), collapse = ", "),
#> ". Levels will be converted to numeric IN THIS ORDER for the correlation, is this the expected order?"))
#> }
#> }
#> modules <- GetModules(seurat_obj, wgcna_name)
#> mods <- levels(modules$module)
#> mods <- mods[mods != "grey"]
#> trait_df <- seurat_obj@meta.data[, traits]
#> if (length(traits == 1)) {
#> trait_df <- data.frame(x = trait_df)
#> colnames(trait_df) <- traits
#> }
#> if (any(data_types == "factor")) {
#> factor_traits <- traits[data_types == "factor"]
#> for (tr in factor_traits) {
#> trait_df[, tr] <- as.numeric(trait_df[, tr])
#> }
#> }
#> cor_list <- list()
#> pval_list <- list()
#> fdr_list <- list()
#> temp <- Hmisc::rcorr(as.matrix(trait_df), as.matrix(MEs),
#> type = cor_method)
#> cur_cor <- temp$r[traits, mods]
#> cur_p <- temp$P[traits, mods]
#> p_df <- cur_p %>% reshape2::melt()
#> if (length(traits) == 1) {
#> tmp <- rep(mods, length(traits))
#> tmp <- factor(tmp, levels = mods)
#> tmp <- tmp[order(tmp)]
#> p_df$Var1 <- traits
#> p_df$Var2 <- tmp
#> rownames(p_df) <- 1:nrow(p_df)
#> p_df <- dplyr::select(p_df, c(Var1, Var2, value))
#> }
#> p_df <- p_df %>% dplyr::mutate(fdr = p.adjust(value, method = "fdr")) %>%
#> dplyr::select(c(Var1, Var2, fdr))
#> cur_fdr <- reshape2::dcast(p_df, Var1 ~ Var2, value.var = "fdr")
#> rownames(cur_fdr) <- cur_fdr$Var1
#> cur_fdr <- cur_fdr[, -1]
#> cor_list[["all_cells"]] <- cur_cor
#> pval_list[["all_cells"]] <- cur_p
#> fdr_list[["all_cells"]] <- cur_fdr
#> trait_df <- cbind(trait_df, seurat_obj@meta.data[, group.by])
#> colnames(trait_df)[ncol(trait_df)] <- "group"
#> MEs <- cbind(as.data.frame(MEs), seurat_obj@meta.data[, group.by])
#> colnames(MEs)[ncol(MEs)] <- "group"
#> if (class(seurat_obj@meta.data[, group.by]) == "factor") {
#> group_names <- levels(seurat_obj@meta.data[, group.by])
#> }
#> else {
#> group_names <- levels(as.factor(seurat_obj@meta.data[,
#> group.by]))
#> }
#> trait_list <- dplyr::group_split(trait_df, group, .keep = FALSE)
#> ME_list <- dplyr::group_split(MEs, group, .keep = FALSE)
#> names(trait_list) <- group_names
#> names(ME_list) <- group_names
#> for (i in names(trait_list)) {
#> temp <- Hmisc::rcorr(as.matrix(trait_list[[i]]), as.matrix(ME_list[[i]]))
#> cur_cor <- temp$r[traits, mods]
#> cur_p <- temp$P[traits, mods]
#> p_df <- cur_p %>% reshape2::melt()
#> if (length(traits) == 1) {
#> tmp <- rep(mods, length(traits))
#> tmp <- factor(tmp, levels = mods)
#> tmp <- tmp[order(tmp)]
#> p_df$Var1 <- traits
#> p_df$Var2 <- tmp
#> rownames(p_df) <- 1:nrow(p_df)
#> p_df <- dplyr::select(p_df, c(Var1, Var2, value))
#> }
#> p_df <- p_df %>% dplyr::mutate(fdr = p.adjust(value,
#> method = "fdr")) %>% dplyr::select(c(Var1, Var2,
#> fdr))
#> cur_fdr <- reshape2::dcast(p_df, Var1 ~ Var2, value.var = "fdr")
#> rownames(cur_fdr) <- cur_fdr$Var1
#> cur_fdr <- cur_fdr[, -1]
#> cor_list[[i]] <- cur_cor
#> pval_list[[i]] <- cur_p
#> fdr_list[[i]] <- as.matrix(cur_fdr)
#> }
#> mt_cor <- list(cor = cor_list, pval = pval_list, fdr = fdr_list)
#> if (!is.null(subset_by)) {
#> seurat_full <- SetModuleTraitCorrelation(seurat_full,
#> mt_cor, wgcna_name)
#> seurat_obj <- seurat_full
#> }
#> else {
#> seurat_obj <- SetModuleTraitCorrelation(seurat_obj, mt_cor,
#> wgcna_name)
#> }
#> seurat_obj
#> }
#> <bytecode: 0x7f855720ca70>
#> <environment: namespace:hdWGCNA>