GroupHeatmap

GroupHeatmap

Usage

GroupHeatmap(
  srt,
  features = NULL,
  group.by = NULL,
  split.by = NULL,
  within_groups = FALSE,
  grouping.var = NULL,
  numerator = NULL,
  cells = NULL,
  aggregate_fun = base::mean,
  exp_cutoff = 0,
  border = TRUE,
  flip = FALSE,
  slot = "counts",
  assay = NULL,
  exp_method = c("zscore", "raw", "fc", "log2fc", "log1p"),
  exp_legend_title = NULL,
  limits = NULL,
  lib_normalize = identical(slot, "counts"),
  libsize = NULL,
  feature_split = NULL,
  feature_split_by = NULL,
  n_split = NULL,
  split_order = NULL,
  split_method = c("kmeans", "hclust", "mfuzz"),
  decreasing = FALSE,
  fuzzification = NULL,
  cluster_features_by = NULL,
  cluster_rows = FALSE,
  cluster_columns = FALSE,
  cluster_row_slices = FALSE,
  cluster_column_slices = FALSE,
  show_row_names = FALSE,
  show_column_names = FALSE,
  row_names_side = ifelse(flip, "left", "right"),
  column_names_side = ifelse(flip, "bottom", "top"),
  row_names_rot = 0,
  column_names_rot = 90,
  row_title = NULL,
  column_title = NULL,
  row_title_side = "left",
  column_title_side = "top",
  row_title_rot = 0,
  column_title_rot = ifelse(flip, 90, 0),
  anno_terms = FALSE,
  anno_keys = FALSE,
  anno_features = FALSE,
  terms_width = unit(4, "in"),
  terms_fontsize = 8,
  keys_width = unit(2, "in"),
  keys_fontsize = c(6, 10),
  features_width = unit(2, "in"),
  features_fontsize = c(6, 10),
  IDtype = "symbol",
  species = "Homo_sapiens",
  db_update = FALSE,
  db_version = "latest",
  db_combine = FALSE,
  convert_species = FALSE,
  Ensembl_version = 103,
  mirror = NULL,
  db = "GO_BP",
  TERM2GENE = NULL,
  TERM2NAME = NULL,
  minGSSize = 10,
  maxGSSize = 500,
  GO_simplify = FALSE,
  GO_simplify_cutoff = "p.adjust < 0.05",
  simplify_method = "Wang",
  simplify_similarityCutoff = 0.7,
  pvalueCutoff = NULL,
  padjustCutoff = 0.05,
  topTerm = 5,
  show_termid = FALSE,
  topWord = 20,
  words_excluded = NULL,
  nlabel = 20,
  features_label = NULL,
  label_size = 10,
  label_color = "black",
  add_bg = FALSE,
  bg_alpha = 0.5,
  add_dot = FALSE,
  dot_size = unit(8, "mm"),
  add_reticle = FALSE,
  reticle_color = "grey",
  add_violin = FALSE,
  fill.by = "feature",
  fill_palette = "Dark2",
  fill_palcolor = NULL,
  heatmap_palette = "RdBu",
  heatmap_palcolor = NULL,
  group_palette = "Paired",
  group_palcolor = NULL,
  cell_split_palette = "simspec",
  cell_split_palcolor = NULL,
  feature_split_palette = "simspec",
  feature_split_palcolor = NULL,
  cell_annotation = NULL,
  cell_annotation_palette = "Paired",
  cell_annotation_palcolor = NULL,
  cell_annotation_params = if (flip) list(width = unit(10, "mm")) else list(height =
    unit(10, "mm")),
  feature_annotation = NULL,
  feature_annotation_palette = "Dark2",
  feature_annotation_palcolor = NULL,
  feature_annotation_params = if (flip) list(height = unit(5, "mm")) else list(width =
    unit(5, "mm")),
  use_raster = NULL,
  raster_device = "png",
  raster_by_magick = FALSE,
  height = NULL,
  width = NULL,
  units = "inch",
  seed = 11,
  ht_params = list()
)

Arguments

srt: A Seurat object.
features: The features to include in the heatmap.
group.by: A character vector specifying the groups to group by. Default is NULL.
split.by: A character vector specifying the variable to split the heatmap by. Default is NULL.
within_groups: A logical value indicating whether to create separate heatmap scales for each group or within each group. Default is FALSE.
grouping.var: A character vector that specifies another variable for grouping, such as certain conditions. The default value is NULL.
numerator: A character vector specifying the value to use as the numerator in the grouping.var grouping. Default is NULL.
cells: A character vector specifying the cells to include in the heatmap. Default is NULL.
aggregate_fun: A function to use for aggregating data within groups. Default is base::mean.
exp_cutoff: A numeric value specifying the threshold for cell counting if add_dot is TRUE. Default is 0.
border: A logical value indicating whether to add a border to the heatmap. Default is TRUE.
flip: A logical value indicating whether to flip the heatmap. Default is FALSE.
slot: A character vector specifying the slot in the Seurat object to use. Default is "counts".
assay: A character vector specifying the assay in the Seurat object to use. Default is NULL.
exp_method: A character vector specifying the method for calculating expression values. Default is "zscore" with options "zscore", "raw", "fc", "log2fc", "log1p".
exp_legend_title: A character vector specifying the title for the legend of expression value. Default is NULL.
limits: A two-length numeric vector specifying the limits for the color scale. Default is NULL.
lib_normalize: A logical value indicating whether to normalize the data by library size.
libsize: A numeric vector specifying the library size for each cell. Default is NULL.
feature_split: A factor specifying how to split the features. Default is NULL.
feature_split_by: A character vector specifying which group.by to use when splitting features (into n_split feature clusters). Default is NULL.
n_split: An integer specifying the number of feature splits (feature clusters) to create. Default is NULL.
split_order: A numeric vector specifying the order of splits. Default is NULL.
split_method: A character vector specifying the method for splitting features. Default is "kmeans" with options "kmeans", "hclust", "mfuzz").
decreasing: A logical value indicating whether to sort feature splits in decreasing order. Default is FALSE.
fuzzification: A numeric value specifying the fuzzification coefficient. Default is NULL.
cluster_features_by: A character vector specifying which group.by to use when clustering features. Default is NULL. By default, this parameter is set to NULL, which means that all groups will be used.
cluster_rows: A logical value indicating whether to cluster rows in the heatmap. Default is FALSE.
cluster_columns: A logical value indicating whether to cluster columns in the heatmap. Default is FALSE.
cluster_row_slices: A logical value indicating whether to cluster row slices in the heatmap. Default is FALSE.
cluster_column_slices: A logical value indicating whether to cluster column slices in the heatmap. Default is FALSE.
show_row_names: A logical value indicating whether to show row names in the heatmap. Default is FALSE.
show_column_names: A logical value indicating whether to show column names in the heatmap. Default is FALSE.
row_names_side: A character vector specifying the side to place row names.
column_names_side: A character vector specifying the side to place column names.
row_names_rot: A numeric value specifying the rotation angle for row names. Default is 0.
column_names_rot: A numeric value specifying the rotation angle for column names. Default is 90.
row_title: A character vector specifying the title for rows. Default is NULL.
column_title: A character vector specifying the title for columns. Default is NULL.
row_title_side: A character vector specifying the side to place row title. Default is "left".
column_title_side: A character vector specifying the side to place column title. Default is "top".
row_title_rot: A numeric value specifying the rotation angle for row title. Default is 0.
column_title_rot: A numeric value specifying the rotation angle for column title.
anno_terms: A logical value indicating whether to include term annotations. Default is FALSE.
anno_keys: A logical value indicating whether to include key annotations. Default is FALSE.
anno_features: A logical value indicating whether to include feature annotations. Default is FALSE.
terms_width: A unit specifying the width of term annotations. Default is unit(4, "in").
terms_fontsize: A numeric vector specifying the font size(s) for term annotations. Default is 8.
keys_width: A unit specifying the width of key annotations. Default is unit(2, "in").
keys_fontsize: A two-length numeric vector specifying the minimum and maximum font size(s) for key annotations. Default is c(6, 10).
features_width: A unit specifying the width of feature annotations. Default is unit(2, "in").
features_fontsize: A two-length numeric vector specifying the minimum and maximum font size(s) for feature annotations. Default is c(6, 10).
IDtype: A character vector specifying the type of IDs for features. Default is "symbol".
species: A character vector specifying the species for features. Default is "Homo_sapiens".
db_update: A logical value indicating whether to update the database. Default is FALSE.
db_version: A character vector specifying the version of the database. Default is "latest".
db_combine: A logical value indicating whether to use a combined database. Default is FALSE.
convert_species: A logical value indicating whether to use a species-converted database if annotation is missing for species. Default is FALSE.
Ensembl_version: An integer specifying the Ensembl version. Default is 103.
mirror: A character vector specifying the mirror for the Ensembl database. Default is NULL.
db: A character vector specifying the database to use. Default is "GO_BP".
TERM2GENE: A data.frame specifying the TERM2GENE mapping for the database. Default is NULL.
TERM2NAME: A data.frame specifying the TERM2NAME mapping for the database. Default is NULL.
minGSSize: An integer specifying the minimum gene set size for the database. Default is 10.
maxGSSize: An integer specifying the maximum gene set size for the database. Default is 500.
GO_simplify: A logical value indicating whether to simplify gene ontology terms. Default is FALSE.
GO_simplify_cutoff: A character vector specifying the cutoff for GO simplification. Default is "p.adjust < 0.05".
simplify_method: A character vector specifying the method for GO simplification. Default is "Wang".
simplify_similarityCutoff: A numeric value specifying the similarity cutoff for GO simplification. Default is 0.7.
pvalueCutoff: A numeric vector specifying the p-value cutoff(s) for significance. Default is NULL.
padjustCutoff: A numeric value specifying the adjusted p-value cutoff for significance. Default is 0.05.
topTerm: An integer specifying the number of top terms to include. Default is 5.
show_termid: A logical value indicating whether to show term IDs. Default is FALSE.
topWord: An integer specifying the number of top words to include. Default is 20.
words_excluded: A character vector specifying the words to exclude. Default is NULL.
nlabel: An integer specifying the number of labels to include. Default is 0.
features_label: A character vector specifying the features to label. Default is NULL.
label_size: A numeric value specifying the size of labels. Default is 10.
label_color: A character vector specifying the color of labels. Default is "black".
add_bg: A logical value indicating whether to add a background to the heatmap. Default is FALSE.
bg_alpha: A numeric value specifying the alpha value for the background color. Default is 0.5.
add_dot: A logical value indicating whether to add dots to the heatmap. The size of dot represents percentage of expressed cells based on the specified exp_cutoff. Default is FALSE.
dot_size: A unit specifying the base size of the dots. Default is unit(8, "mm").
add_reticle: A logical value indicating whether to add reticles to the heatmap. Default is FALSE.
reticle_color: A character vector specifying the color of the reticles. Default is "grey".
add_violin: A logical value indicating whether to add violins to the heatmap. Default is FALSE.
fill.by: A character vector specifying what to fill the violin. Possible values are "group", "feature", or "expression". Default is "feature".
fill_palette: A character vector specifying the palette to use for fill. Default is "Dark2".
fill_palcolor: A character vector specifying the fill color to use. Default is NULL.
heatmap_palette: A character vector specifying the palette to use for the heatmap. Default is "RdBu".
heatmap_palcolor: A character vector specifying the heatmap color to use. Default is NULL.
group_palette: A character vector specifying the palette to use for groups. Default is "Paired".
group_palcolor: A character vector specifying the group color to use. Default is NULL.
cell_split_palette: A character vector specifying the palette to use for cell splits. Default is "simspec".
cell_split_palcolor: A character vector specifying the cell split color to use. Default is NULL.
feature_split_palette: A character vector specifying the palette to use for feature splits. Default is "simspec".
feature_split_palcolor: A character vector specifying the feature split color to use. Default is NULL.
cell_annotation: A character vector specifying the cell annotation(s) to include. Default is NULL.
cell_annotation_palette: A character vector specifying the palette to use for cell annotations. The length of the vector should match the number of cell_annotation. Default is "Paired".
cell_annotation_palcolor: A list of character vector specifying the cell annotation color(s) to use. The length of the list should match the number of cell_annotation. Default is NULL.
cell_annotation_params: A list specifying additional parameters for cell annotations. Default is a list with width = unit(1, "cm") if flip is TRUE, else a list with height = unit(1, "cm").
feature_annotation: A character vector specifying the feature annotation(s) to include. Default is NULL.
feature_annotation_palette: A character vector specifying the palette to use for feature annotations. The length of the vector should match the number of feature_annotation. Default is "Dark2".
feature_annotation_palcolor: A list of character vector specifying the feature annotation color to use. The length of the list should match the number of feature_annotation. Default is NULL.
feature_annotation_params: A list specifying additional parameters for feature annotations. Default is an empty list.
use_raster: A logical value indicating whether to use a raster device for plotting. Default is NULL.
raster_device: A character vector specifying the raster device to use. Default is "png".
raster_by_magick: A logical value indicating whether to use the 'magick' package for raster. Default is FALSE.
height: A numeric vector specifying the height(s) of the heatmap body. Default is NULL.
width: A numeric vector specifying the width(s) of the heatmap body. Default is NULL.
units: A character vector specifying the units for the height and width. Default is "inch".
seed: An integer specifying the random seed. Default is 11.
ht_params: A list specifying additional parameters passed to the ComplexHeatmap::Heatmap function. Default is an empty list.

Value

A list with the following elements:

plotThe heatmap plot.
matrix_listA list of matrix for each group.by used in the heatmap.
feature_splitNULL or a factor if splitting is performed in the heatmap.
cell_metadataMeta data of cells used to generate the heatmap.
cell_metadataMeta data of features used to generate the heatmap.
enrichmentNULL or a enrichment result generated by RunEnrichment when any of the parameters anno_terms, anno_keys, or anno_features is set to TRUE.

Examples

library(dplyr)
data("pancreas_sub")
ht1 <- GroupHeatmap(pancreas_sub,
  features = c(
    "Sox9", "Anxa2", "Bicc1", # Ductal
    "Neurog3", "Hes6", # EPs
    "Fev", "Neurod1", # Pre-endocrine
    "Rbp4", "Pyy", # Endocrine
    "Ins1", "Gcg", "Sst", "Ghrl" # Beta, Alpha, Delta, Epsilon
  ),
  group.by = c("CellType", "SubCellType")
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht1$plot

panel_fix(ht1$plot, height = 4, width = 6, raster = TRUE, dpi = 50)


pancreas_sub <- RunDEtest(pancreas_sub, group_by = "CellType")
#> Warning: Data in the 'data' slot is raw counts. Perform NormalizeData(LogNormalize) on the data.
#> [2023-11-21 07:21:22.592122] Start DEtest
#> Workers: 2
#> Find all markers(wilcox) among 5 groups...
#> 
  |                                                                                                                    
  |                                                                                                              |   0%
#> 
#> 
#> 
  |                                                                                                                    
  |============================================                                                                  |  40%
#> 
#> 
#> 
#> 
  |                                                                                                                    
  |==============================================================================================================| 100%
#> 
#> [2023-11-21 07:21:32.613376] DEtest done
#> Elapsed time:10.02 secs
de_filter <- filter(pancreas_sub@tools$DEtest_CellType$AllMarkers_wilcox, p_val_adj < 0.05 & avg_log2FC > 1)

ht2 <- GroupHeatmap(
  srt = pancreas_sub, features = de_filter$gene, group.by = "CellType",
  split.by = "Phase", cell_split_palette = "Dark2",
  cluster_rows = TRUE, cluster_columns = TRUE
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
#> `use_raster` is automatically set to TRUE for a matrix with more than 2000 rows. You can control
#> `use_raster` argument by explicitly setting TRUE/FALSE to it.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht2$plot


ht3 <- GroupHeatmap(
  srt = pancreas_sub, features = de_filter$gene, feature_split = de_filter$group1, group.by = "CellType",
  species = "Mus_musculus", db = "GO_BP", anno_terms = TRUE, anno_keys = TRUE, anno_features = TRUE
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
#> [2023-11-21 07:21:43.521111] Start Enrichment
#> Workers: 2
#> Species: Mus_musculus
#> Loading cached db: GO_BP version:3.17.0 nterm:16027 created:2023-11-21 07:14:20.545084
#> Convert ID types for the database: GO_BP
#> Connect to the Ensembl archives...
#> Using the 103 version of biomart...
#> Connecting to the biomart...
#> Searching the dataset mmusculus ...
#> Connecting to the dataset mmusculus_gene_ensembl ...
#> Converting the geneIDs...
#> Error in collect(., Inf): Failed to collect lazy table.
#> Caused by error in `db_collect()`:
#> ! Arguments in `...` must be used.
#> ✖ Problematic argument:
#> • ..1 = Inf
#> ℹ Did you misspell an argument name?
ht3$plot
#> Error in eval(expr, envir, enclos): object 'ht3' not found

pancreas_sub <- AnnotateFeatures(pancreas_sub, species = "Mus_musculus", db = c("TF", "CSPA"))
#> Species: Mus_musculus
#> Loading cached db: TF version:AnimalTFDB4 nterm:2 created:2023-11-21 07:05:33.872428
#> Loading cached db: CSPA version:CSPA nterm:1 created:2023-11-21 07:05:36.02141
de_top <- de_filter %>%
  group_by(gene) %>%
  top_n(1, avg_log2FC) %>%
  group_by(group1) %>%
  top_n(3, avg_log2FC)
ht4 <- GroupHeatmap(pancreas_sub,
  features = de_top$gene, feature_split = de_top$group1, group.by = "CellType",
  heatmap_palette = "YlOrRd",
  cell_annotation = c("Phase", "G2M_score", "Neurod2"), cell_annotation_palette = c("Dark2", "Paired", "Paired"),
  cell_annotation_params = list(height = unit(10, "mm")),
  feature_annotation = c("TF", "CSPA"),
  feature_annotation_palcolor = list(c("gold", "steelblue"), c("forestgreen")),
  add_dot = TRUE, add_bg = TRUE, nlabel = 0, show_row_names = TRUE
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht4$plot


ht5 <- GroupHeatmap(pancreas_sub,
  features = de_top$gene, feature_split = de_top$group1, group.by = "CellType",
  heatmap_palette = "YlOrRd",
  cell_annotation = c("Phase", "G2M_score", "Neurod2"), cell_annotation_palette = c("Dark2", "Paired", "Paired"),
  cell_annotation_params = list(width = unit(10, "mm")),
  feature_annotation = c("TF", "CSPA"),
  feature_annotation_palcolor = list(c("gold", "steelblue"), c("forestgreen")),
  add_dot = TRUE, add_bg = TRUE,
  flip = TRUE, column_title_rot = 45, nlabel = 0, show_row_names = TRUE
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht5$plot


ht6 <- GroupHeatmap(pancreas_sub,
  features = de_top$gene, feature_split = de_top$group1, group.by = "CellType",
  add_violin = TRUE, cluster_rows = TRUE,
  nlabel = 0, show_row_names = TRUE
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht6$plot


ht7 <- GroupHeatmap(pancreas_sub,
  features = de_top$gene, feature_split = de_top$group1, group.by = "CellType",
  add_violin = TRUE, fill.by = "expression", fill_palette = "Blues", cluster_rows = TRUE,
  nlabel = 0, show_row_names = TRUE
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht7$plot


ht8 <- GroupHeatmap(pancreas_sub,
  features = de_top$gene, group.by = "CellType", split.by = "Phase", n_split = 4,
  cluster_rows = TRUE, cluster_columns = TRUE, cluster_row_slices = TRUE, cluster_column_slices = TRUE,
  add_dot = TRUE, add_reticle = TRUE, heatmap_palette = "viridis",
  nlabel = 0, show_row_names = TRUE,
  ht_params = list(row_gap = unit(0, "mm"), row_names_gp = gpar(fontsize = 10))
)
#> 'magick' package is suggested to install to give better rasterization.
#> 
#> Set `ht_opt$message = FALSE` to turn off this message.
ht8$plot

Usage

Arguments

Value

See also

Examples