scplotter to work with CODEX data prepared by Giotto¶
See: https://drieslab.github.io/Giotto_website/articles/codex_mouse_spleen.html
Go back to scplotter documentation: https://pwwang.github.io/scplotter/
InĀ [Ā ]:
# GiottoData::getSpatialDataset(
# dataset = "codex_spleen",
# directory = "data/codex_spleen",
# verbose = TRUE,
# dryrun = FALSE
# )
Warning message in GiottoData::getSpatialDataset(dataset = "codex_spleen", directory = "data/codex_spleen", : āThe output directory does not exist and will be created ā Warning message in data.table::fread(datasets_file, sep = "\t"): āDiscarded single-line footer: <<sg_mini_kidney https://github.com/drieslab/spatial-datasets/data/2023_spatial_genomics_mouse_kidney/Raw.zip >>ā Selected dataset links for: codex_spleen
dataset <char> 1: codex_spleen spatial_locs <char> 1: https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/cell_locations/codex_BALBc_3_coord.txt expr_matrix <char> 1: https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/count_matrix/codex_BALBc_3_expression.txt.gz metadata <char> 1: https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/cell_locations/codex_BALBc_3_annotation.txt|https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/cell_locations/cell_type_annotation.csv segmentations <char> 1:
Download expression matrix: Download spatial locations: Download metadata:
NULL
InĀ [3]:
library(Giotto)
# Ensure Giotto can access a python env
genv_exists <- suppressMessages(checkGiottoEnvironment())
print(genv_exists)
python_path <- file.path(Sys.getenv("HOME"), "miniconda3", "envs", "giotto_env", "bin", "python")
Sys.setenv(RETICULATE_PYTHON = python_path)
invisible(capture.output(suppressMessages(set_giotto_python_path(python_path = python_path))))
# library(scplotter)
devtools::load_all()
[1] TRUE
ā¹ Loading scplotter
InĀ [11]:
library(Giotto)
## Set instructions
results_folder <- "data/codex_spleen.results"
instructions <- createGiottoInstructions(
save_dir = results_folder,
save_plot = FALSE,
show_plot = TRUE,
return_plot = TRUE,
python_path = python_path
)
data_path <- "data/codex_spleen/"
# 2. create giotto object from provided paths ####
expr_path <- paste0(data_path, "codex_BALBc_3_expression.txt.gz")
loc_path <- paste0(data_path, "codex_BALBc_3_coord.txt")
meta_path <- paste0(data_path, "codex_BALBc_3_annotation.txt")
# read in data information
# expression info
codex_expression <- readExprMatrix(expr_path, transpose = FALSE)
# cell coordinate info
codex_locations <- data.table::fread(loc_path)
# metadata
codex_metadata <- data.table::fread(meta_path)
## stitch x.y tile coordinates to global coordinates
xtilespan <- 1344
ytilespan <- 1008
# TODO: expand the documentation and input format of stitchTileCoordinates. Probably not enough information for new users.
stitch_file <- stitchTileCoordinates(location_file = codex_metadata,
Xtilespan = xtilespan,
Ytilespan = ytilespan)
codex_locations <- stitch_file[,.(Xcoord, Ycoord)]
# create Giotto object
codex_test <- createGiottoObject(expression = codex_expression,
spatial_locs = codex_locations,
instructions = instructions)
codex_metadata$cell_ID <- as.character(codex_metadata$cellID)
codex_test <- addCellMetadata(codex_test, new_metadata = codex_metadata,
by_column = TRUE,
column_cell_ID = "cell_ID")
# subset Giotto object
cell_metadata <- pDataDT(codex_test)
cell_IDs_to_keep <- cell_metadata[Imaging_phenotype_cell_type != "dirt" & Imaging_phenotype_cell_type != "noid" & Imaging_phenotype_cell_type != "capsule",]$cell_ID
codex_test <- subsetGiotto(codex_test,
cell_ids = cell_IDs_to_keep)
## filter
codex_test <- filterGiotto(gobject = codex_test,
expression_threshold = 1,
feat_det_in_min_cells = 10,
min_det_feats_per_cell = 2,
expression_values = "raw",
verbose = TRUE)
codex_test <- normalizeGiotto(gobject = codex_test,
scalefactor = 6000,
verbose = TRUE,
log_norm = FALSE,
library_size_norm = FALSE,
scale_feats = FALSE,
scale_cells = TRUE)
## add gene & cell statistics
codex_test <- addStatistics(gobject = codex_test,
expression_values = "normalized")
## adjust expression matrix for technical or known variables
codex_test <- adjustGiottoMatrix(gobject = codex_test,
expression_values = "normalized",
batch_columns = "sample_Xtile_Ytile",
covariate_columns = NULL,
return_gobject = TRUE,
update_slot = "custom")
python already initialized in this session active environment : 'giotto_env' python version : 3.10
completed 1: preparation completed 2: subset expression data completed 3: subset spatial locations completed 4: subset cell metadata completed 5: subset feature metadata completed 6: subset spatial network(s) completed 7: subsetted dimension reductions completed 8: subsetted nearest network(s) completed 9: subsetted spatial enrichment results
Feature type: rna Number of cells removed: 2 out of 80019 Number of feats removed: 0 out of 30
Setting expression [cell][rna] normalized Setting expression [cell][rna] scaled calculating statistics for "normalized" expression Warning message: āThe `update_slot` argument of `adjustGiottoMatrix()` is deprecated as of <NA> 4.1.7. ā¹ Please use the `name` argument instead. ā¹ The deprecated feature was likely used in the base package. Please report the issue to the authors.ā Setting expression [cell][rna] custom
InĀ [16]:
options(repr.plot.width = 7, repr.plot.height = 7)
SpatDimPlot(codex_test, color_by = "lightblue", size = 0.25)
InĀ [19]:
options(repr.plot.width = 14, repr.plot.height = 7)
SpatDimPlot(
codex_test,
group_by = "sample_Xtile_Ytile",
size = 0.2
)
InĀ [20]:
# PCA
codex_test <- runPCA(gobject = codex_test,
expression_values = "normalized",
scale_unit = TRUE,
method = "factominer")
# UMAP
codex_test <- runUMAP(codex_test,
dimensions_to_use = 1:14,
n_components = 2,
n_threads = 12)
## sNN network (default)
codex_test <- createNearestNetwork(gobject = codex_test,
dimensions_to_use = 1:14,
k = 20)
## 0.1 resolution
codex_test <- doLeidenCluster(gobject = codex_test,
resolution = 0.5,
n_iterations = 100,
name = "leiden")
clusters_cell_types <- c("naive B cells", "B cells", "B cells", "naive B cells",
"B cells", "macrophages", "erythroblasts",
"erythroblasts", "erythroblasts", "CD8 + T cells",
"Naive T cells", "CD4+ T cells", "Naive T cells",
"CD4+ T cells", "Dendritic cells", "NK cells",
"Dendritic cells", "Plasma cells", "endothelial cells",
"monocytes")
names(clusters_cell_types) <- c(2, 15, 13, 5, 8, 9, 19, 1, 10, 3, 12, 14, 4, 6,
7, 16, 17, 18, 11, 20)
codex_test <- annotateGiotto(gobject = codex_test,
annotation_vector = clusters_cell_types,
cluster_column = "leiden",
name = "cell_types")
cell_metadatadata <- pDataDT(codex_test)
subset_cell_ids <- cell_metadatadata[sample_Xtile_Ytile=="BALBc-3_X04_Y08"]$cell_ID
codex_test_zone1 <- subsetGiotto(codex_test,
cell_ids = subset_cell_ids)
"hvf" was not found in the gene metadata information. all genes will be used. Warning message in .run_pca_factominer(x = t_flex(expr_values), scale = scale_unit, : āncp > ncol(x), will be set to ncol(x)ā Setting dimension reduction [cell][rna] pca Setting dimension reduction [cell][rna] umap
InĀ [32]:
options(repr.plot.width = 7, repr.plot.height = 7)
codex_test@cell_metadata$cell$rna$leiden <- factor(
as.character(codex_test@cell_metadata$cell$rna$leiden),
levels = unique(as.character(sort(codex_test@cell_metadata$cell$rna$leiden))))
SpatDimPlot(
codex_test,
group_by = "leiden",
size = 0.2
)
InĀ [34]:
options(repr.plot.width = 12, repr.plot.height = 7)
SpatDimPlot(
codex_test,
group_by = "Imaging_phenotype_cell_type",
size = 0.2
)
InĀ [36]:
options(repr.plot.width = 8, repr.plot.height = 5)
SpatDimPlot(
codex_test_zone1,
group_by = "Imaging_phenotype_cell_type",
size = 1
)
InĀ [39]:
options(repr.plot.width = 10, repr.plot.height = 5)
SpatFeaturePlot(
codex_test_zone1,
features = c("CD8a","CD19"),
layer = "scaled",
size = 1
)
InĀ [4]:
x <- sessionInfo()
x <- capture.output(print(x))
# hide the BLAS/LAPACK paths
x <- x[!startsWith(x, "BLAS/LAPACK:")]
cat(paste(x, collapse = "\n"))
R version 4.4.3 (2025-02-28) Platform: x86_64-conda-linux-gnu Running under: Red Hat Enterprise Linux 8.10 (Ootpa) Matrix products: default locale: [1] LC_CTYPE=en_US.UTF-8 LC_NUMERIC=C [3] LC_TIME=en_US.UTF-8 LC_COLLATE=C [5] LC_MONETARY=en_US.UTF-8 LC_MESSAGES=en_US.UTF-8 [7] LC_PAPER=en_US.UTF-8 LC_NAME=C [9] LC_ADDRESS=C LC_TELEPHONE=C [11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C time zone: America/Chicago tzcode source: system (glibc) attached base packages: [1] stats graphics grDevices utils datasets methods base other attached packages: [1] scplotter_0.4.0 Giotto_4.2.1 GiottoClass_0.4.7 loaded via a namespace (and not attached): [1] fs_1.6.6 matrixStats_1.5.0 [3] spatstat.sparse_3.1-0 bitops_1.0-9 [5] devtools_2.4.5 httr_1.4.7 [7] RColorBrewer_1.1-3 repr_1.1.7 [9] profvis_0.4.0 tools_4.4.3 [11] sctransform_0.4.2 backports_1.5.0 [13] R6_2.6.1 uwot_0.2.3 [15] lazyeval_0.2.2 urlchecker_1.0.1 [17] withr_3.0.2 sp_2.2-0 [19] gridExtra_2.3 GiottoUtils_0.2.5 [21] progressr_0.15.1 quantreg_6.00 [23] cli_3.6.5 Biobase_2.62.0 [25] spatstat.explore_3.4-3 fastDummies_1.7.5 [27] iNEXT_3.0.1 Seurat_5.3.0 [29] spatstat.data_3.1-6 ggridges_0.5.6 [31] pbapply_1.7-2 pbdZMQ_0.3-14 [33] stringdist_0.9.15 parallelly_1.45.0 [35] sessioninfo_1.2.3 VGAM_1.1-13 [37] rstudioapi_0.17.1 generics_0.1.4 [39] shape_1.4.6.1 gtools_3.9.5 [41] ica_1.0-3 spatstat.random_3.4-1 [43] dplyr_1.1.4 Matrix_1.7-3 [45] S4Vectors_0.40.2 abind_1.4-5 [47] terra_1.8-42 lifecycle_1.0.4 [49] SummarizedExperiment_1.32.0 SparseArray_1.2.4 [51] Rtsne_0.17 grid_4.4.3 [53] promises_1.3.2 crayon_1.5.3 [55] miniUI_0.1.2 lattice_0.22-7 [57] cowplot_1.1.3 pillar_1.10.2 [59] GenomicRanges_1.54.1 rjson_0.2.23 [61] future.apply_1.20.0 codetools_0.2-20 [63] glue_1.8.0 spatstat.univar_3.1-3 [65] data.table_1.17.4 remotes_2.5.0 [67] vctrs_0.6.5 png_0.1-8 [69] spam_2.11-1 testthat_3.2.3 [71] gtable_0.3.6 assertthat_0.2.1 [73] cachem_1.1.0 S4Arrays_1.2.1 [75] mime_0.13 tidygraph_1.3.0 [77] survival_3.8-3 SingleCellExperiment_1.24.0 [79] ellipsis_0.3.2 scRepertoire_2.2.1 [81] fitdistrplus_1.2-2 ROCR_1.0-11 [83] nlme_3.1-168 usethis_3.1.0 [85] RcppAnnoy_0.0.22 evd_2.3-7.1 [87] GenomeInfoDb_1.38.8 rprojroot_2.0.4 [89] irlba_2.3.5.1 KernSmooth_2.23-26 [91] plotthis_0.7.0 colorspace_2.1-1 [93] BiocGenerics_0.48.1 tidyselect_1.2.1 [95] compiler_4.4.3 SparseM_1.84-2 [97] xml2_1.3.8 desc_1.4.3 [99] ggdendro_0.2.0 DelayedArray_0.28.0 [101] plotly_4.10.4 checkmate_2.3.2 [103] scales_1.4.0 lmtest_0.9-40 [105] rappdirs_0.3.3 stringr_1.5.1 [107] digest_0.6.37 goftest_1.2-3 [109] spatstat.utils_3.1-4 XVector_0.42.0 [111] htmltools_0.5.8.1 GiottoVisuals_0.2.12 [113] pkgconfig_2.0.3 base64enc_0.1-3 [115] MatrixGenerics_1.14.0 fastmap_1.2.0 [117] rlang_1.1.6 GlobalOptions_0.1.2 [119] htmlwidgets_1.6.4 shiny_1.10.0 [121] farver_2.1.2 zoo_1.8-14 [123] jsonlite_2.0.0 RCurl_1.98-1.17 [125] magrittr_2.0.3 GenomeInfoDbData_1.2.11 [127] dotCall64_1.2 patchwork_1.3.0 [129] IRkernel_1.3.2 Rcpp_1.0.14 [131] evmix_2.12 ggnewscale_0.5.1 [133] viridis_0.6.5 reticulate_1.42.0 [135] truncdist_1.0-2 stringi_1.8.7 [137] ggalluvial_0.12.5 ggraph_2.2.1 [139] brio_1.1.5 zlibbioc_1.48.2 [141] MASS_7.3-64 plyr_1.8.9 [143] pkgbuild_1.4.8 parallel_4.4.3 [145] listenv_0.9.1 ggrepel_0.9.6 [147] forcats_1.0.0 deldir_2.0-4 [149] graphlayouts_1.2.2 IRdisplay_1.1 [151] splines_4.4.3 gridtext_0.1.5 [153] tensor_1.5 circlize_0.4.16 [155] colorRamp2_0.1.0 igraph_2.0.3 [157] uuid_1.2-1 spatstat.geom_3.4-1 [159] cubature_2.1.4 RcppHNSW_0.6.0 [161] reshape2_1.4.4 stats4_4.4.3 [163] pkgload_1.4.0 evaluate_1.0.3 [165] SeuratObject_5.1.0 tweenr_2.0.3 [167] httpuv_1.6.15 MatrixModels_0.5-4 [169] RANN_2.6.2 tidyr_1.3.1 [171] purrr_1.0.4 polyclip_1.10-7 [173] future_1.58.0 scattermore_1.2 [175] ggplot2_3.5.2 ggforce_0.4.2 [177] xtable_1.8-4 RSpectra_0.16-2 [179] later_1.4.2 viridisLite_0.4.2 [181] gsl_2.1-8 tibble_3.2.1 [183] memoise_2.0.1 IRanges_2.36.0 [185] cluster_2.1.8.1 globals_0.18.0