scplotter to work with CODEX data prepared by Giotto¶

See: https://drieslab.github.io/Giotto_website/articles/codex_mouse_spleen.html

Go back to scplotter documentation: https://pwwang.github.io/scplotter/

InĀ [Ā ]:
# GiottoData::getSpatialDataset(
#   dataset = "codex_spleen",
#   directory = "data/codex_spleen",
#   verbose = TRUE,
#   dryrun = FALSE
# )
Warning message in GiottoData::getSpatialDataset(dataset = "codex_spleen", directory = "data/codex_spleen", :
ā€œThe output directory does not exist and will be created 
ā€
Warning message in data.table::fread(datasets_file, sep = "\t"):
ā€œDiscarded single-line footer: <<sg_mini_kidney	https://github.com/drieslab/spatial-datasets/data/2023_spatial_genomics_mouse_kidney/Raw.zip	>>ā€
Selected dataset links for: codex_spleen


        dataset
         <char>
1: codex_spleen
                                                                                                                       spatial_locs
                                                                                                                             <char>
1: https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/cell_locations/codex_BALBc_3_coord.txt
                                                                                                                              expr_matrix
                                                                                                                                   <char>
1: https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/count_matrix/codex_BALBc_3_expression.txt.gz
                                                                                                                                                                                                                                                                  metadata
                                                                                                                                                                                                                                                                    <char>
1: https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/cell_locations/codex_BALBc_3_annotation.txt|https://raw.githubusercontent.com/drieslab/spatial-datasets/master/data/2018_codex_spleen/cell_locations/cell_type_annotation.csv
   segmentations
          <char>
1:              

Download expression matrix:



Download spatial locations:



Download metadata:

NULL
InĀ [3]:
library(Giotto)

# Ensure Giotto can access a python env
genv_exists <- suppressMessages(checkGiottoEnvironment())
print(genv_exists)

python_path <- file.path(Sys.getenv("HOME"), "miniconda3", "envs", "giotto_env", "bin", "python")
Sys.setenv(RETICULATE_PYTHON = python_path)

invisible(capture.output(suppressMessages(set_giotto_python_path(python_path = python_path))))

# library(scplotter)
devtools::load_all()
[1] TRUE
ℹ Loading scplotter
InĀ [11]:
library(Giotto)

## Set instructions
results_folder <- "data/codex_spleen.results"

instructions <- createGiottoInstructions(
    save_dir = results_folder,
    save_plot = FALSE,
    show_plot = TRUE,
    return_plot = TRUE,
    python_path = python_path
)

data_path <- "data/codex_spleen/"

# 2. create giotto object from provided paths ####
expr_path <- paste0(data_path, "codex_BALBc_3_expression.txt.gz")
loc_path <- paste0(data_path, "codex_BALBc_3_coord.txt")
meta_path <- paste0(data_path, "codex_BALBc_3_annotation.txt")

# read in data information

# expression info
codex_expression <- readExprMatrix(expr_path, transpose = FALSE)
# cell coordinate info
codex_locations <- data.table::fread(loc_path)
# metadata
codex_metadata <- data.table::fread(meta_path)

## stitch x.y tile coordinates to global coordinates
xtilespan <- 1344
ytilespan <- 1008

# TODO: expand the documentation and input format of stitchTileCoordinates. Probably not enough information for new users.
stitch_file <- stitchTileCoordinates(location_file = codex_metadata,
                                     Xtilespan = xtilespan,
                                     Ytilespan = ytilespan)
codex_locations <- stitch_file[,.(Xcoord, Ycoord)]

# create Giotto object
codex_test <- createGiottoObject(expression = codex_expression,
                                 spatial_locs = codex_locations,
                                 instructions = instructions)

codex_metadata$cell_ID <- as.character(codex_metadata$cellID)
codex_test <- addCellMetadata(codex_test, new_metadata = codex_metadata,
                              by_column = TRUE,
                              column_cell_ID = "cell_ID")

# subset Giotto object
cell_metadata <- pDataDT(codex_test)
cell_IDs_to_keep <- cell_metadata[Imaging_phenotype_cell_type != "dirt" & Imaging_phenotype_cell_type != "noid" & Imaging_phenotype_cell_type != "capsule",]$cell_ID

codex_test <- subsetGiotto(codex_test,
                           cell_ids = cell_IDs_to_keep)

## filter
codex_test <- filterGiotto(gobject = codex_test,
                           expression_threshold = 1,
                           feat_det_in_min_cells = 10,
                           min_det_feats_per_cell = 2,
                           expression_values = "raw",
                           verbose = TRUE)

codex_test <- normalizeGiotto(gobject = codex_test,
                              scalefactor = 6000,
                              verbose = TRUE,
                              log_norm = FALSE,
                              library_size_norm = FALSE,
                              scale_feats = FALSE,
                              scale_cells = TRUE)

## add gene & cell statistics
codex_test <- addStatistics(gobject = codex_test,
                            expression_values = "normalized")

## adjust expression matrix for technical or known variables
codex_test <- adjustGiottoMatrix(gobject = codex_test,
                                 expression_values = "normalized",
                                 batch_columns = "sample_Xtile_Ytile",
                                 covariate_columns = NULL,
                                 return_gobject = TRUE,
                                 update_slot = "custom")
python already initialized in this session
 active environment : 'giotto_env'
 python version : 3.10

completed 1: preparation

completed 2: subset expression data

completed 3: subset spatial locations

completed 4: subset cell metadata

completed 5: subset feature metadata

completed 6: subset spatial network(s)

completed 7: subsetted dimension reductions

completed 8: subsetted nearest network(s)

completed 9: subsetted spatial enrichment results

Feature type:  rna 
Number of cells removed:  2  out of  80019 
Number of feats removed:  0  out of  30 
Setting expression [cell][rna] normalized

Setting expression [cell][rna] scaled

calculating statistics for "normalized" expression

Warning message:
ā€œThe `update_slot` argument of `adjustGiottoMatrix()` is deprecated as of <NA>
4.1.7.
ℹ Please use the `name` argument instead.
ℹ The deprecated feature was likely used in the base package.
  Please report the issue to the authors.ā€
Setting expression [cell][rna] custom

InĀ [16]:
options(repr.plot.width = 7, repr.plot.height = 7)

SpatDimPlot(codex_test, color_by = "lightblue", size = 0.25)
No description has been provided for this image
InĀ [19]:
options(repr.plot.width = 14, repr.plot.height = 7)

SpatDimPlot(
    codex_test,
    group_by = "sample_Xtile_Ytile",
    size = 0.2
)
No description has been provided for this image
InĀ [20]:
# PCA
codex_test <- runPCA(gobject = codex_test,
                     expression_values = "normalized",
                     scale_unit = TRUE,
                     method = "factominer")
# UMAP
codex_test <- runUMAP(codex_test,
                      dimensions_to_use = 1:14,
                      n_components = 2,
                      n_threads = 12)
## sNN network (default)
codex_test <- createNearestNetwork(gobject = codex_test,
                                   dimensions_to_use = 1:14,
                                   k = 20)

## 0.1 resolution
codex_test <- doLeidenCluster(gobject = codex_test,
                              resolution = 0.5,
                              n_iterations = 100,
                              name = "leiden")

clusters_cell_types <- c("naive B cells", "B cells", "B cells", "naive B cells",
                         "B cells", "macrophages", "erythroblasts",
                         "erythroblasts", "erythroblasts", "CD8 + T cells",
                         "Naive T cells", "CD4+ T cells", "Naive T cells",
                         "CD4+ T cells", "Dendritic cells", "NK cells",
                         "Dendritic cells", "Plasma cells", "endothelial cells",
                         "monocytes")

names(clusters_cell_types) <- c(2, 15, 13, 5, 8, 9, 19, 1, 10, 3, 12, 14, 4, 6,
                                7, 16, 17, 18, 11, 20)

codex_test <- annotateGiotto(gobject = codex_test,
                             annotation_vector = clusters_cell_types,
                             cluster_column = "leiden",
                             name = "cell_types")

cell_metadatadata <- pDataDT(codex_test)
subset_cell_ids <- cell_metadatadata[sample_Xtile_Ytile=="BALBc-3_X04_Y08"]$cell_ID

codex_test_zone1 <- subsetGiotto(codex_test,
                                 cell_ids = subset_cell_ids)
"hvf" was not found in the gene metadata information.
 all genes will be used.

Warning message in .run_pca_factominer(x = t_flex(expr_values), scale = scale_unit, :
ā€œncp > ncol(x), will be set to ncol(x)ā€
Setting dimension reduction [cell][rna] pca

Setting dimension reduction [cell][rna] umap

InĀ [32]:
options(repr.plot.width = 7, repr.plot.height = 7)

codex_test@cell_metadata$cell$rna$leiden <- factor(
    as.character(codex_test@cell_metadata$cell$rna$leiden),
    levels = unique(as.character(sort(codex_test@cell_metadata$cell$rna$leiden))))

SpatDimPlot(
    codex_test,
    group_by = "leiden",
    size = 0.2
)
No description has been provided for this image
InĀ [34]:
options(repr.plot.width = 12, repr.plot.height = 7)

SpatDimPlot(
    codex_test,
    group_by = "Imaging_phenotype_cell_type",
    size = 0.2
)
No description has been provided for this image
InĀ [36]:
options(repr.plot.width = 8, repr.plot.height = 5)

SpatDimPlot(
    codex_test_zone1,
    group_by = "Imaging_phenotype_cell_type",
    size = 1
)
No description has been provided for this image
InĀ [39]:
options(repr.plot.width = 10, repr.plot.height = 5)

SpatFeaturePlot(
    codex_test_zone1,
    features = c("CD8a","CD19"),
    layer = "scaled",
    size = 1
)
No description has been provided for this image
InĀ [4]:
x <- sessionInfo()
x <- capture.output(print(x))
# hide the BLAS/LAPACK paths
x <- x[!startsWith(x, "BLAS/LAPACK:")]
cat(paste(x, collapse = "\n"))
R version 4.4.3 (2025-02-28)
Platform: x86_64-conda-linux-gnu
Running under: Red Hat Enterprise Linux 8.10 (Ootpa)

Matrix products: default

locale:
 [1] LC_CTYPE=en_US.UTF-8       LC_NUMERIC=C              
 [3] LC_TIME=en_US.UTF-8        LC_COLLATE=C              
 [5] LC_MONETARY=en_US.UTF-8    LC_MESSAGES=en_US.UTF-8   
 [7] LC_PAPER=en_US.UTF-8       LC_NAME=C                 
 [9] LC_ADDRESS=C               LC_TELEPHONE=C            
[11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C       

time zone: America/Chicago
tzcode source: system (glibc)

attached base packages:
[1] stats     graphics  grDevices utils     datasets  methods   base     

other attached packages:
[1] scplotter_0.4.0   Giotto_4.2.1      GiottoClass_0.4.7

loaded via a namespace (and not attached):
  [1] fs_1.6.6                    matrixStats_1.5.0          
  [3] spatstat.sparse_3.1-0       bitops_1.0-9               
  [5] devtools_2.4.5              httr_1.4.7                 
  [7] RColorBrewer_1.1-3          repr_1.1.7                 
  [9] profvis_0.4.0               tools_4.4.3                
 [11] sctransform_0.4.2           backports_1.5.0            
 [13] R6_2.6.1                    uwot_0.2.3                 
 [15] lazyeval_0.2.2              urlchecker_1.0.1           
 [17] withr_3.0.2                 sp_2.2-0                   
 [19] gridExtra_2.3               GiottoUtils_0.2.5          
 [21] progressr_0.15.1            quantreg_6.00              
 [23] cli_3.6.5                   Biobase_2.62.0             
 [25] spatstat.explore_3.4-3      fastDummies_1.7.5          
 [27] iNEXT_3.0.1                 Seurat_5.3.0               
 [29] spatstat.data_3.1-6         ggridges_0.5.6             
 [31] pbapply_1.7-2               pbdZMQ_0.3-14              
 [33] stringdist_0.9.15           parallelly_1.45.0          
 [35] sessioninfo_1.2.3           VGAM_1.1-13                
 [37] rstudioapi_0.17.1           generics_0.1.4             
 [39] shape_1.4.6.1               gtools_3.9.5               
 [41] ica_1.0-3                   spatstat.random_3.4-1      
 [43] dplyr_1.1.4                 Matrix_1.7-3               
 [45] S4Vectors_0.40.2            abind_1.4-5                
 [47] terra_1.8-42                lifecycle_1.0.4            
 [49] SummarizedExperiment_1.32.0 SparseArray_1.2.4          
 [51] Rtsne_0.17                  grid_4.4.3                 
 [53] promises_1.3.2              crayon_1.5.3               
 [55] miniUI_0.1.2                lattice_0.22-7             
 [57] cowplot_1.1.3               pillar_1.10.2              
 [59] GenomicRanges_1.54.1        rjson_0.2.23               
 [61] future.apply_1.20.0         codetools_0.2-20           
 [63] glue_1.8.0                  spatstat.univar_3.1-3      
 [65] data.table_1.17.4           remotes_2.5.0              
 [67] vctrs_0.6.5                 png_0.1-8                  
 [69] spam_2.11-1                 testthat_3.2.3             
 [71] gtable_0.3.6                assertthat_0.2.1           
 [73] cachem_1.1.0                S4Arrays_1.2.1             
 [75] mime_0.13                   tidygraph_1.3.0            
 [77] survival_3.8-3              SingleCellExperiment_1.24.0
 [79] ellipsis_0.3.2              scRepertoire_2.2.1         
 [81] fitdistrplus_1.2-2          ROCR_1.0-11                
 [83] nlme_3.1-168                usethis_3.1.0              
 [85] RcppAnnoy_0.0.22            evd_2.3-7.1                
 [87] GenomeInfoDb_1.38.8         rprojroot_2.0.4            
 [89] irlba_2.3.5.1               KernSmooth_2.23-26         
 [91] plotthis_0.7.0              colorspace_2.1-1           
 [93] BiocGenerics_0.48.1         tidyselect_1.2.1           
 [95] compiler_4.4.3              SparseM_1.84-2             
 [97] xml2_1.3.8                  desc_1.4.3                 
 [99] ggdendro_0.2.0              DelayedArray_0.28.0        
[101] plotly_4.10.4               checkmate_2.3.2            
[103] scales_1.4.0                lmtest_0.9-40              
[105] rappdirs_0.3.3              stringr_1.5.1              
[107] digest_0.6.37               goftest_1.2-3              
[109] spatstat.utils_3.1-4        XVector_0.42.0             
[111] htmltools_0.5.8.1           GiottoVisuals_0.2.12       
[113] pkgconfig_2.0.3             base64enc_0.1-3            
[115] MatrixGenerics_1.14.0       fastmap_1.2.0              
[117] rlang_1.1.6                 GlobalOptions_0.1.2        
[119] htmlwidgets_1.6.4           shiny_1.10.0               
[121] farver_2.1.2                zoo_1.8-14                 
[123] jsonlite_2.0.0              RCurl_1.98-1.17            
[125] magrittr_2.0.3              GenomeInfoDbData_1.2.11    
[127] dotCall64_1.2               patchwork_1.3.0            
[129] IRkernel_1.3.2              Rcpp_1.0.14                
[131] evmix_2.12                  ggnewscale_0.5.1           
[133] viridis_0.6.5               reticulate_1.42.0          
[135] truncdist_1.0-2             stringi_1.8.7              
[137] ggalluvial_0.12.5           ggraph_2.2.1               
[139] brio_1.1.5                  zlibbioc_1.48.2            
[141] MASS_7.3-64                 plyr_1.8.9                 
[143] pkgbuild_1.4.8              parallel_4.4.3             
[145] listenv_0.9.1               ggrepel_0.9.6              
[147] forcats_1.0.0               deldir_2.0-4               
[149] graphlayouts_1.2.2          IRdisplay_1.1              
[151] splines_4.4.3               gridtext_0.1.5             
[153] tensor_1.5                  circlize_0.4.16            
[155] colorRamp2_0.1.0            igraph_2.0.3               
[157] uuid_1.2-1                  spatstat.geom_3.4-1        
[159] cubature_2.1.4              RcppHNSW_0.6.0             
[161] reshape2_1.4.4              stats4_4.4.3               
[163] pkgload_1.4.0               evaluate_1.0.3             
[165] SeuratObject_5.1.0          tweenr_2.0.3               
[167] httpuv_1.6.15               MatrixModels_0.5-4         
[169] RANN_2.6.2                  tidyr_1.3.1                
[171] purrr_1.0.4                 polyclip_1.10-7            
[173] future_1.58.0               scattermore_1.2            
[175] ggplot2_3.5.2               ggforce_0.4.2              
[177] xtable_1.8-4                RSpectra_0.16-2            
[179] later_1.4.2                 viridisLite_0.4.2          
[181] gsl_2.1-8                   tibble_3.2.1               
[183] memoise_2.0.1               IRanges_2.36.0             
[185] cluster_2.1.8.1             globals_0.18.0