```r #--- data-loading ---# library(scRNAseq) sce.nest <- NestorowaHSCData() #--- gene-annotation ---# library(AnnotationHub) ens.mm.v97 <- AnnotationHub()[["AH73905"]] anno <- select(ens.mm.v97, keys=rownames(sce.nest), keytype="GENEID", columns=c("SYMBOL", "SEQNAME")) rowData(sce.nest) <- anno[match(rownames(sce.nest), anno$GENEID),] #--- quality-control ---# library(scater) stats <- perCellQCMetrics(sce.nest) qc <- quickPerCellQC(stats, percent_subsets="altexps_ERCC_percent") sce.nest <- sce.nest[,!qc$discard] #--- normalization ---# library(scran) set.seed(101000110) clusters <- quickCluster(sce.nest) sce.nest <- computeSumFactors(sce.nest, clusters=clusters) sce.nest <- logNormCounts(sce.nest) #--- variance-modelling ---# set.seed(00010101) dec.nest <- modelGeneVarWithSpikes(sce.nest, "ERCC") top.nest <- getTopHVGs(dec.nest, prop=0.1) ```

```r #--- data-loading ---# library(scRNAseq) sce.grun.hsc <- GrunHSCData(ensembl=TRUE) #--- gene-annotation ---# library(AnnotationHub) ens.mm.v97 <- AnnotationHub()[["AH73905"]] anno <- select(ens.mm.v97, keys=rownames(sce.grun.hsc), keytype="GENEID", columns=c("SYMBOL", "SEQNAME")) rowData(sce.grun.hsc) <- anno[match(rownames(sce.grun.hsc), anno$GENEID),] #--- quality-control ---# library(scuttle) stats <- perCellQCMetrics(sce.grun.hsc) qc <- quickPerCellQC(stats, batch=sce.grun.hsc$protocol, subset=grepl("sorted", sce.grun.hsc$protocol)) sce.grun.hsc <- sce.grun.hsc[,!qc$discard] ```

```r #--- data-loading ---# library(scRNAseq) sce.paul <- PaulHSCData(ensembl=TRUE) #--- gene-annotation ---# library(AnnotationHub) ens.mm.v97 <- AnnotationHub()[["AH73905"]] anno <- select(ens.mm.v97, keys=rownames(sce.paul), keytype="GENEID", columns=c("SYMBOL", "SEQNAME")) rowData(sce.paul) <- anno[match(rownames(sce.paul), anno$GENEID),] #--- quality-control ---# library(scater) stats <- perCellQCMetrics(sce.paul) qc <- quickPerCellQC(stats, batch=sce.paul$Plate_ID) # Detecting batches with unusually low threshold values. lib.thresholds <- attr(qc$low_lib_size, "thresholds")["lower",] nfeat.thresholds <- attr(qc$low_n_features, "thresholds")["lower",] ignore <- union(names(lib.thresholds)[lib.thresholds < 100], names(nfeat.thresholds)[nfeat.thresholds < 100]) # Repeating the QC using only the "high-quality" batches. qc2 <- quickPerCellQC(stats, batch=sce.paul$Plate_ID, subset=!sce.paul$Plate_ID %in% ignore) sce.paul <- sce.paul[,!qc2$discard] ```

``` R version 4.4.0 RC (2024-04-16 r86468) Platform: x86_64-pc-linux-gnu Running under: Ubuntu 22.04.4 LTS Matrix products: default BLAS: /home/biocbuild/bbs-3.20-bioc/R/lib/libRblas.so LAPACK: /usr/lib/x86_64-linux-gnu/lapack/liblapack.so.3.10.0 locale: [1] LC_CTYPE=en_US.UTF-8 LC_NUMERIC=C [3] LC_TIME=en_GB LC_COLLATE=C [5] LC_MONETARY=en_US.UTF-8 LC_MESSAGES=en_US.UTF-8 [7] LC_PAPER=en_US.UTF-8 LC_NAME=C [9] LC_ADDRESS=C LC_TELEPHONE=C [11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C time zone: America/New_York tzcode source: system (glibc) attached base packages: [1] stats4 stats graphics grDevices utils datasets methods [8] base other attached packages: [1] TSCAN_1.41.1 TrajectoryUtils_1.11.1 [3] scater_1.31.2 ggplot2_3.5.1 [5] bluster_1.13.0 batchelor_1.19.1 [7] scran_1.31.3 scuttle_1.13.1 [9] SingleCellExperiment_1.25.1 SummarizedExperiment_1.33.3 [11] Biobase_2.63.1 GenomicRanges_1.55.4 [13] GenomeInfoDb_1.39.14 IRanges_2.37.1 [15] S4Vectors_0.41.7 BiocGenerics_0.49.1 [17] MatrixGenerics_1.15.1 matrixStats_1.3.0 [19] BiocStyle_2.31.0 rebook_1.13.0 loaded via a namespace (and not attached): [1] bitops_1.0-7 gridExtra_2.3 [3] CodeDepends_0.6.6 rlang_1.1.3 [5] magrittr_2.0.3 RcppAnnoy_0.0.22 [7] compiler_4.4.0 mgcv_1.9-1 [9] dir.expiry_1.11.0 DelayedMatrixStats_1.25.4 [11] vctrs_0.6.5 combinat_0.0-8 [13] pkgconfig_2.0.3 crayon_1.5.2 [15] fastmap_1.1.1 XVector_0.43.1 [17] labeling_0.4.3 caTools_1.18.2 [19] utf8_1.2.4 promises_1.3.0 [21] rmarkdown_2.26 graph_1.81.1 [23] UCSC.utils_0.99.7 ggbeeswarm_0.7.2 [25] xfun_0.43 zlibbioc_1.49.3 [27] cachem_1.0.8 beachmat_2.19.4 [29] jsonlite_1.8.8 later_1.3.2 [31] highr_0.10 DelayedArray_0.29.9 [33] BiocParallel_1.37.1 irlba_2.3.5.1 [35] parallel_4.4.0 cluster_2.1.6 [37] R6_2.5.1 bslib_0.7.0 [39] limma_3.59.10 jquerylib_0.1.4 [41] Rcpp_1.0.12 bookdown_0.39 [43] knitr_1.46 httpuv_1.6.15 [45] splines_4.4.0 Matrix_1.7-0 [47] igraph_2.0.3 tidyselect_1.2.1 [49] abind_1.4-5 yaml_2.3.8 [51] viridis_0.6.5 gplots_3.1.3.1 [53] codetools_0.2-20 plyr_1.8.9 [55] lattice_0.22-6 tibble_3.2.1 [57] shiny_1.8.1.1 withr_3.0.0 [59] evaluate_0.23 mclust_6.1.1 [61] pillar_1.9.0 BiocManager_1.30.22 [63] filelock_1.0.3 KernSmooth_2.23-22 [65] generics_0.1.3 fastICA_1.2-4 [67] sparseMatrixStats_1.15.1 munsell_0.5.1 [69] scales_1.3.0 xtable_1.8-4 [71] gtools_3.9.5 glue_1.7.0 [73] metapod_1.11.1 tools_4.4.0 [75] BiocNeighbors_1.21.2 ScaledMatrix_1.11.1 [77] locfit_1.5-9.9 XML_3.99-0.16.1 [79] cowplot_1.1.3 grid_4.4.0 [81] edgeR_4.1.33 colorspace_2.1-0 [83] nlme_3.1-164 GenomeInfoDbData_1.2.12 [85] beeswarm_0.4.0 BiocSingular_1.19.0 [87] vipor_0.4.7 cli_3.6.2 [89] rsvd_1.0.5 rappdirs_0.3.3 [91] fansi_1.0.6 S4Arrays_1.3.7 [93] viridisLite_0.4.2 dplyr_1.1.4 [95] uwot_0.2.2 ResidualMatrix_1.13.0 [97] gtable_0.3.5 sass_0.4.9 [99] digest_0.6.35 SparseArray_1.3.7 [101] ggrepel_0.9.5 dqrng_0.3.2 [103] farver_2.1.1 htmltools_0.5.8.1 [105] lifecycle_1.0.4 httr_1.4.7 [107] mime_0.12 statmod_1.5.0 ```