```r #--- data-loading ---# library(scRNAseq) sce.nest <- NestorowaHSCData() #--- gene-annotation ---# library(AnnotationHub) ens.mm.v97 <- AnnotationHub()[["AH73905"]] anno <- select(ens.mm.v97, keys=rownames(sce.nest), keytype="GENEID", columns=c("SYMBOL", "SEQNAME")) rowData(sce.nest) <- anno[match(rownames(sce.nest), anno$GENEID),] #--- quality-control ---# library(scater) stats <- perCellQCMetrics(sce.nest) qc <- quickPerCellQC(stats, percent_subsets="altexps_ERCC_percent") sce.nest <- sce.nest[,!qc$discard] #--- normalization ---# library(scran) set.seed(101000110) clusters <- quickCluster(sce.nest) sce.nest <- computeSumFactors(sce.nest, clusters=clusters) sce.nest <- logNormCounts(sce.nest) #--- variance-modelling ---# set.seed(00010101) dec.nest <- modelGeneVarWithSpikes(sce.nest, "ERCC") top.nest <- getTopHVGs(dec.nest, prop=0.1) ```

```r #--- data-loading ---# library(scRNAseq) sce.grun.hsc <- GrunHSCData(ensembl=TRUE) #--- gene-annotation ---# library(AnnotationHub) ens.mm.v97 <- AnnotationHub()[["AH73905"]] anno <- select(ens.mm.v97, keys=rownames(sce.grun.hsc), keytype="GENEID", columns=c("SYMBOL", "SEQNAME")) rowData(sce.grun.hsc) <- anno[match(rownames(sce.grun.hsc), anno$GENEID),] #--- quality-control ---# library(scuttle) stats <- perCellQCMetrics(sce.grun.hsc) qc <- quickPerCellQC(stats, batch=sce.grun.hsc$protocol, subset=grepl("sorted", sce.grun.hsc$protocol)) sce.grun.hsc <- sce.grun.hsc[,!qc$discard] ```

```r #--- data-loading ---# library(scRNAseq) sce.paul <- PaulHSCData(ensembl=TRUE) #--- gene-annotation ---# library(AnnotationHub) ens.mm.v97 <- AnnotationHub()[["AH73905"]] anno <- select(ens.mm.v97, keys=rownames(sce.paul), keytype="GENEID", columns=c("SYMBOL", "SEQNAME")) rowData(sce.paul) <- anno[match(rownames(sce.paul), anno$GENEID),] #--- quality-control ---# library(scater) stats <- perCellQCMetrics(sce.paul) qc <- quickPerCellQC(stats, batch=sce.paul$Plate_ID) # Detecting batches with unusually low threshold values. lib.thresholds <- attr(qc$low_lib_size, "thresholds")["lower",] nfeat.thresholds <- attr(qc$low_n_features, "thresholds")["lower",] ignore <- union(names(lib.thresholds)[lib.thresholds < 100], names(nfeat.thresholds)[nfeat.thresholds < 100]) # Repeating the QC using only the "high-quality" batches. qc2 <- quickPerCellQC(stats, batch=sce.paul$Plate_ID, subset=!sce.paul$Plate_ID %in% ignore) sce.paul <- sce.paul[,!qc2$discard] ```

``` R version 4.1.0 (2021-05-18) Platform: x86_64-pc-linux-gnu (64-bit) Running under: Ubuntu 20.04.2 LTS Matrix products: default BLAS: /home/biocbuild/bbs-3.13-bioc/R/lib/libRblas.so LAPACK: /home/biocbuild/bbs-3.13-bioc/R/lib/libRlapack.so locale: [1] LC_CTYPE=en_US.UTF-8 LC_NUMERIC=C [3] LC_TIME=en_US.UTF-8 LC_COLLATE=C [5] LC_MONETARY=en_US.UTF-8 LC_MESSAGES=en_US.UTF-8 [7] LC_PAPER=en_US.UTF-8 LC_NAME=C [9] LC_ADDRESS=C LC_TELEPHONE=C [11] LC_MEASUREMENT=en_US.UTF-8 LC_IDENTIFICATION=C attached base packages: [1] parallel stats4 stats graphics grDevices utils datasets [8] methods base other attached packages: [1] TSCAN_1.30.0 TrajectoryUtils_1.0.0 [3] scater_1.20.0 ggplot2_3.3.3 [5] bluster_1.2.0 batchelor_1.8.0 [7] scran_1.20.0 scuttle_1.2.0 [9] SingleCellExperiment_1.14.0 SummarizedExperiment_1.22.0 [11] Biobase_2.52.0 GenomicRanges_1.44.0 [13] GenomeInfoDb_1.28.0 IRanges_2.26.0 [15] S4Vectors_0.30.0 BiocGenerics_0.38.0 [17] MatrixGenerics_1.4.0 matrixStats_0.58.0 [19] BiocStyle_2.20.0 rebook_1.2.0 loaded via a namespace (and not attached): [1] ggbeeswarm_0.6.0 colorspace_2.0-1 [3] ellipsis_0.3.2 mclust_5.4.7 [5] XVector_0.32.0 BiocNeighbors_1.10.0 [7] farver_2.1.0 fansi_0.4.2 [9] splines_4.1.0 codetools_0.2-18 [11] sparseMatrixStats_1.4.0 knitr_1.33 [13] jsonlite_1.7.2 ResidualMatrix_1.2.0 [15] cluster_2.1.2 graph_1.70.0 [17] uwot_0.1.10 shiny_1.6.0 [19] BiocManager_1.30.15 compiler_4.1.0 [21] dqrng_0.3.0 fastmap_1.1.0 [23] assertthat_0.2.1 Matrix_1.3-3 [25] limma_3.48.0 later_1.2.0 [27] BiocSingular_1.8.0 htmltools_0.5.1.1 [29] tools_4.1.0 rsvd_1.0.5 [31] igraph_1.2.6 gtable_0.3.0 [33] glue_1.4.2 GenomeInfoDbData_1.2.6 [35] dplyr_1.0.6 rappdirs_0.3.3 [37] Rcpp_1.0.6 jquerylib_0.1.4 [39] vctrs_0.3.8 nlme_3.1-152 [41] DelayedMatrixStats_1.14.0 xfun_0.23 [43] stringr_1.4.0 beachmat_2.8.0 [45] mime_0.10 lifecycle_1.0.0 [47] irlba_2.3.3 gtools_3.8.2 [49] statmod_1.4.36 XML_3.99-0.6 [51] edgeR_3.34.0 zlibbioc_1.38.0 [53] scales_1.1.1 promises_1.2.0.1 [55] yaml_2.2.1 gridExtra_2.3 [57] sass_0.4.0 fastICA_1.2-2 [59] stringi_1.6.2 highr_0.9 [61] ScaledMatrix_1.0.0 caTools_1.18.2 [63] filelock_1.0.2 BiocParallel_1.26.0 [65] rlang_0.4.11 pkgconfig_2.0.3 [67] bitops_1.0-7 evaluate_0.14 [69] lattice_0.20-44 purrr_0.3.4 [71] CodeDepends_0.6.5 labeling_0.4.2 [73] cowplot_1.1.1 tidyselect_1.1.1 [75] RcppAnnoy_0.0.18 plyr_1.8.6 [77] magrittr_2.0.1 bookdown_0.22 [79] R6_2.5.0 gplots_3.1.1 [81] generics_0.1.0 metapod_1.0.0 [83] combinat_0.0-8 DelayedArray_0.18.0 [85] DBI_1.1.1 mgcv_1.8-35 [87] pillar_1.6.1 withr_2.4.2 [89] RCurl_1.98-1.3 tibble_3.1.2 [91] dir.expiry_1.0.0 crayon_1.4.1 [93] KernSmooth_2.23-20 utf8_1.2.1 [95] rmarkdown_2.8 viridis_0.6.1 [97] locfit_1.5-9.4 grid_4.1.0 [99] digest_0.6.27 xtable_1.8-4 [101] httpuv_1.6.1 munsell_0.5.0 [103] beeswarm_0.3.1 viridisLite_0.4.0 [105] vipor_0.4.5 bslib_0.2.5.1 ```