These exercises are about manipulate single-cell data with Bioconductor packages. Please download the counting matrix from DropBox and loading them into a Seurat object. Or you may also used the rds file data/scSeq_CKO_sceSub.rds.
library(DropletUtils)
library(DropletTestFiles)
<- "~path to the 10X counting matrix"
fname <- read10xCounts(fname, col.names=TRUE)
sce saveRDS(sce,"path to rds file")
library(DropletUtils)
# library(DropletTestFiles)
<- readRDS("data/scSeq_CKO_sceSub.rds") sce
## Warning in xy.coords(x, y, xlabel, ylabel, log): 1 y value <= 0 omitted from
## logarithmic plot
## DataFrame with 400000 rows and 5 columns
## Total LogProb PValue Limited FDR
## <integer> <numeric> <numeric> <logical> <numeric>
## CCACGGAAGCTCTCGG-1 0 NA NA NA NA
## TGTGGTAAGAGTCGGT-1 2 -11.1237 0.7561244 FALSE NA
## CCCTCCTTCGTCTGCT-1 2 -18.2572 0.0727927 FALSE NA
## ACTGAGTGTGTCGCTG-1 0 NA NA NA NA
## CGTAGCGTCTCTGCTG-1 0 NA NA NA NA
## ... ... ... ... ... ...
## AGAGCTTGTCCGACGT-1 0 NA NA NA NA
## GCTGCGACAATAGCAA-1 0 NA NA NA NA
## CGAACATAGTGAAGTT-1 2 -12.3017 0.632437 FALSE NA
## TAGCCGGCATGTCGAT-1 0 NA NA NA NA
## CGAGAAGAGCAGATCG-1 0 NA NA NA NA
## Mode FALSE TRUE NA's
## logical 3051 3943 393006
## Limited
## Sig FALSE TRUE
## FALSE 3051 0
## TRUE 62 3881
## Warning in (function (x, sizes, min.mean = NULL, positive = FALSE, scaling =
## NULL) : encountered non-positive size factor estimates
## ENSMUSG00000051951 ENSMUSG00000025902 ENSMUSG00000033845 ENSMUSG00000025903
## 1.669575e-07 1.669575e-07 1.407972e-04 5.201547e-05
## ENSMUSG00000104217 ENSMUSG00000033813
## 1.669575e-07 6.783772e-05
## Min. 1st Qu. Median Mean 3rd Qu. Max.
## 0.0000 0.2445 0.6309 0.8732 1.2381 7.3498
##
## no yes
## 3744 199
## Warning: Removed 905 rows containing non-finite values (stat_density).