3. Covid19 data QC¶
library(tictoc)
tic()
load(file = 'nCoV.list.rda')
toc()
112.838 sec elapsed
library(Seurat)
library(dplyr)
library(ggpubr)
o<-function(w,h) options(repr.plot.width=w, repr.plot.height=h)
sample 1¶
i=1
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/e81e5/e81e5a0a94bc7a43a72c2c87e6968bdc12ddd6a9" alt="output_3_1.png"
data:image/s3,"s3://crabby-images/1ab96/1ab96b1d038dc64d1a291a3a815a6697a865dc1b" alt="output_3_2.png"
data:image/s3,"s3://crabby-images/236fb/236fb9a1d6aa3e1cd5106c844d0b131590b63919" alt="output_3_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 5)
sample 2¶
i=2
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
data:image/s3,"s3://crabby-images/49728/49728ac8fd7521401d9ed28ff4052972d8d6831a" alt="output_7_0.png"
data:image/s3,"s3://crabby-images/c0d28/c0d280ab9154ccbe996ea8d3cc9bd2bfa57637bd" alt="output_7_1.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.mt < 5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 5)
sample 3¶
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.mt < 5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 5)
i=3
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/72cec/72cec6803d7fbccda2d9a688e70586bb8764ba0b" alt="output_11_1.png"
data:image/s3,"s3://crabby-images/928a0/928a00226bad2d0db2e2313c99a05e6e7408d19e" alt="output_11_2.png"
data:image/s3,"s3://crabby-images/002de/002de09178b4fa35a2a294875da3241a80157dfe" alt="output_11_3.png"
sample 4 (low quality)¶
i=4
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/5cc43/5cc438a62de486c36cc9c88759b35b3ac320de1e" alt="output_13_1.png"
Warning message in FeaturePlot(nCoV.list[[i]], features = c("PTPRC", "COL1A1", "EPCAM", :
“All cells have the same value (0) of COL1A1.”
data:image/s3,"s3://crabby-images/2fed1/2fed1e059ea9280da483114d695b234af4342d3c" alt="output_13_3.png"
data:image/s3,"s3://crabby-images/79e8d/79e8db1250e197f3559d92fd9a12f5f17bba027f" alt="output_13_4.png"
sample 5¶
i=5
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/9deb8/9deb81f707085a59ad01ac230b7bbca1bc170489" alt="output_15_1.png"
data:image/s3,"s3://crabby-images/8a620/8a6203d27b937dc6af7f9223bb0e5879b7bbce5d" alt="output_15_2.png"
data:image/s3,"s3://crabby-images/b6729/b6729020cc13c0d6fbe0d9cd0c8c6ccdfda17933" alt="output_15_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nFeature_RNA < 3500)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nCount_RNA < 20000)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.75)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 7.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , RNA_snn_res.1.2 != 15)
sample 6¶
i=6
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/4f803/4f803abd9dc88f50c07068d7c54e40f0d6d025d1" alt="output_18_1.png"
data:image/s3,"s3://crabby-images/7a848/7a848b9fef197cfe509d98cd336dec94a7d60f49" alt="output_18_2.png"
data:image/s3,"s3://crabby-images/f2ab4/f2ab48f471d7e71978f2e0c0746047c17fc2d2a3" alt="output_18_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nFeature_RNA < 4000)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nCount_RNA < 30000)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , RNA_snn_res.1.2 != 11)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , RNA_snn_res.1.2 != 12)
sample 7¶
i=7
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/77f29/77f290991b1b75bdef184c01c5a03d627bff5f25" alt="output_21_1.png"
data:image/s3,"s3://crabby-images/646bc/646bc8b72019c37aaa477d8d91fb4cc97e6af00f" alt="output_21_2.png"
data:image/s3,"s3://crabby-images/0456c/0456ce60aa11e2becc13224f93dd5e849622d99a" alt="output_21_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso<10)
sample 8¶
i=8
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/c20be/c20befc2ba0ae61431e0c4c96626b6626a884b4b" alt="output_24_1.png"
data:image/s3,"s3://crabby-images/8f7f9/8f7f9bab5046c1b98bca15daa487a6c9b21c31f9" alt="output_24_2.png"
data:image/s3,"s3://crabby-images/0f1fc/0f1fc48c34412201607b92c71ce127d7d551375b" alt="output_24_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 10)
sample 9¶
i=9
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/23fa7/23fa7416965e9b2e8f3169137f9e9325899ac183" alt="output_27_1.png"
data:image/s3,"s3://crabby-images/29bad/29bada69fa04744146bf683fe62a97d52cffdb91" alt="output_27_2.png"
data:image/s3,"s3://crabby-images/e86a3/e86a357a80698b6f78c7c6067bd05740ef724d18" alt="output_27_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 5 )
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nFeature_RNA >500 )
sample 10 (low quality)¶
i=10
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/00a7a/00a7a6faa97cd2d00871a0be591d19e2a9ae58ce" alt="output_30_1.png"
Warning message in FeaturePlot(nCoV.list[[i]], features = c("PTPRC", "COL1A1", "EPCAM", :
“All cells have the same value (0) of COL1A1.”
data:image/s3,"s3://crabby-images/916d3/916d399fd3f3403c3594ade5823474bf474aa5de" alt="output_30_3.png"
data:image/s3,"s3://crabby-images/8ebd9/8ebd9b23936a198a8d604cb6b2b9ed8cd54349df" alt="output_30_4.png"
sample 11 (low quality)¶
i=11
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/76fb0/76fb0e2a14de8bed92b9a2b13d2dd2cfeb815e4f" alt="output_32_1.png"
Warning message in FeaturePlot(nCoV.list[[i]], features = c("PTPRC", "COL1A1", "EPCAM", :
“All cells have the same value (0) of COL1A1.”
Warning message in FeaturePlot(nCoV.list[[i]], features = c("PTPRC", "COL1A1", "EPCAM", :
“All cells have the same value (0) of CD79A.”
data:image/s3,"s3://crabby-images/6af74/6af7466782c722f871be51232411104f35de73b9" alt="output_32_3.png"
data:image/s3,"s3://crabby-images/50a9e/50a9e95bbba674f3c0a01a4a361747c4dd0ff177" alt="output_32_4.png"
sample 12¶
i=12
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/a2403/a2403ba5863e4b6572bc05d3419924a4ca657f1a" alt="output_34_1.png"
data:image/s3,"s3://crabby-images/06b48/06b480ffcc0ce37c541d2952091e16e22b3f9414" alt="output_34_2.png"
data:image/s3,"s3://crabby-images/31896/318962efffe856ea90f592d7652c9e3047530218" alt="output_34_3.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nFeature_RNA < 5000)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , nCount_RNA < 40000)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 5)
sample 13¶
i=13
o(20,20)
ggarrange(
DimPlot(nCoV.list[[i]], label=T,repel=T, group.by="RNA_snn_res.1.2")&NoLegend()&
theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'hybrid_score')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.mt')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
FeaturePlot(nCoV.list[[i]], features = 'percent.disso')&
theme(legend.position=c(0.8,0.8),
axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
),
ncol=2,nrow=2
)
o(20,15)
ggarrange(
VlnPlot(nCoV.list[[i]], features = 'hybrid_score')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'nCount_RNA')&NoLegend()&scale_y_continuous(breaks=c(20000,40000,50000,60000,70000,80000)),
VlnPlot(nCoV.list[[i]], features = 'nFeature_RNA')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.mt')&NoLegend(),
VlnPlot(nCoV.list[[i]], features = 'percent.disso')&NoLegend(),
ncol=2, nrow=3
)
o(5*5, 5*3)
FeaturePlot(nCoV.list[[i]],
features = c("PTPRC","COL1A1","EPCAM","PECAM1","CD3D",
'ITGAM','ITGAX',"CD68",'S100A9',"FCGR3B",
'CD79A','CD4','CD8A','IL7R','CCR7',
"CD44","IL2RA",'ITGAE','SELL','CD69'),
ncol=5
)&theme(axis.line = element_blank(),
axis.title = element_blank(),
axis.text = element_blank(),
axis.ticks=element_blank()
)
Scale for 'y' is already present. Adding another scale for 'y', which will
replace the existing scale.
data:image/s3,"s3://crabby-images/fcf10/fcf10a5ca5881fe08522fa0b38abb1b9d0a8f526" alt="output_37_1.png"
Warning message in FeaturePlot(nCoV.list[[i]], features = c("PTPRC", "COL1A1", "EPCAM", :
“All cells have the same value (0) of FCGR3B.”
data:image/s3,"s3://crabby-images/88a04/88a045babd8b30df1f94d7be131074f5edefdf73" alt="output_37_3.png"
data:image/s3,"s3://crabby-images/5e25c/5e25c8f7f099e3ae72eb07d77b6ad91e6039ea7f" alt="output_37_4.png"
nCoV.list[[i]] <- subset(nCoV.list[[i]] , hybrid_score < 1.5)
nCoV.list[[i]] <- subset(nCoV.list[[i]] , percent.disso < 5)
reclustering¶
library(scds)
dissociation.genes.hs<-c("ACTG1","ANKRD1","ARID5A","ATF3","ATF4","BAG3","BHLHE40","CCNL1","CCRN4L",
"CEBPB","CEBPD","CEBPG","CSRNP1","CXCL1","CYR61","DCN","DDX3XX","DDX5","DES","DNAJA1","DNAJB1",
"DNAJB4","DUSP1","DUSP8","EGR1","EGR2","EIF1","EIF5","ERF","ERRFI1","FAM132B","FOS","FOSB","FOSL2",
"GADD45A","GADD45G","BRD2","BTG1","BTG2","GCC1","GEM","H3F3B","HIPK3","HSP90AA1","HSP90AB1",
"HSPA1A","HSPA1B","HSPA5","HSPA8","HSPB1","HSPE1","HSPH1","ID3","IDI1","IER2","IER3","IER5",
"IFRD1","IL6","IRF1","IRF8","ITPKC","JUN","JUNB","JUND","KCNE4","KLF2","KLF4","KLF6","KLF9",
"LITAF","LMNA","MAFF","MAFK","MCL1","MIDN","MIR22HG","MT1","MT2","MYADM","MYC","MYD88","NCKAP5L",
"NCOA7","NFKBIA","NFKBIZ","NOP58","NPPC","NR4A1","ODC1","OSGIN1","OXNAD1","PCF11","PDE4B","PER1",
"PHLDA1","PNP","PNRC1","PPP1CC","PPP1R15A","PXDC1","RAP1B","RASSF1","RHOB","RHOH","RIPK1","SAT1X",
"SBNO2","SDC4","SERPINE1","SKIL","SLC10A6","SLC38A2","SLC41A1","SOCS3","SQSTM1","SRF","SRSF5",
"SRSF7","STAT3","TAGLN2","TIPARP","TNFAIP3","TNFAIP6","TPM3","TPPP3","TRA2A","TRA2B","TRIB1",
"TUBB4B","TUBB6","UBC","USP2","WAC","ZC3H12A","ZFAND5","ZFP36","ZFP36L1","ZFP36L2","ZYX")
# normalize and identify variable features for each dataset independently
nCoV.list <- lapply(X = nCoV.list, FUN = function(x) {
DefaultAssay(x)<-'RNA'
x <- NormalizeData(x, verbose = F)
x <- FindVariableFeatures(x, selection.method = "vst", nfeatures = 2000, verbose = F)
x <- ScaleData(x, features = rownames(x), verbose = F)
x <- RunPCA(object = x, features = VariableFeatures(x), npcs = 50, verbose = F)
x <- FindNeighbors(x, reduction = "pca", dims = 1:30, verbose = F)
x <- RunUMAP(object=x,reduction = "pca", dims = 1:30, verbose = F)
x <- FindClusters(object=x, resolution = c(0.7,0.9,1.2),verbose = F)
(x %>%
as.SingleCellExperiment %>%
cxds_bcds_hybrid)@colData[,c('cxds_score','bcds_score','hybrid_score')
] %>% as.data.frame -> scds.doublet.profiles
meta <- merge(x@meta.data, scds.doublet.profiles, by.x=0, by.y=0)
rownames(meta) <- meta$Row.names
meta$Row.names <- NULL
x@meta.data <- meta
gset <- dissociation.genes.hs
gset <- gset[gset %in% rownames(x)]
x[["percent.disso"]]<-PercentageFeatureSet(x, features = gset)
x
})
library(tictoc)
tic()
save(nCoV.list,
file = 'nCoV.list.qc.rda',
compress = T, compression_level = 9)
toc()
2695.756 sec elapsed