-
Notifications
You must be signed in to change notification settings - Fork 2
/
10X Datasets UMI per marker.Rmd
123 lines (92 loc) · 3.62 KB
/
10X Datasets UMI per marker.Rmd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
---
title: "CITE-seq optimization - 10X datasets: UMI per marker plot"
author: "Terkild Brink Buus"
date: "30/3/2020"
output: github_document
---
```{r setup, include=FALSE}
knitr::opts_chunk$set(warning=FALSE, message=FALSE)
options(stringsAsFactors=FALSE)
```
## Load utilities
Including libraries, plotting and color settings and custom utility functions
```{r loadLibraries, results='hide', message=FALSE, warning=FALSE}
set.seed(114)
require("tidyverse", quietly=T)
library("Matrix", quietly=T)
## Load ggplot theme and defaults
source("R/ggplot_settings.R")
## Load helper functions
source("R/Utilities.R")
outdir <- "figures"
data.10X <- "data/data.10X.datasets.Rdata"
```
## Load data
10X datasets were preprocessed in the [Load unfiltered data vignette](Load-unfiltered-data.md)
```{r}
load(file=data.10X)
```
## Draw UMI per marker
These three 10X dataset used the same panel of antibodies at three conditions, 3' V3 chemistry at ~1,000 and ~10,000 cells or 5' at 10,000 cells using TotalSeqB or TotalSeqC antibodies, respectively.
```{r, fig.height=3, fig.width=7}
## Extract data from list into a combined data.frame
for(i in seq_along(data.10X.datasets)){
dataset <- data.10X.datasets[i]
kallisto <- data.10X.datasets.adt.kallisto[[dataset]]
cells <- intersect(data.10X.datasets.gex.aboveInf[[dataset]],colnames(kallisto))
total <- Matrix::rowSums(kallisto)
Cell <- Matrix::rowSums(kallisto[,cells])
EmptyDrop <- total-Cell
add <- data.frame(Dataset=dataset,Marker=names(Cell),Cell,EmptyDrop)
if(i == 1){
plotData <- add
} else {
plotData <- rbind(plotData,add)
}
}
## Convert data into "long format" for plotting with ggplot
plotData <- plotData %>% pivot_longer(c(-Marker, -Dataset))
## Rename isotype controls to get shorter names
plotData$Marker <- gsub("isotype_control_","",plotData$Marker)
plotData$subset <- factor(as.character(plotData$name), levels=c("EmptyDrop","Cell"))
plotData$Dataset <- factor(as.character(plotData$Dataset), levels=data.10X.datasets)
## Make plot
data.10X.markerBarplot <- ggplot(plotData, aes(x=Marker, y=value/10^6, fill=subset)) +
geom_bar(stat="identity", position="dodge", color="black", width=0.65) +
scale_y_continuous(expand=c(0,0,0.05,0)) +
scale_fill_manual(values=c("lightgrey","black")) +
labs(y=bquote("ADT UMI counts ("~10^6~")")) +
coord_flip() +
facet_wrap(~Dataset, nrow=1, scales="free_x") +
theme(axis.title.y=element_blank(),
legend.position=c(1,0.98),
legend.justification=c(1,1),
legend.title=element_blank(),
legend.background=element_blank())
```
## Final figure
```{r, fig.height=5, fig.width=7}
## Include knee_plots from preprocessing in the figure
data.10X.GEXrank <- cowplot::plot_grid(plotlist=data.10X.datasets.knee_plots,
labels=data.10X.datasets,
hjust=-0.65,
vjust=1.6,
label_size=7,
nrow=1)
p.figure <- cowplot::plot_grid(data.10X.GEXrank, data.10X.markerBarplot,
labels=c("A", "B"),
ncol=1,
rel_heights=c(2,3),
label_size=panel.label_size,
vjust=panel.label_vjust,
hjust=panel.label_hjust)
png(file=file.path(outdir,"Supplementary Figure S6.png"),
width=figure.width.full,
height=5,
units = figure.unit,
res=figure.resolution,
antialias=figure.antialias)
p.figure
dev.off()
p.figure
```