forked from nbbarrientos/LeafCutter
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathplot_leafcutter_effect.R
48 lines (35 loc) · 1.96 KB
/
plot_leafcutter_effect.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
library(data.table)
library(dplyr)
library(stringr)
library(ggplot2)
library(ggrepel)
cluster_sig = fread("PATH_TO_FILE/_cluster_significance.txt")
cluster_sig = cluster_sig[cluster_sig$status == "Success",]
effect = fread("PATH_TO_FILE/_effect_sizes.txt")
temp1 = str_split_fixed(effect$intron, ":", 4)
effect$cluster = paste0(temp1[,1],":",temp1[,4])
df1 = inner_join(effect, cluster_sig, by = c("cluster" = "cluster"))
df1$abs_deltapsi = abs(df1$Condition2 - df1$Condition1) #Conditions based on how the DS analysis was run with LeafCutter
df2 = group_by(df1, cluster) %>% summarise(max_deltapsi=max(abs_deltapsi))
df1$cluster_psi = paste0(df1$cluster,":",df1$abs_deltapsi)
df2$cluster_psi = paste0(df2$cluster,":",df2$max_deltapsi)
df3 = inner_join(df1, df2, by = c("cluster_psi"="cluster_psi"))
df3 = df3[!duplicated(df3$cluster.x),]
pval_threshold = 1e-6 #Calculate cluster-level significance
#Sets boolean variable to know which clusters are above significant thresholds for pvalue and deltapsi in volcano plot
df3$significant = ifelse(df3$p.adjust > pval_threshold, NA,
ifelse(df3$deltapsi < 0, "Significant_b0",
ifelse(df3$deltapsi > 0, "Significant_a0", NA)))
df3$genes = ifelse(is.na(df3$genes), df3$intron, df3$genes)
ggplot(df3, aes(x=deltapsi, y=-log10(p.adjust), color=significant)) +
geom_point(size = 1) +
scale_color_manual(values = c("orangered", "skyblue2"), na.value="gray89") +
geom_vline(xintercept = 0, color="black", size=0.5, linetype=2) +
geom_hline(yintercept = -log10(pval_threshold), color="black", size=0.5, linetype=2) +
geom_label_repel(data = subset(df3, df3$significant == "Significant_b0" | df3$significant == "Significant_a0"), aes(label=genes), size=3, col="black") +
xlab(expression(Delta*"PSI")) +
ylab(bquote(~-Log[10]~ 'Adjusted P-value')) +
ggtitle("You forgot to title the plot lol") +
theme_bw() +
theme(legend.position = "none",
plot.title = element_text(hjust = 0.5))