xxx object slots

  1. expression counts

  2. ground truth up genes

  3. ground truth down genes

  4. ground truth up gene sets

  5. ground truth down gene sets

  6. DE result (DESeq2)

  7. DE genes up observed

  8. DE genes down observed

  9. clusterprofiler_default up gene sets

  10. clusterprofiler_default down gene sets

  11. clusterprofiler bg fix up gene sets

  12. clusterprofiler bg fix down gene sets

  13. clusterprofiler FDR fix up gene sets

  14. clusterprofiler FDR fix down gene sets

  15. clusterprofiler BG and FDR fix up gene sets

  16. clusterprofiler BG and FDR fix down gene sets

  17. fora up gene sets

  18. fora down gene sets

  19. fgsea up gene sets

  20. fgsea down gene sets

Get count data

a <- countData()

Generate gene sets

gsets <- randomGeneSets(a,setsize=30,nsets=200)

run simulations over a range of parameters

#run 500 sims

colnames(mygrid) <- c("FRAC_DE","FC","N_REPS","DGE_FUNC","SUM_COUNT","VARIANCE")

## 1    0.05 0.5      3   deseq2     2e+07      0.0
## 2    0.05 0.5      3   deseq2     2e+07      0.1
## 3    0.05 0.5      3   deseq2     2e+07      0.2
## 4    0.05 0.5      3   deseq2     2e+07      0.3
## 5    0.05 0.5      3   deseq2     2e+07      0.4
## 6    0.05 0.5      3   deseq2     2e+07      0.5
## 7    0.05 0.5      3   deseq2     2e+07      0.6

Now run the analysis.

res <- lapply(1:nrow(mygrid), function(i) {
  x <- agg_dge(a,N_REPS,SUM_COUNT,VARIANCE,FRAC_DE,FC,SIMS,DGE_FUNC,gsets,cores=32), x))

res <-,res)


Now show the results.

res %>% kbl(caption="simulation_results") %>% kable_paper("hover", full_width = F)
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
3 2e+07 0.0 0.05 0.5 1000 deseq2 9.922 0.280 18377.92 0.078 0.9725544 0.9922 0.9822790 clusterProfiler default
3 2e+07 0.0 0.05 0.5 1000 deseq2 9.949 0.496 18377.71 0.051 0.9525132 0.9949 0.9732453 clusterProfiler BG fix
3 2e+07 0.0 0.05 0.5 1000 deseq2 9.784 0.013 18378.19 0.216 0.9986731 0.9784 0.9884326 clusterProfiler FDR fix
3 2e+07 0.0 0.05 0.5 1000 deseq2 9.912 0.352 18377.85 0.088 0.9657054 0.9912 0.9782866 clusterProfiler BG and FDR fix
3 2e+07 0.0 0.05 0.5 1000 deseq2 9.912 0.352 18377.85 0.088 0.9657054 0.9912 0.9782866 fora
3 2e+07 0.0 0.05 0.5 1000 deseq2 9.981 0.700 18377.50 0.019 0.9344631 0.9981 0.9652338 fgsea
3 2e+07 0.1 0.05 0.5 1000 deseq2 9.783 0.279 18371.67 0.217 0.9722719 0.9783 0.9752766 clusterProfiler default
3 2e+07 0.1 0.05 0.5 1000 deseq2 9.832 0.453 18371.50 0.168 0.9559553 0.9832 0.9693862 clusterProfiler BG fix
3 2e+07 0.1 0.05 0.5 1000 deseq2 9.442 0.024 18371.93 0.558 0.9974646 0.9442 0.9701017 clusterProfiler FDR fix
3 2e+07 0.1 0.05 0.5 1000 deseq2 9.739 0.296 18371.66 0.261 0.9705032 0.9739 0.9721987 clusterProfiler BG and FDR fix
3 2e+07 0.1 0.05 0.5 1000 deseq2 9.739 0.296 18371.66 0.261 0.9705032 0.9739 0.9721987 fora
3 2e+07 0.1 0.05 0.5 1000 deseq2 9.981 0.557 18371.40 0.019 0.9471437 0.9981 0.9719544 fgsea
3 2e+07 0.2 0.05 0.5 1000 deseq2 8.642 0.395 18349.43 1.358 0.9562908 0.8642 0.9079162 clusterProfiler default
3 2e+07 0.2 0.05 0.5 1000 deseq2 8.812 0.485 18349.34 1.188 0.9478326 0.8812 0.9133026 clusterProfiler BG fix
3 2e+07 0.2 0.05 0.5 1000 deseq2 7.353 0.027 18349.80 2.647 0.9963415 0.7353 0.8461450 clusterProfiler FDR fix
3 2e+07 0.2 0.05 0.5 1000 deseq2 8.089 0.259 18349.56 1.911 0.9689746 0.8089 0.8817310 clusterProfiler BG and FDR fix
3 2e+07 0.2 0.05 0.5 1000 deseq2 8.089 0.259 18349.56 1.911 0.9689746 0.8089 0.8817310 fora
3 2e+07 0.2 0.05 0.5 1000 deseq2 9.858 0.531 18349.29 0.142 0.9488882 0.9858 0.9669920 fgsea
3 2e+07 0.3 0.05 0.5 1000 deseq2 5.263 0.349 18312.24 4.737 0.9378118 0.5263 0.6742250 clusterProfiler default
3 2e+07 0.3 0.05 0.5 1000 deseq2 5.656 0.429 18312.16 4.344 0.9294988 0.5656 0.7032639 clusterProfiler BG fix
3 2e+07 0.3 0.05 0.5 1000 deseq2 3.367 0.026 18312.57 6.633 0.9923372 0.3367 0.5028000 clusterProfiler FDR fix
3 2e+07 0.3 0.05 0.5 1000 deseq2 3.685 0.087 18312.51 6.315 0.9769353 0.3685 0.5351438 clusterProfiler BG and FDR fix
3 2e+07 0.3 0.05 0.5 1000 deseq2 3.685 0.087 18312.51 6.315 0.9769353 0.3685 0.5351438 fora
3 2e+07 0.3 0.05 0.5 1000 deseq2 9.169 0.575 18312.02 0.831 0.9409893 0.9169 0.9287885 fgsea
3 2e+07 0.4 0.05 0.5 1000 deseq2 2.146 0.276 18258.59 7.854 0.8860446 0.2146 0.3455160 clusterProfiler default
3 2e+07 0.4 0.05 0.5 1000 deseq2 2.560 0.387 18258.47 7.440 0.8686800 0.2560 0.3954584 clusterProfiler BG fix
3 2e+07 0.4 0.05 0.5 1000 deseq2 1.032 0.017 18258.85 8.968 0.9837941 0.1032 0.1868042 clusterProfiler FDR fix
3 2e+07 0.4 0.05 0.5 1000 deseq2 1.100 0.025 18258.84 8.900 0.9777778 0.1100 0.1977528 clusterProfiler BG and FDR fix
3 2e+07 0.4 0.05 0.5 1000 deseq2 1.100 0.025 18258.84 8.900 0.9777778 0.1100 0.1977528 fora
3 2e+07 0.4 0.05 0.5 1000 deseq2 7.162 0.421 18258.44 2.838 0.9444811 0.7162 0.8146505 fgsea
3 2e+07 0.5 0.05 0.5 1000 deseq2 0.624 0.256 18198.76 9.376 0.7090909 0.0624 0.1147059 clusterProfiler default
3 2e+07 0.5 0.05 0.5 1000 deseq2 0.758 0.347 18198.67 9.242 0.6859729 0.0758 0.1365151 clusterProfiler BG fix
3 2e+07 0.5 0.05 0.5 1000 deseq2 0.231 0.015 18199.00 9.769 0.9390244 0.0231 0.0450908 clusterProfiler FDR fix
3 2e+07 0.5 0.05 0.5 1000 deseq2 0.242 0.018 18199.00 9.758 0.9307692 0.0242 0.0471735 clusterProfiler BG and FDR fix
3 2e+07 0.5 0.05 0.5 1000 deseq2 0.242 0.018 18199.00 9.758 0.9307692 0.0242 0.0471735 fora
3 2e+07 0.5 0.05 0.5 1000 deseq2 4.391 0.281 18198.73 5.609 0.9398545 0.4391 0.5985551 fgsea
3 2e+07 0.6 0.05 0.5 1000 deseq2 0.316 0.255 18105.75 9.684 0.5534151 0.0316 0.0597862 clusterProfiler default
3 2e+07 0.6 0.05 0.5 1000 deseq2 0.369 0.323 18105.68 9.631 0.5332370 0.0369 0.0690236 clusterProfiler BG fix
3 2e+07 0.6 0.05 0.5 1000 deseq2 0.104 0.031 18105.97 9.896 0.7703704 0.0104 0.0205229 clusterProfiler FDR fix
3 2e+07 0.6 0.05 0.5 1000 deseq2 0.105 0.032 18105.97 9.895 0.7664234 0.0105 0.0207162 clusterProfiler BG and FDR fix
3 2e+07 0.6 0.05 0.5 1000 deseq2 0.105 0.032 18105.97 9.895 0.7664234 0.0105 0.0207162 fora
3 2e+07 0.6 0.05 0.5 1000 deseq2 2.145 0.180 18105.82 7.855 0.9225806 0.2145 0.3480730 fgsea



cp <- subset(res,PWAY_FUNC == "clusterProfiler default")
cpbg <- subset(res,PWAY_FUNC == "clusterProfiler BG fix")
cpfdr <- subset(res,PWAY_FUNC == "clusterProfiler FDR fix")
cpbgfdr <- subset(res,PWAY_FUNC == "clusterProfiler BG and FDR fix")
fo <- subset(res,PWAY_FUNC == "fora")
fg <- subset(res,PWAY_FUNC == "fgsea")

cp %>% kbl(caption="clusterProfiler") %>% kable_paper("hover", full_width = F)
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
1 3 2e+07 0.0 0.05 0.5 1000 deseq2 9.922 0.280 18377.92 0.078 0.9725544 0.9922 0.9822790 clusterProfiler default
7 3 2e+07 0.1 0.05 0.5 1000 deseq2 9.783 0.279 18371.67 0.217 0.9722719 0.9783 0.9752766 clusterProfiler default
13 3 2e+07 0.2 0.05 0.5 1000 deseq2 8.642 0.395 18349.43 1.358 0.9562908 0.8642 0.9079162 clusterProfiler default
19 3 2e+07 0.3 0.05 0.5 1000 deseq2 5.263 0.349 18312.24 4.737 0.9378118 0.5263 0.6742250 clusterProfiler default
25 3 2e+07 0.4 0.05 0.5 1000 deseq2 2.146 0.276 18258.59 7.854 0.8860446 0.2146 0.3455160 clusterProfiler default
31 3 2e+07 0.5 0.05 0.5 1000 deseq2 0.624 0.256 18198.76 9.376 0.7090909 0.0624 0.1147059 clusterProfiler default
37 3 2e+07 0.6 0.05 0.5 1000 deseq2 0.316 0.255 18105.75 9.684 0.5534151 0.0316 0.0597862 clusterProfiler default
cpbg %>% kbl(caption="clusterProfiler with background bug fix") %>% kable_paper("hover", full_width = F)
clusterProfiler with background bug fix
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
2 3 2e+07 0.0 0.05 0.5 1000 deseq2 9.949 0.496 18377.71 0.051 0.9525132 0.9949 0.9732453 clusterProfiler BG fix
8 3 2e+07 0.1 0.05 0.5 1000 deseq2 9.832 0.453 18371.50 0.168 0.9559553 0.9832 0.9693862 clusterProfiler BG fix
14 3 2e+07 0.2 0.05 0.5 1000 deseq2 8.812 0.485 18349.34 1.188 0.9478326 0.8812 0.9133026 clusterProfiler BG fix
20 3 2e+07 0.3 0.05 0.5 1000 deseq2 5.656 0.429 18312.16 4.344 0.9294988 0.5656 0.7032639 clusterProfiler BG fix
26 3 2e+07 0.4 0.05 0.5 1000 deseq2 2.560 0.387 18258.47 7.440 0.8686800 0.2560 0.3954584 clusterProfiler BG fix
32 3 2e+07 0.5 0.05 0.5 1000 deseq2 0.758 0.347 18198.67 9.242 0.6859729 0.0758 0.1365151 clusterProfiler BG fix
38 3 2e+07 0.6 0.05 0.5 1000 deseq2 0.369 0.323 18105.68 9.631 0.5332370 0.0369 0.0690236 clusterProfiler BG fix
cpfdr %>% kbl(caption="clusterProfiler with FDR bug fix") %>% kable_paper("hover", full_width = F)
clusterProfiler with FDR bug fix
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
3 3 2e+07 0.0 0.05 0.5 1000 deseq2 9.784 0.013 18378.19 0.216 0.9986731 0.9784 0.9884326 clusterProfiler FDR fix
9 3 2e+07 0.1 0.05 0.5 1000 deseq2 9.442 0.024 18371.93 0.558 0.9974646 0.9442 0.9701017 clusterProfiler FDR fix
15 3 2e+07 0.2 0.05 0.5 1000 deseq2 7.353 0.027 18349.80 2.647 0.9963415 0.7353 0.8461450 clusterProfiler FDR fix
21 3 2e+07 0.3 0.05 0.5 1000 deseq2 3.367 0.026 18312.57 6.633 0.9923372 0.3367 0.5028000 clusterProfiler FDR fix
27 3 2e+07 0.4 0.05 0.5 1000 deseq2 1.032 0.017 18258.85 8.968 0.9837941 0.1032 0.1868042 clusterProfiler FDR fix
33 3 2e+07 0.5 0.05 0.5 1000 deseq2 0.231 0.015 18199.00 9.769 0.9390244 0.0231 0.0450908 clusterProfiler FDR fix
39 3 2e+07 0.6 0.05 0.5 1000 deseq2 0.104 0.031 18105.97 9.896 0.7703704 0.0104 0.0205229 clusterProfiler FDR fix
cpbgfdr %>% kbl(caption="clusterProfiler with background and FDR fixes") %>% kable_paper("hover", full_width = F)
clusterProfiler with background and FDR fixes
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
4 3 2e+07 0.0 0.05 0.5 1000 deseq2 9.912 0.352 18377.85 0.088 0.9657054 0.9912 0.9782866 clusterProfiler BG and FDR fix
10 3 2e+07 0.1 0.05 0.5 1000 deseq2 9.739 0.296 18371.66 0.261 0.9705032 0.9739 0.9721987 clusterProfiler BG and FDR fix
16 3 2e+07 0.2 0.05 0.5 1000 deseq2 8.089 0.259 18349.56 1.911 0.9689746 0.8089 0.8817310 clusterProfiler BG and FDR fix
22 3 2e+07 0.3 0.05 0.5 1000 deseq2 3.685 0.087 18312.51 6.315 0.9769353 0.3685 0.5351438 clusterProfiler BG and FDR fix
28 3 2e+07 0.4 0.05 0.5 1000 deseq2 1.100 0.025 18258.84 8.900 0.9777778 0.1100 0.1977528 clusterProfiler BG and FDR fix
34 3 2e+07 0.5 0.05 0.5 1000 deseq2 0.242 0.018 18199.00 9.758 0.9307692 0.0242 0.0471735 clusterProfiler BG and FDR fix
40 3 2e+07 0.6 0.05 0.5 1000 deseq2 0.105 0.032 18105.97 9.895 0.7664234 0.0105 0.0207162 clusterProfiler BG and FDR fix
fo %>% kbl(caption="fora") %>% kable_paper("hover", full_width = F)
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
5 3 2e+07 0.0 0.05 0.5 1000 deseq2 9.912 0.352 18377.85 0.088 0.9657054 0.9912 0.9782866 fora
11 3 2e+07 0.1 0.05 0.5 1000 deseq2 9.739 0.296 18371.66 0.261 0.9705032 0.9739 0.9721987 fora
17 3 2e+07 0.2 0.05 0.5 1000 deseq2 8.089 0.259 18349.56 1.911 0.9689746 0.8089 0.8817310 fora
23 3 2e+07 0.3 0.05 0.5 1000 deseq2 3.685 0.087 18312.51 6.315 0.9769353 0.3685 0.5351438 fora
29 3 2e+07 0.4 0.05 0.5 1000 deseq2 1.100 0.025 18258.84 8.900 0.9777778 0.1100 0.1977528 fora
35 3 2e+07 0.5 0.05 0.5 1000 deseq2 0.242 0.018 18199.00 9.758 0.9307692 0.0242 0.0471735 fora
41 3 2e+07 0.6 0.05 0.5 1000 deseq2 0.105 0.032 18105.97 9.895 0.7664234 0.0105 0.0207162 fora
fg %>% kbl(caption="fg") %>% kable_paper("hover", full_width = F)
N_REPS SUM_COUNT VARIANCE FRAC_DE FC SIMS DGE_FUNC true_pos false_pos true_neg false_neg p r f PWAY_FUNC
6 3 2e+07 0.0 0.05 0.5 1000 deseq2 9.981 0.700 18377.50 0.019 0.9344631 0.9981 0.9652338 fgsea
12 3 2e+07 0.1 0.05 0.5 1000 deseq2 9.981 0.557 18371.40 0.019 0.9471437 0.9981 0.9719544 fgsea
18 3 2e+07 0.2 0.05 0.5 1000 deseq2 9.858 0.531 18349.29 0.142 0.9488882 0.9858 0.9669920 fgsea
24 3 2e+07 0.3 0.05 0.5 1000 deseq2 9.169 0.575 18312.02 0.831 0.9409893 0.9169 0.9287885 fgsea
30 3 2e+07 0.4 0.05 0.5 1000 deseq2 7.162 0.421 18258.44 2.838 0.9444811 0.7162 0.8146505 fgsea
36 3 2e+07 0.5 0.05 0.5 1000 deseq2 4.391 0.281 18198.73 5.609 0.9398545 0.4391 0.5985551 fgsea
42 3 2e+07 0.6 0.05 0.5 1000 deseq2 2.145 0.180 18105.82 7.855 0.9225806 0.2145 0.3480730 fgsea
par(mar=c(c(5.1, 5.1, 2.1, 2.1) ))

plot(cp$VARIANCE,cp$p,ylim=c(0,1),type="b",pch=19,xlab="variance added",ylab="index",main="precision")

legend("bottomleft", inset=.02, title="tool",
   c("CP default","CP BG fix","CP FDR fix","CP BG and FDR fix","fora","fgsea"),
   col=c("black","orange","darkgreen","purple","red","blue"),horiz=FALSE, cex=1.0, pch=19,lwd=2)

plot(cp$VARIANCE,cp$r,ylim=c(0,1),type="b",pch=19,xlab="variance added",ylab="index",main="recall")

plot(cp$VARIANCE,cp$f,ylim=c(0,1),type="b",pch=19,xlab="variance added",ylab="index",main="f1")

png("fig3_sim.png", width=7,height=5,units="in",res=150,pointsize=12)
par(mar=c(c(5.1, 5.1, 2.1, 2.1) ))

plot(cp$VARIANCE,cp$p,ylim=c(0,1),type="b",pch=19,xlab="variance added",ylab="index",main="precision")
legend("bottomleft", inset=.02, title="tool",
   c("CP default","CP BG fix","CP FDR fix","CP BG and FDR fix","fora","fgsea"),
   horiz=FALSE, cex=1.0, pch=19,lwd=2)

plot(cp$VARIANCE,cp$r,ylim=c(0,1),type="b",pch=19,xlab="variance added",ylab="index",main="recall")

plot(cp$VARIANCE,cp$f,ylim=c(0,1),type="b",pch=19,xlab="variance added",ylab="index",main="f1")
## png 
##   2

Barplot is simpler.

prec <- c("CP default"=mean(cp$p),"CP BG fix"=mean(cpbg$p),"CP FDR fix"=mean(cpfdr$p),"CP BG and FDR fix"=mean(cpbgfdr$p),"fora"=mean(fo$p),"fgsea"=mean(fg$p))
rec <- c("CP default"=mean(cp$r),"CP BG fix"=mean(cpbg$r),"CP FDR fix"=mean(cpfdr$r),"CP BG and FDR fix"=mean(cpbgfdr$r),"fora"=mean(fo$r),"fgsea"=mean(fg$r))
f1 <- sapply(1:length(prec), function(i) { 2/(1/rec[i]+1/prec[i]) })

par(mar=c(c(9.1, 3.5, 2.1, 1.1) ))

png("fig3_bars.png", width=7,height=5,units="in",res=150,pointsize=12)
par(mar=c(c(9.1, 3.5, 2.1, 1.1) ))
## png 
##   2

