index.html annotation.html macrophage_estimation_parasite.html macrophage_expression_parasite.html

In this document, we will perform a series of differential expression analyses using the data which survived sample estimation.

1 Gene Ontology searches

Lets set up some simple data sets for goseq/clusterProfiler/topGO

I think a bunch of the material in this sheet is actually now obsolete.

1.1 Extracting ontology annotations from the TriTrypDB

## goseq uses the gene lengths, clusterprofiler and topgo don't
## gene_lengths <- all_genes[,c("geneid","genesize")]
## colnames(gene_lengths) <- c("ID", "width")
colnames(lp_lengths) <- c("ID", "width")
## go_ids needs to be a 2 column data frame with names 'ID', 'GO' which are
## gene names and GO names respectively.  I actually think I made my goseq() function
## smart enough that this is no longer needed, but nonetheless.

## go_ids <- read.table("reference/go/tcruzi_all_go.tab.gz", header=0, sep="\t")
## colnames(go_ids) <- c("ID","GO","ontology","term","source")
## Since there are multiple sources, I am doing a unique of the table...
## go_ids <- unique(go_ids[,c("ID","GO")])
## goid_file <- "reference/go/topgo_goids.tab.gz"

## colnames(lp_goids) <- c("ID", "GO")
lp_go <- lp_goids[, c("ID","GO")]
lp_go$ID <- paste0("exon_", lp_go$ID)
lp_go$ID <- paste0(lp_go$ID, ".1")
test_sig <- macro_batch_sig[["limma"]][["ups"]][["macro_chr-sh"]]
## Error in eval(expr, envir, enclos): object 'macro_batch_sig' not found
dim(test_sig)
## Error in eval(expr, envir, enclos): object 'test_sig' not found
## hmm maybe there are insufficient genes for gene ontology...
##macrobatch_shch_up_goseq <- simple_goseq(sig_genes=test_sig,
##                                         go_db=lp_go,
##                                         length_db=lp_lengths)
##macrobatch_shch_up_goseq <- sm(simple_goseq(sig_genes=macrobatch$limma$ups$macro_sh_vs_macro_ch,
##                                            go_db=lp_goids, length_db=lp_lengths))
##macrobatch_shch_up_excel <- sm(write_goseq_data(macrobatch_shch_up_goseq,
##                                                excel=paste0("excel/macrobatch_shch_up_goseq-v", ver, ".xlsx")))
LS0tCnRpdGxlOiAiUk5Bc2VxIG9mIEwucGFuYW1lbnNpczogUGFyYXNpdGUgR2VuZSBPbnRvbG9neS4iCmF1dGhvcjogImF0YiBhYmVsZXdAZ21haWwuY29tIgpkYXRlOiAiYHIgU3lzLkRhdGUoKWAiCm91dHB1dDoKIGh0bWxfZG9jdW1lbnQ6CiAgY29kZV9kb3dubG9hZDogdHJ1ZQogIGNvZGVfZm9sZGluZzogc2hvdwogIGZpZ19jYXB0aW9uOiB0cnVlCiAgZmlnX2hlaWdodDogNwogIGZpZ193aWR0aDogNwogIGhpZ2hsaWdodDogZGVmYXVsdAogIGtlZXBfbWQ6IGZhbHNlCiAgbW9kZTogc2VsZmNvbnRhaW5lZAogIG51bWJlcl9zZWN0aW9uczogdHJ1ZQogIHNlbGZfY29udGFpbmVkOiB0cnVlCiAgdGhlbWU6IHJlYWRhYmxlCiAgdG9jOiB0cnVlCiAgdG9jX2Zsb2F0OgogICAgY29sbGFwc2VkOiBmYWxzZQogICAgc21vb3RoX3Njcm9sbDogZmFsc2UKLS0tCgoKPHN0eWxlPgogIDwhLS0gRG9jdW1lbnQgcHJlbHVkZSByZXZpc2lvbiAyMDE2LTEwIC0tPgogIGJvZHkgLm1haW4tY29udGFpbmVyIHsKICAgIG1heC13aWR0aDogMTYwMHB4Owp9Cjwvc3R5bGU+CgpgYGB7ciBvcHRpb25zLCBpbmNsdWRlPUZBTFNFfQojIyBUaGVzZSBhcmUgdGhlIG9wdGlvbnMgSSB0ZW5kIHRvIGZhdm9yCmxpYnJhcnkoImhwZ2x0b29scyIpCnR0IDwtIGRldnRvb2xzOjpsb2FkX2FsbCgifi9ocGdsdG9vbHMiKQprbml0cjo6b3B0c19rbml0JHNldCgKICAgIHByb2dyZXNzID0gVFJVRSwKICAgIHZlcmJvc2UgPSBUUlVFLAogICAgd2lkdGggPSA5MCwKICAgIGVjaG8gPSBUUlVFKQprbml0cjo6b3B0c19jaHVuayRzZXQoCiAgICBlcnJvciA9IFRSVUUsCiAgICBmaWcud2lkdGggPSA4LAogICAgZmlnLmhlaWdodCA9IDgsCiAgICBkcGkgPSA5NikKb3B0aW9ucygKICAgIGRpZ2l0cyA9IDQsCiAgICBzdHJpbmdzQXNGYWN0b3JzID0gRkFMU0UsCiAgICBrbml0ci5kdXBsaWNhdGUubGFiZWwgPSAiYWxsb3ciKQpnZ3Bsb3QyOjp0aGVtZV9zZXQoZ2dwbG90Mjo6dGhlbWVfYncoYmFzZV9zaXplPTEwKSkKc2V0LnNlZWQoMSkKcm1kX2ZpbGUgPC0gIm1hY3JvcGhhZ2Vfb250b2xvZ3lfcGFyYXNpdGUuUm1kIgp2ZXIgPC0gIjIwMTcwMjAyIgpgYGAKCltpbmRleC5odG1sXShpbmRleC5odG1sKSBbYW5ub3RhdGlvbi5odG1sXShhbm5vdGF0aW9uLmh0bWwpClttYWNyb3BoYWdlX2VzdGltYXRpb25fcGFyYXNpdGUuaHRtbF0obWFjcm9waGFnZV9lc3RpbWF0aW9uX3BhcmFzaXRlLmh0bWwpClttYWNyb3BoYWdlX2V4cHJlc3Npb25fcGFyYXNpdGUuaHRtbF0obWFjcm9waGFnZV9leHByZXNzaW9uX3BhcmFzaXRlLmh0bWwpCgpgYGB7ciByZW5kZXJpbmcsIGluY2x1ZGU9RkFMU0UsIGV2YWw9RkFMU0V9CiMjIFRoaXMgYmxvY2sgaXMgdXNlZCB0byByZW5kZXIgYSBkb2N1bWVudCBmcm9tIHdpdGhpbiBpdC4Kcm1hcmtkb3duOjpyZW5kZXIocm1kX2ZpbGUpCgojIyBBbiBleHRyYSByZW5kZXJlciBmb3IgcGRmIG91dHB1dApybWFya2Rvd246OnJlbmRlcihybWRfZmlsZSwgb3V0cHV0X2Zvcm1hdD0icGRmX2RvY3VtZW50Iiwgb3V0cHV0X29wdGlvbnM9Yygic2tpcF9odG1sIikpCiMjIE9yIHRvIHNhdmUvbG9hZCBsYXJnZSBSZGF0YSBmaWxlcy4KaHBnbHRvb2xzOjo6c2F2ZW1lKCkKaHBnbHRvb2xzOjo6bG9hZG1lKCkKcm0obGlzdD1scygpKQpgYGAKCkluIHRoaXMgZG9jdW1lbnQsIHdlIHdpbGwgcGVyZm9ybSBhIHNlcmllcyBvZiBkaWZmZXJlbnRpYWwgZXhwcmVzc2lvbiBhbmFseXNlcyB1c2luZyB0aGUgZGF0YSB3aGljaCBzdXJ2aXZlZCBzYW1wbGUgZXN0aW1hdGlvbi4KCmBgYHtyIGxvYWRtZSwgaW5jbHVkZT1GQUxTRX0KdG1wIDwtIHNtKGxvYWRtZShmaWxlbmFtZT0ibWFjcm9waGFnZV9leHByZXNzaW9uX3BhcmFzaXRlLnJkYS54eiIpKQpgYGAKCiMgR2VuZSBPbnRvbG9neSBzZWFyY2hlcwoKTGV0cyBzZXQgdXAgc29tZSBzaW1wbGUgZGF0YSBzZXRzIGZvciBnb3NlcS9jbHVzdGVyUHJvZmlsZXIvdG9wR08KCkkgdGhpbmsgYSBidW5jaCBvZiB0aGUgbWF0ZXJpYWwgaW4gdGhpcyBzaGVldCBpcyBhY3R1YWxseSBub3cgb2Jzb2xldGUuCgojIyBFeHRyYWN0aW5nIG9udG9sb2d5IGFubm90YXRpb25zIGZyb20gdGhlIFRyaVRyeXBEQgoKYGBge3IgZ29zZXFfcHJlcGFyYXRpb259CiMjIGdvc2VxIHVzZXMgdGhlIGdlbmUgbGVuZ3RocywgY2x1c3RlcnByb2ZpbGVyIGFuZCB0b3BnbyBkb24ndAojIyBnZW5lX2xlbmd0aHMgPC0gYWxsX2dlbmVzWyxjKCJnZW5laWQiLCJnZW5lc2l6ZSIpXQojIyBjb2xuYW1lcyhnZW5lX2xlbmd0aHMpIDwtIGMoIklEIiwgIndpZHRoIikKY29sbmFtZXMobHBfbGVuZ3RocykgPC0gYygiSUQiLCAid2lkdGgiKQojIyBnb19pZHMgbmVlZHMgdG8gYmUgYSAyIGNvbHVtbiBkYXRhIGZyYW1lIHdpdGggbmFtZXMgJ0lEJywgJ0dPJyB3aGljaCBhcmUKIyMgZ2VuZSBuYW1lcyBhbmQgR08gbmFtZXMgcmVzcGVjdGl2ZWx5LiAgSSBhY3R1YWxseSB0aGluayBJIG1hZGUgbXkgZ29zZXEoKSBmdW5jdGlvbgojIyBzbWFydCBlbm91Z2ggdGhhdCB0aGlzIGlzIG5vIGxvbmdlciBuZWVkZWQsIGJ1dCBub25ldGhlbGVzcy4KCiMjIGdvX2lkcyA8LSByZWFkLnRhYmxlKCJyZWZlcmVuY2UvZ28vdGNydXppX2FsbF9nby50YWIuZ3oiLCBoZWFkZXI9MCwgc2VwPSJcdCIpCiMjIGNvbG5hbWVzKGdvX2lkcykgPC0gYygiSUQiLCJHTyIsIm9udG9sb2d5IiwidGVybSIsInNvdXJjZSIpCiMjIFNpbmNlIHRoZXJlIGFyZSBtdWx0aXBsZSBzb3VyY2VzLCBJIGFtIGRvaW5nIGEgdW5pcXVlIG9mIHRoZSB0YWJsZS4uLgojIyBnb19pZHMgPC0gdW5pcXVlKGdvX2lkc1ssYygiSUQiLCJHTyIpXSkKIyMgZ29pZF9maWxlIDwtICJyZWZlcmVuY2UvZ28vdG9wZ29fZ29pZHMudGFiLmd6IgoKIyMgY29sbmFtZXMobHBfZ29pZHMpIDwtIGMoIklEIiwgIkdPIikKbHBfZ28gPC0gbHBfZ29pZHNbLCBjKCJJRCIsIkdPIildCmxwX2dvJElEIDwtIHBhc3RlMCgiZXhvbl8iLCBscF9nbyRJRCkKbHBfZ28kSUQgPC0gcGFzdGUwKGxwX2dvJElELCAiLjEiKQpgYGAKCmBgYHtyIGdvc2VxX2NsYnJfdGltZXMxfQp0ZXN0X3NpZyA8LSBtYWNyb19iYXRjaF9zaWdbWyJsaW1tYSJdXVtbInVwcyJdXVtbIm1hY3JvX2Noci1zaCJdXQpkaW0odGVzdF9zaWcpCiMjIGhtbSBtYXliZSB0aGVyZSBhcmUgaW5zdWZmaWNpZW50IGdlbmVzIGZvciBnZW5lIG9udG9sb2d5Li4uCiMjbWFjcm9iYXRjaF9zaGNoX3VwX2dvc2VxIDwtIHNpbXBsZV9nb3NlcShzaWdfZ2VuZXM9dGVzdF9zaWcsCiMjICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICBnb19kYj1scF9nbywKIyMgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgIGxlbmd0aF9kYj1scF9sZW5ndGhzKQojI21hY3JvYmF0Y2hfc2hjaF91cF9nb3NlcSA8LSBzbShzaW1wbGVfZ29zZXEoc2lnX2dlbmVzPW1hY3JvYmF0Y2gkbGltbWEkdXBzJG1hY3JvX3NoX3ZzX21hY3JvX2NoLAojIyAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgZ29fZGI9bHBfZ29pZHMsIGxlbmd0aF9kYj1scF9sZW5ndGhzKSkKIyNtYWNyb2JhdGNoX3NoY2hfdXBfZXhjZWwgPC0gc20od3JpdGVfZ29zZXFfZGF0YShtYWNyb2JhdGNoX3NoY2hfdXBfZ29zZXEsCiMjICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgZXhjZWw9cGFzdGUwKCJleGNlbC9tYWNyb2JhdGNoX3NoY2hfdXBfZ29zZXEtdiIsIHZlciwgIi54bHN4IikpKQpgYGAK