1 Contrasts

zymodeme_keeper <- list(
    "zymodeme" = c("z23", "z22"))
susceptibility_keepers <- list(
    "resistant_sensitive" = c("resistant", "sensitive"),
    "resistant_ambiguous" = c("resistant", "ambiguous"),
    "sensitive_ambiguous" = c("sensitive", "ambiguous"))

1.1 Zymodeme enzyme gene IDs

Najib read me an email listing off the gene names associated with the zymodeme classification. I took those names and cross referenced them against the Leishmania panamensis gene annotations and found the following:

They are:

  1. ALAT: LPAL13_120010900 – alanine aminotransferase
  2. ASAT: LPAL13_340013000 – aspartate aminotransferase
  3. G6PD: LPAL13_000054100 – glucase-6-phosphate 1-dehydrogenase
  4. NH: LPAL13_14006100, LPAL13_180018500 – inosine-guanine nucleoside hydrolase
  5. MPI: LPAL13_320022300 (maybe) – mannose phosphate isomerase (I chose phosphomannose isomerase)

Given these 6 gene IDs (NH has two gene IDs associated with it), I can do some looking for specific differences among the various samples.

1.1.1 Expression levels of zymodeme genes

The following creates a colorspace (red to green) heatmap showing the observed expression of these genes in every sample.

my_genes <- c("LPAL13_120010900", "LPAL13_340013000", "LPAL13_000054100",
              "LPAL13_140006100", "LPAL13_180018500", "LPAL13_320022300",
              "other")
my_names <- c("ALAT", "ASAT", "G6PD", "NHv1", "NHv2", "MPI", "other")

zymo_six_genes <- exclude_genes_expt(lp_two_strains, ids = my_genes, method = "keep")
## Note, I renamed this to subset_genes().
## remove_genes_expt(), before removal, there were 8710 genes, now there are 6.
## There are 93 samples which kept less than 90 percent counts.
## TMRC20001 TMRC20065 TMRC20005 TMRC20066 TMRC20039 TMRC20037 TMRC20038 TMRC20067 
##   0.12101   0.12835   0.13438   0.10804   0.13756   0.11451   0.11446   0.10858 
## TMRC20068 TMRC20041 TMRC20015 TMRC20009 TMRC20010 TMRC20016 TMRC20011 TMRC20012 
##   0.11269   0.12840   0.11072   0.11376   0.10292   0.10451   0.10967   0.11676 
## TMRC20013 TMRC20017 TMRC20014 TMRC20018 TMRC20019 TMRC20070 TMRC20020 TMRC20021 
##   0.11865   0.10594   0.10591   0.11517   0.12027   0.11179   0.11100   0.10764 
## TMRC20022 TMRC20024 TMRC20036 TMRC20069 TMRC20033 TMRC20026 TMRC20031 TMRC20076 
##   0.12952   0.11481   0.12100   0.11631   0.11188   0.13633   0.10013   0.12403 
## TMRC20073 TMRC20055 TMRC20079 TMRC20071 TMRC20078 TMRC20094 TMRC20042 TMRC20058 
##   0.12398   0.13783   0.12639   0.12003   0.13420   0.12021   0.13766   0.11900 
## TMRC20072 TMRC20059 TMRC20048 TMRC20057 TMRC20088 TMRC20056 TMRC20060 TMRC20077 
##   0.14675   0.10984   0.10679   0.13443   0.12936   0.13510   0.10882   0.12810 
## TMRC20074 TMRC20063 TMRC20053 TMRC20052 TMRC20064 TMRC20075 TMRC20051 TMRC20050 
##   0.12494   0.12239   0.12145   0.11690   0.12051   0.11261   0.13149   0.11526 
## TMRC20049 TMRC20062 TMRC20110 TMRC20080 TMRC20043 TMRC20083 TMRC20054 TMRC20085 
##   0.14480   0.13429   0.13812   0.12120   0.11306   0.12235   0.12723   0.12316 
## TMRC20046 TMRC20093 TMRC20089 TMRC20047 TMRC20090 TMRC20044 TMRC20045 TMRC20105 
##   0.13182   0.13588   0.11884   0.12391   0.11566   0.13691   0.12812   0.12219 
## TMRC20108 TMRC20109 TMRC20098 TMRC20096 TMRC20097 TMRC20101 TMRC20092 TMRC20082 
##   0.11601   0.11684   0.11771   0.11364   0.11706   0.11784   0.11465   0.10358 
## TMRC20102 TMRC20099 TMRC20100 TMRC20091 TMRC20084 TMRC20087 TMRC20103 TMRC20104 
##   0.11399   0.11888   0.10820   0.12935   0.11273   0.12564   0.13704   0.11723 
## TMRC20086 TMRC20107 TMRC20081 TMRC20106 TMRC20095 
##   0.10752   0.09364   0.10335   0.09894   0.06566
strain_norm <- normalize_expt(zymo_six_genes, convert="rpkm", filter=TRUE, transform="log2")
## Removing 0 low-count genes (6 remaining).
zymo_heatmap <- plot_sample_heatmap(strain_norm, row_label = my_names)
zymo_heatmap

lp_norm <- normalize_expt(lp_two_strains, filter=TRUE, convert="rpkm",
                          norm="quant", transform="log2")
## Removing 151 low-count genes (8559 remaining).
## transform_counts: Found 109 values equal to 0, adding 1 to the matrix.
zymo_heatmap_all <- plot_sample_heatmap(lp_norm)
zymo_heatmap_all

1.2 Compare to highly expressed, variant genes

I want to compare the above heatmap with one which is comprised of all genes with some ‘significantly high’ expression value and also a not-negligible coefficient of variance.

zymo_high_genes <- normalize_expt(lp_two_strains, filter = "cv", cv_min = 0.9)
## Removing 5564 low-count genes (3146 remaining).
high_strain_norm <- normalize_expt(zymo_high_genes, convert = "rpkm",
                                   norm = "quant", transform = "log2")
## transform_counts: Found 476 values equal to 0, adding 1 to the matrix.
zymo_heatmap <- plot_sample_heatmap(high_strain_norm, row_label = my_names)
zymo_heatmap

I think this plot suggests that the difference between the two primary strains is not really one of a few specific genes, but instead a global pattern.

2 Zymodeme differential expression

2.1 No attempt at batch estimation

two_zymo <- set_expt_conditions(lp_two_strains, fact = "zymodemecategorical") %>%
  subset_expt(subset = "condition!='unknown'")
## The numbers of samples by condition are:
## 
## z21 z22 z23 z24 
##   7  43  41   2
## subset_expt(): There were 93, now there are 93 samples.
zymo_de_nobatch <- all_pairwise(two_zymo, filter = TRUE, model_batch = FALSE)
## 
## z21 z22 z23 z24 
##   7  43  41   2
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
zymo_de_nobatch
## Error in eval(expr, envir, enclos): object 'zymo_de_nobatch' not found
## Including the plots causes the rda file to balloon to 3.4Gb in the following invocation.
## Removing them results in... holy crap 2.1Mb
zymo_table_nobatch <- combine_de_tables(
    zymo_de_nobatch, keepers = zymodeme_keeper,
    rda = glue("rda/zymo_tables_nobatch-v{ver}.rda"),
    excel = glue("excel/zymo_tables_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'zymo_de_nobatch' not found
zymo_table_nobatch
## Error in eval(expr, envir, enclos): object 'zymo_table_nobatch' not found
zymo_sig_nobatch <- extract_significant_genes(
    zymo_table_nobatch,
    according_to = "deseq", current_id = "GID", required_id = "GID",
    gmt = glue("excel/zymodeme_nobatch-v{ver}.gmt"),
    excel = glue("excel/zymo_sig_nobatch_deseq-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'zymo_table_nobatch' not found
zymo_sig_nobatch
## Error in eval(expr, envir, enclos): object 'zymo_sig_nobatch' not found

2.1.1 Plot DE genes without batch estimation/adjustment

zymo_table_nobatch[["plots"]][["zymodeme"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'zymo_table_nobatch' not found
zymo_table_nobatch[["plots"]][["zymodeme"]][["deseq_vol_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'zymo_table_nobatch' not found

Log ratio, mean average plot and volcano plot of the comparison of the two primary zymodeme transcriptomes. When the transcriptomes of the two main strains (43 and 41 samples of z2.3 and z2.1) were compared without any attempt at batch/surrogate estimation with DESeq2, 45 and 85 genes were observed as significantly higher in strain z2.3 and z2.2 respectively using a cutoff of 1.0 logFC and 0.05 FDR adjusted p-value. There remain a large number of genes which are likely significantly different between the two strains, but fall below the 2-fold difference required for ‘significance.’ This follows prior observations that the parasite transcriptomes are constituitively expressed.

When the same data was plotted via a volcano plot, the relatively small range of fold changes compared to the large range of adjusted p-values is visible.

2.2 Attempt SVA estimate

zymo_de_sva <- all_pairwise(two_zymo, filter = TRUE, model_batch = "svaseq")
## 
## z21 z22 z23 z24 
##   7  43  41   2
## Removing 0 low-count genes (8559 remaining).
## Setting 495 low elements to zero.
## transform_counts: Found 495 values equal to 0, adding 1 to the matrix.
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
zymo_de_sva
## Error in eval(expr, envir, enclos): object 'zymo_de_sva' not found
zymo_table_sva <- combine_de_tables(
    zymo_de_sva, keepers = zymodeme_keeper,
    rda = glue("rda/zymo_tables_sva-v{ver}.rda"),
    excel = glue("excel/zymo_tables_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'zymo_de_sva' not found
zymo_table_sva
## Error in eval(expr, envir, enclos): object 'zymo_table_sva' not found
zymo_sig_sva <- extract_significant_genes(
    zymo_table_sva,
    according_to = "deseq",
    current_id = "GID", required_id = "GID",
    gmt = glue("excel/zymodeme_sva-v{ver}.gmt"),
    excel = glue("excel/zymo_sig_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'zymo_table_sva' not found
zymo_sig_sva
## Error in eval(expr, envir, enclos): object 'zymo_sig_sva' not found

2.2.1 Plot zymodeme DE genes with sva batch estimation/adjustment

When estimates from SVA were included in the statistical model used by EdgeR, DESeq2, and limma; a nearly identical view of the data emerged. I think this shows with a high degree of confidence, that sva is not having a significant effect on this dataset.

zymo_table_sva[["plots"]][["zymodeme"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'zymo_table_sva' not found
zymo_table_sva[["plots"]][["zymodeme"]][["deseq_vol_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'zymo_table_sva' not found

3 Parasite Susceptibility to Drug (Current)

This susceptibility comparison is using the ‘current’ dataset.

sus_de_nobatch <- all_pairwise(lp_susceptibility, filter = TRUE, model_batch = FALSE)
## 
## resistant sensitive   unknown 
##        47        49         5
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
sus_de_nobatch
## Error in eval(expr, envir, enclos): object 'sus_de_nobatch' not found
sus_table_nobatch <- combine_de_tables(
    sus_de_nobatch, keepers = susceptibility_keepers,
    rda = glue("rda/sus_tables_nobatch-v{ver}.rda"),
    excel = glue("excel/sus_tables_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sus_de_nobatch' not found
sus_table_nobatch
## Error in eval(expr, envir, enclos): object 'sus_table_nobatch' not found
sus_sig_nobatch <- extract_significant_genes(
    sus_table_nobatch,
    excel = glue("excel/sus_sig_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sus_table_nobatch' not found
sus_de_sva <- all_pairwise(lp_susceptibility, filter = TRUE, model_batch = "svaseq")
## 
## resistant sensitive   unknown 
##        47        49         5
## Removing 0 low-count genes (8576 remaining).
## Setting 636 low elements to zero.
## transform_counts: Found 636 values equal to 0, adding 1 to the matrix.
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
sus_de_sva
## Error in eval(expr, envir, enclos): object 'sus_de_sva' not found
sus_table_sva <- combine_de_tables(
    sus_de_sva, keepers = susceptibility_keepers,
    rda = glue("rda/sus_tables_sva-v{ver}.rda"),
    excel = glue("excel/sus_tables_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sus_de_sva' not found
sus_table_sva
## Error in eval(expr, envir, enclos): object 'sus_table_sva' not found
sus_sig_sva <- extract_significant_genes(
    sus_table_sva, according_to = "deseq",
    excel = glue("excel/sus_sig_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sus_table_sva' not found
sus_sig_sva
## Error in eval(expr, envir, enclos): object 'sus_sig_sva' not found
## To get a more true sense of sensitive vs resistant with sva, we kind of need to get rid of the
## unknown samples and perhaps the ambiguous.
no_ambiguous <- subset_expt(lp_susceptibility, subset="condition!='ambiguous'") %>%
  subset_expt(subset="condition!='unknown'")
## subset_expt(): There were 101, now there are 101 samples.
## subset_expt(): There were 101, now there are 96 samples.
no_ambiguous_de_sva <- all_pairwise(no_ambiguous, filter = TRUE, model_batch = "svaseq")
## 
## resistant sensitive 
##        47        49
## Removing 0 low-count genes (8565 remaining).
## Setting 423 low elements to zero.
## transform_counts: Found 423 values equal to 0, adding 1 to the matrix.
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
no_ambiguous_de_sva
## Error in eval(expr, envir, enclos): object 'no_ambiguous_de_sva' not found
## Let us see if my keeper code will fail hard or soft with extra contrasts...
no_ambiguous_table_sva <- combine_de_tables(
    no_ambiguous_de_sva, keepers = susceptibility_keepers,
    excel = glue("excel/no_ambiguous_tables_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'no_ambiguous_de_sva' not found
no_ambiguous_table_sva
## Error in eval(expr, envir, enclos): object 'no_ambiguous_table_sva' not found
no_ambiguous_sig_sva <- extract_significant_genes(
    no_ambiguous_table_sva, according_to = "deseq",
    excel = glue("excel/no_ambiguous_sig_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'no_ambiguous_table_sva' not found
no_ambiguous_sig_sva
## Error in eval(expr, envir, enclos): object 'no_ambiguous_sig_sva' not found

3.0.1 Plot Susceptibility DE genes with sva batch estimation/adjustment

sus_table_nobatch[["plots"]][["resistant_sensitive"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'sus_table_nobatch' not found
sus_table_nobatch[["plots"]][["resistant_sensitive"]][["deseq_vol_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'sus_table_nobatch' not found
sus_table_sva[["plots"]][["resistant_sensitive"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'sus_table_sva' not found
sus_table_sva[["plots"]][["resistant_sensitive"]][["deseq_vol_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'sus_table_sva' not found
no_ambiguous_table_sva[["plots"]][["resistant_sensitive"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'no_ambiguous_table_sva' not found
no_ambiguous_table_sva[["plots"]][["resistant_sensitive"]][["deseq_vol_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'no_ambiguous_table_sva' not found

Given that resistance/sensitivity tends to be correlated with strain, one might expect similar results. One caveat in this context though: there are fewer strains with resistance/sensitivity definitions. This when the analysis was repeated without the ambiguous/unknown samples, a few more genes were observed as significant.

4 Comparing DE results from strain/sensitivity

## zymo_table_sva[["plots"]][["zymodeme"]][["deseq_ma_plots"]][["plot"]]
zy_df <- zymo_table_sva[["data"]][["zymodeme"]]
## Error in eval(expr, envir, enclos): object 'zymo_table_sva' not found
sus_df <- sus_table_sva[["data"]][["resistant_sensitive"]]
## Error in eval(expr, envir, enclos): object 'sus_table_sva' not found
both_df <- merge(zy_df, sus_df, by = "row.names")
## Error in h(simpleError(msg, call)): error in evaluating the argument 'x' in selecting a method for function 'merge': object 'zy_df' not found
plot_df <- both_df[, c("deseq_logfc.x", "deseq_logfc.y")]
## Error in eval(expr, envir, enclos): object 'both_df' not found
rownames(plot_df) <- both_df[["Row.names"]]
## Error in eval(expr, envir, enclos): object 'both_df' not found
colnames(plot_df) <- c("z23_vs_z22", "sensitive_vs_resistant")
## Error: object 'plot_df' not found
compare <- plot_linear_scatter(plot_df)
## Error in eval(expr, envir, enclos): object 'plot_df' not found
pp(file = "images/compare_sus_zy.png")
compare$scatter
## Error in compare$scatter: object of type 'closure' is not subsettable
dev.off()
## png 
##   2
compare$scatter
## Error in compare$scatter: object of type 'closure' is not subsettable
compare$cor
## Error in compare$cor: object of type 'closure' is not subsettable

5 Parasite Susceptibility to Drug (Historical)

This susceptibility comparison is using the historical dataset.

sushist_de_nobatch <- all_pairwise(lp_susceptibility_historical, filter = TRUE,
                                   model_batch = FALSE)
## 
## ambiguous resistant sensitive   unknown 
##         5        12        29        55
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
sushist_de_nobatch
## Error in eval(expr, envir, enclos): object 'sushist_de_nobatch' not found
sushist_table_nobatch <- combine_de_tables(
    sushist_de_nobatch, keepers = susceptibility_keepers,
    excel = glue("excel/sushist_tables_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sushist_de_nobatch' not found
sushist_table_nobatch
## Error in eval(expr, envir, enclos): object 'sushist_table_nobatch' not found
sushist_sig_nobatch <- extract_significant_genes(
    sushist_table_nobatch,
    excel = glue("excel/sushist_sig_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sushist_table_nobatch' not found
sushist_sig_nobatch
## Error in eval(expr, envir, enclos): object 'sushist_sig_nobatch' not found
sushist_de_sva <- all_pairwise(lp_susceptibility_historical, filter = TRUE,
                               model_batch = "svaseq")
## 
## ambiguous resistant sensitive   unknown 
##         5        12        29        55
## Removing 0 low-count genes (8576 remaining).
## Setting 374 low elements to zero.
## transform_counts: Found 374 values equal to 0, adding 1 to the matrix.
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
sushist_de_sva
## Error in eval(expr, envir, enclos): object 'sushist_de_sva' not found
sushist_table_sva <- combine_de_tables(
    sushist_de_sva, keepers = susceptibility_keepers,
    excel = glue("excel/sushist_tables_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sushist_de_sva' not found
sushist_table_sva
## Error in eval(expr, envir, enclos): object 'sushist_table_sva' not found
sushist_sig_sva <- extract_significant_genes(
    sushist_table_sva, according_to = "deseq",
    excel = glue("excel/sushist_sig_sva-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'sushist_table_sva' not found
sushist_sig_sva
## Error in eval(expr, envir, enclos): object 'sushist_sig_sva' not found

6 Cure/Fail association

##cf_nb_input <- subset_expt(cf_expt, subset="condition!='unknown'")
cf_de_nobatch <- all_pairwise(lp_cf_known, filter = TRUE, model_batch = FALSE)
## 
## cure fail 
##   40   37
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
cf_de_nobatch
## Error in eval(expr, envir, enclos): object 'cf_de_nobatch' not found
cf_table_nobatch <- combine_de_tables(cf_de_nobatch, excel = glue("excel/cf_tables_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'cf_de_nobatch' not found
cf_table_nobatch
## Error in eval(expr, envir, enclos): object 'cf_table_nobatch' not found
cf_sig_nobatch <- extract_significant_genes(cf_table_nobatch, excel = glue("excel/cf_sig_nobatch-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'cf_table_nobatch' not found
cf_sig_nobatch
## Error in eval(expr, envir, enclos): object 'cf_sig_nobatch' not found
cf_de <- all_pairwise(lp_cf_known, filter = TRUE, model_batch = "svaseq")
## 
## cure fail 
##   40   37
## Removing 0 low-count genes (8548 remaining).
## Setting 118 low elements to zero.
## transform_counts: Found 118 values equal to 0, adding 1 to the matrix.
## Error in results[[type]] <- a_result: attempt to select less than one element in OneIndex
cf_de
## Error in eval(expr, envir, enclos): object 'cf_de' not found
cf_table <- combine_de_tables(cf_de, excel = glue("excel/cf_tables-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'cf_de' not found
cf_table
## Error in eval(expr, envir, enclos): object 'cf_table' not found
cf_sig <- extract_significant_genes(cf_table, excel = glue("excel/cf_sig-v{ver}.xlsx"))
## Error in eval(expr, envir, enclos): object 'cf_table' not found
cf_sig
## Error in eval(expr, envir, enclos): object 'cf_sig' not found

6.1 Cure/Fail DE plots

It is not surprising that few or no genes are deemed significantly differentially expressed across samples which were taken from cure or fail patients.

cf_table_nobatch[["plots"]][["fail_vs_cure"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'cf_table_nobatch' not found
dev <- pp(file = "images/cf_ma.png")
cf_table[["plots"]][["fail_vs_cure"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'cf_table' not found
closed <- dev.off()
cf_table[["plots"]][["fail_vs_cure"]][["deseq_ma_plots"]][["plot"]]
## Error in eval(expr, envir, enclos): object 'cf_table' not found

7 Combining the macrophage infected amastigotes with in-vitro promastigotes

One query we have not yet addressed: what are the similarities and differences among the strains used to infect the macrophage samples and the promastigote samples used in the TMRC2 parasite data?

In my container image, this dataset is not currently loaded, so turning this off.

## I just fixed this in the datasets Rmd, but until that propagates just set it manually
annotation(lp_expt) <- annotation(lp_macrophage)
tmrc2_macrophage_norm <- normalize_expt(lp_macrophage, transform="log2", convert="cpm",
                                        norm="quant", filter=TRUE)
all_tmrc2 <- combine_expts(lp_expt, lp_macrophage)

all_nosb <- all_tmrc2
pData(all_nosb)[["stage"]] <- "promastigote"
na_idx <- is.na(pData(all_nosb)[["macrophagetreatment"]])
pData(all_nosb)[na_idx, "macrophagetreatment"] <- "undefined"
all_nosb <- subset_expt(all_nosb, subset="macrophagetreatment!='inf_sb'")
ama_idx <- pData(all_nosb)[["macrophagetreatment"]] == "inf"
pData(all_nosb)[ama_idx, "stage" ] <- "amastigote"
pData(all_nosb)[["batch"]] <- pData(all_nosb)[["stage"]]

I think the above picture is sort of the opposite of what we want to compare in a DE analysis for this set of data, e.g. we want to compare promastigotes from amastigotes?

all_nosb <- set_expt_batches(all_nosb, fact="condition") %>%
  set_expt_conditions(fact="stage")
two_zymo <- subset_expt(
  all_nosb,
  subset="zymodemecategorical=='z22'|zymodemecategorical=='z23'|zymodemecategorical=='unknown'")

pro_ama <- all_pairwise(all_nosb, filter=TRUE, model_batch="svaseq")
pro_ama_table <- combine_de_tables(
    pro_ama,
    excel = glue("excel/tmrc2_pro_vs_ama_table-v{ver}.xlsx"))
pro_ama_sig <- extract_significant_genes(
    pro_ama_table,
    excel = glue("excel/tmrc2_pro_vs_ama_sig-v{ver}.xlsx"))

7.0.1 Plot promastigote/amastigote DE genes

pro_ama_table[["plots"]][["promastigote_vs_amastigote"]][["deseq_ma_plots"]][["plot"]]

I am a little surprised by this plot, I somewhat expected there to be few genes which passed the 2-fold difference demarcation line.

pander::pander(sessionInfo())

R version 4.3.1 (2023-06-16)

Platform: x86_64-conda-linux-gnu (64-bit)

locale: C

attached base packages: stats4, stats, graphics, grDevices, utils, datasets, methods and base

other attached packages: ruv(v.0.9.7.1), hpgltools(v.1.0), testthat(v.3.1.10), Matrix(v.1.6-1.1), glue(v.1.6.2), SummarizedExperiment(v.1.30.2), GenomicRanges(v.1.52.0), GenomeInfoDb(v.1.38.5), IRanges(v.2.36.0), S4Vectors(v.0.40.2), MatrixGenerics(v.1.12.3), matrixStats(v.1.0.0), Biobase(v.2.62.0), BiocGenerics(v.0.48.1) and Heatplus(v.3.8.0)

loaded via a namespace (and not attached): fs(v.1.6.3), bitops(v.1.0-7), enrichplot(v.1.20.3), devtools(v.2.4.5), HDO.db(v.0.99.1), httr(v.1.4.7), RColorBrewer(v.1.1-3), doParallel(v.1.0.17), profvis(v.0.3.8), tools(v.4.3.1), backports(v.1.4.1), utf8(v.1.2.3), R6(v.2.5.1), lazyeval(v.0.2.2), mgcv(v.1.9-0), urlchecker(v.1.0.1), withr(v.2.5.1), prettyunits(v.1.2.0), gridExtra(v.2.3), preprocessCore(v.1.62.1), cli(v.3.6.2), scatterpie(v.0.2.1), sass(v.0.4.7), mvtnorm(v.1.2-3), genefilter(v.1.82.1), Rsamtools(v.2.16.0), yulab.utils(v.0.1.0), gson(v.0.1.0), DOSE(v.3.26.1), sessioninfo(v.1.2.2), limma(v.3.56.2), rstudioapi(v.0.15.0), RSQLite(v.2.3.4), generics(v.0.1.3), gridGraphics(v.0.5-1), BiocIO(v.1.10.0), gtools(v.3.9.4), zip(v.2.3.0), dplyr(v.1.1.3), GO.db(v.3.17.0), fansi(v.1.0.4), abind(v.1.4-5), lifecycle(v.1.0.4), yaml(v.2.3.7), edgeR(v.3.42.4), gplots(v.3.1.3), qvalue(v.2.32.0), BiocFileCache(v.2.8.0), grid(v.4.3.1), blob(v.1.2.4), promises(v.1.2.1), crayon(v.1.5.2), miniUI(v.0.1.1.1), lattice(v.0.21-9), cowplot(v.1.1.1), GenomicFeatures(v.1.52.2), annotate(v.1.78.0), KEGGREST(v.1.42.0), pillar(v.1.9.0), knitr(v.1.44.1), fgsea(v.1.26.0), rjson(v.0.2.21), boot(v.1.3-28.1), corpcor(v.1.6.10), codetools(v.0.2-19), fastmatch(v.1.1-4), downloader(v.0.4), ggfun(v.0.1.3), data.table(v.1.14.8), remotes(v.2.4.2.1), vctrs(v.0.6.5), png(v.0.1-8), treeio(v.1.24.3), Rdpack(v.2.5), gtable(v.0.3.4), cachem(v.1.0.8), openxlsx(v.4.2.5.2), xfun(v.0.40), rbibutils(v.2.2.15), S4Arrays(v.1.0.6), mime(v.0.12), tidygraph(v.1.2.3), survival(v.3.5-7), iterators(v.1.0.14), ellipsis(v.0.3.2), nlme(v.3.1-163), pbkrtest(v.0.5.2), ggtree(v.3.8.2), usethis(v.2.2.2), bit64(v.4.0.5), progress(v.1.2.2), EnvStats(v.2.8.1), filelock(v.1.0.2), rprojroot(v.2.0.3), bslib(v.0.5.1), KernSmooth(v.2.23-22), colorspace(v.2.1-0), DBI(v.1.2.0), DESeq2(v.1.40.2), tidyselect(v.1.2.0), processx(v.3.8.2), bit(v.4.0.5), compiler(v.4.3.1), curl(v.5.2.0), graph(v.1.78.0), xml2(v.1.3.5), desc(v.1.4.2), DelayedArray(v.0.26.7), plotly(v.4.10.2), shadowtext(v.0.1.2), rtracklayer(v.1.60.1), scales(v.1.2.1), caTools(v.1.18.2), remaCor(v.0.0.16), callr(v.3.7.3), rappdirs(v.0.3.3), stringr(v.1.5.0), digest(v.0.6.33), minqa(v.1.2.6), variancePartition(v.1.30.2), rmarkdown(v.2.25), aod(v.1.3.2), XVector(v.0.42.0), RhpcBLASctl(v.0.23-42), htmltools(v.0.5.6), pkgconfig(v.2.0.3), lme4(v.1.1-34), dbplyr(v.2.3.4), fastmap(v.1.1.1), rlang(v.1.1.2), htmlwidgets(v.1.6.2), shiny(v.1.7.5), farver(v.2.1.1), jquerylib(v.0.1.4), jsonlite(v.1.8.8), BiocParallel(v.1.34.2), GOSemSim(v.2.26.1), RCurl(v.1.98-1.13), magrittr(v.2.0.3), GenomeInfoDbData(v.1.2.11), ggplotify(v.0.1.2), patchwork(v.1.1.3), munsell(v.0.5.0), Rcpp(v.1.0.11), ape(v.5.7-1), viridis(v.0.6.4), stringi(v.1.7.12), ggraph(v.2.1.0), brio(v.1.1.3), zlibbioc(v.1.48.0), MASS(v.7.3-60), plyr(v.1.8.9), pkgbuild(v.1.4.2), parallel(v.4.3.1), ggrepel(v.0.9.3), forcats(v.1.0.0), Biostrings(v.2.70.1), graphlayouts(v.1.0.1), splines(v.4.3.1), pander(v.0.6.5), hms(v.1.1.3), locfit(v.1.5-9.8), ps(v.1.7.5), fastcluster(v.1.2.3), igraph(v.1.5.1), reshape2(v.1.4.4), biomaRt(v.2.56.1), pkgload(v.1.3.3), XML(v.3.99-0.14), evaluate(v.0.22), nloptr(v.2.0.3), PROPER(v.1.32.0), foreach(v.1.5.2), tweenr(v.2.0.2), httpuv(v.1.6.11), tidyr(v.1.3.0), purrr(v.1.0.2), polyclip(v.1.10-6), ggplot2(v.3.4.3), ggforce(v.0.4.1), broom(v.1.0.5), xtable(v.1.8-4), restfulr(v.0.0.15), tidytree(v.0.4.5), later(v.1.3.1), viridisLite(v.0.4.2), tibble(v.3.2.1), clusterProfiler(v.4.8.3), aplot(v.0.2.1), memoise(v.2.0.1), AnnotationDbi(v.1.64.1), GenomicAlignments(v.1.36.0), sva(v.3.48.0) and GSEABase(v.1.62.0)

message(paste0("This is hpgltools commit: ", get_git_commit()))
## If you wish to reproduce this exact build of hpgltools, invoke the following:
## > git clone http://github.com/abelew/hpgltools.git
## > git reset 996769878223fb869c8fa3e1496bffec3a7de7f6
## This is hpgltools commit: Mon Jan 8 16:36:00 2024 -0500: 996769878223fb869c8fa3e1496bffec3a7de7f6
message(paste0("Saving to ", savefile))
## Saving to 03differential_expression.rda.xz
##  tmp <- sm(saveme(filename = savefile))
tmp <- loadme(filename = savefile)
