1 Annotation version: 20180822

1.1 Genome annotation input

There are a few methods of importing annotation data into R. The following are two attempts, the second is currently being used in these analyses.

1.1.1 AnnotationHub

AnnotationHub is a newer service and has promise to be an excellent top-level resource for gathering annotation data.

tt <- sm(library(AnnotationHub))
ah <- AnnotationHub()

## snapshotDate(): 2020-04-27

orgdbs <- query(ah, "OrgDB")
annot_lm <- query(ah, c("OrgDB", "Friedlin"))
lm_name <- names(annot_lm)
annot_lm <- annot_lm[[lm_name[[2]]]]

## downloading 1 resources

## retrieving 1 resource

## loading from cache

## Loading required package: AnnotationDbi

## Loading required package: stats4

## Loading required package: IRanges

## Loading required package: S4Vectors

## 
## Attaching package: 'S4Vectors'

## The following object is masked from 'package:base':
## 
##     expand.grid

txtdbs <- query(ah, "TxDb")

## AH48429 appears to be panamensis
##annot_lp <- annot_lp[["AH48429"]]
annot_lp <- query(ah, c("OrgDB", "panamensis"))
lp_name <- names(annot_lp)
annot_lp <- annot_lp[[lp_name[[2]]]]

## downloading 1 resources

## retrieving 1 resource

## loading from cache

1.2 OrganismDb

Since this document was originally written, I have made substantial changes to how I create, load, and manipulate the eupathdb annotation data. As a result, this needs to be significantly reworked.

AnnotationHub is the new and fancier version of what OrganismDb does. Keith already made these for the parasites though, lets try and use one of those.

testing_panamensis <- make_eupath_organismdbi("panamensis")
testing_braziliensis <- make_eupath_organismdbi("braziliensis")
testing_donovani <- make_eupath_organismdbi("donovani")
testing_mexicana <- make_eupath_organismdbi("mexicana")
testing_major <- make_eupath_organismdbi("major")
testing_crith <- make_eupath_organismdbi("Crithidia")

Assuming the above packages got created, we may load them and extract the annotation data.

major_names <- get_eupath_pkgnames("major")

## Error in get_eupath_pkgnames("major"): could not find function "get_eupath_pkgnames"

major_names$orgdb

## Error in eval(expr, envir, enclos): object 'major_names' not found

wanted_fields <- c("cds_length", "chromosome", "entrez_gene_id" , "gene_name_or_symbol",
                   "gene_strand", "gid", "go_go_id", "go_go_term_name", "go_ontology",
                   "interpro_description" ,"interpro_e_value", "type_gene_type")


lm_org <- load_orgdb_annotations(major_names$orgdb, keytype="gid", fields=wanted_fields)

## Error in load_orgdb_annotations(major_names$orgdb, keytype = "gid", fields = wanted_fields): object 'major_names' not found

panamensis_names <- get_eupath_pkgnames("panamensis")

## Error in get_eupath_pkgnames("panamensis"): could not find function "get_eupath_pkgnames"

panamensis_names$orgdb

## Error in eval(expr, envir, enclos): object 'panamensis_names' not found

lp_org <- load_orgdb_annotations(panamensis_names$orgdb, keytype="gid", fields=wanted_fields)

## Error in load_orgdb_annotations(panamensis_names$orgdb, keytype = "gid", : object 'panamensis_names' not found

braziliensis_names <- get_eupath_pkgnames("braziliensis")

## Error in get_eupath_pkgnames("braziliensis"): could not find function "get_eupath_pkgnames"

braziliensis_names$orgdb

## Error in eval(expr, envir, enclos): object 'braziliensis_names' not found

lb_org <- load_orgdb_annotations(braziliensis_names$orgdb, keytype="gid", fields=wanted_fields)

## Error in load_orgdb_annotations(braziliensis_names$orgdb, keytype = "gid", : object 'braziliensis_names' not found

donovani_names <- get_eupath_pkgnames("donovani")

## Error in get_eupath_pkgnames("donovani"): could not find function "get_eupath_pkgnames"

donovani_names$orgdb

## Error in eval(expr, envir, enclos): object 'donovani_names' not found

ld_org <- load_orgdb_annotations(donovani_names$orgdb, keytype="gid", fields=wanted_fields)

## Error in load_orgdb_annotations(donovani_names$orgdb, keytype = "gid", : object 'donovani_names' not found

mexicana_names <- get_eupath_pkgnames("mexicana")

## Error in get_eupath_pkgnames("mexicana"): could not find function "get_eupath_pkgnames"

mexicana_names$orgdb

## Error in eval(expr, envir, enclos): object 'mexicana_names' not found

lmex_org <- load_orgdb_annotations(mexicana_names$orgdb, keytype="gid", fields=wanted_fields)

## Error in load_orgdb_annotations(mexicana_names$orgdb, keytype = "gid", : object 'mexicana_names' not found

fasciculata_names <- get_eupath_pkgnames("rithidia")

## Error in get_eupath_pkgnames("rithidia"): could not find function "get_eupath_pkgnames"

fasciculata_names$orgdb

## Error in eval(expr, envir, enclos): object 'fasciculata_names' not found

cf_org <- load_orgdb_annotations(fasciculata_names$orgdb, keytype="gid", fields=wanted_fields)

## Error in load_orgdb_annotations(fasciculata_names$orgdb, keytype = "gid", : object 'fasciculata_names' not found

1.3 Read a gff file

In contrast, it is possible to load most annotations of interest directly from the gff files used in the alignments. More in-depth information for the human transcriptome may be extracted from biomart.

## The old way of getting genome/annotation data
lp_gff <- "reference/lpanamensis.gff"
lb_gff <- "reference/lbraziliensis.gff"
hs_gff <- "reference/hsapiens.gtf"

lp_fasta <- "reference/lpanamensis.fasta.xz"
lb_fasta <- "reference/lbraziliensis.fasta.xz"
hs_fasta <- "reference/hsapiens.fasta.xz"

lp_annotations <- sm(load_gff_annotations(lp_gff, type="gene"))
rownames(lp_annotations) <- paste0("exon_", lp_annotations$web_id, ".1")

lb_annotations <- sm(load_gff_annotations(lb_gff, type="gene"))
hs_gff_annot <- sm(load_gff_annotations(hs_gff, id_col="gene_id"))

hs_annotations <- sm(load_biomart_annotations())$annotation
hs_annotations$ID <- hs_annotations$geneID
rownames(hs_annotations) <- make.names(hs_annotations[["ensembl_gene_id"]], unique=TRUE)

1.4 Getting ontology data

## Try using biomart
hs_go_biomart <- sm(load_biomart_go())
## or the org.Hs.eg.db sqlite database
tt <- sm(library("Homo.sapiens"))
hs <- Homo.sapiens
##hs_go_ensembl <- load_orgdb_go(hs, hs_annotations$geneID)
##dim(hs_go_biomart)
##dim(hs_go_ensembl)
##hs_goids <- hs_go_biomart

## While testing, I called this desc, that will need to change.
##lp_tooltips <- make_tooltips(lp_annotations)
##lb_tooltips <- make_tooltips(lb_annotations)

lp_lengths <- lp_annotations[, c("ID", "width")]
lb_lengths <- lb_annotations[, c("ID", "width")]
hs_lengths <- hs_annotations[, c("geneID", "length")]

## Error in `[.data.frame`(hs_annotations, , c("geneID", "length")): undefined columns selected

lp_goids <- read.csv(file="reference/lpan_go.txt.xz", sep="\t", header=FALSE)
lb_goids <- read.csv(file="reference/lbraz_go.txt.xz", sep="\t", header=FALSE)
colnames(lp_goids) <- c("ID","GO","ont","name","source","tag")
colnames(lb_goids) <- c("ID","GO","ont","name","source","tag")

2 Putting the pieces together

The macrophage experiment has samples across 2 contexts, the host and parasite. The following block sets up one experiment for each. If you open the all_samples-species.xlsx files, you will note immediately that a few different attempts were made at ascertaining the most likely experimental factors that contributed to the readily apparent batch effects.

2.1 The human transcriptome mappings

Keep in mind that if I change the experimental design with new annotations, I must therefore regenerate the following.

hs_final_annotations <- hs_annotations
hs_final_annotations <- hs_final_annotations[, c("ensembl_transcript_id", "ensembl_gene_id",
                                                 "hgnc_symbol", "description", "gene_biotype")]
note <- "New experimental design factors by snp added 2016-09-20"

hs_expt <- create_expt("sample_sheets/all_samples-combined.xlsx",
                       gene_info=hs_final_annotations,
                       file_column="humanfile",
                       notes=note)

## Reading the sample metadata.

## Dropped 1 rows from the sample metadata because they were blank.

## The sample definitions comprises: 50 rows(samples) and 56 columns(metadata fields).

## Reading count tables.

## Reading count files with read.table().

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0241/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0242/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0243/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0244/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0245/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0246/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0247/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0248/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0315/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0316/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0317/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0318/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0319/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0320/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0321/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0322/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0630/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0631/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0632/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0633/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0634/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0635/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0636/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0637/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0638/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0639/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0640/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0641/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0642/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0643/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0644/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0645/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0646/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0647/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0648/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0649/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0650/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0651/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0652/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0653/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0654/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0655/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0656/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0657/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0658/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0659/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0660/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0661/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0662/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## /mnt/sshfs/cbcbsub01/fs/cbcb-lab/nelsayed/scratch/atb/rnaseq/lpanamensis_2016/preprocessing/hpgl0663/outputs/tophat_hsapiens/accepted_paired.count.xz contains 51046 rows and merges to 51046 rows.

## Finished reading count data.

## Matched 43897 annotations and counts.

## Bringing together the count matrix and gene information.

## Some annotations were lost in merging, setting them to 'undefined'.

## Saving the expressionset to 'expt.rda'.

## The final expressionset has 51041 rows and 50 columns.

head(hs_expt$design, n=1)

##          sampleid pathogenstrain experimentname              tubelabel alias
## HPGL0241 HPGL0241           none     macrophage TM130-Nil (Blue label)   Nil
##          condition batch anotherbatch snpclade snpcladev2 snpcladev3
## HPGL0241     uninf     a            a    undef      undef      undef
##          pathogenstrain1   label donor  time pctmappedparasite pctcategory
## HPGL0241            none uninf_1  d130 undef             undef           0
##               state sourcelab expperson pathogen  host hostcelltype
## HPGL0241 uninfected       Ade   Adriana     none Human   Human macs
##          noofhostcells infectionperiodhpitimeofharvest moiexposure
## HPGL0241    Max 2 mill           2h - 24h chase period        <NA>
##          parasitespercell  pctinf rnangul rnaqcpassed libraryconst libqcpassed
## HPGL0241          unknown unknown     468           Y    Wanderson           Y
##          index         descriptonandremarks observation lowercaseid
## HPGL0241     1 Uninfected human macrophages        <NA>    hpgl0241
##                                                                        humanfile
## HPGL0241 preprocessing/hpgl0241/outputs/tophat_hsapiens/accepted_paired.count.xz
##          parasitefile bcftable salmonreads hssalmonmapped hssalmonmaprate
## HPGL0241        undef    undef    46628648       26156539           0.561
##          lpsalmonmapped lpsalmonmaprate tophatpairs hstophataligned hstophatpct
## HPGL0241             NA              NA    46319335        40905961      0.8831
##          hstophatmulti hstophatdiscordant hstophatconcordantpct lptophataligned
## HPGL0241       1374099            1430888                0.8522              NA
##          lptophatpct lptophatmulti lptophatdiscordant lpconcordantpct
## HPGL0241          NA            NA                 NA              NA
##          variantpositions file
## HPGL0241               NA null

cds_entries <- fData(hs_expt)
cds_entries <- cds_entries[["Type"]] == "protein_coding"
hs_cds_expt <- hs_expt
hs_cds_expt$expressionset <- hs_cds_expt$expressionset[cds_entries, ]
new_cds_entries <- fData(hs_cds_expt)

2.2 The parasite transcriptome mappings

parasite_expt <- sm(create_expt("sample_sheets/all_samples-combined.xlsx",
                             gene_info=lp_annotations, file_column="parasitefile"))
head(parasite_expt$design, n=3)

##          sampleid pathogenstrain experimentname  tubelabel        alias
## HPGL0242 HPGL0242          s2271     macrophage TM130-2271 Self-Healing
## HPGL0243 HPGL0243          s2272     macrophage TM130-2272 Self-Healing
## HPGL0244 HPGL0244          s5433     macrophage TM130-5433      Chronic
##          condition batch anotherbatch  snpclade snpcladev2 snpcladev3
## HPGL0242        sh     a            a     white  whitepink      right
## HPGL0243        sh     a            a     white  whitepink      right
## HPGL0244       chr     a            a blue_self       blue       left
##          pathogenstrain1    label donor  time pctmappedparasite pctcategory
## HPGL0242           s2271  sh_2271  d130 undef                30           3
## HPGL0243           s2272  sh_2272  d130 undef                30           3
## HPGL0244           s5433 chr_5433  d130 undef                15           1
##              state sourcelab expperson pathogen  host hostcelltype
## HPGL0242 self_heal       Ade   Adriana       Lp Human   Human macs
## HPGL0243 self_heal       Ade   Adriana       Lp Human   Human macs
## HPGL0244   chronic       Ade   Adriana       Lp Human   Human macs
##          noofhostcells infectionperiodhpitimeofharvest        moiexposure
## HPGL0242    Max 2 mill           2h - 24h chase period 0.0486111111111111
## HPGL0243    Max 2 mill           2h - 24h chase period 0.0486111111111111
## HPGL0244    Max 2 mill           2h - 24h chase period 0.0486111111111111
##          parasitespercell  pctinf rnangul rnaqcpassed libraryconst libqcpassed
## HPGL0242          unknown unknown     276           Y    Wanderson           Y
## HPGL0243          unknown unknown     532           Y    Wanderson           Y
## HPGL0244          unknown unknown     261           Y    Wanderson           Y
##          index        descriptonandremarks observation lowercaseid
## HPGL0242     8 Infected human macrophages.        <NA>    hpgl0242
## HPGL0243    10  Infected human macrophages        <NA>    hpgl0243
## HPGL0244    27  Infected human macrophages        <NA>    hpgl0244
##                                                                        humanfile
## HPGL0242 preprocessing/hpgl0242/outputs/tophat_hsapiens/accepted_paired.count.xz
## HPGL0243 preprocessing/hpgl0243/outputs/tophat_hsapiens/accepted_paired.count.xz
## HPGL0244 preprocessing/hpgl0244/outputs/tophat_hsapiens/accepted_paired.count.xz
##                                                                        parasitefile
## HPGL0242 preprocessing/hpgl0242/outputs/tophat_lpanamensis/accepted_paired.count.xz
## HPGL0243 preprocessing/hpgl0243/outputs/tophat_lpanamensis/accepted_paired.count.xz
## HPGL0244 preprocessing/hpgl0244/outputs/tophat_lpanamensis/accepted_paired.count.xz
##                                                 bcftable salmonreads
## HPGL0242 preprocessing/outputs/hpgl0242_parsed_count.txt    42742857
## HPGL0243 preprocessing/outputs/hpgl0243_parsed_count.txt    46796079
## HPGL0244 preprocessing/outputs/hpgl0244_parsed_count.txt    47150925
##          hssalmonmapped hssalmonmaprate lpsalmonmapped lpsalmonmaprate
## HPGL0242       17945935          0.4199        8023463         0.18771
## HPGL0243       21046460          0.4497        6823750         0.14582
## HPGL0244       25281958          0.5362        3761371         0.07977
##          tophatpairs hstophataligned hstophatpct hstophatmulti
## HPGL0242    42612353        25394266      0.5959        869649
## HPGL0243    47344642        31160297      0.6582       1000248
## HPGL0244    46925604        36379602      0.7753       1070964
##          hstophatdiscordant hstophatconcordantpct lptophataligned lptophatpct
## HPGL0242             784620                0.5775        13117819      0.3078
## HPGL0243             924296                0.6386        11581460      0.2446
## HPGL0244             991929                0.7541         5755998      0.1227
##          lptophatmulti lptophatdiscordant lpconcordantpct variantpositions file
## HPGL0242        350277             263923          0.3016             3930 null
## HPGL0243        319338             245169          0.2394               NA null
## HPGL0244        154830             116414          0.1202            85981 null

3 Supplemental Table 1

Table S1 is going to be a summary of the metadata in all_samples-combined This may also include some of the numbers regarding mapping %, etc.

Wanted columns: * Sample ID: HPGLxxxx * Donor Code: TM130 or PG1xx * Cell Type: Macrophage or PBMC * Infection Status: Infected or Uninfected * Disease Outcome: Chronic or Self-Healing or NA * Batch: A or B (macrophage); NA for PBMC * Number of reads that passed Illumina filter * Number of reads after trimming * Number of reads mapped - human * % reads mapped - human * Number of reads mapped - L.panamensis * % reads mapped - L.panamensis

Use the Tcruzi colors. * A1 is a large title: “Macrophage Samples” * Row 2 is the blue column headings * 3-m contains Macrophage metadata * m+1 is blank * m+2 is a large title: “PBMC Samples” * m+3-n contains PBMC metadata

4 End

At this point, we should have everything necessary to perform the various analyses of the 4 sub-experiments. So save the current data for reuse elsewhere.

The experimental design is available here.

if (!isTRUE(get0("skip_load"))) {
  pander::pander(sessionInfo())
  message(paste0("This is hpgltools commit: ", get_git_commit()))
  this_save <- paste0(gsub(pattern="\\.Rmd", replace="", x=rmd_file), "-v", ver, ".rda.xz")
  message(paste0("Saving to ", this_save))
  tmp <- sm(saveme(filename=this_save))
}

## If you wish to reproduce this exact build of hpgltools, invoke the following:

## > git clone http://github.com/abelew/hpgltools.git

## > git reset 71e9e0510e6a865fc024d8cf57090f2f02602a35

## This is hpgltools commit: Fri Jun 26 13:06:16 2020 -0400: 71e9e0510e6a865fc024d8cf57090f2f02602a35

## Saving to index-v20180822.rda.xz

LS0tCnRpdGxlOiAiTC5wYW5hbWVuc2lzIDIwMTY6IEFubm90YXRpb24gZGF0YS4iCmF1dGhvcjogImF0YiBhYmVsZXdAZ21haWwuY29tIgpkYXRlOiAiYHIgU3lzLkRhdGUoKWAiCm91dHB1dDoKIGh0bWxfZG9jdW1lbnQ6CiAgY29kZV9kb3dubG9hZDogdHJ1ZQogIGNvZGVfZm9sZGluZzogc2hvdwogIGZpZ19jYXB0aW9uOiB0cnVlCiAgZmlnX2hlaWdodDogNwogIGZpZ193aWR0aDogNwogIGhpZ2hsaWdodDogZGVmYXVsdAogIGtlZXBfbWQ6IGZhbHNlCiAgbW9kZTogc2VsZmNvbnRhaW5lZAogIG51bWJlcl9zZWN0aW9uczogdHJ1ZQogIHNlbGZfY29udGFpbmVkOiB0cnVlCiAgdGhlbWU6IHJlYWRhYmxlCiAgdG9jOiB0cnVlCiAgdG9jX2Zsb2F0OgogICAgY29sbGFwc2VkOiBmYWxzZQogICAgc21vb3RoX3Njcm9sbDogZmFsc2UKLS0tCgo8c3R5bGU+CiAgYm9keSAubWFpbi1jb250YWluZXIgewogICAgbWF4LXdpZHRoOiAxNjAwcHg7CiAgfQo8L3N0eWxlPgoKYGBge3Igb3B0aW9ucywgaW5jbHVkZT1GQUxTRX0KaWYgKCFpc1RSVUUoZ2V0MCgic2tpcF9sb2FkIikpKSB7CiAgbGlicmFyeShocGdsdG9vbHMpCiAgdHQgPC0gZGV2dG9vbHM6OmxvYWRfYWxsKCIvZGF0YS9ocGdsdG9vbHMiKQogIGtuaXRyOjpvcHRzX2tuaXQkc2V0KHByb2dyZXNzPVRSVUUsCiAgICAgICAgICAgICAgICAgICAgICAgdmVyYm9zZT1UUlVFLAogICAgICAgICAgICAgICAgICAgICAgIHdpZHRoPTkwLAogICAgICAgICAgICAgICAgICAgICAgIGVjaG89VFJVRSkKICBrbml0cjo6b3B0c19jaHVuayRzZXQoZXJyb3I9VFJVRSwKICAgICAgICAgICAgICAgICAgICAgICAgZmlnLndpZHRoPTgsCiAgICAgICAgICAgICAgICAgICAgICAgIGZpZy5oZWlnaHQ9OCwKICAgICAgICAgICAgICAgICAgICAgICAgZHBpPTk2KQogIG9sZF9vcHRpb25zIDwtIG9wdGlvbnMoZGlnaXRzPTQsCiAgICAgICAgICAgICAgICAgICAgICAgICBzdHJpbmdzQXNGYWN0b3JzPUZBTFNFLAogICAgICAgICAgICAgICAgICAgICAgICAga25pdHIuZHVwbGljYXRlLmxhYmVsPSJhbGxvdyIpCiAgZ2dwbG90Mjo6dGhlbWVfc2V0KGdncGxvdDI6OnRoZW1lX2J3KGJhc2Vfc2l6ZT0xMCkpCiAgdmVyIDwtICIyMDE4MDgyMiIKICBwcmV2aW91c19maWxlIDwtICJpbmRleC5SbWQiCgogIHRtcCA8LSB0cnkoc20obG9hZG1lKGZpbGVuYW1lPXBhc3RlMChnc3ViKHBhdHRlcm49IlxcLlJtZCIsIHJlcGxhY2U9IiIsIHg9cHJldmlvdXNfZmlsZSksICItdiIsIHZlciwgIi5yZGEueHoiKSkpKQogIHJtZF9maWxlIDwtICJpbmRleC5SbWQiCn0KYGBgCgojIEFubm90YXRpb24gdmVyc2lvbjogYHIgdmVyYAoKIyMgR2Vub21lIGFubm90YXRpb24gaW5wdXQKClRoZXJlIGFyZSBhIGZldyBtZXRob2RzIG9mIGltcG9ydGluZyBhbm5vdGF0aW9uIGRhdGEgaW50byBSLiAgVGhlIGZvbGxvd2luZyBhcmUgdHdvIGF0dGVtcHRzLCB0aGUKc2Vjb25kIGlzIGN1cnJlbnRseSBiZWluZyB1c2VkIGluIHRoZXNlIGFuYWx5c2VzLgoKIyMjIEFubm90YXRpb25IdWIKCkFubm90YXRpb25IdWIgaXMgYSBuZXdlciBzZXJ2aWNlIGFuZCBoYXMgcHJvbWlzZSB0byBiZSBhbiBleGNlbGxlbnQgdG9wLWxldmVsIHJlc291cmNlIGZvciBnYXRoZXJpbmcKYW5ub3RhdGlvbiBkYXRhLgoKYGBge3IgZGF0YV9pbnB1dF9nZW5vbWV9CnR0IDwtIHNtKGxpYnJhcnkoQW5ub3RhdGlvbkh1YikpCmFoIDwtIEFubm90YXRpb25IdWIoKQpvcmdkYnMgPC0gcXVlcnkoYWgsICJPcmdEQiIpCmFubm90X2xtIDwtIHF1ZXJ5KGFoLCBjKCJPcmdEQiIsICJGcmllZGxpbiIpKQpsbV9uYW1lIDwtIG5hbWVzKGFubm90X2xtKQphbm5vdF9sbSA8LSBhbm5vdF9sbVtbbG1fbmFtZVtbMl1dXV0KdHh0ZGJzIDwtIHF1ZXJ5KGFoLCAiVHhEYiIpCgojIyBBSDQ4NDI5IGFwcGVhcnMgdG8gYmUgcGFuYW1lbnNpcwojI2Fubm90X2xwIDwtIGFubm90X2xwW1siQUg0ODQyOSJdXQphbm5vdF9scCA8LSBxdWVyeShhaCwgYygiT3JnREIiLCAicGFuYW1lbnNpcyIpKQpscF9uYW1lIDwtIG5hbWVzKGFubm90X2xwKQphbm5vdF9scCA8LSBhbm5vdF9scFtbbHBfbmFtZVtbMl1dXV0KYGBgCgojIyBPcmdhbmlzbURiCgpTaW5jZSB0aGlzIGRvY3VtZW50IHdhcyBvcmlnaW5hbGx5IHdyaXR0ZW4sIEkgaGF2ZSBtYWRlIHN1YnN0YW50aWFsIGNoYW5nZXMgdG8KaG93IEkgY3JlYXRlLCBsb2FkLCBhbmQgbWFuaXB1bGF0ZSB0aGUgZXVwYXRoZGIgYW5ub3RhdGlvbiBkYXRhLiAgQXMgYSByZXN1bHQsCnRoaXMgbmVlZHMgdG8gYmUgc2lnbmlmaWNhbnRseSByZXdvcmtlZC4KCkFubm90YXRpb25IdWIgaXMgdGhlIG5ldyBhbmQgZmFuY2llciB2ZXJzaW9uIG9mIHdoYXQgT3JnYW5pc21EYiBkb2VzLiAgS2VpdGggYWxyZWFkeQptYWRlIHRoZXNlIGZvciB0aGUgcGFyYXNpdGVzIHRob3VnaCwgbGV0cyB0cnkgYW5kIHVzZSBvbmUgb2YgdGhvc2UuCgpgYGB7ciBtYWtlX29yZ2RiLCBldmFsPUZBTFNFfQp0ZXN0aW5nX3BhbmFtZW5zaXMgPC0gbWFrZV9ldXBhdGhfb3JnYW5pc21kYmkoInBhbmFtZW5zaXMiKQp0ZXN0aW5nX2JyYXppbGllbnNpcyA8LSBtYWtlX2V1cGF0aF9vcmdhbmlzbWRiaSgiYnJhemlsaWVuc2lzIikKdGVzdGluZ19kb25vdmFuaSA8LSBtYWtlX2V1cGF0aF9vcmdhbmlzbWRiaSgiZG9ub3ZhbmkiKQp0ZXN0aW5nX21leGljYW5hIDwtIG1ha2VfZXVwYXRoX29yZ2FuaXNtZGJpKCJtZXhpY2FuYSIpCnRlc3RpbmdfbWFqb3IgPC0gbWFrZV9ldXBhdGhfb3JnYW5pc21kYmkoIm1ham9yIikKdGVzdGluZ19jcml0aCA8LSBtYWtlX2V1cGF0aF9vcmdhbmlzbWRiaSgiQ3JpdGhpZGlhIikKYGBgCgpBc3N1bWluZyB0aGUgYWJvdmUgcGFja2FnZXMgZ290IGNyZWF0ZWQsIHdlIG1heSBsb2FkIHRoZW0gYW5kIGV4dHJhY3QgdGhlIGFubm90YXRpb24gZGF0YS4KCmBgYHtyIGxwYW5hbWVuc2lzX29yZ2RifQptYWpvcl9uYW1lcyA8LSBnZXRfZXVwYXRoX3BrZ25hbWVzKCJtYWpvciIpCm1ham9yX25hbWVzJG9yZ2RiCgp3YW50ZWRfZmllbGRzIDwtIGMoImNkc19sZW5ndGgiLCAiY2hyb21vc29tZSIsICJlbnRyZXpfZ2VuZV9pZCIgLCAiZ2VuZV9uYW1lX29yX3N5bWJvbCIsCiAgICAgICAgICAgICAgICAgICAiZ2VuZV9zdHJhbmQiLCAiZ2lkIiwgImdvX2dvX2lkIiwgImdvX2dvX3Rlcm1fbmFtZSIsICJnb19vbnRvbG9neSIsCiAgICAgICAgICAgICAgICAgICAiaW50ZXJwcm9fZGVzY3JpcHRpb24iICwiaW50ZXJwcm9fZV92YWx1ZSIsICJ0eXBlX2dlbmVfdHlwZSIpCgoKbG1fb3JnIDwtIGxvYWRfb3JnZGJfYW5ub3RhdGlvbnMobWFqb3JfbmFtZXMkb3JnZGIsIGtleXR5cGU9ImdpZCIsIGZpZWxkcz13YW50ZWRfZmllbGRzKQoKcGFuYW1lbnNpc19uYW1lcyA8LSBnZXRfZXVwYXRoX3BrZ25hbWVzKCJwYW5hbWVuc2lzIikKcGFuYW1lbnNpc19uYW1lcyRvcmdkYgpscF9vcmcgPC0gbG9hZF9vcmdkYl9hbm5vdGF0aW9ucyhwYW5hbWVuc2lzX25hbWVzJG9yZ2RiLCBrZXl0eXBlPSJnaWQiLCBmaWVsZHM9d2FudGVkX2ZpZWxkcykKCmJyYXppbGllbnNpc19uYW1lcyA8LSBnZXRfZXVwYXRoX3BrZ25hbWVzKCJicmF6aWxpZW5zaXMiKQpicmF6aWxpZW5zaXNfbmFtZXMkb3JnZGIKbGJfb3JnIDwtIGxvYWRfb3JnZGJfYW5ub3RhdGlvbnMoYnJhemlsaWVuc2lzX25hbWVzJG9yZ2RiLCBrZXl0eXBlPSJnaWQiLCBmaWVsZHM9d2FudGVkX2ZpZWxkcykKCmRvbm92YW5pX25hbWVzIDwtIGdldF9ldXBhdGhfcGtnbmFtZXMoImRvbm92YW5pIikKZG9ub3ZhbmlfbmFtZXMkb3JnZGIKbGRfb3JnIDwtIGxvYWRfb3JnZGJfYW5ub3RhdGlvbnMoZG9ub3ZhbmlfbmFtZXMkb3JnZGIsIGtleXR5cGU9ImdpZCIsIGZpZWxkcz13YW50ZWRfZmllbGRzKQoKbWV4aWNhbmFfbmFtZXMgPC0gZ2V0X2V1cGF0aF9wa2duYW1lcygibWV4aWNhbmEiKQptZXhpY2FuYV9uYW1lcyRvcmdkYgpsbWV4X29yZyA8LSBsb2FkX29yZ2RiX2Fubm90YXRpb25zKG1leGljYW5hX25hbWVzJG9yZ2RiLCBrZXl0eXBlPSJnaWQiLCBmaWVsZHM9d2FudGVkX2ZpZWxkcykKCmZhc2NpY3VsYXRhX25hbWVzIDwtIGdldF9ldXBhdGhfcGtnbmFtZXMoInJpdGhpZGlhIikKZmFzY2ljdWxhdGFfbmFtZXMkb3JnZGIKY2Zfb3JnIDwtIGxvYWRfb3JnZGJfYW5ub3RhdGlvbnMoZmFzY2ljdWxhdGFfbmFtZXMkb3JnZGIsIGtleXR5cGU9ImdpZCIsIGZpZWxkcz13YW50ZWRfZmllbGRzKQpgYGAKCiMjIFJlYWQgYSBnZmYgZmlsZQoKSW4gY29udHJhc3QsIGl0IGlzIHBvc3NpYmxlIHRvIGxvYWQgbW9zdCBhbm5vdGF0aW9ucyBvZiBpbnRlcmVzdCBkaXJlY3RseSBmcm9tIHRoZSBnZmYgZmlsZXMgdXNlZCBpbgp0aGUgYWxpZ25tZW50cy4gIE1vcmUgaW4tZGVwdGggaW5mb3JtYXRpb24gZm9yIHRoZSBodW1hbiB0cmFuc2NyaXB0b21lIG1heSBiZSBleHRyYWN0ZWQgZnJvbSBiaW9tYXJ0LgoKYGBge3IgZ2Vub21lX2lucHV0fQojIyBUaGUgb2xkIHdheSBvZiBnZXR0aW5nIGdlbm9tZS9hbm5vdGF0aW9uIGRhdGEKbHBfZ2ZmIDwtICJyZWZlcmVuY2UvbHBhbmFtZW5zaXMuZ2ZmIgpsYl9nZmYgPC0gInJlZmVyZW5jZS9sYnJhemlsaWVuc2lzLmdmZiIKaHNfZ2ZmIDwtICJyZWZlcmVuY2UvaHNhcGllbnMuZ3RmIgoKbHBfZmFzdGEgPC0gInJlZmVyZW5jZS9scGFuYW1lbnNpcy5mYXN0YS54eiIKbGJfZmFzdGEgPC0gInJlZmVyZW5jZS9sYnJhemlsaWVuc2lzLmZhc3RhLnh6Igpoc19mYXN0YSA8LSAicmVmZXJlbmNlL2hzYXBpZW5zLmZhc3RhLnh6IgoKbHBfYW5ub3RhdGlvbnMgPC0gc20obG9hZF9nZmZfYW5ub3RhdGlvbnMobHBfZ2ZmLCB0eXBlPSJnZW5lIikpCnJvd25hbWVzKGxwX2Fubm90YXRpb25zKSA8LSBwYXN0ZTAoImV4b25fIiwgbHBfYW5ub3RhdGlvbnMkd2ViX2lkLCAiLjEiKQoKbGJfYW5ub3RhdGlvbnMgPC0gc20obG9hZF9nZmZfYW5ub3RhdGlvbnMobGJfZ2ZmLCB0eXBlPSJnZW5lIikpCmhzX2dmZl9hbm5vdCA8LSBzbShsb2FkX2dmZl9hbm5vdGF0aW9ucyhoc19nZmYsIGlkX2NvbD0iZ2VuZV9pZCIpKQoKaHNfYW5ub3RhdGlvbnMgPC0gc20obG9hZF9iaW9tYXJ0X2Fubm90YXRpb25zKCkpJGFubm90YXRpb24KaHNfYW5ub3RhdGlvbnMkSUQgPC0gaHNfYW5ub3RhdGlvbnMkZ2VuZUlECnJvd25hbWVzKGhzX2Fubm90YXRpb25zKSA8LSBtYWtlLm5hbWVzKGhzX2Fubm90YXRpb25zW1siZW5zZW1ibF9nZW5lX2lkIl1dLCB1bmlxdWU9VFJVRSkKYGBgCgojIyBHZXR0aW5nIG9udG9sb2d5IGRhdGEKCmBgYHtyIG9udG9sb2d5fQojIyBUcnkgdXNpbmcgYmlvbWFydApoc19nb19iaW9tYXJ0IDwtIHNtKGxvYWRfYmlvbWFydF9nbygpKQojIyBvciB0aGUgb3JnLkhzLmVnLmRiIHNxbGl0ZSBkYXRhYmFzZQp0dCA8LSBzbShsaWJyYXJ5KCJIb21vLnNhcGllbnMiKSkKaHMgPC0gSG9tby5zYXBpZW5zCiMjaHNfZ29fZW5zZW1ibCA8LSBsb2FkX29yZ2RiX2dvKGhzLCBoc19hbm5vdGF0aW9ucyRnZW5lSUQpCiMjZGltKGhzX2dvX2Jpb21hcnQpCiMjZGltKGhzX2dvX2Vuc2VtYmwpCiMjaHNfZ29pZHMgPC0gaHNfZ29fYmlvbWFydAoKIyMgV2hpbGUgdGVzdGluZywgSSBjYWxsZWQgdGhpcyBkZXNjLCB0aGF0IHdpbGwgbmVlZCB0byBjaGFuZ2UuCiMjbHBfdG9vbHRpcHMgPC0gbWFrZV90b29sdGlwcyhscF9hbm5vdGF0aW9ucykKIyNsYl90b29sdGlwcyA8LSBtYWtlX3Rvb2x0aXBzKGxiX2Fubm90YXRpb25zKQoKbHBfbGVuZ3RocyA8LSBscF9hbm5vdGF0aW9uc1ssIGMoIklEIiwgIndpZHRoIildCmxiX2xlbmd0aHMgPC0gbGJfYW5ub3RhdGlvbnNbLCBjKCJJRCIsICJ3aWR0aCIpXQpoc19sZW5ndGhzIDwtIGhzX2Fubm90YXRpb25zWywgYygiZ2VuZUlEIiwgImxlbmd0aCIpXQoKbHBfZ29pZHMgPC0gcmVhZC5jc3YoZmlsZT0icmVmZXJlbmNlL2xwYW5fZ28udHh0Lnh6Iiwgc2VwPSJcdCIsIGhlYWRlcj1GQUxTRSkKbGJfZ29pZHMgPC0gcmVhZC5jc3YoZmlsZT0icmVmZXJlbmNlL2xicmF6X2dvLnR4dC54eiIsIHNlcD0iXHQiLCBoZWFkZXI9RkFMU0UpCmNvbG5hbWVzKGxwX2dvaWRzKSA8LSBjKCJJRCIsIkdPIiwib250IiwibmFtZSIsInNvdXJjZSIsInRhZyIpCmNvbG5hbWVzKGxiX2dvaWRzKSA8LSBjKCJJRCIsIkdPIiwib250IiwibmFtZSIsInNvdXJjZSIsInRhZyIpCmBgYAoKIyBQdXR0aW5nIHRoZSBwaWVjZXMgdG9nZXRoZXIKClRoZSBtYWNyb3BoYWdlIGV4cGVyaW1lbnQgaGFzIHNhbXBsZXMgYWNyb3NzIDIgY29udGV4dHMsIHRoZSBob3N0IGFuZCBwYXJhc2l0ZS4gIFRoZSBmb2xsb3dpbmcgYmxvY2sKc2V0cyB1cCBvbmUgZXhwZXJpbWVudCBmb3IgZWFjaC4gIElmIHlvdSBvcGVuIHRoZSBhbGxfc2FtcGxlcy1zcGVjaWVzLnhsc3ggZmlsZXMsIHlvdSB3aWxsIG5vdGUKaW1tZWRpYXRlbHkgdGhhdCBhIGZldyBkaWZmZXJlbnQgYXR0ZW1wdHMgd2VyZSBtYWRlIGF0IGFzY2VydGFpbmluZyB0aGUgbW9zdCBsaWtlbHkgZXhwZXJpbWVudGFsCmZhY3RvcnMgdGhhdCBjb250cmlidXRlZCB0byB0aGUgcmVhZGlseSBhcHBhcmVudCBiYXRjaCBlZmZlY3RzLgoKIyMgVGhlIGh1bWFuIHRyYW5zY3JpcHRvbWUgbWFwcGluZ3MKCktlZXAgaW4gbWluZCB0aGF0IGlmIEkgY2hhbmdlIHRoZSBleHBlcmltZW50YWwgZGVzaWduIHdpdGggbmV3IGFubm90YXRpb25zLCBJIG11c3QKdGhlcmVmb3JlIHJlZ2VuZXJhdGUgdGhlIGZvbGxvd2luZy4KCmBgYHtyIGhzX2V4cHR9CmhzX2ZpbmFsX2Fubm90YXRpb25zIDwtIGhzX2Fubm90YXRpb25zCmhzX2ZpbmFsX2Fubm90YXRpb25zIDwtIGhzX2ZpbmFsX2Fubm90YXRpb25zWywgYygiZW5zZW1ibF90cmFuc2NyaXB0X2lkIiwgImVuc2VtYmxfZ2VuZV9pZCIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAgICAiaGduY19zeW1ib2wiLCAiZGVzY3JpcHRpb24iLCAiZ2VuZV9iaW90eXBlIildCm5vdGUgPC0gIk5ldyBleHBlcmltZW50YWwgZGVzaWduIGZhY3RvcnMgYnkgc25wIGFkZGVkIDIwMTYtMDktMjAiCgpoc19leHB0IDwtIGNyZWF0ZV9leHB0KCJzYW1wbGVfc2hlZXRzL2FsbF9zYW1wbGVzLWNvbWJpbmVkLnhsc3giLAogICAgICAgICAgICAgICAgICAgICAgIGdlbmVfaW5mbz1oc19maW5hbF9hbm5vdGF0aW9ucywKICAgICAgICAgICAgICAgICAgICAgICBmaWxlX2NvbHVtbj0iaHVtYW5maWxlIiwKICAgICAgICAgICAgICAgICAgICAgICBub3Rlcz1ub3RlKQpoZWFkKGhzX2V4cHQkZGVzaWduLCBuPTEpCgpjZHNfZW50cmllcyA8LSBmRGF0YShoc19leHB0KQpjZHNfZW50cmllcyA8LSBjZHNfZW50cmllc1tbIlR5cGUiXV0gPT0gInByb3RlaW5fY29kaW5nIgpoc19jZHNfZXhwdCA8LSBoc19leHB0CmhzX2Nkc19leHB0JGV4cHJlc3Npb25zZXQgPC0gaHNfY2RzX2V4cHQkZXhwcmVzc2lvbnNldFtjZHNfZW50cmllcywgXQpuZXdfY2RzX2VudHJpZXMgPC0gZkRhdGEoaHNfY2RzX2V4cHQpCmBgYAoKIyMgVGhlIHBhcmFzaXRlIHRyYW5zY3JpcHRvbWUgbWFwcGluZ3MKCmBgYHtyIHBhcmFzaXRlX2V4cHR9CnBhcmFzaXRlX2V4cHQgPC0gc20oY3JlYXRlX2V4cHQoInNhbXBsZV9zaGVldHMvYWxsX3NhbXBsZXMtY29tYmluZWQueGxzeCIsCiAgICAgICAgICAgICAgICAgICAgICAgICAgICAgZ2VuZV9pbmZvPWxwX2Fubm90YXRpb25zLCBmaWxlX2NvbHVtbj0icGFyYXNpdGVmaWxlIikpCmhlYWQocGFyYXNpdGVfZXhwdCRkZXNpZ24sIG49MykKYGBgCgojIFN1cHBsZW1lbnRhbCBUYWJsZSAxCgpUYWJsZSBTMSBpcyBnb2luZyB0byBiZSBhIHN1bW1hcnkgb2YgdGhlIG1ldGFkYXRhIGluIGFsbF9zYW1wbGVzLWNvbWJpbmVkClRoaXMgbWF5IGFsc28gaW5jbHVkZSBzb21lIG9mIHRoZSBudW1iZXJzIHJlZ2FyZGluZyBtYXBwaW5nICUsIGV0Yy4KCldhbnRlZCBjb2x1bW5zOgogICogU2FtcGxlIElEOiAgSFBHTHh4eHgKICAqIERvbm9yIENvZGU6IFRNMTMwIG9yIFBHMXh4CiAgKiBDZWxsIFR5cGU6ICBNYWNyb3BoYWdlIG9yIFBCTUMKICAqIEluZmVjdGlvbiBTdGF0dXM6ICBJbmZlY3RlZCBvciBVbmluZmVjdGVkCiAgKiBEaXNlYXNlIE91dGNvbWU6ICBDaHJvbmljIG9yIFNlbGYtSGVhbGluZyBvciBOQQogICogQmF0Y2g6IEEgb3IgQiAobWFjcm9waGFnZSk7IE5BIGZvciBQQk1DCiAgKiBOdW1iZXIgb2YgcmVhZHMgdGhhdCBwYXNzZWQgSWxsdW1pbmEgZmlsdGVyCiAgKiBOdW1iZXIgb2YgcmVhZHMgYWZ0ZXIgdHJpbW1pbmcKICAqIE51bWJlciBvZiByZWFkcyBtYXBwZWQgLSBodW1hbgogICogJSByZWFkcyBtYXBwZWQgLSBodW1hbgogICogTnVtYmVyIG9mIHJlYWRzIG1hcHBlZCAtIEwucGFuYW1lbnNpcwogICogJSByZWFkcyBtYXBwZWQgLSBMLnBhbmFtZW5zaXMKCiAgVXNlIHRoZSBUY3J1emkgY29sb3JzLgogICogQTEgaXMgYSBsYXJnZSB0aXRsZTogIk1hY3JvcGhhZ2UgU2FtcGxlcyIKICAqIFJvdyAyIGlzIHRoZSBibHVlIGNvbHVtbiBoZWFkaW5ncwogICogMy1tIGNvbnRhaW5zIE1hY3JvcGhhZ2UgbWV0YWRhdGEKICAqIG0rMSBpcyBibGFuawogICogbSsyIGlzIGEgbGFyZ2UgdGl0bGU6ICJQQk1DIFNhbXBsZXMiCiAgKiBtKzMtbiBjb250YWlucyBQQk1DIG1ldGFkYXRhCgoKIyBFbmQKCkF0IHRoaXMgcG9pbnQsIHdlIHNob3VsZCBoYXZlIGV2ZXJ5dGhpbmcgbmVjZXNzYXJ5IHRvIHBlcmZvcm0gdGhlIHZhcmlvdXMgYW5hbHlzZXMgb2YgdGhlIDQgc3ViLWV4cGVyaW1lbnRzLiAgU28gc2F2ZSB0aGUgY3VycmVudCBkYXRhIGZvciByZXVzZSBlbHNld2hlcmUuCgpUaGUgZXhwZXJpbWVudGFsIGRlc2lnbiBpcyBhdmFpbGFibGUgW2hlcmVdKHNhbXBsZV9zaGVldHMvYWxsX3NhbXBsZXMtY29tYmluZWQueGxzeCIpLgoKYGBge3Igc2F2ZW1lfQppZiAoIWlzVFJVRShnZXQwKCJza2lwX2xvYWQiKSkpIHsKICBwYW5kZXI6OnBhbmRlcihzZXNzaW9uSW5mbygpKQogIG1lc3NhZ2UocGFzdGUwKCJUaGlzIGlzIGhwZ2x0b29scyBjb21taXQ6ICIsIGdldF9naXRfY29tbWl0KCkpKQogIHRoaXNfc2F2ZSA8LSBwYXN0ZTAoZ3N1YihwYXR0ZXJuPSJcXC5SbWQiLCByZXBsYWNlPSIiLCB4PXJtZF9maWxlKSwgIi12IiwgdmVyLCAiLnJkYS54eiIpCiAgbWVzc2FnZShwYXN0ZTAoIlNhdmluZyB0byAiLCB0aGlzX3NhdmUpKQogIHRtcCA8LSBzbShzYXZlbWUoZmlsZW5hbWU9dGhpc19zYXZlKSkKfQpgYGAK

L.panamensis 2016: Annotation data.

atb abelew@gmail.com

2020-07-06