@article{BarlowHartmannGonzalezetal.2020, author = {Barlow, Axel and Hartmann, Stefanie and Gonzalez, Javier and Hofreiter, Michael and Paijmans, Johanna L. A.}, title = {Consensify}, series = {Genes / Molecular Diversity Preservation International}, volume = {11}, journal = {Genes / Molecular Diversity Preservation International}, number = {1}, publisher = {MDPI}, address = {Basel}, issn = {2073-4425}, doi = {10.3390/genes11010050}, pages = {22}, year = {2020}, abstract = {A standard practise in palaeogenome analysis is the conversion of mapped short read data into pseudohaploid sequences, frequently by selecting a single high-quality nucleotide at random from the stack of mapped reads. This controls for biases due to differential sequencing coverage, but it does not control for differential rates and types of sequencing error, which are frequently large and variable in datasets obtained from ancient samples. These errors have the potential to distort phylogenetic and population clustering analyses, and to mislead tests of admixture using D statistics. We introduce Consensify, a method for generating pseudohaploid sequences, which controls for biases resulting from differential sequencing coverage while greatly reducing error rates. The error correction is derived directly from the data itself, without the requirement for additional genomic resources or simplifying assumptions such as contemporaneous sampling. For phylogenetic and population clustering analysis, we find that Consensify is less affected by artefacts than methods based on single read sampling. For D statistics, Consensify is more resistant to false positives and appears to be less affected by biases resulting from different laboratory protocols than other frequently used methods. Although Consensify is developed with palaeogenomic data in mind, it is applicable for any low to medium coverage short read datasets. We predict that Consensify will be a useful tool for future studies of palaeogenomes.}, language = {en} } @article{YuanShengPreicketal.2020, author = {Yuan, Junxia and Sheng, Guilian and Preick, Michaela and Sun, Boyang and Hou, Xindong and Chen, Shungang and Taron, Ulrike Helene and Barlow, Axel and Wang, Linying and Hu, Jiaming and Deng, Tao and Lai, Xulong and Hofreiter, Michael}, title = {Mitochondrial genomes of Late Pleistocene caballine horses from China belong to a separate clade}, series = {Quaternary science reviews : the international multidisciplinary research and review journal}, volume = {250}, journal = {Quaternary science reviews : the international multidisciplinary research and review journal}, publisher = {Elsevier}, address = {Amsterdam [u.a.]}, issn = {0277-3791}, doi = {10.1016/j.quascirev.2020.106691}, pages = {8}, year = {2020}, abstract = {There were several species of Equus in northern China during the Late Pleistocene, including Equus przewalskii and Equus dalianensis. A number of morphological studies have been carried out on E. przewalskii and E. dalianensis, but their evolutionary history is still unresolved. In this study, we retrieved near-complete mitochondrial genomes from E. dalianensis and E. przewalskii specimens excavated from Late Pleistocene strata in northeastern China. Phylogenetic analyses revealed that caballoid horses were divided into two subclades: the New World and the Old World caballine horse subclades. The Old World caballine horses comprise of two deep phylogenetic lineages, with modern and ancient Equus caballus and modern E. przewalskii forming lineage I, and the individuals in this study together with one Yakut specimen forming lineage II. Our results indicate that Chinese Late Pleistocene caballoid horses showed a closer relationship to other Eurasian caballine horses than that to Pleistocene horses from North America. In addition, phylogenetic analyses suggested a close relationship between E. dalianensis and the Chinese fossil E. przewalskii, in agreement with previous researches based on morphological analyses. Interestingly, E. dalianensis and the fossil E. przewalskii were intermixed rather than split into distinct lineages, suggesting either that gene flow existed between these two species or that morphology-based species assignment of palaeontological specimens is not always correct. Moreover, Bayesian analysis showed that the divergence time between the New World and the Old World caballoid horses was at 1.02 Ma (95\% CI: 0.86-1.24 Ma), and the two Old World lineages (I \& II) split at 0.88 Ma (95\% CI: 0.69-1.13 Ma), which indicates that caballoid horses seem to have evolved into different populations in the Old World soon after they migrated from North America via the Bering Land Bridge. Finally, the TMRCA of E. dalianensis was estimated at 0.20 Ma (95\% CI: 0.15-0.28 Ma), and it showed a relative low genetic diversity compared with other Equus species.}, language = {en} } @article{AlbertiGonzalezPaijmansetal.2018, author = {Alberti, Federica and Gonzalez, Javier and Paijmans, Johanna L. A. and Basler, Nikolas and Preick, Michaela and Henneberger, Kirstin and Trinks, Alexandra and Rabeder, Gernot and Conard, Nicholas J. and Muenzel, Susanne C. and Joger, Ulrich and Fritsch, Guido and Hildebrandt, Thomas and Hofreiter, Michael and Barlow, Axel}, title = {Optimized DNA sampling of ancient bones using Computed Tomography scans}, series = {Molecular ecology resources}, volume = {18}, journal = {Molecular ecology resources}, number = {6}, publisher = {Wiley}, address = {Hoboken}, issn = {1755-098X}, doi = {10.1111/1755-0998.12911}, pages = {1196 -- 1208}, year = {2018}, abstract = {The prevalence of contaminant microbial DNA in ancient bone samples represents the principal limiting factor for palaeogenomic studies, as it may comprise more than 99\% of DNA molecules obtained. Efforts to exclude or reduce this contaminant fraction have been numerous but also variable in their success. Here, we present a simple but highly effective method to increase the relative proportion of endogenous molecules obtained from ancient bones. Using computed tomography (CT) scanning, we identify the densest region of a bone as optimal for sampling. This approach accurately identifies the densest internal regions of petrous bones, which are known to be a source of high-purity ancient DNA. For ancient long bones, CT scans reveal a high-density outermost layer, which has been routinely removed and discarded prior to DNA extraction. For almost all long bones investigated, we find that targeted sampling of this outermost layer provides an increase in endogenous DNA content over that obtained from softer, trabecular bone. This targeted sampling can produce as much as 50-fold increase in the proportion of endogenous DNA, providing a directly proportional reduction in sequencing costs for shotgun sequencing experiments. The observed increases in endogenous DNA proportion are not associated with any reduction in absolute endogenous molecule recovery. Although sampling the outermost layer can result in higher levels of human contamination, some bones were found to have more contamination associated with the internal bone structures. Our method is highly consistent, reproducible and applicable across a wide range of bone types, ages and species. We predict that this discovery will greatly extend the potential to study ancient populations and species in the genomics era.}, language = {en} } @article{TaronLellBarlowetal.2018, author = {Taron, Ulrike H. and Lell, Moritz and Barlow, Axel and Paijmans, Johanna L. A.}, title = {Testing of Alignment Parameters for Ancient Samples}, series = {Genes}, volume = {9}, journal = {Genes}, number = {3}, publisher = {Molecular Diversity Preservation International}, address = {Basel}, issn = {2073-4425}, doi = {10.3390/genes9030157}, pages = {1 -- 12}, year = {2018}, abstract = {High-throughput sequence data retrieved from ancient or other degraded samples has led to unprecedented insights into the evolutionary history of many species, but the analysis of such sequences also poses specific computational challenges. The most commonly used approach involves mapping sequence reads to a reference genome. However, this process becomes increasingly challenging with an elevated genetic distance between target and reference or with the presence of contaminant sequences with high sequence similarity to the target species. The evaluation and testing of mapping efficiency and stringency are thus paramount for the reliable identification and analysis of ancient sequences. In this paper, we present 'TAPAS', (Testing of Alignment Parameters for Ancient Samples), a computational tool that enables the systematic testing of mapping tools for ancient data by simulating sequence data reflecting the properties of an ancient dataset and performing test runs using the mapping software and parameter settings of interest. We showcase TAPAS by using it to assess and improve mapping strategy for a degraded sample from a banded linsang (Prionodon linsang), for which no closely related reference is currently available. This enables a 1.8-fold increase of the number of mapped reads without sacrificing mapping specificity. The increase of mapped reads effectively reduces the need for additional sequencing, thus making more economical use of time, resources, and sample material.}, language = {en} } @article{TaronLellBarlowetal.2018, author = {Taron, Ulrike H. and Lell, Moritz and Barlow, Axel and Paijmans, Johanna L. A.}, title = {Testing of Alignment Parameters for Ancient Samples}, series = {Genese}, volume = {9}, journal = {Genese}, number = {3}, publisher = {MDPI}, address = {Basel}, issn = {2073-4425}, doi = {10.3390/genes9030157}, pages = {12}, year = {2018}, abstract = {High-throughput sequence data retrieved from ancient or other degraded samples has led to unprecedented insights into the evolutionary history of many species, but the analysis of such sequences also poses specific computational challenges. The most commonly used approach involves mapping sequence reads to a reference genome. However, this process becomes increasingly challenging with an elevated genetic distance between target and reference or with the presence of contaminant sequences with high sequence similarity to the target species. The evaluation and testing of mapping efficiency and stringency are thus paramount for the reliable identification and analysis of ancient sequences. In this paper, we present 'TAPAS', (Testing of Alignment Parameters for Ancient Samples), a computational tool that enables the systematic testing of mapping tools for ancient data by simulating sequence data reflecting the properties of an ancient dataset and performing test runs using the mapping software and parameter settings of interest. We showcase TAPAS by using it to assess and improve mapping strategy for a degraded sample from a banded linsang (Prionodon linsang), for which no closely related reference is currently available. This enables a 1.8-fold increase of the number of mapped reads without sacrificing mapping specificity. The increase of mapped reads effectively reduces the need for additional sequencing, thus making more economical use of time, resources, and sample material.}, language = {en} }