@article{YuanShengPreicketal.2020, author = {Yuan, Junxia and Sheng, Guilian and Preick, Michaela and Sun, Boyang and Hou, Xindong and Chen, Shungang and Taron, Ulrike Helene and Barlow, Axel and Wang, Linying and Hu, Jiaming and Deng, Tao and Lai, Xulong and Hofreiter, Michael}, title = {Mitochondrial genomes of Late Pleistocene caballine horses from China belong to a separate clade}, series = {Quaternary science reviews : the international multidisciplinary research and review journal}, volume = {250}, journal = {Quaternary science reviews : the international multidisciplinary research and review journal}, publisher = {Elsevier}, address = {Amsterdam [u.a.]}, issn = {0277-3791}, doi = {10.1016/j.quascirev.2020.106691}, pages = {8}, year = {2020}, abstract = {There were several species of Equus in northern China during the Late Pleistocene, including Equus przewalskii and Equus dalianensis. A number of morphological studies have been carried out on E. przewalskii and E. dalianensis, but their evolutionary history is still unresolved. In this study, we retrieved near-complete mitochondrial genomes from E. dalianensis and E. przewalskii specimens excavated from Late Pleistocene strata in northeastern China. Phylogenetic analyses revealed that caballoid horses were divided into two subclades: the New World and the Old World caballine horse subclades. The Old World caballine horses comprise of two deep phylogenetic lineages, with modern and ancient Equus caballus and modern E. przewalskii forming lineage I, and the individuals in this study together with one Yakut specimen forming lineage II. Our results indicate that Chinese Late Pleistocene caballoid horses showed a closer relationship to other Eurasian caballine horses than that to Pleistocene horses from North America. In addition, phylogenetic analyses suggested a close relationship between E. dalianensis and the Chinese fossil E. przewalskii, in agreement with previous researches based on morphological analyses. Interestingly, E. dalianensis and the fossil E. przewalskii were intermixed rather than split into distinct lineages, suggesting either that gene flow existed between these two species or that morphology-based species assignment of palaeontological specimens is not always correct. Moreover, Bayesian analysis showed that the divergence time between the New World and the Old World caballoid horses was at 1.02 Ma (95\% CI: 0.86-1.24 Ma), and the two Old World lineages (I \& II) split at 0.88 Ma (95\% CI: 0.69-1.13 Ma), which indicates that caballoid horses seem to have evolved into different populations in the Old World soon after they migrated from North America via the Bering Land Bridge. Finally, the TMRCA of E. dalianensis was estimated at 0.20 Ma (95\% CI: 0.15-0.28 Ma), and it showed a relative low genetic diversity compared with other Equus species.}, language = {en} } @article{BarlowHartmannGonzalezetal.2020, author = {Barlow, Axel and Hartmann, Stefanie and Gonzalez, Javier and Hofreiter, Michael and Paijmans, Johanna L. A.}, title = {Consensify}, series = {Genes / Molecular Diversity Preservation International}, volume = {11}, journal = {Genes / Molecular Diversity Preservation International}, number = {1}, publisher = {MDPI}, address = {Basel}, issn = {2073-4425}, doi = {10.3390/genes11010050}, pages = {22}, year = {2020}, abstract = {A standard practise in palaeogenome analysis is the conversion of mapped short read data into pseudohaploid sequences, frequently by selecting a single high-quality nucleotide at random from the stack of mapped reads. This controls for biases due to differential sequencing coverage, but it does not control for differential rates and types of sequencing error, which are frequently large and variable in datasets obtained from ancient samples. These errors have the potential to distort phylogenetic and population clustering analyses, and to mislead tests of admixture using D statistics. We introduce Consensify, a method for generating pseudohaploid sequences, which controls for biases resulting from differential sequencing coverage while greatly reducing error rates. The error correction is derived directly from the data itself, without the requirement for additional genomic resources or simplifying assumptions such as contemporaneous sampling. For phylogenetic and population clustering analysis, we find that Consensify is less affected by artefacts than methods based on single read sampling. For D statistics, Consensify is more resistant to false positives and appears to be less affected by biases resulting from different laboratory protocols than other frequently used methods. Although Consensify is developed with palaeogenomic data in mind, it is applicable for any low to medium coverage short read datasets. We predict that Consensify will be a useful tool for future studies of palaeogenomes.}, language = {en} } @misc{GambaJonesTeasdaleetal.2014, author = {Gamba, Cristina and Jones, Eppie R. and Teasdale, Matthew D. and McLaughlin, Russell L. and Gonz{\´a}lez-Fortes, Gloria M. and Mattiangeli, Valeria and Dombor{\´o}czki, L{\´a}szl{\´o} and Kőv{\´a}ri, Ivett and Pap, Ildik{\´o} and Anders, Alexandra and Whittle, Alasdair and Dani, J{\´a}nos and Raczky, P{\´a}l and Higham, Thomas F. G. and Hofreiter, Michael and Bradley, Daniel G. and Pinhasi, Ron}, title = {Genome flux and stasis in a five millennium transect of European prehistory}, series = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, volume = {5}, journal = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Mathematisch-Naturwissenschaftliche Reihe}, number = {1332}, issn = {1866-8372}, doi = {10.25932/publishup-43799}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-437999}, pages = {9}, year = {2014}, abstract = {The Great Hungarian Plain was a crossroads of cultural transformations that have shaped European prehistory. Here we analyse a 5,000-year transect of human genomes, sampled from petrous bones giving consistently excellent endogenous DNA yields, from 13 Hungarian Neolithic, Copper, Bronze and Iron Age burials including two to high (similar to 22x) and seven to similar to 1x coverage, to investigate the impact of these on Europe's genetic landscape. These data suggest genomic shifts with the advent of the Neolithic, Bronze and Iron Ages, with interleaved periods of genome stability. The earliest Neolithic context genome shows a European hunter-gatherer genetic signature and a restricted ancestral population size, suggesting direct contact between cultures after the arrival of the first farmers into Europe. The latest, Iron Age, sample reveals an eastern genomic influence concordant with introduced Steppe burial rites. We observe transition towards lighter pigmentation and surprisingly, no Neolithic presence of lactase persistence.}, language = {en} } @article{HofreiterHartmann2020, author = {Hofreiter, Michael and Hartmann, Stefanie}, title = {Reconstructing protein-coding sequences from ancient DNA}, series = {Odorant binding and chemosensory proteins}, volume = {642}, journal = {Odorant binding and chemosensory proteins}, publisher = {Academic Press, an imprint of Elsevier}, address = {Cambridge, MA.}, isbn = {978-0-12-821157-1}, issn = {0076-6879}, doi = {10.1016/bs.mie.2020.05.008}, pages = {21 -- 33}, year = {2020}, abstract = {Obtaining information about functional details of proteins of extinct species is of critical importance for a better understanding of the real-life appearance, behavior and ecology of these lost entries in the book of life. In this chapter, we discuss the possibilities to retrieve the necessary DNA sequence information from paleogenomic data obtained from fossil specimens, which can then be used to express and subsequently analyze the protein of interest. We discuss the problems specific to ancient DNA, including mis-coding lesions, short read length and incomplete paleogenome assemblies. Finally, we discuss an alternative, but currently rarely used approach, direct PCR amplification, which is especially useful for comparatively short proteins.}, language = {en} } @phdthesis{Schulte2022, author = {Schulte, Luise}, title = {Dynamics of Larix (Mill.) species in Siberia during the last 50,000 years inferred from sedimentary ancient DNA}, doi = {10.25932/publishup-55878}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-558782}, school = {Universit{\"a}t Potsdam}, pages = {xi, 121}, year = {2022}, abstract = {The deciduous needle tree larch (Larix Mill.) covers more than 80\% of the Asian boreal forests. Only a few Larix species constitute the vast forests and these species differ markedly in their ecological traits, most importantly in their ability to grow on and stabilize underlying permafrost. The pronounced dominance of the summergreen larches makes the Asian boreal forests unique, as the rest of the northern hemisphere boreal forests is almost exclusively dominated by evergreen needle-leaf forests. Global warming is impacting the whole world but is especially pronounced in the arctic and boreal regions. Although adapted to extreme climatic conditions, larch forests are sensitive to varying climatic conditions. By their sheer size, changes in Asian larch forests as range shifts or changes in species composition and the resulting vegetation-climate feedbacks are of global relevance. It is however still uncertain if larch forests will persist under the ongoing warming climate or if they will be replaced by evergreen forests. It is therefore of great importance to understand how these ecosystems will react to future climate warmings and if they will maintain their dominance. One step in the better understanding of larch dynamics is to study how the vast dominant forests developed and why they only established in northern Asia. A second step is to study how the species reacted to past changes in the climate. The first objective of this thesis was to review and identify factors promoting Asian larch dominance. I achieved this by synthesizing and comparing reported larch occurrences and influencing components on the northern hemisphere continents in the present and in the past. The second objective was to find a possibility to directly study past Larix populations in Siberia and specifically their genetic variation, enabling the study of geographic movements. For this, I established chloroplast enrichment by hybridization capture from sedimentary ancient DNA (sedaDNA) isolated from lake sediment records. The third objective was to use the established method to track past larch populations, their glacial refugia during the Last Glacial Maximum (LGM) around 21,000 years before present (ka BP), and their post-glacial migration patterns. To study larch promoting factors, I compared the present state of larch species ranges, areas of dominance, their bioclimatic niches, and the distribution on different extents and thaw depths of permafrost. The species comparison showed that the bioclimatic niches greatly overlap between the American and Asian species and that it is only in the extremely continental climates in which only the Asian larch species can persist. I revealed that the area of dominance is strongly connected to permafrost extent but less linked to permafrost seasonal thaw depths. Comparisons of the paleorecord of larch between the continents suggest differences in the recolonization history. Outside of northern Asia and Alaska, glacial refugial populations of larch were confined to the southern regions and thus recolonization could only occur as migration from south to north. Alaskan larch populations could not establish wide-range dominant forest which could be related to their own genetically depletion as separated refugial population. In Asia, it is still unclear whether or not the northern refugial populations contributed and enhanced the postglacial colonization or whether they were replaced by populations invading from the south in the course of climate warming. Asian larch dominance is thus promoted partly by adaptions to extremely continental climates and by adaptations to grow on continuous permafrost but could be also connected to differences in glacial survival and recolonization history of Larix species. Except for extremely rare macrofossil findings of fossilized cones, traditional methods to study past vegetation are not able to distinguish between larch species or populations. Within the scope of this thesis, I therefore established a method to retrieve genetic information of past larch populations to distinguish between species. Using the Larix chloroplast genome as target, I successfully applied the method of DNA target enrichment by hybridization capture on sedaDNA samples from lake records and showed that it is able to distinguish between larch species. I then used the method on samples from lake records from across Siberia dating back up to 50 ka BP. The results allowed me to address the question of glacial survival and post-glacial recolonization mode in Siberian larch species. The analyzed pattern showed that LGM refugia were almost exclusively constituted by L. gmelinii, even in sites of current L. sibirica distribution. For included study sites, L. sibirica migrated into its extant northern distribution area only in the Holocene. Consequently, the post-glacial recolonization of L. sibirica was not enhanced by northern glacial refugia. In case of sites in extant distribution area of L. gmelinii, the absence of a genetic turn-over point to a continuous population rather than an invasion of southern refugia. The results suggest that climate has a strong influence on the distribution of Larix species and that species may also respond differently to future climate warming. Because species differ in their ecological characteristics, species distribution is also relevant with respect to further feedbacks between vegetation and climate. With this thesis, I give an overview of present and past larch occurrences and evaluate which factors promote their dominance. Furthermore, I provide the tools to study past Larix species and give first important insights into the glacial history of Larix populations.}, language = {en} } @article{MohandesanSpellerPetersetal.2017, author = {Mohandesan, Elmira and Speller, Camilla F. and Peters, Joris and Uerpmann, Hans-Peter and Uerpmann, Margarethe and De Cupere, Bea and Hofreiter, Michael and Burger, Pamela A.}, title = {Combined hybridization capture and shotgun sequencing for ancient DNA analysis of extinct wild and domestic dromedary camel}, series = {Molecular ecology resources}, volume = {17}, journal = {Molecular ecology resources}, number = {2}, publisher = {Wiley}, address = {Hoboken}, issn = {1755-098X}, doi = {10.1111/1755-0998.12551}, pages = {300 -- 313}, year = {2017}, abstract = {The performance of hybridization capture combined with next-generation sequencing (NGS) has seen limited investigation with samples from hot and arid regions until now. We applied hybridization capture and shotgun sequencing to recover DNA sequences from bone specimens of ancient-domestic dromedary (Camelus dromedarius) and its extinct ancestor, the wild dromedary from Jordan, Syria, Turkey and the Arabian Peninsula, respectively. Our results show that hybridization capture increased the percentage of mitochondrial DNA (mtDNA) recovery by an average 187-fold and in some cases yielded virtually complete mitochondrial (mt) genomes at multifold coverage in a single capture experiment. Furthermore, we tested the effect of hybridization temperature and time by using a touchdown approach on a limited number of samples. We observed no significant difference in the number of unique dromedary mtDNA reads retrieved with the standard capture compared to the touchdown method. In total, we obtained 14 partial mitochondrial genomes from ancient-domestic dromedaries with 17-95\% length coverage and 1.27-47.1-fold read depths for the covered regions. Using whole-genome shotgun sequencing, we successfully recovered endogenous dromedary nuclear DNA (nuDNA) from domestic and wild dromedary specimens with 1-1.06-fold read depths for covered regions. Our results highlight that despite recent methodological advances, obtaining ancient DNA (aDNA) from specimens recovered from hot, arid environments is still problematic. Hybridization protocols require specific optimization, and samples at the limit of DNA preservation need multiple replications of DNA extraction and hybridization capture as has been shown previously for Middle Pleistocene specimens.}, language = {en} } @article{ThomasCarvalhoHaileetal.2017, author = {Thomas, Jessica E. and Carvalho, Gary R. and Haile, James and Martin, Michael D. and Castruita, Jose A. Samaniego and Niemann, Jonas and Sinding, Mikkel-Holger S. and Sandoval-Velasco, Marcela and Rawlence, Nicolas J. and Fuller, Errol and Fjeldsa, Jon and Hofreiter, Michael and Stewart, John R. and Gilbert, M. Thomas P. and Knapp, Michael}, title = {An ‛Aukward' tale}, series = {Genes}, volume = {8}, journal = {Genes}, number = {6}, publisher = {MDPI}, address = {Basel}, issn = {2073-4425}, doi = {10.3390/genes8060164}, pages = {164}, year = {2017}, abstract = {One hundred and seventy-three years ago, the last two Great Auks, Pinguinus impennis, ever reliably seen were killed. Their internal organs can be found in the collections of the Natural History Museum of Denmark, but the location of their skins has remained a mystery. In 1999, Great Auk expert Errol Fuller proposed a list of five potential candidate skins in museums around the world. Here we take a palaeogenomic approach to test which—if any—of Fuller's candidate skins likely belong to either of the two birds. Using mitochondrial genomes from the five candidate birds (housed in museums in Bremen, Brussels, Kiel, Los Angeles, and Oldenburg) and the organs of the last two known individuals, we partially solve the mystery that has been on Great Auk scholars' minds for generations and make new suggestions as to the whereabouts of the still-missing skin from these two birds.}, language = {en} } @phdthesis{Huang2021, author = {Huang, Sichao}, title = {Past and present biodiversity in northeastern Siberia inferred from sedimentary DNA metabarcoding}, school = {Universit{\"a}t Potsdam}, year = {2021}, abstract = {The arctic-boreal treeline is a transition zone from taiga to tundra covering a vast area in Siberia. It often features large environmental gradients and reacts sensitively to changes in the environment. For example, the expansion of shrubs and a northward movement of the treeline are observable in Siberia as a response to the warming climate. The changes in vegetation across the treeline are known to influence the water chemistry in the lakes. This causes further alteration to the composition and diversity of sensitive aquatic organisms such as diatoms and macrophytes. Despite the rising awareness of the complex climate-feedback mechanisms of terrestrial plants, the understanding of their assembly rules and about responses of aquatic biomes in the surrounding treeline lakes is still limited. The goal of this thesis is to examine the previous and present biodiversity of terrestrial and freshwater biomes from the Siberian treeline ecotone, as well as their reactions to environmental changes. In particular, this thesis attempts to examine the performance of applying sedimentary DNA metabarcoding in terrestrial plants, aquatic macrophytes and diatoms, their spatial patterns along the environmental gradients and their temporal patterns throughout the climate transition from the late Pleistocene to Holocene. Sedimentary DNA metabarcoding combined with next-generation sequencing is applied as a primary tool to explore the composition and diversity of terrestrial plants, diatoms and aquatic macrophytes. The main study area is located in Chukotka of northeastern Siberia in the Arctic, a biodiversity hotspot due to its continental location and the diverse habitats of the glacial refugium. The modern diatom diversity was assessed with a specific diatom metabarcoding marker and morphological identification. Both approaches agree to a dominance of Fragilariaceae and Aulacoseiraceae, as well as on the environmental influential indicators of the diatom community. The high diversity of Fragilariaceae identified in the thermokarst lakes is found to follow the vegetation gradient along the treeline, suggesting that diatom metabarcoding can decipher relationships between diatom assemblage shifts and the relevant environmental changes. In particular, the metabarcoding approach detects diversification of fragilarioids in glacial lakes which is not visible using morphology. Sedimentary ancient DNA records indicate a vegetation mosaic of forb-dominated steppe-tundra during 28-19 ka, followed by a shift to dwarf-shrub tundra during 19-14 ka. During the most recent 14 thousand years, the vegetation consists of deciduous shrublands, then a change to boreal forest is observed. Investigations on the alpha diversity of the vegetation show that species richness is unexpectedly highest during pre-LGM, which is likely related to the extensive area that allows for more taxa. The optimum Holocene warming during 9-6 ka is not accompanied by a high richness as widely believed, but with an evenly distributed community by the fulfilment of erect shrubs. Furthermore, changes in taxonomic and phylogenetic diversity show complementary results in understanding community diversity. The composition and richness in the modern macrophytes community from Siberian Arctic and Chinese alpine are best co-influenced by July temperature and electrical conductivity.. Past macrophyte turnover during the late Pleistocene-Holocene is less noticeable in Siberia, whereas a pronounced community change from emergent to submerged plants is detected from Chinese alpine regions at about 14 ka due to increasing temperature and varying water conductivity. Finally, sedimentary DNA metabarcoding is a cost-effective and powerful proxy for ecological application, whereas completeness of the reference library, coverage and resolution of the metabarcoding marker are the major limitations of sedimentary DNA based diversity monitoring. The composition and richness in modern vegetation and macrophytes across broad spatial gradients is constrained by environmental variables, suggesting a potential usage for environmental monitoring. Diatom distributions are driven by different water variables along the treeline. Past records indicate that the shrub coverage has a noticeable influence on the assemblies of both terrestrial plants and aquatic macrophytes, though the shift in macrophyte community is relatively minor in the past 28 thousand years. In the long-term, the shrub expansion may eventually result in a genetically more diverse vegetation community but reduced species richness. When exceeding the optimal temperatures, further warming may lead to a decrease and putative loss of macrophytes and diatoms.}, language = {en} } @article{TaronLellBarlowetal.2018, author = {Taron, Ulrike H. and Lell, Moritz and Barlow, Axel and Paijmans, Johanna L. A.}, title = {Testing of Alignment Parameters for Ancient Samples}, series = {Genese}, volume = {9}, journal = {Genese}, number = {3}, publisher = {MDPI}, address = {Basel}, issn = {2073-4425}, doi = {10.3390/genes9030157}, pages = {12}, year = {2018}, abstract = {High-throughput sequence data retrieved from ancient or other degraded samples has led to unprecedented insights into the evolutionary history of many species, but the analysis of such sequences also poses specific computational challenges. The most commonly used approach involves mapping sequence reads to a reference genome. However, this process becomes increasingly challenging with an elevated genetic distance between target and reference or with the presence of contaminant sequences with high sequence similarity to the target species. The evaluation and testing of mapping efficiency and stringency are thus paramount for the reliable identification and analysis of ancient sequences. In this paper, we present 'TAPAS', (Testing of Alignment Parameters for Ancient Samples), a computational tool that enables the systematic testing of mapping tools for ancient data by simulating sequence data reflecting the properties of an ancient dataset and performing test runs using the mapping software and parameter settings of interest. We showcase TAPAS by using it to assess and improve mapping strategy for a degraded sample from a banded linsang (Prionodon linsang), for which no closely related reference is currently available. This enables a 1.8-fold increase of the number of mapped reads without sacrificing mapping specificity. The increase of mapped reads effectively reduces the need for additional sequencing, thus making more economical use of time, resources, and sample material.}, language = {en} } @article{AlbertiGonzalezPaijmansetal.2018, author = {Alberti, Federica and Gonzalez, Javier and Paijmans, Johanna L. A. and Basler, Nikolas and Preick, Michaela and Henneberger, Kirstin and Trinks, Alexandra and Rabeder, Gernot and Conard, Nicholas J. and Muenzel, Susanne C. and Joger, Ulrich and Fritsch, Guido and Hildebrandt, Thomas and Hofreiter, Michael and Barlow, Axel}, title = {Optimized DNA sampling of ancient bones using Computed Tomography scans}, series = {Molecular ecology resources}, volume = {18}, journal = {Molecular ecology resources}, number = {6}, publisher = {Wiley}, address = {Hoboken}, issn = {1755-098X}, doi = {10.1111/1755-0998.12911}, pages = {1196 -- 1208}, year = {2018}, abstract = {The prevalence of contaminant microbial DNA in ancient bone samples represents the principal limiting factor for palaeogenomic studies, as it may comprise more than 99\% of DNA molecules obtained. Efforts to exclude or reduce this contaminant fraction have been numerous but also variable in their success. Here, we present a simple but highly effective method to increase the relative proportion of endogenous molecules obtained from ancient bones. Using computed tomography (CT) scanning, we identify the densest region of a bone as optimal for sampling. This approach accurately identifies the densest internal regions of petrous bones, which are known to be a source of high-purity ancient DNA. For ancient long bones, CT scans reveal a high-density outermost layer, which has been routinely removed and discarded prior to DNA extraction. For almost all long bones investigated, we find that targeted sampling of this outermost layer provides an increase in endogenous DNA content over that obtained from softer, trabecular bone. This targeted sampling can produce as much as 50-fold increase in the proportion of endogenous DNA, providing a directly proportional reduction in sequencing costs for shotgun sequencing experiments. The observed increases in endogenous DNA proportion are not associated with any reduction in absolute endogenous molecule recovery. Although sampling the outermost layer can result in higher levels of human contamination, some bones were found to have more contamination associated with the internal bone structures. Our method is highly consistent, reproducible and applicable across a wide range of bone types, ages and species. We predict that this discovery will greatly extend the potential to study ancient populations and species in the genomics era.}, language = {en} }