@phdthesis{Horn2017, author = {Horn, Hannes}, title = {Analysis and interpretation of (meta-)genomic data from host-associated microorganisms}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-152035}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2017}, abstract = {Host-microbe interactions are the key to understand why and how microbes inhabit specific environments. With the scientific fields of microbial genomics and metagenomics, evolving on an unprecedented scale, one is able to gain insights in these interactions on a molecular and ecological level. The goal of this PhD thesis was to make (meta-)genomic data accessible, integrate it in a comparative manner and to gain comprehensive taxonomic and functional insights into bacterial strains and communities derived from two different environments: the phyllosphere of Arabidopsis thaliana and the mesohyl interior of marine sponges. This thesis focused first on the de novo assembly of bacterial genomes. A 5-step protocol was developed, each step including a quality control. The examination of different assembly software in a comparative way identified SPAdes as most suitable. The protocol enables the user to chose the best tailored assembly. Contamination issues were solved by an initial filtering of the data and methods normally used for the binning of metagenomic datasets. This step is missed in many published assembly pipelines. The described protocol offers assemblies of high quality ready for downstream analysis. Subsequently, assemblies generated with the developed protocol were annotated and explored in terms of their function. In a first study, the genome of a phyllosphere bacterium, Williamsia sp. ARP1, was analyzed, offering many adaptions to the leaf habitat: it can deal with temperature shifts, react to oxygen species, produces mycosporins as protection against UV-light, and is able to uptake photosynthates. Further, its taxonomic position within the Actinomycetales was infered from 16S rRNA and comparative genomics showing the close relation between the genera Williamsia and Gordonia. In a second study, six sponge-derived actinomycete genomes were investigated for secondary metabolism. By use of state-of-the-art software, these strains exhibited numerous gene clusters, mostly linked to polykethide synthases, non-ribosomal peptide synthesis, terpenes, fatty acids and saccharides. Subsequent predictions on these clusters offered a great variety of possible produced compounds with antibiotic, antifungal or anti-cancer activity. These analysis highlight the potential for the synthesis of natural products and the use of genomic data as screening toolkit. In a last study, three sponge-derived and one seawater metagenomes were functionally compared. Different signatures regarding the microbial composition and GC-distribution were observed between the two environments. With a focus on bacerial defense systems, the data indicates a pronounced repertoire of sponge associated bacteria for bacterial defense systems, in particular, Clustered Regularly Interspaced Short Palindromic Repeats, restriction modification system, DNA phosphorothioation and phage growth limitation. In addition, characterizing genes for secondary metabolite cluster differed between sponge and seawater microbiomes. Moreover, a variety of Type I polyketide synthases were only found within the sponge microbiomes. With that, metagenomics are shown to be a useful tool for the screening of secondary metabolite genes. Furthermore, enriched defense systems are highlighted as feature of sponge-associated microbes and marks them as a selective trait.}, subject = {Bakterien}, language = {en} } @phdthesis{Foerstner2008, author = {F{\"o}rstner, Konrad Ulrich}, title = {Computational analysis of metagenomic data: delineation of compositional features and screens for desirable enzymes}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-33577}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2008}, abstract = {The topic of my doctorial research was the computational analysis of metagenomic data. A metagenome comprises the genomic information from all the microorganisms within a certain environment. The currently available metagenomic data sets cover only parts of these usually huge metagenomes due to the high technical and financial effort of such sequencing endeavors. During my thesis I developed bioinformatic tools and applied them to analyse genomic features of different metagenomic data sets and to search for enzymes of importance for biotechnology or pharmaceutical applications in those sequence collections. In these studies nine metagenomic projects (with up to 41 subsamples) were analysed. These samples originated from diverse environments like farm soil, acid mine drainage, microbial mats on whale bones, marine water, fresh water, water treatment sludges and the human gut flora. Additionally, data sets of conventionally retrieved sequence data were taken into account and compared with each other}, subject = {Bioinformatik}, language = {en} }