@phdthesis{Ankenbrand2018, author = {Ankenbrand, Markus Johannes}, title = {Squeezing more information out of biological data - development and application of bioinformatic tools for ecology, evolution and genomics}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-156344}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2018}, abstract = {New experimental methods have drastically accelerated the pace and quantity at which biological data is generated. High-throughput DNA sequencing is one of the pivotal new technologies. It offers a number of novel applications in various fields of biology, including ecology, evolution, and genomics. However, together with those opportunities many new challenges arise. Specialized algorithms and software are required to cope with the amount of data, often requiring substantial training in bioinformatic methods. Another way to make those data accessible to non-bioinformaticians is the development of programs with intuitive user interfaces. In my thesis I developed analyses and programs to tackle current problems with high-throughput data in biology. In the field of ecology this covers the establishment of the bioinformatic workflow for pollen DNA meta-barcoding. Furthermore, I developed an application that facilitates the analysis of ecological communities in the context of their traits. Information from multiple public databases have been aggregated and can now be mapped automatically to existing community tables for interactive inspection. In evolution the new data are used to reconstruct phylogenetic trees from multiple genes. I developed the tool bcgTree to automate this process for bacteria. Many plant genomes have been sequenced in current years. Sequencing reads of those projects also contain data from the chloroplasts. The tool chloroExtractor supports the targeted extraction and analysis of the chloroplast genome. To compare the structure of multiple genomes specialized software is required for calculation and visualization of the relationships. I developed AliTV to address this. In contrast to existing programs for this task it allows interactive adjustments of produced graphics. Thus, facilitating the discovery of biologically relevant information. Another application I developed helps to analyze transcriptomes even if no reference genome is present. This is achieved by aggregating the different pieces of information, like functional annotation and expression level, for each transcript in a web platform. Scientists can then search, filter, subset, and visualize the transcriptome. Together the methods and tools expedite insights into biological systems that were not possible before.}, language = {en} } @article{CarradecPelletierDaSilvaetal.2018, author = {Carradec, Quentin and Pelletier, Eric and Da Silva, Corinne and Alberti, Adriana and Seeleuthner, Yoann and Blanc-Mathieu, Romain and Lima-Mendez, Gipsi and Rocha, Fabio and Tirichine, Leila and Labadie, Karine and Kirilovsky, Amos and Bertrand, Alexis and Engelen, Stefan and Madoui, Mohammed-Amin and M{\´e}heust, Rapha{\"e}l and Poulain, Julie and Romac, Sarah and Richter, Daniel J. and Yoshikawa, Genki and Dimier, C{\´e}line and Kandels-Lewis, Stefanie and Picheral, Marc and Searson, Sarah and Jaillon, Olivier and Aury, Jean-Marc and Karsenti, Eric and Sullivan, Matthew B. and Sunagawa, Shinichi and Bork, Peer and Not, Fabrice and Hingamp, Pascal and Raes, Jeroen and Guidi, Lionel and Ogata, Hiroyuki and de Vargas, Colomban and Iudicone, Daniele and Bowler, Chris and Wincker, Patrick}, title = {A global ocean atlas of eukaryotic gene}, series = {Nature Communications}, volume = {9}, journal = {Nature Communications}, organization = {Tara Oceans Coordinators}, doi = {10.1038/s41467-017-02342-1}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-222250}, year = {2018}, abstract = {While our knowledge about the roles of microbes and viruses in the ocean has increased tremendously due to recent advances in genomics and metagenomics, research on marine microbial eukaryotes and zooplankton has benefited much less from these new technologies because of their larger genomes, their enormous diversity, and largely unexplored physiologies. Here, we use a metatranscriptomics approach to capture expressed genes in open ocean Tara Oceans stations across four organismal size fractions. The individual sequence reads cluster into 116 million unigenes representing the largest reference collection of eukaryotic transcripts from any single biome. The catalog is used to unveil functions expressed by eukaryotic marine plankton, and to assess their functional biogeography. Almost half of the sequences have no similarity with known proteins, and a great number belong to new gene families with a restricted distribution in the ocean. Overall, the resource provides the foundations for exploring the roles of marine eukaryotes in ocean ecology and biogeochemistry.}, language = {en} }