@phdthesis{Ankenbrand2018, author = {Ankenbrand, Markus Johannes}, title = {Squeezing more information out of biological data - development and application of bioinformatic tools for ecology, evolution and genomics}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-156344}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2018}, abstract = {New experimental methods have drastically accelerated the pace and quantity at which biological data is generated. High-throughput DNA sequencing is one of the pivotal new technologies. It offers a number of novel applications in various fields of biology, including ecology, evolution, and genomics. However, together with those opportunities many new challenges arise. Specialized algorithms and software are required to cope with the amount of data, often requiring substantial training in bioinformatic methods. Another way to make those data accessible to non-bioinformaticians is the development of programs with intuitive user interfaces. In my thesis I developed analyses and programs to tackle current problems with high-throughput data in biology. In the field of ecology this covers the establishment of the bioinformatic workflow for pollen DNA meta-barcoding. Furthermore, I developed an application that facilitates the analysis of ecological communities in the context of their traits. Information from multiple public databases have been aggregated and can now be mapped automatically to existing community tables for interactive inspection. In evolution the new data are used to reconstruct phylogenetic trees from multiple genes. I developed the tool bcgTree to automate this process for bacteria. Many plant genomes have been sequenced in current years. Sequencing reads of those projects also contain data from the chloroplasts. The tool chloroExtractor supports the targeted extraction and analysis of the chloroplast genome. To compare the structure of multiple genomes specialized software is required for calculation and visualization of the relationships. I developed AliTV to address this. In contrast to existing programs for this task it allows interactive adjustments of produced graphics. Thus, facilitating the discovery of biologically relevant information. Another application I developed helps to analyze transcriptomes even if no reference genome is present. This is achieved by aggregating the different pieces of information, like functional annotation and expression level, for each transcript in a web platform. Scientists can then search, filter, subset, and visualize the transcriptome. Together the methods and tools expedite insights into biological systems that were not possible before.}, language = {en} } @phdthesis{delOlmoToledo2019, author = {del Olmo Toledo, Valentina}, title = {Evolution of DNA binding preferences in a family of eukaryotic transcription regulators}, doi = {10.25972/OPUS-18789}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-187890}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2019}, abstract = {Regulation of gene expression by the control of transcription is essential for any cell to adapt to the environment and survive. Transcription regulators, i.e. sequence-specific DNA binding proteins that regulate gene expression, are central elements within the gene networks of most organisms. Transcription regulators are grouped into distinct families based on structural features that determine, to a large extent, the DNA sequence(s) that they can recognise and bind. Less is known, however, about how the DNA binding preferences can diversify within transcription regulator families during evolutionary timescales, and how such diversification can affect the biology of the organism. In this dissertation I study the SREBP (sterol regulatory element binding protein) family of transcriptional regulators in yeasts, and in Candida albicans in particular, as an experimental system to address these questions. The SREBPs are conserved from fungi to humans and represent a subgroup of basic helix-loop-helix DNA binding proteins. Early chromatin immunoprecipitation experiments with SREBPs from humans and yeasts showed that these proteins bound in vivo to the canonical DNA sequence, termed E-box, most basic helix-loop-helix proteins bind to. By contrast, most recent analysis carried out with less-studied fungal SREBPs revealed a non-canonical DNA motif to be the most overrepresented sequence in the bound regions. This study aims to establish the intrinsic DNA binding preferences of key branches of this family and to determine how the divergence in DNA binding affinities originated. To this end, I combined phylogenetic and ancestral reconstruction with extensive biochemical characterisation of key SREBP proteins. The results indicated that while the most-studied SREBPs (in mammals) indeed show preference for the E-box, a second branch of the family preferentially binds the non-E-box, and a third one is able to bind both sequences with similar affinity. The preference for one or the other DNA sequence is an intrinsic property of each protein because their purified DNA binding domain was sufficient to recapitulate their in vivo binding preference. The ancestor that gave rise to these two different types of SREBPs (the branch that binds E-box and the one that binds non-E-box DNA) appears to be a protein with a broader DNA binding capability that had a slight preference for the non-canonical motif. Thus, the results imply these two branches originated by either enhancing the original ancestral preference for non-E-box or tilting it towards the E-box DNA and flipping the preference for this sequence. The main function associated with members of the SREBP family in most eukaryotes is the control of lipid biosynthesis. I have further studied the function of these proteins in the lineage that encompasses the human associated yeast C. albicans. Strikingly, the three SREBPs present in the fungus' genome contribute to the colonisation of the mammalian gut by regulating cellular processes unrelated to lipid metabolism. Here I describe that two of the three C. albicans SREBPs form a regulatory cascade that regulates morphology and cell wall modifications under anaerobic conditions, whereas the third SREBP has been shown to be involved in the regulation of glycolysis genes. Therefore, I posit that the described diversification in DNA binding specificity in these proteins and the concomitant expansion of targets of regulation were key in enabling this fungal lineage to associate with animals.}, subject = {Candida albicans}, language = {en} }