@article{AlbrechtSharmaDittrichetal.2011, author = {Albrecht, Marco and Sharma, Cynthia M. and Dittrich, Marcus T. and M{\"u}ller, Tobias and Reinhardt, Richard and Vogel, J{\"o}rg and Rudel, Thomas}, title = {The Transcriptional Landscape of Chlamydia pneumoniae}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-69116}, year = {2011}, abstract = {Background: Gene function analysis of the obligate intracellular bacterium Chlamydia pneumoniae is hampered by the facts that this organism is inaccessible to genetic manipulations and not cultivable outside the host. The genomes of several strains have been sequenced; however, very little information is available on the gene structure and transcriptome of C. pneumoniae. Results: Using a differential RNA-sequencing approach with specific enrichment of primary transcripts, we defined the transcriptome of purified elementary bodies and reticulate bodies of C. pneumoniae strain CWL-029; 565 transcriptional start sites of annotated genes and novel transcripts were mapped. Analysis of adjacent genes for cotranscription revealed 246 polycistronic transcripts. In total, a distinct transcription start site or an affiliation to an operon could be assigned to 862 out of 1,074 annotated protein coding genes. Semi-quantitative analysis of mapped cDNA reads revealed significant differences for 288 genes in the RNA levels of genes isolated from elementary bodies and reticulate bodies. We have identified and in part confirmed 75 novel putative non-coding RNAs. The detailed map of transcription start sites at single nucleotide resolution allowed for the first time a comprehensive and saturating analysis of promoter consensus sequences in Chlamydia. Conclusions: The precise transcriptional landscape as a complement to the genome sequence will provide new insights into the organization, control and function of genes. Novel non-coding RNAs and identified common promoter motifs will help to understand gene regulation of this important human pathogen.}, subject = {Chlamydia pneumoniae}, language = {en} } @article{BijuSchwarzLinkeetal.2011, author = {Biju, Joseph and Schwarz, Roland and Linke, Burkhard and Blom, Jochen and Becker, Anke and Claus, Heike and Goesmann, Alexander and Frosch, Matthias and M{\"u}ller, Tobias and Vogel, Ulrich and Schoen, Christoph}, title = {Virulence Evolution of the Human Pathogen Neisseria meningitidis by Recombination in the Core and Accessory Genome}, series = {PLoS One}, volume = {6}, journal = {PLoS One}, number = {4}, doi = {10.1371/journal.pone.0018441}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-137960}, pages = {e18441}, year = {2011}, abstract = {Background Neisseria meningitidis is a naturally transformable, facultative pathogen colonizing the human nasopharynx. Here, we analyze on a genome-wide level the impact of recombination on gene-complement diversity and virulence evolution in N. meningitidis. We combined comparative genome hybridization using microarrays (mCGH) and multilocus sequence typing (MLST) of 29 meningococcal isolates with computational comparison of a subset of seven meningococcal genome sequences. Principal Findings We found that lateral gene transfer of minimal mobile elements as well as prophages are major forces shaping meningococcal population structure. Extensive gene content comparison revealed novel associations of virulence with genetic elements besides the recently discovered meningococcal disease associated (MDA) island. In particular, we identified an association of virulence with a recently described canonical genomic island termed IHT-E and a differential distribution of genes encoding RTX toxin- and two-partner secretion systems among hyperinvasive and non-hyperinvasive lineages. By computationally screening also the core genome for signs of recombination, we provided evidence that about 40\% of the meningococcal core genes are affected by recombination primarily within metabolic genes as well as genes involved in DNA replication and repair. By comparison with the results of previous mCGH studies, our data indicated that genetic structuring as revealed by mCGH is stable over time and highly similar for isolates from different geographic origins. Conclusions Recombination comprising lateral transfer of entire genes as well as homologous intragenic recombination has a profound impact on meningococcal population structure and genome composition. Our data support the hypothesis that meningococcal virulence is polygenic in nature and that differences in metabolism might contribute to virulence.}, language = {en} } @article{BeisserGrohmeKopkaetal.2012, author = {Beisser, Daniela and Grohme, Markus A. and Kopka, Joachim and Frohme, Marcus and Schill, Ralph O. and Hengherr, Steffen and Dandekar, Thomas and Klau, Gunnar W. and Dittrich, Marcus and M{\"u}ller, Tobias}, title = {Integrated pathway modules using time-course metabolic profiles and EST data from Milnesium tardigradum}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-75241}, year = {2012}, abstract = {Background: Tardigrades are multicellular organisms, resistant to extreme environmental changes such as heat, drought, radiation and freezing. They outlast these conditions in an inactive form (tun) to escape damage to cellular structures and cell death. Tardigrades are apparently able to prevent or repair such damage and are therefore a crucial model organism for stress tolerance. Cultures of the tardigrade Milnesium tardigradum were dehydrated by removing the surrounding water to induce tun formation. During this process and the subsequent rehydration, metabolites were measured in a time series by GC-MS. Additionally expressed sequence tags are available, especially libraries generated from the active and inactive state. The aim of this integrated analysis is to trace changes in tardigrade metabolism and identify pathways responsible for their extreme resistance against physical stress. Results: In this study we propose a novel integrative approach for the analysis of metabolic networks to identify modules of joint shifts on the transcriptomic and metabolic levels. We derive a tardigrade-specific metabolic network represented as an undirected graph with 3,658 nodes (metabolites) and 4,378 edges (reactions). Time course metabolite profiles are used to score the network nodes showing a significant change over time. The edges are scored according to information on enzymes from the EST data. Using this combined information, we identify a key subnetwork (functional module) of concerted changes in metabolic pathways, specific for de- and rehydration. The module is enriched in reactions showing significant changes in metabolite levels and enzyme abundance during the transition. It resembles the cessation of a measurablemetabolism (e.g. glycolysis and amino acid anabolism) during the tun formation, the production of storage metabolites and bioprotectants, such as DNA stabilizers, and the generation of amino acids and cellular components from monosaccharides as carbon and energy source during rehydration. Conclusions: The functional module identifies relationships among changed metabolites (e.g. spermidine) and reactions and provides first insights into important altered metabolic pathways. With sparse and diverse data available, the presented integrated metabolite network approach is suitable to integrate all existing data and analyse it in a combined manner.}, subject = {Milnesium tardigradum}, language = {en} } @article{MergetKoetschanHackletal.2012, author = {Merget, Benjamin and Koetschan, Christian and Hackl, Thomas and F{\"o}rster, Frank and Dandekar, Thomas and M{\"u}ller, Tobias and Schultz, J{\"o}rg and Wolf, Matthias}, title = {The ITS2 Database}, series = {Journal of Visual Expression}, volume = {61}, journal = {Journal of Visual Expression}, number = {e3806}, doi = {10.3791/3806}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-124600}, year = {2012}, abstract = {The internal transcribed spacer 2 (ITS2) has been used as a phylogenetic marker for more than two decades. As ITS2 research mainly focused on the very variable ITS2 sequence, it confined this marker to low-level phylogenetics only. However, the combination of the ITS2 sequence and its highly conserved secondary structure improves the phylogenetic resolution1 and allows phylogenetic inference at multiple taxonomic ranks, including species delimitation. The ITS2 Database presents an exhaustive dataset of internal transcribed spacer 2 sequences from NCBI GenBank accurately reannotated. Following an annotation by profile Hidden Markov Models (HMMs), the secondary structure of each sequence is predicted. First, it is tested whether a minimum energy based fold (direct fold) results in a correct, four helix conformation. If this is not the case, the structure is predicted by homology modeling. In homology modeling, an already known secondary structure is transferred to another ITS2 sequence, whose secondary structure was not able to fold correctly in a direct fold. The ITS2 Database is not only a database for storage and retrieval of ITS2 sequence-structures. It also provides several tools to process your own ITS2 sequences, including annotation, structural prediction, motif detection and BLAST search on the combined sequence-structure information. Moreover, it integrates trimmed versions of 4SALE and ProfDistS for multiple sequence-structure alignment calculation and Neighbor Joining tree reconstruction. Together they form a coherent analysis pipeline from an initial set of sequences to a phylogeny based on sequence and secondary structure. In a nutshell, this workbench simplifies first phylogenetic analyses to only a few mouse-clicks, while additionally providing tools and data for comprehensive large-scale analyses.}, language = {en} } @article{FoersterBeisserGrohmeetal.2012, author = {F{\"o}rster, Frank and Beisser, Daniela and Grohme, Markus A. and Liang, Chunguang and Mali, Brahim and Siegl, Alexander Matthias and Engelmann, Julia C. and Shkumatov, Alexander V. and Schokraie, Elham and M{\"u}ller, Tobias and Schn{\"o}lzer, Martina and Schill, Ralph O. and Frohme, Marcus and Dandekar, Thomas}, title = {Transcriptome analysis in tardigrade species reveals specific molecular pathways for stress adaptations}, series = {Bioinformatics and biology insights}, volume = {6}, journal = {Bioinformatics and biology insights}, doi = {10.4137/BBI.S9150}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-123089}, pages = {69-96}, year = {2012}, abstract = {Tardigrades have unique stress-adaptations that allow them to survive extremes of cold, heat, radiation and vacuum. To study this, encoded protein clusters and pathways from an ongoing transcriptome study on the tardigrade \(Milnesium\) \(tardigradum\) were analyzed using bioinformatics tools and compared to expressed sequence tags (ESTs) from \(Hypsibius\) \(dujardini\), revealing major pathways involved in resistance against extreme environmental conditions. ESTs are available on the Tardigrade Workbench along with software and databank updates. Our analysis reveals that RNA stability motifs for \(M.\) \(tardigradum\) are different from typical motifs known from higher animals. \(M.\) \(tardigradum\) and \(H.\) \(dujardini\) protein clusters and conserved domains imply metabolic storage pathways for glycogen, glycolipids and specific secondary metabolism as well as stress response pathways (including heat shock proteins, bmh2, and specific repair pathways). Redox-, DNA-, stress- and protein protection pathways complement specific repair capabilities to achieve the strong robustness of \(M.\) \(tardigradum\). These pathways are partly conserved in other animals and their manipulation could boost stress adaptation even in human cells. However, the unique combination of resistance and repair pathways make tardigrades and \(M.\) \(tardigradum\) in particular so highly stress resistant.}, language = {en} } @article{StaigerCadotKooteretal.2012, author = {Staiger, Christine and Cadot, Sidney and Kooter, Raul and Dittrich, Marcus and M{\"u}ller, Tobias and Klau, Gunnar W. and Wessels, Lodewyk F. A.}, title = {A Critical Evaluation of Network and Pathway-Based Classifiers for Outcome Prediction in Breast Cancer}, series = {PLoS One}, volume = {7}, journal = {PLoS One}, number = {4}, doi = {10.1371/journal.pone.0034796}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-131323}, pages = {e34796}, year = {2012}, abstract = {Recently, several classifiers that combine primary tumor data, like gene expression data, and secondary data sources, such as protein-protein interaction networks, have been proposed for predicting outcome in breast cancer. In these approaches, new composite features are typically constructed by aggregating the expression levels of several genes. The secondary data sources are employed to guide this aggregation. Although many studies claim that these approaches improve classification performance over single genes classifiers, the gain in performance is difficult to assess. This stems mainly from the fact that different breast cancer data sets and validation procedures are employed to assess the performance. Here we address these issues by employing a large cohort of six breast cancer data sets as benchmark set and by performing an unbiased evaluation of the classification accuracies of the different approaches. Contrary to previous claims, we find that composite feature classifiers do not outperform simple single genes classifiers. We investigate the effect of (1) the number of selected features; (2) the specific gene set from which features are selected; (3) the size of the training set and (4) the heterogeneity of the data set on the performance of composite feature and single genes classifiers. Strikingly, we find that randomization of secondary data sources, which destroys all biological information in these sources, does not result in a deterioration in performance of composite feature classifiers. Finally, we show that when a proper correction for gene set size is performed, the stability of single genes sets is similar to the stability of composite feature sets. Based on these results there is currently no reason to prefer prognostic classifiers based on composite features over single genes classifiers for predicting outcome in breast cancer.}, language = {en} } @article{WolfChenSongetal.2013, author = {Wolf, Matthias and Chen, Shilin and Song, Jingyuan and Ankenbrand, Markus and M{\"u}ller, Tobias}, title = {Compensatory Base Changes in ITS2 Secondary Structures Correlate with the Biological Species Concept Despite Intragenomic Variability in ITS2 Sequences - A Proof of Concept}, series = {PLoS ONE}, journal = {PLoS ONE}, doi = {10.1371/journal.pone.0066726}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-96450}, year = {2013}, abstract = {Compensatory base changes (CBCs) in internal transcribed spacer 2 (ITS2) rDNA secondary structures correlate with Ernst Mayr's biological species concept. This hypothesis also referred to as the CBC species concept recently was subjected to large-scale testing, indicating two distinct probabilities. (1) If there is a CBC then there are two different species with a probability of ~0.93. (2) If there is no CBC then there is the same species with a probability of ~0.76. In ITS2 research, however, the main problem is the multicopy nature of ITS2 sequences. Most recently, 454 pyrosequencing data have been used to characterize more than 5000 intragenomic variations of ITS2 regions from 178 plant species, demonstrating that mutation of ITS2 is frequent, with a mean of 35 variants per species, respectively per individual organism. In this study, using those 454 data, the CBC criterion is reconsidered in the light of intragenomic variability, a proof of concept, a necessary criterion, expecting no intragenomic CBCs in variant ITS2 copies. In accordance with the CBC species concept, we could demonstrate that the probability that there is no intragenomic CBC is ~0.99.}, language = {en} } @article{FlorenMupepeleMuelleretal.2014, author = {Floren, Andreas and Mupepele, Anne-Christine and M{\"u}ller, Tobias and Dittrich, Marcus}, title = {Are Temperate Canopy Spiders Tree-Species Specific?}, doi = {10.1371/journal.pone.0086571}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-111413}, year = {2014}, abstract = {Arboreal spiders in deciduous and coniferous trees were investigated on their distribution and diversity. Insecticidal knock-down was used to comprehensively sample spiders from 175 trees from 2001 to 2003 in the Białowieża forest and three remote forests in Poland. We identified 140 species from 9273 adult spiders. Spider communities were distinguished between deciduous and coniferous trees. The richest fauna was collected from Quercus where beta diversity was also highest. A tree-species-specific pattern was clearly observed for Alnus, Carpinus, Picea and Pinus trees and also for those tree species that were fogged in only four or three replicates, namely Betula and Populus. This hitherto unrecognised association was mainly due to the community composition of common species identified in a Dufrene-Legendre indicator species analysis. It was not caused by spatial or temporal autocorrelation. Explaining tree-species specificity for generalist predators like spiders is difficult and has to involve physical and ecological tree parameters like linkage with the abundance of prey species. However, neither did we find a consistent correlation of prey group abundances with spiders nor could differences in spider guild composition explain the observed pattern. Our results hint towards the importance of deterministic mechanisms structuring communities of generalist canopy spiders although the casual relationship is not yet understood.}, language = {en} } @article{KoetschanKittelmannLuetal.2014, author = {Koetschan, Christian and Kittelmann, Sandra and Lu, Jingli and Al-Halbouni, Djamila and Jarvis, Graeme N. and M{\"u}ller, Tobias and Wolf, Matthias and Janssen, Peter H.}, title = {Internal Transcribed Spacer 1 Secondary Structure Analysis Reveals a Common Core throughout the Anaerobic Fungi (Neocallimastigomycota)}, series = {PLOS ONE}, volume = {9}, journal = {PLOS ONE}, number = {3}, doi = {10.1371/journal.pone.0091928}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-117058}, pages = {e91928}, year = {2014}, abstract = {The internal transcribed spacer (ITS) is a popular barcode marker for fungi and in particular the ITS1 has been widely used for the anaerobic fungi (phylum Neocallimastigomycota). A good number of validated reference sequences of isolates as well as a large number of environmental sequences are available in public databases. Its highly variable nature predisposes the ITS1 for low level phylogenetics; however, it complicates the establishment of reproducible alignments and the reconstruction of stable phylogenetic trees at higher taxonomic levels (genus and above). Here, we overcame these problems by proposing a common core secondary structure of the ITS1 of the anaerobic fungi employing a Hidden Markov Model-based ITS1 sequence annotation and a helix-wise folding approach. We integrated the additional structural information into phylogenetic analyses and present for the first time an automated sequence-structure-based taxonomy of the ITS1 of the anaerobic fungi. The methodology developed is transferable to the ITS1 of other fungal groups, and the robust taxonomy will facilitate and improve high-throughput anaerobic fungal community structure analysis of samples from various environments.}, language = {en} } @article{RemmeleXianAlbrechtetal.2014, author = {Remmele, Christian W. and Xian, Yibo and Albrecht, Marco and Faulstich, Michaela and Fraunholz, Martin and Heinrichs, Elisabeth and Dittrich, Marcus T. and M{\"u}ller, Tobias and Reinhardt, Richard and Rudel, Thomas}, title = {Transcriptional landscape and essential genes of Neisseria gonorrhoeae}, doi = {10.1093/nar/gku762}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-113676}, year = {2014}, abstract = {The WHO has recently classified Neisseria gonorrhoeae as a super-bacterium due to the rapid spread of antibiotic resistant derivatives and an overall dramatic increase in infection incidences. Genome sequencing has identified potential genes, however, little is known about the transcriptional organization and the presence of non-coding RNAs in gonococci. We performed RNA sequencing to define the transcriptome and the transcriptional start sites of all gonococcal genes and operons. Numerous new transcripts including 253 potentially non-coding RNAs transcribed from intergenic regions or antisense to coding genes were identified. Strikingly, strong antisense transcription was detected for the phase-variable opa genes coding for a family of adhesins and invasins in pathogenic Neisseria, that may have regulatory functions. Based on the defined transcriptional start sites, promoter motifs were identified. We further generated and sequenced a high density Tn5 transposon library to predict a core of 827 gonococcal essential genes, 133 of which have no known function. Our combined RNA-Seq and Tn-Seq approach establishes a detailed map of gonococcal genes and defines the first core set of essential gonococcal genes.}, language = {en} }