@article{WheelerBarquistKingsleyetal.2016, author = {Wheeler, Nicole E. and Barquist, Lars and Kingsley, Robert A. and Gardner, Paul P.}, title = {A profile-based method for identifying functional divergence of orthologous genes in bacterial genomes}, series = {Bioinformatics}, volume = {32}, journal = {Bioinformatics}, number = {23}, doi = {10.1093/bioinformatics/btw518}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-186502}, pages = {3566-3574}, year = {2016}, abstract = {Motivation: Next generation sequencing technologies have provided us with a wealth of information on genetic variation, but predi cting the functional significance of this variation is a difficult task. While many comparative genomics studies have focused on gene flux and large scale changes, relatively little attention has been paid to quantifying the effects of single nucleotide polymorphisms and indels on protein function, particularly in bacterial genomics. Results: We present a hidden Markov model based approach we call delta-bitscore (DBS) for identifying orthologous proteins that have diverged at the amino acid sequence level in a way that is likely to impact biological function. We benchmark this approach with several widely used datasets and apply it to a proof-of-concept study of orthologous proteomes in an investigation of host adaptation in Salmonella enterica. We highlight the value of the method in identifying functional divergence of genes, and suggest that this tool may be a better approach than the commonly used dN/dS metric for identifying functionally significant genetic changes occurring in recently diverged organisms.}, language = {en} } @article{WestermannBarquistVogel2017, author = {Westermann, Alexander J. and Barquist, Lars and Vogel, J{\"o}rg}, title = {Resolving host-pathogen interactions by dual RNA-seq}, series = {PLoS Pathogens}, volume = {13}, journal = {PLoS Pathogens}, number = {2}, doi = {10.1371/journal.ppat.1006033}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-171921}, year = {2017}, abstract = {The transcriptome is a powerful proxy for the physiological state of a cell, healthy or diseased. As a result, transcriptome analysis has become a key tool in understanding the molecular changes that accompany bacterial infections of eukaryotic cells. Until recently, such transcriptomic studies have been technically limited to analyzing mRNA expression changes in either the bacterial pathogen or the infected eukaryotic host cell. However, the increasing sensitivity of high-throughput RNA sequencing now enables "dual RNA-seq" studies, simultaneously capturing all classes of coding and noncoding transcripts in both the pathogen and the host. In the five years since the concept of dual RNA-seq was introduced, the technique has been applied to a range of infection models. This has not only led to a better understanding of the physiological changes in pathogen and host during the course of an infection but has also revealed hidden molecular phenotypes of virulence-associated small noncoding RNAs that were not visible in standard infection assays. Here, we use the knowledge gained from these recent studies to suggest experimental and computational guidelines for the design of future dual RNA-seq studies. We conclude this review by discussing prospective applications of the technique.}, language = {en} } @article{ReadMillsJohnsonetal.2016, author = {Read, Hannah M. and Mills, Grant and Johnson, Sarah and Tsai, Peter and Dalton, James and Barquist, Lars and Print, Cristin G. and Patrick, Wayne M. and Wiles, Siouxsie}, title = {The in vitro and in vivo effects of constitutive light expression on a bioluminescent strain of the mouse enteropathogen Citrobacter rodentium}, series = {PeerJ}, volume = {4}, journal = {PeerJ}, number = {e2130}, doi = {10.7717/peerj.2130}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-166576}, year = {2016}, abstract = {Bioluminescent reporter genes, such as those from fireflies and bacteria, let researchers use light production as a non-invasive and non-destructive surrogate measure of microbial numbers in a wide variety of environments. As bioluminescence needs microbial metabolites, tagging microorganisms with luciferases means only live metabolically active cells are detected. Despite the wide use of bioluminescent reporter genes, very little is known about the impact of continuous (also called constitutive) light expression on tagged bacteria. We have previously made a bioluminescent strain of Citrobacter rodentium, a bacterium which infects laboratory mice in a similar way to how enteropathogenic Escherichia coli (EPEC) and enterohaemorrhagic E. coli (EHEC) infect humans. In this study, we compared the growth of the bioluminescent C. rodentium strain ICC180 with its non-bioluminescent parent (strain ICC169) in a wide variety of environments. To understand more about the metabolic burden of expressing light, we also compared the growth profiles of the two strains under approximately 2,000 different conditions. We found that constitutive light expression in ICC180 was near-neutral in almost every non-toxic environment tested. However, we also found that the non-bioluminescent parent strain has a competitive advantage over ICC180 during infection of adult mice, although this was not enough for ICC180 to be completely outcompeted. In conclusion, our data suggest that constitutive light expression is not metabolically costly to C. rodentium and supports the view that bioluminescent versions of microbes can be used as a substitute for their non-bioluminescent parents to study bacterial behaviour in a wide variety of environments.}, language = {en} } @article{PrezzaRyanMaedleretal.2022, author = {Prezza, Gianluca and Ryan, Daniel and M{\"a}dler, Gohar and Reichardt, Sarah and Barquist, Lars and Westermann, Alexander J.}, title = {Comparative genomics provides structural and functional insights into Bacteroides RNA biology}, series = {Molecular Microbiology}, volume = {117}, journal = {Molecular Microbiology}, number = {1}, doi = {10.1111/mmi.14793}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-259594}, pages = {67-85}, year = {2022}, abstract = {Bacteria employ noncoding RNA molecules for a wide range of biological processes, including scaffolding large molecular complexes, catalyzing chemical reactions, defending against phages, and controlling gene expression. Secondary structures, binding partners, and molecular mechanisms have been determined for numerous small noncoding RNAs (sRNAs) in model aerobic bacteria. However, technical hurdles have largely prevented analogous analyses in the anaerobic gut microbiota. While experimental techniques are being developed to investigate the sRNAs of gut commensals, computational tools and comparative genomics can provide immediate functional insight. Here, using Bacteroides thetaiotaomicron as a representative microbiota member, we illustrate how comparative genomics improves our understanding of RNA biology in an understudied gut bacterium. We investigate putative RNA-binding proteins and predict a Bacteroides cold-shock protein homolog to have an RNA-related function. We apply an in silico protocol incorporating both sequence and structural analysis to determine the consensus structures and conservation of nine Bacteroides noncoding RNA families. Using structure probing, we validate and refine these predictions and deposit them in the Rfam database. Through synteny analyses, we illustrate how genomic coconservation can serve as a predictor of sRNA function. Altogether, this work showcases the power of RNA informatics for investigating the RNA biology of anaerobic microbiota members.}, language = {en} } @article{OkoroBarquistConnoretal.2015, author = {Okoro, Chinyere K. and Barquist, Lars and Connor, Thomas R. and Harris, Simon R. and Clare, Simon and Stevens, Mark P. and Arends, Mark J. and Hale, Christine and Kane, Leanne and Pickard, Derek J. and Hill, Jennifer and Harcourt, Katherine and Parkhill, Julian and Dougan, Gordon and Kingsley, Robert A.}, title = {Signatures of adaptation in human invasive Salmonella Typhimurium ST313 populations from sub-Saharan Africa}, series = {PLoS Neglected Tropical Diseases}, volume = {9}, journal = {PLoS Neglected Tropical Diseases}, number = {3}, doi = {10.1371/journal.pntd.0003611}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-143779}, pages = {e0003611}, year = {2015}, abstract = {Two lineages of Salmonella enterica serovar Typhimurium (S. Typhimurium) of multi-locus sequence type ST313 have been linked with the emergence of invasive Salmonella disease across sub-Saharan Africa. The expansion of these lineages has a temporal association with the HIV pandemic and antibiotic usage. We analysed the whole genome sequence of 129 ST313 isolates representative of the two lineages and found evidence of lineage-specific genome degradation, with some similarities to that observed in S. Typhi. Individual ST313 S. Typhimurium isolates exhibit a distinct metabolic signature and modified enteropathogenesis in both a murine and cattle model of colitis, compared to S. Typhimurium outside of the ST313 lineages. These data define phenotypes that distinguish ST313 isolates from other S. Typhimurium and may represent adaptation to a distinct pathogenesis and lifestyle linked to an-immuno-compromised human population.}, language = {en} } @article{MichauxHansenJennichesetal.2020, author = {Michaux, Charlotte and Hansen, Elisabeth E. and Jenniches, Laura and Gerovac, Milan and Barquist, Lars and Vogel, J{\"o}rg}, title = {Single-Nucleotide RNA Maps for the Two Major Nosocomial Pathogens Enterococcus faecalis and Enterococcus faecium}, series = {Frontiers in Cellular and Infection Microbiology}, volume = {10}, journal = {Frontiers in Cellular and Infection Microbiology}, issn = {2235-2988}, doi = {10.3389/fcimb.2020.600325}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-217947}, year = {2020}, abstract = {Enterococcus faecalis and faecium are two major representative clinical strains of the Enterococcus genus and are sadly notorious to be part of the top agents responsible for nosocomial infections. Despite their critical implication in worldwide public healthcare, essential and available resources such as deep transcriptome annotations remain poor, which also limits our understanding of post-transcriptional control small regulatory RNA (sRNA) functions in these bacteria. Here, using the dRNA-seq technique in combination with ANNOgesic analysis, we successfully mapped and annotated transcription start sites (TSS) of both E. faecalis V583 and E. faecium AUS0004 at single nucleotide resolution. Analyzing bacteria in late exponential phase, we capture ~40\% (E. faecalis) and 43\% (E. faecium) of the annotated protein-coding genes, determine 5′ and 3′ UTR (untranslated region) length, and detect instances of leaderless mRNAs. The transcriptome maps revealed sRNA candidates in both bacteria, some found in previous studies and new ones. Expression of candidate sRNAs is being confirmed under biologically relevant environmental conditions. This comprehensive global TSS mapping atlas provides a valuable resource for RNA biology and gene expression analysis in the Enterococci. It can be accessed online at www.helmholtz-hiri.de/en/datasets/enterococcus through an instance of the genomic viewer JBrowse.}, language = {en} } @article{MichauxGerovacHansenetal.2023, author = {Michaux, Charlotte and Gerovac, Milan and Hansen, Elisabeth E. and Barquist, Lars and Vogel, J{\"o}rg}, title = {Grad-seq analysis of Enterococcus faecalis and Enterococcus faecium provides a global view of RNA and protein complexes in these two opportunistic pathogens}, series = {microLife}, volume = {4}, journal = {microLife}, doi = {10.1093/femsml/uqac027}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-313311}, year = {2023}, abstract = {Enterococcus faecalis and Enterococcus faecium are major nosocomial pathogens. Despite their relevance to public health and their role in the development of bacterial antibiotic resistance, relatively little is known about gene regulation in these species. RNA-protein complexes serve crucial functions in all cellular processes associated with gene expression, including post-transcriptional control mediated by small regulatory RNAs (sRNAs). Here, we present a new resource for the study of enterococcal RNA biology, employing the Grad-seq technique to comprehensively predict complexes formed by RNA and proteins in E. faecalis V583 and E. faecium AUS0004. Analysis of the generated global RNA and protein sedimentation profiles led to the identification of RNA-protein complexes and putative novel sRNAs. Validating our data sets, we observe well-established cellular RNA-protein complexes such as the 6S RNA-RNA polymerase complex, suggesting that 6S RNA-mediated global control of transcription is conserved in enterococci. Focusing on the largely uncharacterized RNA-binding protein KhpB, we use the RIP-seq technique to predict that KhpB interacts with sRNAs, tRNAs, and untranslated regions of mRNAs, and might be involved in the processing of specific tRNAs. Collectively, these datasets provide departure points for in-depth studies of the cellular interactome of enterococci that should facilitate functional discovery in these and related Gram-positive species. Our data are available to the community through a user-friendly Grad-seq browser that allows interactive searches of the sedimentation profiles (https://resources.helmholtz-hiri.de/gradseqef/).}, language = {en} } @article{LindgreenUmuLaietal.2014, author = {Lindgreen, Stinus and Umu, Sinan Uğur and Lai, Alicia Sook-Wei and Eldai, Hisham and Liu, Wenting and McGimpsey, Stephanie and Wheeler, Nicole E. and Biggs, Patrick J. and Thomson, Nick R. and Barquist, Lars and Poole, Anthony M. and Gardner, Paul P.}, title = {Robust Identification of Noncoding RNA from Transcriptomes Requires Phylogenetically-Informed Sampling}, series = {PLOS Computational Biology}, volume = {10}, journal = {PLOS Computational Biology}, number = {10}, doi = {10.1371/journal.pcbi.1003907}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-115259}, pages = {e1003907}, year = {2014}, abstract = {Noncoding RNAs are integral to a wide range of biological processes, including translation, gene regulation, host-pathogen interactions and environmental sensing. While genomics is now a mature field, our capacity to identify noncoding RNA elements in bacterial and archaeal genomes is hampered by the difficulty of de novo identification. The emergence of new technologies for characterizing transcriptome outputs, notably RNA-seq, are improving noncoding RNA identification and expression quantification. However, a major challenge is to robustly distinguish functional outputs from transcriptional noise. To establish whether annotation of existing transcriptome data has effectively captured all functional outputs, we analysed over 400 publicly available RNA-seq datasets spanning 37 different Archaea and Bacteria. Using comparative tools, we identify close to a thousand highly-expressed candidate noncoding RNAs. However, our analyses reveal that capacity to identify noncoding RNA outputs is strongly dependent on phylogenetic sampling. Surprisingly, and in stark contrast to protein-coding genes, the phylogenetic window for effective use of comparative methods is perversely narrow: aggregating public datasets only produced one phylogenetic cluster where these tools could be used to robustly separate unannotated noncoding RNAs from a null hypothesis of transcriptional noise. Our results show that for the full potential of transcriptomics data to be realized, a change in experimental design is paramount: effective transcriptomics requires phylogeny-aware sampling.}, language = {en} } @article{HombergerHaywardBarquistetal.2023, author = {Homberger, Christina and Hayward, Regan J. and Barquist, Lars and Vogel, J{\"o}rg}, title = {Improved bacterial single-cell RNA-seq through automated MATQ-seq and Cas9-based removal of rRNA reads}, series = {mBio}, volume = {14}, journal = {mBio}, number = {2}, doi = {10.1128/mbio.03557-22}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-350059}, year = {2023}, abstract = {Bulk RNA sequencing technologies have provided invaluable insights into host and bacterial gene expression and associated regulatory networks. Nevertheless, the majority of these approaches report average expression across cell populations, hiding the true underlying expression patterns that are often heterogeneous in nature. Due to technical advances, single-cell transcriptomics in bacteria has recently become reality, allowing exploration of these heterogeneous populations, which are often the result of environmental changes and stressors. In this work, we have improved our previously published bacterial single-cell RNA sequencing (scRNA-seq) protocol that is based on multiple annealing and deoxycytidine (dC) tailing-based quantitative scRNA-seq (MATQ-seq), achieving a higher throughput through the integration of automation. We also selected a more efficient reverse transcriptase, which led to reduced cell loss and higher workflow robustness. Moreover, we successfully implemented a Cas9-based rRNA depletion protocol into the MATQ-seq workflow. Applying our improved protocol on a large set of single Salmonella cells sampled over different growth conditions revealed improved gene coverage and a higher gene detection limit compared to our original protocol and allowed us to detect the expression of small regulatory RNAs, such as GcvB or CsrB at a single-cell level. In addition, we confirmed previously described phenotypic heterogeneity in Salmonella in regard to expression of pathogenicity-associated genes. Overall, the low percentage of cell loss and high gene detection limit makes the improved MATQ-seq protocol particularly well suited for studies with limited input material, such as analysis of small bacterial populations in host niches or intracellular bacteria. IMPORTANCE: Gene expression heterogeneity among isogenic bacteria is linked to clinically relevant scenarios, like biofilm formation and antibiotic tolerance. The recent development of bacterial single-cell RNA sequencing (scRNA-seq) enables the study of cell-to-cell variability in bacterial populations and the mechanisms underlying these phenomena. Here, we report a scRNA-seq workflow based on MATQ-seq with increased robustness, reduced cell loss, and improved transcript capture rate and gene coverage. Use of a more efficient reverse transcriptase and the integration of an rRNA depletion step, which can be adapted to other bacterial single-cell workflows, was instrumental for these improvements. Applying the protocol to the foodborne pathogen Salmonella, we confirmed transcriptional heterogeneity across and within different growth phases and demonstrated that our workflow captures small regulatory RNAs at a single-cell level. Due to low cell loss and high transcript capture rates, this protocol is uniquely suited for experimental settings in which the starting material is limited, such as infected tissues.}, language = {en} } @article{HombergerBarquistVogel2022, author = {Homberger, Christina and Barquist, Lars and Vogel, J{\"o}rg}, title = {Ushering in a new era of single-cell transcriptomics in bacteria}, series = {microLife}, volume = {3}, journal = {microLife}, doi = {10.1093/femsml/uqac020}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-313292}, year = {2022}, abstract = {Transcriptome analysis of individual cells by single-cell RNA-seq (scRNA-seq) has become routine for eukaryotic tissues, even being applied to whole multicellular organisms. In contrast, developing methods to read the transcriptome of single bacterial cells has proven more challenging, despite a general perception of bacteria as much simpler than eukaryotes. Bacterial cells are harder to lyse, their RNA content is about two orders of magnitude lower than that of eukaryotic cells, and bacterial mRNAs are less stable than their eukaryotic counterparts. Most importantly, bacterial transcripts lack functional poly(A) tails, precluding simple adaptation of popular standard eukaryotic scRNA-seq protocols that come with the double advantage of specific mRNA amplification and concomitant depletion of rRNA. However, thanks to very recent breakthroughs in methodology, bacterial scRNA-seq is now feasible. This short review will discuss recently published bacterial scRNA-seq approaches (MATQ-seq, microSPLiT, and PETRI-seq) and a spatial transcriptomics approach based on multiplexed in situ hybridization (par-seqFISH). Together, these novel approaches will not only enable a new understanding of cell-to-cell variation in bacterial gene expression, they also promise a new microbiology by enabling high-resolution profiling of gene activity in complex microbial consortia such as the microbiome or pathogens as they invade, replicate, and persist in host tissue.}, language = {en} }