@article{MichauxGerovacHansenetal.2023, author = {Michaux, Charlotte and Gerovac, Milan and Hansen, Elisabeth E. and Barquist, Lars and Vogel, J{\"o}rg}, title = {Grad-seq analysis of Enterococcus faecalis and Enterococcus faecium provides a global view of RNA and protein complexes in these two opportunistic pathogens}, series = {microLife}, volume = {4}, journal = {microLife}, doi = {10.1093/femsml/uqac027}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-313311}, year = {2023}, abstract = {Enterococcus faecalis and Enterococcus faecium are major nosocomial pathogens. Despite their relevance to public health and their role in the development of bacterial antibiotic resistance, relatively little is known about gene regulation in these species. RNA-protein complexes serve crucial functions in all cellular processes associated with gene expression, including post-transcriptional control mediated by small regulatory RNAs (sRNAs). Here, we present a new resource for the study of enterococcal RNA biology, employing the Grad-seq technique to comprehensively predict complexes formed by RNA and proteins in E. faecalis V583 and E. faecium AUS0004. Analysis of the generated global RNA and protein sedimentation profiles led to the identification of RNA-protein complexes and putative novel sRNAs. Validating our data sets, we observe well-established cellular RNA-protein complexes such as the 6S RNA-RNA polymerase complex, suggesting that 6S RNA-mediated global control of transcription is conserved in enterococci. Focusing on the largely uncharacterized RNA-binding protein KhpB, we use the RIP-seq technique to predict that KhpB interacts with sRNAs, tRNAs, and untranslated regions of mRNAs, and might be involved in the processing of specific tRNAs. Collectively, these datasets provide departure points for in-depth studies of the cellular interactome of enterococci that should facilitate functional discovery in these and related Gram-positive species. Our data are available to the community through a user-friendly Grad-seq browser that allows interactive searches of the sedimentation profiles (https://resources.helmholtz-hiri.de/gradseqef/).}, language = {en} } @article{HombergerHaywardBarquistetal.2023, author = {Homberger, Christina and Hayward, Regan J. and Barquist, Lars and Vogel, J{\"o}rg}, title = {Improved bacterial single-cell RNA-seq through automated MATQ-seq and Cas9-based removal of rRNA reads}, series = {mBio}, volume = {14}, journal = {mBio}, number = {2}, doi = {10.1128/mbio.03557-22}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-350059}, year = {2023}, abstract = {Bulk RNA sequencing technologies have provided invaluable insights into host and bacterial gene expression and associated regulatory networks. Nevertheless, the majority of these approaches report average expression across cell populations, hiding the true underlying expression patterns that are often heterogeneous in nature. Due to technical advances, single-cell transcriptomics in bacteria has recently become reality, allowing exploration of these heterogeneous populations, which are often the result of environmental changes and stressors. In this work, we have improved our previously published bacterial single-cell RNA sequencing (scRNA-seq) protocol that is based on multiple annealing and deoxycytidine (dC) tailing-based quantitative scRNA-seq (MATQ-seq), achieving a higher throughput through the integration of automation. We also selected a more efficient reverse transcriptase, which led to reduced cell loss and higher workflow robustness. Moreover, we successfully implemented a Cas9-based rRNA depletion protocol into the MATQ-seq workflow. Applying our improved protocol on a large set of single Salmonella cells sampled over different growth conditions revealed improved gene coverage and a higher gene detection limit compared to our original protocol and allowed us to detect the expression of small regulatory RNAs, such as GcvB or CsrB at a single-cell level. In addition, we confirmed previously described phenotypic heterogeneity in Salmonella in regard to expression of pathogenicity-associated genes. Overall, the low percentage of cell loss and high gene detection limit makes the improved MATQ-seq protocol particularly well suited for studies with limited input material, such as analysis of small bacterial populations in host niches or intracellular bacteria. IMPORTANCE: Gene expression heterogeneity among isogenic bacteria is linked to clinically relevant scenarios, like biofilm formation and antibiotic tolerance. The recent development of bacterial single-cell RNA sequencing (scRNA-seq) enables the study of cell-to-cell variability in bacterial populations and the mechanisms underlying these phenomena. Here, we report a scRNA-seq workflow based on MATQ-seq with increased robustness, reduced cell loss, and improved transcript capture rate and gene coverage. Use of a more efficient reverse transcriptase and the integration of an rRNA depletion step, which can be adapted to other bacterial single-cell workflows, was instrumental for these improvements. Applying the protocol to the foodborne pathogen Salmonella, we confirmed transcriptional heterogeneity across and within different growth phases and demonstrated that our workflow captures small regulatory RNAs at a single-cell level. Due to low cell loss and high transcript capture rates, this protocol is uniquely suited for experimental settings in which the starting material is limited, such as infected tissues.}, language = {en} } @article{PrezzaRyanMaedleretal.2022, author = {Prezza, Gianluca and Ryan, Daniel and M{\"a}dler, Gohar and Reichardt, Sarah and Barquist, Lars and Westermann, Alexander J.}, title = {Comparative genomics provides structural and functional insights into Bacteroides RNA biology}, series = {Molecular Microbiology}, volume = {117}, journal = {Molecular Microbiology}, number = {1}, doi = {10.1111/mmi.14793}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-259594}, pages = {67-85}, year = {2022}, abstract = {Bacteria employ noncoding RNA molecules for a wide range of biological processes, including scaffolding large molecular complexes, catalyzing chemical reactions, defending against phages, and controlling gene expression. Secondary structures, binding partners, and molecular mechanisms have been determined for numerous small noncoding RNAs (sRNAs) in model aerobic bacteria. However, technical hurdles have largely prevented analogous analyses in the anaerobic gut microbiota. While experimental techniques are being developed to investigate the sRNAs of gut commensals, computational tools and comparative genomics can provide immediate functional insight. Here, using Bacteroides thetaiotaomicron as a representative microbiota member, we illustrate how comparative genomics improves our understanding of RNA biology in an understudied gut bacterium. We investigate putative RNA-binding proteins and predict a Bacteroides cold-shock protein homolog to have an RNA-related function. We apply an in silico protocol incorporating both sequence and structural analysis to determine the consensus structures and conservation of nine Bacteroides noncoding RNA families. Using structure probing, we validate and refine these predictions and deposit them in the Rfam database. Through synteny analyses, we illustrate how genomic coconservation can serve as a predictor of sRNA function. Altogether, this work showcases the power of RNA informatics for investigating the RNA biology of anaerobic microbiota members.}, language = {en} } @article{HombergerBarquistVogel2022, author = {Homberger, Christina and Barquist, Lars and Vogel, J{\"o}rg}, title = {Ushering in a new era of single-cell transcriptomics in bacteria}, series = {microLife}, volume = {3}, journal = {microLife}, doi = {10.1093/femsml/uqac020}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-313292}, year = {2022}, abstract = {Transcriptome analysis of individual cells by single-cell RNA-seq (scRNA-seq) has become routine for eukaryotic tissues, even being applied to whole multicellular organisms. In contrast, developing methods to read the transcriptome of single bacterial cells has proven more challenging, despite a general perception of bacteria as much simpler than eukaryotes. Bacterial cells are harder to lyse, their RNA content is about two orders of magnitude lower than that of eukaryotic cells, and bacterial mRNAs are less stable than their eukaryotic counterparts. Most importantly, bacterial transcripts lack functional poly(A) tails, precluding simple adaptation of popular standard eukaryotic scRNA-seq protocols that come with the double advantage of specific mRNA amplification and concomitant depletion of rRNA. However, thanks to very recent breakthroughs in methodology, bacterial scRNA-seq is now feasible. This short review will discuss recently published bacterial scRNA-seq approaches (MATQ-seq, microSPLiT, and PETRI-seq) and a spatial transcriptomics approach based on multiplexed in situ hybridization (par-seqFISH). Together, these novel approaches will not only enable a new understanding of cell-to-cell variation in bacterial gene expression, they also promise a new microbiology by enabling high-resolution profiling of gene activity in complex microbial consortia such as the microbiome or pathogens as they invade, replicate, and persist in host tissue.}, language = {en} } @article{BauriedlGerovacHeidrichetal.2020, author = {Bauriedl, Saskia and Gerovac, Milan and Heidrich, Nadja and Bischler, Thorsten and Barquist, Lars and Vogel, J{\"o}rg and Schoen, Christoph}, title = {The minimal meningococcal ProQ protein has an intrinsic capacity for structure-based global RNA recognition}, series = {Nature Communications}, volume = {11}, journal = {Nature Communications}, doi = {10.1038/s41467-020-16650-6}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-230040}, year = {2020}, abstract = {FinO-domain proteins are a widespread family of bacterial RNA-binding proteins with regulatory functions. Their target spectrum ranges from a single RNA pair, in the case of plasmid-encoded FinO, to global RNA regulons, as with enterobacterial ProQ. To assess whether the FinO domain itself is intrinsically selective or promiscuous, we determine in vivo targets of Neisseria meningitidis, which consists of solely a FinO domain. UV-CLIP-seq identifies associations with 16 small non-coding sRNAs and 166 mRNAs. Meningococcal ProQ predominantly binds to highly structured regions and generally acts to stabilize its RNA targets. Loss of ProQ alters transcript levels of >250 genes, demonstrating that this minimal ProQ protein impacts gene expression globally. Phenotypic analyses indicate that ProQ promotes oxidative stress resistance and DNA damage repair. We conclude that FinO domain proteins recognize some abundant type of RNA shape and evolve RNA binding selectivity through acquisition of additional regions that constrain target recognition. FinO-domain proteins are bacterial RNA-binding proteins with a wide range of target specificities. Here, the authors employ UV CLIP-seq and show that minimal ProQ protein of Neisseria meningitidis binds to various small non-coding RNAs and mRNAs involved in virulence.}, language = {en} } @article{MichauxHansenJennichesetal.2020, author = {Michaux, Charlotte and Hansen, Elisabeth E. and Jenniches, Laura and Gerovac, Milan and Barquist, Lars and Vogel, J{\"o}rg}, title = {Single-Nucleotide RNA Maps for the Two Major Nosocomial Pathogens Enterococcus faecalis and Enterococcus faecium}, series = {Frontiers in Cellular and Infection Microbiology}, volume = {10}, journal = {Frontiers in Cellular and Infection Microbiology}, issn = {2235-2988}, doi = {10.3389/fcimb.2020.600325}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-217947}, year = {2020}, abstract = {Enterococcus faecalis and faecium are two major representative clinical strains of the Enterococcus genus and are sadly notorious to be part of the top agents responsible for nosocomial infections. Despite their critical implication in worldwide public healthcare, essential and available resources such as deep transcriptome annotations remain poor, which also limits our understanding of post-transcriptional control small regulatory RNA (sRNA) functions in these bacteria. Here, using the dRNA-seq technique in combination with ANNOgesic analysis, we successfully mapped and annotated transcription start sites (TSS) of both E. faecalis V583 and E. faecium AUS0004 at single nucleotide resolution. Analyzing bacteria in late exponential phase, we capture ~40\% (E. faecalis) and 43\% (E. faecium) of the annotated protein-coding genes, determine 5′ and 3′ UTR (untranslated region) length, and detect instances of leaderless mRNAs. The transcriptome maps revealed sRNA candidates in both bacteria, some found in previous studies and new ones. Expression of candidate sRNAs is being confirmed under biologically relevant environmental conditions. This comprehensive global TSS mapping atlas provides a valuable resource for RNA biology and gene expression analysis in the Enterococci. It can be accessed online at www.helmholtz-hiri.de/en/datasets/enterococcus through an instance of the genomic viewer JBrowse.}, language = {en} } @article{WestermannBarquistVogel2017, author = {Westermann, Alexander J. and Barquist, Lars and Vogel, J{\"o}rg}, title = {Resolving host-pathogen interactions by dual RNA-seq}, series = {PLoS Pathogens}, volume = {13}, journal = {PLoS Pathogens}, number = {2}, doi = {10.1371/journal.ppat.1006033}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-171921}, year = {2017}, abstract = {The transcriptome is a powerful proxy for the physiological state of a cell, healthy or diseased. As a result, transcriptome analysis has become a key tool in understanding the molecular changes that accompany bacterial infections of eukaryotic cells. Until recently, such transcriptomic studies have been technically limited to analyzing mRNA expression changes in either the bacterial pathogen or the infected eukaryotic host cell. However, the increasing sensitivity of high-throughput RNA sequencing now enables "dual RNA-seq" studies, simultaneously capturing all classes of coding and noncoding transcripts in both the pathogen and the host. In the five years since the concept of dual RNA-seq was introduced, the technique has been applied to a range of infection models. This has not only led to a better understanding of the physiological changes in pathogen and host during the course of an infection but has also revealed hidden molecular phenotypes of virulence-associated small noncoding RNAs that were not visible in standard infection assays. Here, we use the knowledge gained from these recent studies to suggest experimental and computational guidelines for the design of future dual RNA-seq studies. We conclude this review by discussing prospective applications of the technique.}, language = {en} } @article{HeidrichBauriedlBarquistetal.2017, author = {Heidrich, Nadja and Bauriedl, Saskia and Barquist, Lars and Li, Lei and Schoen, Christoph and Vogel, J{\"o}rg}, title = {The primary transcriptome of Neisseria meningitidis and its interaction with the RNA chaperone Hfq}, series = {Nucleic Acids Research}, volume = {45}, journal = {Nucleic Acids Research}, number = {10}, doi = {10.1093/nar/gkx168}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-170828}, pages = {6147-6167}, year = {2017}, abstract = {Neisseria meningitidis is a human commensal that can also cause life-threatening meningitis and septicemia. Despite growing evidence for RNA-based regulation in meningococci, their transcriptome structure and output of regulatory small RNAs (sRNAs) are incompletely understood. Using dRNA-seq, we have mapped at single-nucleotide resolution the primary transcriptome of N. meningitidis strain 8013. Annotation of 1625 transcriptional start sites defines transcription units for most protein-coding genes but also reveals a paucity of classical σ70-type promoters, suggesting the existence of activators that compensate for the lack of -35 consensus sequences in N. meningitidis. The transcriptome maps also reveal 65 candidate sRNAs, a third of which were validated by northern blot analysis. Immunoprecipitation with the RNA chaperone Hfq drafts an unexpectedly large post-transcriptional regulatory network in this organism, comprising 23 sRNAs and hundreds of potential mRNA targets. Based on this data, using a newly developed gfp reporter system we validate an Hfq-dependent mRNA repression of the putative colonization factor PrpB by the two trans-acting sRNAs RcoF1/2. Our genome-wide RNA compendium will allow for a better understanding of meningococcal transcriptome organization and riboregulation with implications for colonization of the human nasopharynx.}, language = {en} } @article{WheelerBarquistKingsleyetal.2016, author = {Wheeler, Nicole E. and Barquist, Lars and Kingsley, Robert A. and Gardner, Paul P.}, title = {A profile-based method for identifying functional divergence of orthologous genes in bacterial genomes}, series = {Bioinformatics}, volume = {32}, journal = {Bioinformatics}, number = {23}, doi = {10.1093/bioinformatics/btw518}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-186502}, pages = {3566-3574}, year = {2016}, abstract = {Motivation: Next generation sequencing technologies have provided us with a wealth of information on genetic variation, but predi cting the functional significance of this variation is a difficult task. While many comparative genomics studies have focused on gene flux and large scale changes, relatively little attention has been paid to quantifying the effects of single nucleotide polymorphisms and indels on protein function, particularly in bacterial genomics. Results: We present a hidden Markov model based approach we call delta-bitscore (DBS) for identifying orthologous proteins that have diverged at the amino acid sequence level in a way that is likely to impact biological function. We benchmark this approach with several widely used datasets and apply it to a proof-of-concept study of orthologous proteomes in an investigation of host adaptation in Salmonella enterica. We highlight the value of the method in identifying functional divergence of genes, and suggest that this tool may be a better approach than the commonly used dN/dS metric for identifying functionally significant genetic changes occurring in recently diverged organisms.}, language = {en} } @article{BarquistMayhoCumminsetal.2016, author = {Barquist, Lars and Mayho, Matthew and Cummins, Carla and Cain, Amy K. and Boinett, Christine J. and Page, Andrew J. and Langridge, Gemma C. and Quail, Michael A. and Keane, Jacqueline A. and Parkhill, Julian}, title = {The TraDIS toolkit: sequencing and analysis for dense transposon mutant libraries}, series = {Bioinformatics}, volume = {32}, journal = {Bioinformatics}, number = {7}, doi = {10.1093/bioinformatics/btw022}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-189667}, pages = {1109-1111}, year = {2016}, abstract = {Transposon insertion sequencing is a high-throughput technique for assaying large libraries of otherwise isogenic transposon mutants providing insight into gene essentiality, gene function and genetic interactions. We previously developed the Transposon Directed Insertion Sequencing (TraDIS) protocol for this purpose, which utilizes shearing of genomic DNA followed by specific PCR amplification of transposon-containing fragments and Illumina sequencing. Here we describe an optimized high-yield library preparation and sequencing protocol for TraDIS experiments and a novel software pipeline for analysis of the resulting data. The Bio-Tradis analysis pipeline is implemented as an extensible Perl library which can either be used as is, or as a basis for the development of more advanced analysis tools. This article can serve as a general reference for the application of the TraDIS methodology.}, language = {en} }