@phdthesis{Sauer2019, author = {Sauer, Markus}, title = {DHX36 function in RNA G-quadruplex-mediated posttranscriptional gene regulation}, doi = {10.25972/OPUS-18395}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-183954}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2019}, abstract = {The expression of genetic information into proteins is a key aspect of life. The efficient and exact regulation of this process is essential for the cell to produce the correct amounts of these effector molecules to a given situation. For this purpose, eukaryotic cells have developed many different levels of transcriptional and posttranscriptional gene regulation. These mechanisms themselves heavily rely on interactions of proteins with associated nucleic acids. In the case of posttranscriptional gene regulation an orchestrated interplay between RNA-binding proteins, messenger RNAs (mRNA), and non-coding RNAs is compulsory to achieve this important function. A pivotal factor hereby are RNA secondary structures. One of the most stable and diverse representatives is the G-quadruplex structure (G4) implicated in many cellular mechanisms, such as mRNA processing and translation. In protein biosynthesis, G4s often act as obstacles but can also assist in this process. However, their presence has to be tightly regulated, a task which is often fulfilled by helicases. One of the best characterized G4-resolving factors is the DEAH-box protein DHX36. The in vitro function of this helicase is extensively described and individual reports aimed to address diverse cellular functions as well. Nevertheless, a comprehensive and systems-wide study on the function of this specific helicase was missing, so far. The here-presented doctoral thesis provides a detailed view on the global cellular function of DHX36. The binding sites of this helicase were defined in a transcriptome-wide manner, a consensus binding motif was deviated, and RNA targets as well as the effect this helicase exerts on them were examined. In human embryonic kidney cells, DHX36 is a mainly cytoplasmic protein preferentially binding to G-rich and G4-forming sequence motifs on more than 4,500 mRNAs. Loss of DHX36 leads to increased target mRNA levels whereas ribosome occupancy on and protein output of these transcripts are reduced. Furthermore, DHX36 knockout leads to higher RNA G4 levels and concomitant stress reactions in the cell. I hypothesize that, upon loss of this helicase, translationally-incompetent structured DHX36 target mRNAs, prone to localize in stress granules, accumulate in the cell. The cell reacts with basal stress to avoid cytotoxic effects produced by these mis-regulated and structured transcripts.}, subject = {RNS}, language = {en} } @phdthesis{Hoer2020, author = {H{\"o}r, Jens}, title = {Discovery of RNA/protein complexes by Grad-seq}, doi = {10.25972/OPUS-21181}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-211811}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2020}, abstract = {Complex formation between macromolecules constitutes the foundation of most cellular processes. Most known complexes are made up of two or more proteins interacting in order to build a functional entity and therefore enabling activities which the single proteins could otherwise not fulfill. With the increasing knowledge about noncoding RNAs (ncRNAs) it has become evident that, similar to proteins, many of them also need to form a complex to be functional. This functionalization is usually executed by specific or global RNA-binding proteins (RBPs) that are specialized binders of a certain class of ncRNAs. For instance, the enterobacterial global RBPs Hfq and ProQ together bind >80 \% of the known small regulatory RNAs (sRNAs), a class of ncRNAs involved in post-transcriptional regulation of gene expression. However, identification of RNA-protein interactions so far was performed individually by employing low-throughput biochemical methods and thereby hindered the discovery of such interactions, especially in less studied organisms such as Gram-positive bacteria. Using gradient profiling by sequencing (Grad-seq), the present thesis aimed to establish high-throughput, global RNA/protein complexome resources for Escherichia coli and Streptococcus pneumoniae in order to provide a new way to investigate RNA-protein as well as protein-protein interactions in these two important model organisms. In E. coli, Grad-seq revealed the sedimentation profiles of 4,095 (∼85 \% of total) transcripts and 2,145 (∼49 \% of total) proteins and with that reproduced its major ribonucleoprotein particles. Detailed analysis of the in-gradient distribution of the RNA and protein content uncovered two functionally unknown molecules—the ncRNA RyeG and the small protein YggL—to be ribosomeassociated. Characterization of RyeG revealed it to encode for a 48 aa long, toxic protein that drastically increases lag times when overexpressed. YggL was shown to be bound by the 50S subunit of the 70S ribosome, possibly indicating involvement of YggL in ribosome biogenesis or translation of specific mRNAs. S. pneumoniae Grad-seq detected 2,240 (∼88 \% of total) transcripts and 1,301 (∼62 \% of total) proteins, whose gradient migration patterns were successfully reconstructed, and thereby represents the first RNA/protein complexome resource of a Gram-positive organism. The dataset readily verified many conserved major complexes for the first time in S. pneumoniae and led to the discovery of a specific interaction between the 3'!5' exonuclease Cbf1 and the competence-regulating ciadependent sRNAs (csRNAs). Unexpectedly, trimming of the csRNAs by Cbf1 stabilized the former, thereby promoting their inhibitory function. cbf1 was further shown to be part of the late competence genes and as such to act as a negative regulator of competence.}, subject = {Multiproteinkomplex}, language = {en} } @phdthesis{Bischler2018, author = {Bischler, Thorsten David}, title = {Data mining and software development for RNA-seq-based approaches in bacteria}, url = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-166108}, school = {Universit{\"a}t W{\"u}rzburg}, year = {2018}, abstract = {RNA sequencing (RNA-seq) has in recent years become the preferred method for gene expression analysis and whole transcriptome annotation. While initial RNA-seq experiments focused on eukaryotic messenger RNAs (mRNAs), which can be purified from the cellular ribonucleic acid (RNA) pool with relative ease, more advanced protocols had to be developed for sequencing of microbial transcriptomes. The resulting RNA-seq data revealed an unexpected complexity of bacterial transcriptomes and the requirement for specific analysis methods, which in many cases is not covered by tools developed for processing of eukaryotic data. The aim of this thesis was the development and application of specific data analysis methods for different RNA-seq-based approaches used to gain insights into transcription and gene regulatory processes in prokaryotes. The differential RNA sequencing (dRNA-seq) approach allows for transcriptional start site (TSS) annotation by differentiating between primary transcripts with a 5'-triphosphate (5'-PPP) and processed transcripts with a 5'-monophosphate (5'-P). This method was applied in combination with an automated TSS annotation tool to generate global trancriptome maps for Escherichia coli (E. coli) and Helicobacter pylori (H. pylori). In the E. coli study we conducted different downstream analyses to gain a deeper understanding of the nature and properties of transcripts in our TSS map. Here, we focused especially on putative antisense RNAs (asRNAs), an RNA class transcribed from the opposite strand of known protein-coding genes with the potential to regulate corresponding sense transcripts. Besides providing a set of putative asRNAs and experimental validation of candidates via Northern analysis, we analyzed and discussed different sources of variation in RNA-seq data. The aim of the H. pylori study was to provide a detailed description of the dRNA-seq approach and its application to a bacterial model organism. It includes information on experimental protocols and requirements for data analysis to generate a genome-wide TSS map. We show how the included TSS can be used to identify and analyze transcriptome and regulatory features and discuss challenges in terms oflibrary preparation protocols, sequencing platforms, and data analysis including manual and automated TSS annotation. The TSS maps and associated transcriptome data from both H. pylori and E. coli were made available for visualization in an easily accessible online browser. Furthermore, a modified version of dRNA-seq was used to identify transcriptome targets of the RNA pyrophosphohydrolase (RppH) in H. pylori. RppH initiates 5'-end-dependent degradation of transcripts by converting the 5'-PPP of primary transcripts to a 5'-P. I developed an analysis method, which uses data from complementary DNA (cDNA) libraries specific for transcripts carrying a 5'-PPP, 5'-P or both, to specifically identify transcripts modified by RppH. For this, the method assessed the 5'-phosphorylation state and cellular concentration of transcripts in rppH deletion in comparison to strains with the intact gene. Several of the identified potential RppH targets were further validated via half-life measurements and quantification of their 5'-phosphorylation state in wild-type and mutant cells. Our findings suggest an important role for RppH in post-transcriptional gene regulationin H. pylori and related organisms. In addition, we applied two RNA-seq -based approaches, RNA immunoprecipitation followed by sequencing (RIP-seq) and cross-linking immunoprecipitation followed by sequencing (CLIP-seq), to identify transcripts bound by Hfq and CsrA, two RNA-binding proteins (RBPs) with an important role in post-transcriptional regulation. For RIP-seq -based identification of CsrA binding regions in Campylobacter jejuni(C. jejuni), we used annotation-based analysis and, in addition, a self-developed peak calling method based on a sliding window approach. Both methods revealed flaA mRNA, encoding the major flagellin, as the main target and functional analysis of identified targets showed a significant enrichment of genes involved in flagella biosynthesis. Further experimental analysis revealed the role of flaA mRNA in post-transcriptional regulation. In comparison to RIP-seq, CLIP-seq allows mapping of RBP binding sites with a higher resolution. To identify these sites an approach called "block-based peak calling" was developed and resulting peaks were used to identify sequence and structural constraints required for interaction of Hfq and CsrA with Salmonella transcripts. Overall, the different RNA-seq-based approaches described in this thesis together with their associated analyis pipelines extended our knowledge on the transcriptional repertoire and modes of post-transcriptional regulation in bacteria. The global TSS maps, including further characterized asRNA candidates, putative RppH targets, and identified RBP interactomes will likely trigger similar global studies in the same or different organisms or will be used as a resource for closer examination of these features.}, subject = {Bakterien}, language = {en} }