@article{HoernleinMandelIflandetal.2011,
  author    = {H{\"o}rnlein, Alexander and Mandel, Alexander and Ifland, Marianus and L{\"u}neberg, Edeltraud and Deckert, J{\"u}rgen and Puppe, Frank},
  title     = {Akzeptanz medizinischer Trainingsf{\"a}lle als Erg{\"a}nzung zu Vorlesungen},
  series = {GMS Zeitschrift f{\"u}r Medizinische Ausbildung},
  volume    = {28},
  journal   = {GMS Zeitschrift f{\"u}r Medizinische Ausbildung},
  number    = {3},
  doi       = {10.3205/zma000754},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-133569},
  pages     = {Doc42},
  year      = {2011},
  abstract  = {Introduction: Medical training cases (virtual patients) are in widespread use for student education. Most publications report about development and experiences in one course with training cases. In this paper we compare the acceptance of different training case courses with different usages deployed as supplement to lectures of the medical faculty of Wuerzburg university during a period of three semesters. Methods: The training cases were developed with the authoring tool CaseTrain and are available for students via the Moodle-based eLearning platform WueCampus at Wuerzburg university. Various data about usage and acceptance is automatically collected. Results: From WS (winter semester) 08/09 till WS 09/10 19 courses with about 200 cases were available. In each semester, about 550 different medical students from W{\"u}rzburg and 50 students from other universities processed about 12000 training cases and filled in about 2000 evaluation forms. In different courses, the usage varied between less than 50 and more than 5000 processed cases. Discussion: Although students demand training cases as supplement to all lectures, the data show that the usage does not primarily depend on the quality of the available training cases. Instead, the training cases of nearly all case collections were processed extremely often shortly before the examination. It shows that the degree of usage depends primarily on the perceived relevance of the training cases for the examination."},
  language  = {de}
}
@article{MandelHoernleinIflandetal.2011,
  author    = {Mandel, Alexander and H{\"o}rnlein, Alexander and Ifland, Marianus and L{\"u}neburg, Edeltraud and Deckert, J{\"u}rgen and Puppe, Frank},
  title     = {Aufwandsanalyse f{\"u}r computerunterst{\"u}tzte Multiple-Choice Papierklausuren},
  series = {GMS Journal for Medical Education},
  volume    = {28},
  journal   = {GMS Journal for Medical Education},
  number    = {4},
  doi       = {10.3205/zma000767},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-134386},
  pages     = {1-15, Doc55},
  year      = {2011},
  abstract  = {Introduction: Multiple-choice-examinations are still fundamental for assessment in medical degree programs. In addition to content related research, the optimization of the technical procedure is an important question. Medical examiners face three options: paper-based examinations with or without computer support or completely electronic examinations. Critical aspects are the effort for formatting, the logistic effort during the actual examination, quality, promptness and effort of the correction, the time for making the documents available for inspection by the students, and the statistical analysis of the examination results. Methods: Since three semesters a computer program for input and formatting of MC-questions in medical and other paper-based examinations is used and continuously improved at Wuerzburg University. In the winter semester (WS) 2009/10 eleven, in the summer semester (SS) 2010 twelve and in WS 2010/11 thirteen medical examinations were accomplished with the program and automatically evaluated. For the last two semesters the remaining manual workload was recorded. Results: The cost of the formatting and the subsequent analysis including adjustments of the analysis of an average examination with about 140 participants and about 35 questions was 5-7 hours for exams without complications in the winter semester 2009/2010, about 2 hours in SS 2010 and about 1.5 hours in the winter semester 2010/11. Including exams with complications, the average time was about 3 hours per exam in SS 2010 and 2.67 hours for the WS 10/11. Discussion: For conventional multiple-choice exams the computer-based formatting and evaluation of paper-based exams offers a significant time reduction for lecturers in comparison with the manual correction of paper-based exams and compared to purely electronically conducted exams it needs a much simpler technological infrastructure and fewer staff during the exam."},
  language  = {de}
}
@inproceedings{JannidisRegerWeimeretal.2015,
  author    = {Jannidis, Fotis and Reger, Isabella and Weimer, Lukas and Krug, Markus and Puppe, Frank},
  title     = {Automatische Erkennung von Figuren in deutschsprachigen Romanen},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-143332},
  pages     = {7},
  year      = {2015},
  abstract  = {Eine wichtige Grundlage f{\"u}r die quantitative Analyse von Erz{\"a}hltexten, etwa eine Netzwerkanalyse der Figurenkonstellation, ist die automatische Erkennung von Referenzen auf Figuren in Erz{\"a}hltexten, ein Sonderfall des generischen NLP-Problems der Named Entity Recognition. Bestehende, auf Zeitungstexten trainierte Modelle sind f{\"u}r literarische Texte nur eingeschr{\"a}nkt brauchbar, da die Einbeziehung von Appellativen in die Named Entity-Definition und deren h{\"a}ufige Verwendung in Romantexten zu einem schlechten Ergebnis f{\"u}hrt. Dieses Paper stellt eine anhand eines manuell annotierten Korpus auf deutschsprachige Romane des 19. Jahrhunderts angepasste NER-Komponente vor.},
  subject      = {Digital Humanities},
  language  = {de}
}
@article{ToepferCorovicFetteetal.2015,
  author    = {Toepfer, Martin and Corovic, Hamo and Fette, Georg and Kl{\"u}gl, Peter and St{\"o}rk, Stefan and Puppe, Frank},
  title     = {Fine-grained information extraction from German transthoracic echocardiography reports},
  series = {BMC Medical Informatics and Decision Making},
  volume    = {15},
  journal   = {BMC Medical Informatics and Decision Making},
  number    = {91},
  doi       = {doi:10.1186/s12911-015-0215-x},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-125509},
  year      = {2015},
  abstract  = {Background Information extraction techniques that get structured representations out of unstructured data make a large amount of clinically relevant information about patients accessible for semantic applications. These methods typically rely on standardized terminologies that guide this process. Many languages and clinical domains, however, lack appropriate resources and tools, as well as evaluations of their applications, especially if detailed conceptualizations of the domain are required. For instance, German transthoracic echocardiography reports have not been targeted sufficiently before, despite of their importance for clinical trials. This work therefore aimed at development and evaluation of an information extraction component with a fine-grained terminology that enables to recognize almost all relevant information stated in German transthoracic echocardiography reports at the University Hospital of W{\"u}rzburg. Methods A domain expert validated and iteratively refined an automatically inferred base terminology. The terminology was used by an ontology-driven information extraction system that outputs attribute value pairs. The final component has been mapped to the central elements of a standardized terminology, and it has been evaluated according to documents with different layouts. Results The final system achieved state-of-the-art precision (micro average.996) and recall (micro average.961) on 100 test documents that represent more than 90 \% of all reports. In particular, principal aspects as defined in a standardized external terminology were recognized with f 1=.989 (micro average) and f 1=.963 (macro average). As a result of keyword matching and restraint concept extraction, the system obtained high precision also on unstructured or exceptionally short documents, and documents with uncommon layout. Conclusions The developed terminology and the proposed information extraction system allow to extract fine-grained information from German semi-structured transthoracic echocardiography reports with very high precision and high recall on the majority of documents at the University Hospital of W{\"u}rzburg. Extracted results populate a clinical data warehouse which supports clinical research.},
  language  = {en}
}
@article{GehrkeBalbachRauchetal.2019,
  author    = {Gehrke, Alexander and Balbach, Nico and Rauch, Yong-Mi and Degkwitz, Andreas and Puppe, Frank},
  title     = {Erkennung von handschriftlichen Unterstreichungen in Alten Drucken},
  series = {Bibliothek Forschung und Praxis},
  volume    = {43},
  journal   = {Bibliothek Forschung und Praxis},
  number    = {3},
  issn      = {1865-7648},
  doi       = {10.1515/bfp-2019-2083},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-193377},
  pages     = {447 -- 452},
  year      = {2019},
  abstract  = {Die Erkennung handschriftlicher Artefakte wie Unterstreichungen in Buchdrucken erm{\"o}glicht R{\"u}ckschl{\"u}sse auf das Rezeptionsverhalten und die Provenienzgeschichte und wird auch f{\"u}r eine OCR ben{\"o}tigt. Dabei soll zwischen handschriftlichen Unterstreichungen und waagerechten Linien im Druck (z. B. Trennlinien usw.) unterschieden werden, da letztere nicht ausgezeichnet werden sollen. Im Beitrag wird ein Ansatz basierend auf einem auf Unterstreichungen trainierten Neuronalen Netz gem{\"a}ß der U-Net Architektur vorgestellt, dessen Ergebnisse in einem zweiten Schritt mit heuristischen Regeln nachbearbeitet werden. Die Evaluationen zeigen, dass Unterstreichungen sehr gut erkannt werden, wenn bei der Binarisierung der Scans nicht zu viele Pixel der Unterstreichung wegen geringem Kontrast verloren gehen. Zuk{\"u}nftig sollen die Worte oberhalb der Unterstreichung mit OCR transkribiert werden und auch andere Artefakte wie handschriftliche Notizen in alten Drucken erkannt werden.},
  language  = {de}
}
@article{WickHarteltPuppe2019,
  author    = {Wick, Christoph and Hartelt, Alexander and Puppe, Frank},
  title     = {Staff, symbol and melody detection of Medieval manuscripts written in square notation using deep Fully Convolutional Networks},
  series = {Applied Sciences},
  volume    = {9},
  journal   = {Applied Sciences},
  number    = {13},
  issn      = {2076-3417},
  doi       = {10.3390/app9132646},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-197248},
  year      = {2019},
  abstract  = {Even today, the automatic digitisation of scanned documents in general, but especially the automatic optical music recognition (OMR) of historical manuscripts, still remains an enormous challenge, since both handwritten musical symbols and text have to be identified. This paper focuses on the Medieval so-called square notation developed in the 11th-12th century, which is already composed of staff lines, staves, clefs, accidentals, and neumes that are roughly spoken connected single notes. The aim is to develop an algorithm that captures both the neumes, and in particular its melody, which can be used to reconstruct the original writing. Our pipeline is similar to the standard OMR approach and comprises a novel staff line and symbol detection algorithm based on deep Fully Convolutional Networks (FCN), which perform pixel-based predictions for either staff lines or symbols and their respective types. Then, the staff line detection combines the extracted lines to staves and yields an F\(_1\) -score of over 99\% for both detecting lines and complete staves. For the music symbol detection, we choose a novel approach that skips the step to identify neumes and instead directly predicts note components (NCs) and their respective affiliation to a neume. Furthermore, the algorithm detects clefs and accidentals. Our algorithm predicts the symbol sequence of a staff with a diplomatic symbol accuracy rate (dSAR) of about 87\%, which includes symbol type and location. If only the NCs without their respective connection to a neume, all clefs and accidentals are of interest, the algorithm reaches an harmonic symbol accuracy rate (hSAR) of approximately 90\%. In general, the algorithm recognises a symbol in the manuscript with an F\(_1\) -score of over 96\%.},
  language  = {en}
}
@article{ReulChristHarteltetal.2019,
  author    = {Reul, Christian and Christ, Dennis and Hartelt, Alexander and Balbach, Nico and Wehner, Maximilian and Springmann, Uwe and Wick, Christoph and Grundig, Christine and B{\"u}ttner, Andreas and Puppe, Frank},
  title     = {OCR4all—An open-source tool providing a (semi-)automatic OCR workflow for historical printings},
  series = {Applied Sciences},
  volume    = {9},
  journal   = {Applied Sciences},
  number    = {22},
  issn      = {2076-3417},
  doi       = {10.3390/app9224853},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-193103},
  pages     = {4853},
  year      = {2019},
  abstract  = {Optical Character Recognition (OCR) on historical printings is a challenging task mainly due to the complexity of the layout and the highly variant typography. Nevertheless, in the last few years, great progress has been made in the area of historical OCR, resulting in several powerful open-source tools for preprocessing, layout analysis and segmentation, character recognition, and post-processing. The drawback of these tools often is their limited applicability by non-technical users like humanist scholars and in particular the combined use of several tools in a workflow. In this paper, we present an open-source OCR software called OCR4all, which combines state-of-the-art OCR components and continuous model training into a comprehensive workflow. While a variety of materials can already be processed fully automatically, books with more complex layouts require manual intervention by the users. This is mostly due to the fact that the required ground truth for training stronger mixed models (for segmentation, as well as text recognition) is not available, yet, neither in the desired quantity nor quality. To deal with this issue in the short run, OCR4all offers a comfortable GUI that allows error corrections not only in the final output, but already in early stages to minimize error propagations. In the long run, this constant manual correction produces large quantities of valuable, high quality training material, which can be used to improve fully automatic approaches. Further on, extensive configuration capabilities are provided to set the degree of automation of the workflow and to make adaptations to the carefully selected default parameters for specific printings, if necessary. During experiments, the fully automated application on 19th Century novels showed that OCR4all can considerably outperform the commercial state-of-the-art tool ABBYY Finereader on moderate layouts if suitably pretrained mixed OCR models are available. Furthermore, on very complex early printed books, even users with minimal or no experience were able to capture the text with manageable effort and great quality, achieving excellent Character Error Rates (CERs) below 0.5\%. The architecture of OCR4all allows the easy integration (or substitution) of newly developed tools for its main components by standardized interfaces like PageXML, thus aiming at continual higher automation for historical printings.},
  language  = {en}
}
@article{DjebkoPuppeKayal2019,
  author    = {Djebko, Kirill and Puppe, Frank and Kayal, Hakan},
  title     = {Model-based fault detection and diagnosis for spacecraft with an application for the SONATE triple cube nano-satellite},
  series = {Aerospace},
  volume    = {6},
  journal   = {Aerospace},
  number    = {10},
  issn      = {2226-4310},
  doi       = {10.3390/aerospace6100105},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-198836},
  pages     = {105},
  year      = {2019},
  abstract  = {The correct behavior of spacecraft components is the foundation of unhindered mission operation. However, no technical system is free of wear and degradation. A malfunction of one single component might significantly alter the behavior of the whole spacecraft and may even lead to a complete mission failure. Therefore, abnormal component behavior must be detected early in order to be able to perform counter measures. A dedicated fault detection system can be employed, as opposed to classical health monitoring, performed by human operators, to decrease the response time to a malfunction. In this paper, we present a generic model-based diagnosis system, which detects faults by analyzing the spacecraft's housekeeping data. The observed behavior of the spacecraft components, given by the housekeeping data is compared to their expected behavior, obtained through simulation. Each discrepancy between the observed and the expected behavior of a component generates a so-called symptom. Given the symptoms, the diagnoses are derived by computing sets of components whose malfunction might cause the observed discrepancies. We demonstrate the applicability of the diagnosis system by using modified housekeeping data of the qualification model of an actual spacecraft and outline the advantages and drawbacks of our approach.},
  language  = {en}
}
@article{DietrichKrebsLimanetal.2019,
  author    = {Dietrich, Georg and Krebs, Jonathan and Liman, Leon and Fette, Georg and Ertl, Maximilian and Kaspar, Mathias and St{\"o}rk, Stefan and Puppe, Frank},
  title     = {Replicating medication trend studies using ad hoc information extraction in a clinical data warehouse},
  series = {BMC Medical Informatics and Decision Making},
  volume    = {19},
  journal   = {BMC Medical Informatics and Decision Making},
  doi       = {10.1186/s12911-018-0729-0},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-200409},
  pages     = {15},
  year      = {2019},
  abstract  = {Background Medication trend studies show the changes of medication over the years and may be replicated using a clinical Data Warehouse (CDW). Even nowadays, a lot of the patient information, like medication data, in the EHR is stored in the format of free text. As the conventional approach of information extraction (IE) demands a high developmental effort, we used ad hoc IE instead. This technique queries information and extracts it on the fly from texts contained in the CDW. Methods We present a generalizable approach of ad hoc IE for pharmacotherapy (medications and their daily dosage) presented in hospital discharge letters. We added import and query features to the CDW system, like error tolerant queries to deal with misspellings and proximity search for the extraction of the daily dosage. During the data integration process in the CDW, negated, historical and non-patient context data are filtered. For the replication studies, we used a drug list grouped by ATC (Anatomical Therapeutic Chemical Classification System) codes as input for queries to the CDW. Results We achieve an F1 score of 0.983 (precision 0.997, recall 0.970) for extracting medication from discharge letters and an F1 score of 0.974 (precision 0.977, recall 0.972) for extracting the dosage. We replicated three published medical trend studies for hypertension, atrial fibrillation and chronic kidney disease. Overall, 93\% of the main findings could be replicated, 68\% of sub-findings, and 75\% of all findings. One study could be completely replicated with all main and sub-findings. Conclusion A novel approach for ad hoc IE is presented. It is very suitable for basic medical texts like discharge letters and finding reports. Ad hoc IE is by definition more limited than conventional IE and does not claim to replace it, but it substantially exceeds the search capabilities of many CDWs and it is convenient to conduct replication studies fast and with high quality.},
  language  = {en}
}
@article{LodaKrebsDanhofetal.2019,
  author    = {Loda, Sophia and Krebs, Jonathan and Danhof, Sophia and Schreder, Martin and Solimando, Antonio G. and Strifler, Susanne and Rasche, Leo and Kort{\"u}m, Martin and Kerscher, Alexander and Knop, Stefan and Puppe, Frank and Einsele, Hermann and Bittrich, Max},
  title     = {Exploration of artificial intelligence use with ARIES in multiple myeloma research},
  series = {Journal of Clinical Medicine},
  volume    = {8},
  journal   = {Journal of Clinical Medicine},
  number    = {7},
  issn      = {2077-0383},
  doi       = {10.3390/jcm8070999},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-197231},
  pages     = {999},
  year      = {2019},
  abstract  = {Background: Natural language processing (NLP) is a powerful tool supporting the generation of Real-World Evidence (RWE). There is no NLP system that enables the extensive querying of parameters specific to multiple myeloma (MM) out of unstructured medical reports. We therefore created a MM-specific ontology to accelerate the information extraction (IE) out of unstructured text. Methods: Our MM ontology consists of extensive MM-specific and hierarchically structured attributes and values. We implemented "A Rule-based Information Extraction System" (ARIES) that uses this ontology. We evaluated ARIES on 200 randomly selected medical reports of patients diagnosed with MM. Results: Our system achieved a high F1-Score of 0.92 on the evaluation dataset with a precision of 0.87 and recall of 0.98. Conclusions: Our rule-based IE system enables the comprehensive querying of medical reports. The IE accelerates the extraction of data and enables clinicians to faster generate RWE on hematological issues. RWE helps clinicians to make decisions in an evidence-based manner. Our tool easily accelerates the integration of research evidence into everyday clinical practice.},
  language  = {en}
}
@article{KasparFetteHankeetal.2021,
  author    = {Kaspar, Mathias and Fette, Georg and Hanke, Monika and Ertl, Maximilian and Puppe, Frank and St{\"o}rk, Stefan},
  title     = {Automated provision of clinical routine data for a complex clinical follow-up study: A data warehouse solution},
  series = {Health Informatics Journal},
  volume    = {28},
  journal   = {Health Informatics Journal},
  number    = {1},
  doi       = {10.1177/14604582211058081},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-260828},
  year      = {2021},
  abstract  = {A deep integration of routine care and research remains challenging in many respects. We aimed to show the feasibility of an automated transformation and transfer process feeding deeply structured data with a high level of granularity collected for a clinical prospective cohort study from our hospital information system to the study's electronic data capture system, while accounting for study-specific data and visits. We developed a system integrating all necessary software and organizational processes then used in the study. The process and key system components are described together with descriptive statistics to show its feasibility in general and to identify individual challenges in particular. Data of 2051 patients enrolled between 2014 and 2020 was transferred. We were able to automate the transfer of approximately 11 million individual data values, representing 95\% of all entered study data. These were recorded in n = 314 variables (28\% of all variables), with some variables being used multiple times for follow-up visits. Our validation approach allowed for constant good data quality over the course of the study. In conclusion, the automated transfer of multi-dimensional routine medical data from HIS to study databases using specific study data and visit structures is complex, yet viable.},
  language  = {en}
}
@article{KrenzerMakowskiHekaloetal.2022,
  author    = {Krenzer, Adrian and Makowski, Kevin and Hekalo, Amar and Fitting, Daniel and Troya, Joel and Zoller, Wolfram G. and Hann, Alexander and Puppe, Frank},
  title     = {Fast machine learning annotation in the medical domain: a semi-automated video annotation tool for gastroenterologists},
  series = {BioMedical Engineering OnLine},
  volume    = {21},
  journal   = {BioMedical Engineering OnLine},
  number    = {1},
  doi       = {10.1186/s12938-022-01001-x},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-300231},
  year      = {2022},
  abstract  = {Background Machine learning, especially deep learning, is becoming more and more relevant in research and development in the medical domain. For all the supervised deep learning applications, data is the most critical factor in securing successful implementation and sustaining the progress of the machine learning model. Especially gastroenterological data, which often involves endoscopic videos, are cumbersome to annotate. Domain experts are needed to interpret and annotate the videos. To support those domain experts, we generated a framework. With this framework, instead of annotating every frame in the video sequence, experts are just performing key annotations at the beginning and the end of sequences with pathologies, e.g., visible polyps. Subsequently, non-expert annotators supported by machine learning add the missing annotations for the frames in-between. Methods In our framework, an expert reviews the video and annotates a few video frames to verify the object's annotations for the non-expert. In a second step, a non-expert has visual confirmation of the given object and can annotate all following and preceding frames with AI assistance. After the expert has finished, relevant frames will be selected and passed on to an AI model. This information allows the AI model to detect and mark the desired object on all following and preceding frames with an annotation. Therefore, the non-expert can adjust and modify the AI predictions and export the results, which can then be used to train the AI model. Results Using this framework, we were able to reduce workload of domain experts on average by a factor of 20 on our data. This is primarily due to the structure of the framework, which is designed to minimize the workload of the domain expert. Pairing this framework with a state-of-the-art semi-automated AI model enhances the annotation speed further. Through a prospective study with 10 participants, we show that semi-automated annotation using our tool doubles the annotation speed of non-expert annotators compared to a well-known state-of-the-art annotation tool. Conclusion In summary, we introduce a framework for fast expert annotation for gastroenterologists, which reduces the workload of the domain expert considerably while maintaining a very high annotation quality. The framework incorporates a semi-automated annotation system utilizing trained object detection models. The software and framework are open-source.},
  language  = {en}
}
@article{HarteltPuppe2022,
  author    = {Hartelt, Alexander and Puppe, Frank},
  title     = {Optical Medieval Music Recognition using background knowledge},
  series = {Algorithms},
  volume    = {15},
  journal   = {Algorithms},
  number    = {7},
  issn      = {1999-4893},
  doi       = {10.3390/a15070221},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-278756},
  year      = {2022},
  abstract  = {This paper deals with the effect of exploiting background knowledge for improving an OMR (Optical Music Recognition) deep learning pipeline for transcribing medieval, monophonic, handwritten music from the 12th-14th century, whose usage has been neglected in the literature. Various types of background knowledge about overlapping notes and text, clefs, graphical connections (neumes) and their implications on the position in staff of the notes were used and evaluated. Moreover, the effect of different encoder/decoder architectures and of different datasets for training a mixed model and for document-specific fine-tuning based on an extended OMR pipeline with an additional post-processing step were evaluated. The use of background models improves all metrics and in particular the melody accuracy rate (mAR), which is based on the insert, delete and replace operations necessary to convert the generated melody into the correct melody. When using a mixed model and evaluating on a different dataset, our best model achieves without fine-tuning and without post-processing a mAR of 90.4\%, which is raised by nearly 30\% to 93.2\% mAR using background knowledge. With additional fine-tuning, the contribution of post-processing is even greater: the basic mAR of 90.5\% is raised by more than 50\% to 95.8\% mAR.},
  language  = {en}
}
@article{Puppe2022,
  author    = {Puppe, Frank},
  title     = {Gesellschaftliche Perspektiven einer fachspezifischen KI f{\"u}r automatisierte Entscheidungen},
  series = {Informatik Spektrum},
  volume    = {45},
  journal   = {Informatik Spektrum},
  number    = {2},
  issn      = {0170-6012},
  doi       = {10.1007/s00287-022-01443-6},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-324197},
  pages     = {88-95},
  year      = {2022},
  abstract  = {Die k{\"u}nstliche Intelligenz (KI) entwickelt sich rasant und hat bereits eindrucksvolle Erfolge zu verzeichnen, darunter {\"u}bermenschliche Kompetenz in den meisten Spielen und vielen Quizshows, intelligente Suchmaschinen, individualisierte Werbung, Spracherkennung, -ausgabe und -{\"u}bersetzung auf sehr hohem Niveau und hervorragende Leistungen bei der Bildverarbeitung, u. a. in der Medizin, der optischen Zeichenerkennung, beim autonomen Fahren, aber auch beim Erkennen von Menschen auf Bildern und Videos oder bei Deep Fakes f{\"u}r Fotos und Videos. Es ist zu erwarten, dass die KI auch in der Entscheidungsfindung Menschen {\"u}bertreffen wird; ein alter Traum der Expertensysteme, der durch Lernverfahren, Big Data und Zugang zu dem gesammelten Wissen im Web in greifbare N{\"a}he r{\"u}ckt. Gegenstand dieses Beitrags sind aber weniger die technischen Entwicklungen, sondern m{\"o}gliche gesellschaftliche Auswirkungen einer spezialisierten, kompetenten KI f{\"u}r verschiedene Bereiche der autonomen, d. h. nicht nur unterst{\"u}tzenden Entscheidungsfindung: als Fußballschiedsrichter, in der Medizin, f{\"u}r richterliche Entscheidungen und sehr spekulativ auch im politischen Bereich. Dabei werden Vor- und Nachteile dieser Szenarien aus gesellschaftlicher Sicht diskutiert.},
  subject      = {K{\"u}nstliche Intelligenz},
  language  = {de}
}
@article{DakroubVermaFuehringAgorastouetal.2022,
  author    = {Dakroub, Mohamad and Verma-Fuehring, Raoul and Agorastou, Vaia and Sch{\"o}n, Julian and Hillenkamp, Jost and Puppe, Frank and Loewen, Nils A.},
  title     = {Inter-eye correlation analysis of 24-h IOPs and glaucoma progression},
  series = {Graefe's Archive for Clinical and Experimental Ophthalmology},
  volume    = {260},
  journal   = {Graefe's Archive for Clinical and Experimental Ophthalmology},
  number    = {10},
  doi       = {10.1007/s00417-022-05651-4},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-323831},
  pages     = {3349-3356},
  year      = {2022},
  abstract  = {Purpose To determine whether 24-h IOP monitoring can be a predictor for glaucoma progression and to analyze the inter-eye relationship of IOP, perfusion, and progression parameters. Methods We extracted data from manually drawn IOP curves with HIOP-Reader, a software suite we developed. The relationship between measured IOPs and mean ocular perfusion pressures (MOPP) to retinal nerve fiber layer (RNFL) thickness was analyzed. We determined the ROC curves for peak IOP (T\(_{max}\)), average IOP(T\(_{avg}\)), IOP variation (IOP\(_{var}\)), and historical IOP cut-off levels to detect glaucoma progression (rate of RNFL loss). Bivariate analysis was also conducted to check for various inter-eye relationships. Results Two hundred seventeen eyes were included. The average IOP was 14.8 ± 3.5 mmHg, with a 24-h variation of 5.2 ± 2.9 mmHg. A total of 52\% of eyes with RNFL progression data showed disease progression. There was no significant difference in T\(_{max}\), T\(_{avg}\), and IOP\(_{var}\) between progressors and non-progressors (all p > 0.05). Except for T\(_{avg}\) and the temporal RNFL, there was no correlation between disease progression in any quadrant and T\(_{max}\), T\(_{avg}\), and IOP\(_{var}\). Twenty-four-hour and outpatient IOP variables had poor sensitivities and specificities in detecting disease progression. The correlation of inter-eye parameters was moderate; correlation with disease progression was weak. Conclusion In line with our previous study, IOP data obtained during a single visit (outpatient or inpatient monitoring) make for a poor diagnostic tool, no matter the method deployed. Glaucoma progression and perfusion pressure in left and right eyes correlated weakly to moderately with each other. Key messages What is known: ● Our prior study showed that manually obtained 24-hour inpatient IOP measurements in right eyes are poor predictors for glaucoma progression. The inter-eye relationship of 24-hour IOP parameters and disease progression on optical coherence tomography (OCT) has not been examined. What we found: ● 24-hour IOP profiles of left eyes from the same study were a poor diagnostic tool to detect worsening glaucoma. ● Significant inter-eye correlations of various strengths were found for all tested parameters},
  language  = {en}
}
@article{LuxBanckSassmannshausenetal.2022,
  author    = {Lux, Thomas J. and Banck, Michael and Saßmannshausen, Zita and Troya, Joel and Krenzer, Adrian and Fitting, Daniel and Sudarevic, Boban and Zoller, Wolfram G. and Puppe, Frank and Meining, Alexander and Hann, Alexander},
  title     = {Pilot study of a new freely available computer-aided polyp detection system in clinical practice},
  series = {International Journal of Colorectal Disease},
  volume    = {37},
  journal   = {International Journal of Colorectal Disease},
  number    = {6},
  doi       = {10.1007/s00384-022-04178-8},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-324459},
  pages     = {1349-1354},
  year      = {2022},
  abstract  = {Purpose Computer-aided polyp detection (CADe) systems for colonoscopy are already presented to increase adenoma detection rate (ADR) in randomized clinical trials. Those commercially available closed systems often do not allow for data collection and algorithm optimization, for example regarding the usage of different endoscopy processors. Here, we present the first clinical experiences of a, for research purposes publicly available, CADe system. Methods We developed an end-to-end data acquisition and polyp detection system named EndoMind. Examiners of four centers utilizing four different endoscopy processors used EndoMind during their clinical routine. Detected polyps, ADR, time to first detection of a polyp (TFD), and system usability were evaluated (NCT05006092). Results During 41 colonoscopies, EndoMind detected 29 of 29 adenomas in 66 of 66 polyps resulting in an ADR of 41.5\%. Median TFD was 130 ms (95\%-CI, 80-200 ms) while maintaining a median false positive rate of 2.2\% (95\%-CI, 1.7-2.8\%). The four participating centers rated the system using the System Usability Scale with a median of 96.3 (95\%-CI, 70-100). Conclusion EndoMind's ability to acquire data, detect polyps in real-time, and high usability score indicate substantial practical value for research and clinical practice. Still, clinical benefit, measured by ADR, has to be determined in a prospective randomized controlled trial.},
  language  = {en}
}
@article{KempfKrugPuppe2023,
  author    = {Kempf, Sebastian and Krug, Markus and Puppe, Frank},
  title     = {KIETA: Key-insight extraction from scientific tables},
  series = {Applied Intelligence},
  volume    = {53},
  journal   = {Applied Intelligence},
  number    = {8},
  issn      = {0924-669X},
  doi       = {10.1007/s10489-022-03957-8},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-324180},
  pages     = {9513-9530},
  year      = {2023},
  abstract  = {An important but very time consuming part of the research process is literature review. An already large and nevertheless growing ground set of publications as well as a steadily increasing publication rate continue to worsen the situation. Consequently, automating this task as far as possible is desirable. Experimental results of systems are key-insights of high importance during literature review and usually represented in form of tables. Our pipeline KIETA exploits these tables to contribute to the endeavor of automation by extracting them and their contained knowledge from scientific publications. The pipeline is split into multiple steps to guarantee modularity as well as analyzability, and agnosticim regarding the specific scientific domain up until the knowledge extraction step, which is based upon an ontology. Additionally, a dataset of corresponding articles has been manually annotated with information regarding table and knowledge extraction. Experiments show promising results that signal the possibility of an automated system, while also indicating limits of extracting knowledge from tables without any context.},
  language  = {en}
}
@article{KrenzerBanckMakowskietal.2023,
  author    = {Krenzer, Adrian and Banck, Michael and Makowski, Kevin and Hekalo, Amar and Fitting, Daniel and Troya, Joel and Sudarevic, Boban and Zoller, Wolfgang G. and Hann, Alexander and Puppe, Frank},
  title     = {A real-time polyp-detection system with clinical application in colonoscopy using deep convolutional neural networks},
  series = {Journal of Imaging},
  volume    = {9},
  journal   = {Journal of Imaging},
  number    = {2},
  issn      = {2313-433X},
  doi       = {10.3390/jimaging9020026},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-304454},
  year      = {2023},
  abstract  = {Colorectal cancer (CRC) is a leading cause of cancer-related deaths worldwide. The best method to prevent CRC is with a colonoscopy. During this procedure, the gastroenterologist searches for polyps. However, there is a potential risk of polyps being missed by the gastroenterologist. Automated detection of polyps helps to assist the gastroenterologist during a colonoscopy. There are already publications examining the problem of polyp detection in the literature. Nevertheless, most of these systems are only used in the research context and are not implemented for clinical application. Therefore, we introduce the first fully open-source automated polyp-detection system scoring best on current benchmark data and implementing it ready for clinical application. To create the polyp-detection system (ENDOMIND-Advanced), we combined our own collected data from different hospitals and practices in Germany with open-source datasets to create a dataset with over 500,000 annotated images. ENDOMIND-Advanced leverages a post-processing technique based on video detection to work in real-time with a stream of images. It is integrated into a prototype ready for application in clinical interventions. We achieve better performance compared to the best system in the literature and score a F1-score of 90.24\% on the open-source CVC-VideoClinicDB benchmark.},
  language  = {en}
}
@article{FischerHarteltPuppe2023,
  author    = {Fischer, Norbert and Hartelt, Alexander and Puppe, Frank},
  title     = {Line-level layout recognition of historical documents with background knowledge},
  series = {Algorithms},
  volume    = {16},
  journal   = {Algorithms},
  number    = {3},
  issn      = {1999-4893},
  doi       = {10.3390/a16030136},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-310938},
  year      = {2023},
  abstract  = {Digitization and transcription of historic documents offer new research opportunities for humanists and are the topics of many edition projects. However, manual work is still required for the main phases of layout recognition and the subsequent optical character recognition (OCR) of early printed documents. This paper describes and evaluates how deep learning approaches recognize text lines and can be extended to layout recognition using background knowledge. The evaluation was performed on five corpora of early prints from the 15th and 16th Centuries, representing a variety of layout features. While the main text with standard layouts could be recognized in the correct reading order with a precision and recall of up to 99.9\%, also complex layouts were recognized at a rate as high as 90\% by using background knowledge, the full potential of which was revealed if many pages of the same source were transcribed.},
  language  = {en}
}
@article{LimanMayFetteetal.2023,
  author    = {Liman, Leon and May, Bernd and Fette, Georg and Krebs, Jonathan and Puppe, Frank},
  title     = {Using a clinical data warehouse to calculate and present key metrics for the radiology department: implementation and performance evaluation},
  series = {JMIR Medical Informatics},
  volume    = {11},
  journal   = {JMIR Medical Informatics},
  issn      = {2291-9694},
  doi       = {10.2196/41808},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-349411},
  year      = {2023},
  abstract  = {Background: Due to the importance of radiologic examinations, such as X-rays or computed tomography scans, for many clinical diagnoses, the optimal use of the radiology department is 1 of the primary goals of many hospitals. Objective: This study aims to calculate the key metrics of this use by creating a radiology data warehouse solution, where data from radiology information systems (RISs) can be imported and then queried using a query language as well as a graphical user interface (GUI). Methods: Using a simple configuration file, the developed system allowed for the processing of radiology data exported from any kind of RIS into a Microsoft Excel, comma-separated value (CSV), or JavaScript Object Notation (JSON) file. These data were then imported into a clinical data warehouse. Additional values based on the radiology data were calculated during this import process by implementing 1 of several provided interfaces. Afterward, the query language and GUI of the data warehouse were used to configure and calculate reports on these data. For the most common types of requested reports, a web interface was created to view their numbers as graphics. Results: The tool was successfully tested with the data of 4 different German hospitals from 2018 to 2021, with a total of 1,436,111 examinations. The user feedback was good, since all their queries could be answered if the available data were sufficient. The initial processing of the radiology data for using them with the clinical data warehouse took (depending on the amount of data provided by each hospital) between 7 minutes and 1 hour 11 minutes. Calculating 3 reports of different complexities on the data of each hospital was possible in 1-3 seconds for reports with up to 200 individual calculations and in up to 1.5 minutes for reports with up to 8200 individual calculations. Conclusions: A system was developed with the main advantage of being generic concerning the export of different RISs as well as concerning the configuration of queries for various reports. The queries could be configured easily using the GUI of the data warehouse, and their results could be exported into the standard formats Excel and CSV for further processing.},
  language  = {en}
}