@article{VollmerVollmerLangetal.2023,
  author    = {Vollmer, Andreas and Vollmer, Michael and Lang, Gernot and Straub, Anton and K{\"u}bler, Alexander and Gubik, Sebastian and Brands, Roman C. and Hartmann, Stefan and Saravi, Babak},
  title     = {Automated assessment of radiographic bone loss in the posterior maxilla utilizing a multi-object detection artificial intelligence algorithm},
  series = {Applied Sciences},
  volume    = {13},
  journal   = {Applied Sciences},
  number    = {3},
  issn      = {2076-3417},
  doi       = {10.3390/app13031858},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-305050},
  year      = {2023},
  abstract  = {Periodontitis is one of the most prevalent diseases worldwide. The degree of radiographic bone loss can be used to assess the course of therapy or the severity of the disease. Since automated bone loss detection has many benefits, our goal was to develop a multi-object detection algorithm based on artificial intelligence that would be able to detect and quantify radiographic bone loss using standard two-dimensional radiographic images in the maxillary posterior region. This study was conducted by combining three recent online databases and validating the results using an external validation dataset from our organization. There were 1414 images for training and testing and 341 for external validation in the final dataset. We applied a Keypoint RCNN with a ResNet-50-FPN backbone network for both boundary box and keypoint detection. The intersection over union (IoU) and the object keypoint similarity (OKS) were used for model evaluation. The evaluation of the boundary box metrics showed a moderate overlapping with the ground truth, revealing an average precision of up to 0.758. The average precision and recall over all five folds were 0.694 and 0.611, respectively. Mean average precision and recall for the keypoint detection were 0.632 and 0.579, respectively. Despite only using a small and heterogeneous set of images for training, our results indicate that the algorithm is able to learn the objects of interest, although without sufficient accuracy due to the limited number of images and a large amount of information available in panoramic radiographs. Considering the widespread availability of panoramic radiographs as well as the increasing use of online databases, the presented model can be further improved in the future to facilitate its implementation in clinics.},
  language  = {en}
}
@article{KrenzerMakowskiHekaloetal.2022,
  author    = {Krenzer, Adrian and Makowski, Kevin and Hekalo, Amar and Fitting, Daniel and Troya, Joel and Zoller, Wolfram G. and Hann, Alexander and Puppe, Frank},
  title     = {Fast machine learning annotation in the medical domain: a semi-automated video annotation tool for gastroenterologists},
  series = {BioMedical Engineering OnLine},
  volume    = {21},
  journal   = {BioMedical Engineering OnLine},
  number    = {1},
  doi       = {10.1186/s12938-022-01001-x},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-300231},
  year      = {2022},
  abstract  = {Background Machine learning, especially deep learning, is becoming more and more relevant in research and development in the medical domain. For all the supervised deep learning applications, data is the most critical factor in securing successful implementation and sustaining the progress of the machine learning model. Especially gastroenterological data, which often involves endoscopic videos, are cumbersome to annotate. Domain experts are needed to interpret and annotate the videos. To support those domain experts, we generated a framework. With this framework, instead of annotating every frame in the video sequence, experts are just performing key annotations at the beginning and the end of sequences with pathologies, e.g., visible polyps. Subsequently, non-expert annotators supported by machine learning add the missing annotations for the frames in-between. Methods In our framework, an expert reviews the video and annotates a few video frames to verify the object's annotations for the non-expert. In a second step, a non-expert has visual confirmation of the given object and can annotate all following and preceding frames with AI assistance. After the expert has finished, relevant frames will be selected and passed on to an AI model. This information allows the AI model to detect and mark the desired object on all following and preceding frames with an annotation. Therefore, the non-expert can adjust and modify the AI predictions and export the results, which can then be used to train the AI model. Results Using this framework, we were able to reduce workload of domain experts on average by a factor of 20 on our data. This is primarily due to the structure of the framework, which is designed to minimize the workload of the domain expert. Pairing this framework with a state-of-the-art semi-automated AI model enhances the annotation speed further. Through a prospective study with 10 participants, we show that semi-automated annotation using our tool doubles the annotation speed of non-expert annotators compared to a well-known state-of-the-art annotation tool. Conclusion In summary, we introduce a framework for fast expert annotation for gastroenterologists, which reduces the workload of the domain expert considerably while maintaining a very high annotation quality. The framework incorporates a semi-automated annotation system utilizing trained object detection models. The software and framework are open-source.},
  language  = {en}
}
@article{KrenzerBanckMakowskietal.2023,
  author    = {Krenzer, Adrian and Banck, Michael and Makowski, Kevin and Hekalo, Amar and Fitting, Daniel and Troya, Joel and Sudarevic, Boban and Zoller, Wolfgang G. and Hann, Alexander and Puppe, Frank},
  title     = {A real-time polyp-detection system with clinical application in colonoscopy using deep convolutional neural networks},
  series = {Journal of Imaging},
  volume    = {9},
  journal   = {Journal of Imaging},
  number    = {2},
  issn      = {2313-433X},
  doi       = {10.3390/jimaging9020026},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-304454},
  year      = {2023},
  abstract  = {Colorectal cancer (CRC) is a leading cause of cancer-related deaths worldwide. The best method to prevent CRC is with a colonoscopy. During this procedure, the gastroenterologist searches for polyps. However, there is a potential risk of polyps being missed by the gastroenterologist. Automated detection of polyps helps to assist the gastroenterologist during a colonoscopy. There are already publications examining the problem of polyp detection in the literature. Nevertheless, most of these systems are only used in the research context and are not implemented for clinical application. Therefore, we introduce the first fully open-source automated polyp-detection system scoring best on current benchmark data and implementing it ready for clinical application. To create the polyp-detection system (ENDOMIND-Advanced), we combined our own collected data from different hospitals and practices in Germany with open-source datasets to create a dataset with over 500,000 annotated images. ENDOMIND-Advanced leverages a post-processing technique based on video detection to work in real-time with a stream of images. It is integrated into a prototype ready for application in clinical interventions. We achieve better performance compared to the best system in the literature and score a F1-score of 90.24\% on the open-source CVC-VideoClinicDB benchmark.},
  language  = {en}
}
@article{HoeserKuenzer2020,
  author    = {Hoeser, Thorsten and Kuenzer, Claudia},
  title     = {Object detection and image segmentation with deep learning on Earth observation data: a review-part I: evolution and recent trends},
  series = {Remote Sensing},
  volume    = {12},
  journal   = {Remote Sensing},
  number    = {10},
  issn      = {2072-4292},
  doi       = {10.3390/rs12101667},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-205918},
  year      = {2020},
  abstract  = {Deep learning (DL) has great influence on large parts of science and increasingly established itself as an adaptive method for new challenges in the field of Earth observation (EO). Nevertheless, the entry barriers for EO researchers are high due to the dense and rapidly developing field mainly driven by advances in computer vision (CV). To lower the barriers for researchers in EO, this review gives an overview of the evolution of DL with a focus on image segmentation and object detection in convolutional neural networks (CNN). The survey starts in 2012, when a CNN set new standards in image recognition, and lasts until late 2019. Thereby, we highlight the connections between the most important CNN architectures and cornerstones coming from CV in order to alleviate the evaluation of modern DL models. Furthermore, we briefly outline the evolution of the most popular DL frameworks and provide a summary of datasets in EO. By discussing well performing DL architectures on these datasets as well as reflecting on advances made in CV and their impact on future research in EO, we narrow the gap between the reviewed, theoretical concepts from CV and practical application in EO.},
  language  = {en}
}
@article{HoeserBachoferKuenzer2020,
  author    = {Hoeser, Thorsten and Bachofer, Felix and Kuenzer, Claudia},
  title     = {Object detection and image segmentation with deep learning on Earth Observation data: a review — part II: applications},
  series = {Remote Sensing},
  volume    = {12},
  journal   = {Remote Sensing},
  number    = {18},
  issn      = {2072-4292},
  doi       = {10.3390/rs12183053},
  url       = {http://nbn-resolving.de/urn:nbn:de:bvb:20-opus-213152},
  year      = {2020},
  abstract  = {In Earth observation (EO), large-scale land-surface dynamics are traditionally analyzed by investigating aggregated classes. The increase in data with a very high spatial resolution enables investigations on a fine-grained feature level which can help us to better understand the dynamics of land surfaces by taking object dynamics into account. To extract fine-grained features and objects, the most popular deep-learning model for image analysis is commonly used: the convolutional neural network (CNN). In this review, we provide a comprehensive overview of the impact of deep learning on EO applications by reviewing 429 studies on image segmentation and object detection with CNNs. We extensively examine the spatial distribution of study sites, employed sensors, used datasets and CNN architectures, and give a thorough overview of applications in EO which used CNNs. Our main finding is that CNNs are in an advanced transition phase from computer vision to EO. Upon this, we argue that in the near future, investigations which analyze object dynamics with CNNs will have a significant impact on EO research. With a focus on EO applications in this Part II, we complete the methodological review provided in Part I.},
  language  = {en}
}