@article{AlexyukBogoyavlenskiyAlexyuketal.2021, author = {Alexyuk, Madina and Bogoyavlenskiy, Andrey and Alexyuk, Pavel and Moldakhanov, Yergali and Berezin, Vladimir and Digel, Ilya}, title = {Epipelagic microbiome of the Small Aral Sea: Metagenomic structure and ecological diversity}, series = {MicrobiologyOpen}, volume = {10}, journal = {MicrobiologyOpen}, number = {1}, publisher = {Wiley}, address = {Weinheim}, issn = {2045-8827}, doi = {10.1002/mbo3.1142}, pages = {1 -- 10}, year = {2021}, abstract = {Microbial diversity studies regarding the aquatic communities that experienced or are experiencing environmental problems are essential for the comprehension of the remediation dynamics. In this pilot study, we present data on the phylogenetic and ecological structure of microorganisms from epipelagic water samples collected in the Small Aral Sea (SAS). The raw data were generated by massive parallel sequencing using the shotgun approach. As expected, most of the identified DNA sequences belonged to Terrabacteria and Actinobacteria (40\% and 37\% of the total reads, respectively). The occurrence of Deinococcus-Thermus, Armatimonadetes, Chloroflexi in the epipelagic SAS waters was less anticipated. Surprising was also the detection of sequences, which are characteristic for strict anaerobes—Ignavibacteria, hydrogen-oxidizing bacteria, and archaeal methanogenic species. We suppose that the observed very broad range of phylogenetic and ecological features displayed by the SAS reads demonstrates a more intensive mixing of water masses originating from diverse ecological niches of the Aral-Syr Darya River basin than presumed before.}, language = {en} } @inproceedings{MandekarJentschLutzetal.2021, author = {Mandekar, Swati and Jentsch, Lina and Lutz, Kai and Behbahani, Mehdi and Melnykowycz, Mark}, title = {Earable design analysis for sleep EEG measurements}, series = {UbiComp '21}, booktitle = {UbiComp '21}, doi = {10.1145/3460418.3479328}, pages = {171 -- 175}, year = {2021}, abstract = {Conventional EEG devices cannot be used in everyday life and hence, past decade research has been focused on Ear-EEG for mobile, at-home monitoring for various applications ranging from emotion detection to sleep monitoring. As the area available for electrode contact in the ear is limited, the electrode size and location play a vital role for an Ear-EEG system. In this investigation, we present a quantitative study of ear-electrodes with two electrode sizes at different locations in a wet and dry configuration. Electrode impedance scales inversely with size and ranges from 450 kΩ to 1.29 MΩ for dry and from 22 kΩ to 42 kΩ for wet contact at 10 Hz. For any size, the location in the ear canal with the lowest impedance is ELE (Left Ear Superior), presumably due to increased contact pressure caused by the outer-ear anatomy. The results can be used to optimize signal pickup and SNR for specific applications. We demonstrate this by recording sleep spindles during sleep onset with high quality (5.27 μVrms).}, language = {en} } @inproceedings{KloeserKohlKraftetal.2021, author = {Kl{\"o}ser, Lars and Kohl, Philipp and Kraft, Bodo and Z{\"u}ndorf, Albert}, title = {Multi-attribute relation extraction (MARE): simplifying the application of relation extraction}, series = {Proceedings of the 2nd International Conference on Deep Learning Theory and Applications - DeLTA}, booktitle = {Proceedings of the 2nd International Conference on Deep Learning Theory and Applications - DeLTA}, isbn = {978-989-758-526-5}, doi = {10.5220/0010559201480156}, pages = {148 -- 156}, year = {2021}, abstract = {Natural language understanding's relation extraction makes innovative and encouraging novel business concepts possible and facilitates new digitilized decision-making processes. Current approaches allow the extraction of relations with a fixed number of entities as attributes. Extracting relations with an arbitrary amount of attributes requires complex systems and costly relation-trigger annotations to assist these systems. We introduce multi-attribute relation extraction (MARE) as an assumption-less problem formulation with two approaches, facilitating an explicit mapping from business use cases to the data annotations. Avoiding elaborated annotation constraints simplifies the application of relation extraction approaches. The evaluation compares our models to current state-of-the-art event extraction and binary relation extraction methods. Our approaches show improvement compared to these on the extraction of general multi-attribute relations.}, language = {en} } @misc{JungMuellerStaat2021, author = {Jung, Alexander and M{\"u}ller, Wolfram and Staat, Manfred}, title = {Corrigendum to "Wind and fairness in ski jumping: A computer modelling analysis" [J. Biomech. 75 (2018) 147-153]}, series = {Journal of Biomechanics}, volume = {128}, journal = {Journal of Biomechanics}, number = {Article number: 110690}, publisher = {Elsevier}, address = {Amsterdam}, issn = {0021-9290}, doi = {10.1016/j.jbiomech.2021.110690}, pages = {1 Seite}, year = {2021}, language = {en} } @article{HeelDiktaBraekers2021, author = {Heel, Mareike van and Dikta, Gerhard and Braekers, Roel}, title = {Bootstrap based goodness‑of‑fit tests for binary multivariate regression models}, series = {Journal of the Korean Statistical Society}, volume = {51}, journal = {Journal of the Korean Statistical Society}, publisher = {Springer Nature}, address = {Singapur}, issn = {2005-2863 (Online)}, doi = {10.1007/s42952-021-00142-4}, pages = {28 Seiten}, year = {2021}, abstract = {We consider a binary multivariate regression model where the conditional expectation of a binary variable given a higher-dimensional input variable belongs to a parametric family. Based on this, we introduce a model-based bootstrap (MBB) for higher-dimensional input variables. This test can be used to check whether a sequence of independent and identically distributed observations belongs to such a parametric family. The approach is based on the empirical residual process introduced by Stute (Ann Statist 25:613-641, 1997). In contrast to Stute and Zhu's approach (2002) Stute \& Zhu (Scandinavian J Statist 29:535-545, 2002), a transformation is not required. Thus, any problems associated with non-parametric regression estimation are avoided. As a result, the MBB method is much easier for users to implement. To illustrate the power of the MBB based tests, a small simulation study is performed. Compared to the approach of Stute \& Zhu (Scandinavian J Statist 29:535-545, 2002), the simulations indicate a slightly improved power of the MBB based method. Finally, both methods are applied to a real data set.}, language = {en} } @book{DiktaScheer2021, author = {Dikta, Gerhard and Scheer, Marsel}, title = {Bootstrap Methods: With Applications in R}, publisher = {Springer}, address = {Cham}, isbn = {978-3-030-73480-0}, doi = {10.1007/978-3-030-73480-0}, pages = {XVI, 256 Seiten}, year = {2021}, abstract = {This book provides a compact introduction to the bootstrap method. In addition to classical results on point estimation and test theory, multivariate linear regression models and generalized linear models are covered in detail. Special attention is given to the use of bootstrap procedures to perform goodness-of-fit tests to validate model or distributional assumptions. In some cases, new methods are presented here for the first time. The text is motivated by practical examples and the implementations of the corresponding algorithms are always given directly in R in a comprehensible form. Overall, R is given great importance throughout. Each chapter includes a section of exercises and, for the more mathematically inclined readers, concludes with rigorous proofs. The intended audience is graduate students who already have a prior knowledge of probability theory and mathematical statistics.}, language = {en} } @inproceedings{SchmidtsKraftWinkensetal.2021, author = {Schmidts, Oliver and Kraft, Bodo and Winkens, Marvin and Z{\"u}ndorf, Albert}, title = {Catalog integration of heterogeneous and volatile product data}, series = {DATA 2020: Data Management Technologies and Applications}, booktitle = {DATA 2020: Data Management Technologies and Applications}, publisher = {Springer}, address = {Cham}, isbn = {978-3-030-83013-7}, doi = {10.1007/978-3-030-83014-4_7}, pages = {134 -- 153}, year = {2021}, abstract = {The integration of frequently changing, volatile product data from different manufacturers into a single catalog is a significant challenge for small and medium-sized e-commerce companies. They rely on timely integrating product data to present them aggregated in an online shop without knowing format specifications, concept understanding of manufacturers, and data quality. Furthermore, format, concepts, and data quality may change at any time. Consequently, integrating product catalogs into a single standardized catalog is often a laborious manual task. Current strategies to streamline or automate catalog integration use techniques based on machine learning, word vectorization, or semantic similarity. However, most approaches struggle with low-quality or real-world data. We propose Attribute Label Ranking (ALR) as a recommendation engine to simplify the integration process of previously unknown, proprietary tabular format into a standardized catalog for practitioners. We evaluate ALR by focusing on the impact of different neural network architectures, language features, and semantic similarity. Additionally, we consider metrics for industrial application and present the impact of ALR in production and its limitations.}, language = {en} } @inproceedings{KohlSchmidtsKloeseretal.2021, author = {Kohl, Philipp and Schmidts, Oliver and Kl{\"o}ser, Lars and Werth, Henri and Kraft, Bodo and Z{\"u}ndorf, Albert}, title = {STAMP 4 NLP - an agile framework for rapid quality-driven NLP applications development}, series = {Quality of Information and Communications Technology. QUATIC 2021}, booktitle = {Quality of Information and Communications Technology. QUATIC 2021}, publisher = {Springer}, address = {Cham}, isbn = {978-3-030-85346-4}, doi = {10.1007/978-3-030-85347-1_12}, pages = {156 -- 166}, year = {2021}, abstract = {The progress in natural language processing (NLP) research over the last years, offers novel business opportunities for companies, as automated user interaction or improved data analysis. Building sophisticated NLP applications requires dealing with modern machine learning (ML) technologies, which impedes enterprises from establishing successful NLP projects. Our experience in applied NLP research projects shows that the continuous integration of research prototypes in production-like environments with quality assurance builds trust in the software and shows convenience and usefulness regarding the business goal. We introduce STAMP 4 NLP as an iterative and incremental process model for developing NLP applications. With STAMP 4 NLP, we merge software engineering principles with best practices from data science. Instantiating our process model allows efficiently creating prototypes by utilizing templates, conventions, and implementations, enabling developers and data scientists to focus on the business goals. Due to our iterative-incremental approach, businesses can deploy an enhanced version of the prototype to their software environment after every iteration, maximizing potential business value and trust early and avoiding the cost of successful yet never deployed experiments.}, language = {en} } @inproceedings{BornheimGriegerBialonski2021, author = {Bornheim, Tobias and Grieger, Niklas and Bialonski, Stephan}, title = {FHAC at GermEval 2021: Identifying German toxic, engaging, and fact-claiming comments with ensemble learning}, series = {Proceedings of the GermEval 2021 Workshop on the Identification of Toxic, Engaging, and Fact-Claiming Comments : 17th Conference on Natural Language Processing KONVENS 2021}, booktitle = {Proceedings of the GermEval 2021 Workshop on the Identification of Toxic, Engaging, and Fact-Claiming Comments : 17th Conference on Natural Language Processing KONVENS 2021}, publisher = {Heinrich Heine University}, address = {D{\"u}sseldorf}, doi = {10.48415/2021/fhw5-x128}, pages = {105 -- 111}, year = {2021}, language = {en} } @incollection{EngelmannShashaSlabu2021, author = {Engelmann, Ulrich M. and Shasha, Carolyn and Slabu, Ioana}, title = {Magnetic nanoparticle relaxation in biomedical application: focus on simulating nanoparticle heating}, series = {Magnetic nanoparticles in human health and medicine}, booktitle = {Magnetic nanoparticles in human health and medicine}, publisher = {Wiley-Blackwell}, address = {Hoboken, New Jeersey}, isbn = {978-1-119-75467-1}, pages = {327 -- 354}, year = {2021}, language = {en} }