@inproceedings{haak-engelmann-2021-ircologne, abstract = {In this paper, we describe the TH K{\"o}ln{'}s submission for the Shared Task on the Identification of Toxic Comments at GermEval 2021. Toxicity is a severe and latent problem in comments in online discussions. Complex language model based methods have shown the most success in identifying toxicity. However, these approaches lack explainability and might be insensitive to domain-specific renditions of toxicity. In the scope of the GermEval 2021 toxic comment classification task (Risch et al., 2021), we employed a simple but promising combination of term-frequency-based classification and rule-based labeling to produce effective but to no lesser degree explainable toxicity predictions.}, added-at = {2022-01-07T14:13:25.000+0100}, address = {Duesseldorf, Germany}, author = {Haak, Fabian and Engelmann, Bj{\"o}rn}, biburl = {https://www.bibsonomy.org/bibtex/2cc11c06c22429db927498ff5bb385a44/irgroup_thkoeln}, booktitle = {Proceedings of the GermEval 2021 Shared Task on the Identification of Toxic, Engaging, and Fact-Claiming Comments}, interhash = {68718fa961d6fdf1429f1e8050f51ae9}, intrahash = {cc11c06c22429db927498ff5bb385a44}, keywords = {2021 bias classification data engelmann haak myown nlp programming snorkel toxic}, month = sep, pages = {47--53}, pdf = {https://aclanthology.org/2021.germeval-1.7.pdf}, publisher = {Association for Computational Linguistics}, timestamp = {2023-10-25T18:04:09.000+0200}, title = {{IRC}ologne at {G}erm{E}val 2021: Toxicity Classification}, url = {https://aclanthology.org/2021.germeval-1.7}, year = 2021 }