@inproceedings{2bc0ab7eeccb4fdb8bffabedce973f2f,
title = "MIPT-NSU-UTMN at SemEval-2021 Task 5: Ensembling Learning with Pre-trained Language Models for Toxic Spans Detection",
abstract = "This paper describes our system for SemEval-2021 Task 5 on Toxic Spans Detection. We developed ensemble models using BERT-based neural architectures and post-processing to combine tokens into spans. We evaluated several pre-trained language models using various ensemble techniques for toxic span identification and achieved sizable improvements over our baseline fine-tuned BERT models. Finally, our system obtained a F1-score of 67.55% on test data.",
author = "Mikhail Kotyushev and Anna Glazkova and Dmitry Morozov",
note = "Publisher Copyright: {\textcopyright} 2021 Association for Computational Linguistics.; 15th International Workshop on Semantic Evaluation, SemEval 2021 ; Conference date: 05-08-2021 Through 06-08-2021",
year = "2021",
language = "English",
series = "SemEval 2021 - 15th International Workshop on Semantic Evaluation, Proceedings of the Workshop",
publisher = "Association for Computational Linguistics (ACL)",
pages = "913--918",
editor = "Alexis Palmer and Nathan Schneider and Natalie Schluter and Guy Emerson and Aurelie Herbelot and Xiaodan Zhu",
booktitle = "SemEval 2021 - 15th International Workshop on Semantic Evaluation, Proceedings of the Workshop",
}