<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">bsuir</journal-id><journal-title-group><journal-title xml:lang="ru">Доклады БГУИР</journal-title><trans-title-group xml:lang="en"><trans-title>Doklady BGUIR</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1729-7648</issn><issn pub-type="epub">2708-0382</issn><publisher><publisher-name>БГУИР</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.35596/1729-7648-2026-24-2-85-91</article-id><article-id custom-type="elpub" pub-id-type="custom">bsuir-4346</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>Статьи</subject></subj-group></article-categories><title-group><article-title>Сравнение методов оценки семантического сходства текстовых фрагментов</article-title><trans-title-group xml:lang="en"><trans-title>Comparison of Methods for Assessing the Semantic Similarity of Text Fragments</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Крез</surname><given-names>К. С.</given-names></name><name name-style="western" xml:lang="en"><surname>Krez</surname><given-names>K.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Крез Карина Сергеевна, асп., ассист. каф. проектирования информационно-компьютерных систем</p><p>220013, Минск, ул. П. Бровки, 6</p><p>Тел.: +375 29 952-75-56</p></bio><bio xml:lang="en"><p>Krez Karina, Postgraduate, Assistant at the Department of Information and Computer Systems Design</p><p>220013, Minsk, P. Brovki St., 6</p><p>Тel.: +375 29 952-75-56</p></bio><email xlink:type="simple">karinakrez04@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Шнейдеров</surname><given-names>Е. Н.</given-names></name><name name-style="western" xml:lang="en"><surname>Shneiderov</surname><given-names>E.</given-names></name></name-alternatives><bio xml:lang="ru"><p>канд. техн. наук., доц., каф. проектирования информационно-компьютерных систем, проректор по учебной работе</p><p>Минск</p></bio><bio xml:lang="en"><p>Cand. Sci. (Tech.), Associate Professor at the Department of Information and Computer Systems Design</p><p>Minsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Шиш</surname><given-names>П. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Shish</surname><given-names>P.</given-names></name></name-alternatives><bio xml:lang="ru"><p>студент</p><p>Минск</p></bio><bio xml:lang="en"><p>Student</p><p>Minsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Кондратенко</surname><given-names>Е. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Kondratenko</surname><given-names>E.</given-names></name></name-alternatives><bio xml:lang="ru"><p>студент</p><p>Минск</p></bio><bio xml:lang="en"><p>Student</p><p>Minsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Белорусский государственный университет информатики и радиоэлектроники</institution></aff><aff xml:lang="en"><institution>Belarusian State University of Informatics and Radioelectronics</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>08</day><month>05</month><year>2026</year></pub-date><volume>24</volume><issue>2</issue><fpage>85</fpage><lpage>91</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Крез К.С., Шнейдеров Е.Н., Шиш П.А., Кондратенко Е.В., 2026</copyright-statement><copyright-year>2026</copyright-year><copyright-holder xml:lang="ru">Крез К.С., Шнейдеров Е.Н., Шиш П.А., Кондратенко Е.В.</copyright-holder><copyright-holder xml:lang="en">Krez K., Shneiderov E., Shish P., Kondratenko E.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://doklady.bsuir.by/jour/article/view/4346">https://doklady.bsuir.by/jour/article/view/4346</self-uri><abstract><p>В условиях быстрого роста объема текстовых данных появляется потребность в методах, способных эффективно сравнивать фрагменты текста по смыслу, включая случаи перефразирования, синонимизации и перестройки структуры предложений. Одна из актуальных задач – сопоставление результатов методов семантического сравнения на основе различных моделей с человеческим восприятием смысловой близости. В статье рассматривается экспертный метод оценки семантического сходства текстовых фрагментов, основанный на оценках участников анкетирования. Суть метода заключается в формировании интерпретируемой шкалы семантической близости, полученной на основе человеческого восприятия содержания текстов и используемой для анализа согласованности различных методов. Для формирования «человеческой» оценки проведен опрос 138 участников. Сравнительный анализ показал, что различные методы оценки семантического сходства демонстрируют неодинаковую степень согласованности с человеческим восприятием смысловой близости текстов. </p></abstract><trans-abstract xml:lang="en"><p>With the rapid growth of text data, there is a need for methods capable of effectively comparing text fragments by meaning, including cases of paraphrasing, synonymization, and sentence restructuring. One of the pressing challenges is comparing the results of semantic comparison methods based on various models with the human perception of semantic similarity. This article discusses an expert method for assessing the semantic similarity of text fragments based on the assessments of survey participants. The method consists of creating an interpretable semantic similarity scale derived from human perception of text content and used to analyze the consistency of various methods. To develop a “human” assessment, a survey of 138 participants was conducted. A comparative analysis revealed that various semantic similarity assessment methods demonstrate varying degrees of consistency with the human perception of text semantic similarity.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>семантическое сходство</kwd><kwd>обработка естественного языка</kwd><kwd>экспертный метод</kwd><kwd>сравнение текстов</kwd><kwd>шкалирование оценок</kwd><kwd>анкетирование</kwd><kwd>корреляция Пирсона</kwd><kwd>корреляция Спирмена</kwd></kwd-group><kwd-group xml:lang="en"><kwd>semantic similarity</kwd><kwd>natural language processing</kwd><kwd>expert method</kwd><kwd>text comparison</kwd><kwd>rating scaling</kwd><kwd>questionnaire</kwd><kwd>Pearson correlation</kwd><kwd>Spearman correlation</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Devlin J., Chang M.-W., Lee K., Toutanova K. (2019) BERT: Pre-Training of Deep Bidirectional Transformers for Language Understanding. Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (NAACL-HLT 2019). 4171–4186. DOI: 10.18653/v1/N19-1423.</mixed-citation><mixed-citation xml:lang="en">Devlin J., Chang M.-W., Lee K., Toutanova K. (2019) BERT: Pre-Training of Deep Bidirectional Transformers for Language Understanding. Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (NAACL-HLT 2019). 4171–4186. DOI: 10.18653/v1/N19-1423.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Reimers N., Gurevych I. (2019) Sentence-BERT: Sentence Embeddings Using Siamese BERTNetworks. Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP 2019). 3982–3992. DOI: 10.18653/v1/D19-1410.</mixed-citation><mixed-citation xml:lang="en">Reimers N., Gurevych I. (2019) Sentence-BERT: Sentence Embeddings Using Siamese BERTNetworks. Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP 2019). 3982–3992. DOI: 10.18653/v1/D19-1410.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Salton G., Buckley C. (1988) Term-Weighting Approaches in Automatic Text Retrieval. Information Processing &amp; Management. 24 (5), 513–523. DOI: 10.1016/0306-4573(88)90021-0.</mixed-citation><mixed-citation xml:lang="en">Salton G., Buckley C. (1988) Term-Weighting Approaches in Automatic Text Retrieval. Information Processing &amp; Management. 24 (5), 513–523. DOI: 10.1016/0306-4573(88)90021-0.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Gao T., Yao X., Chen D. (2021) SimCSE: Simple Contrastive Learning of Sentence Embeddings. Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing. 6894–6910. DOI: 10.18653/v1/2021.emnlp-main.552.</mixed-citation><mixed-citation xml:lang="en">Gao T., Yao X., Chen D. (2021) SimCSE: Simple Contrastive Learning of Sentence Embeddings. Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing. 6894–6910. DOI: 10.18653/v1/2021.emnlp-main.552.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Feng F., Yang Y., Cer D., Arivazhagan N., Wang W. (2022) Language-Agnostic BERT Sentence Embedding. Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics. 878–891. DOI: 10.18653/v1/2022.acl-long.62.</mixed-citation><mixed-citation xml:lang="en">Feng F., Yang Y., Cer D., Arivazhagan N., Wang W. (2022) Language-Agnostic BERT Sentence Embedding. Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics. 878–891. DOI: 10.18653/v1/2022.acl-long.62.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
