<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">bsuir</journal-id><journal-title-group><journal-title xml:lang="ru">Доклады БГУИР</journal-title><trans-title-group xml:lang="en"><trans-title>Doklady BGUIR</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1729-7648</issn><issn pub-type="epub">2708-0382</issn><publisher><publisher-name>БГУИР</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.35596/1729-7648-2023-21-4-110-117</article-id><article-id custom-type="elpub" pub-id-type="custom">bsuir-3689</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ЭЛЕКТРОНИКА, РАДИОФИЗИКА, РАДИОТЕХНИКА, ИНФОРМАТИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>ELECTRONICS, RADIOPHYSICS, RADIOENGINEERING, INFORMATICS</subject></subj-group></article-categories><title-group><article-title>Комбинированный метод отбора информативных признаков для выявления речевых патологий по голосу</article-title><trans-title-group xml:lang="en"><trans-title>Combined Method for Informative Feature Selection for Speech Pathology Detection</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Лихачёв</surname><given-names>Д. С.</given-names></name><name name-style="western" xml:lang="en"><surname>Likhachov</surname><given-names>D. S.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Лихачёв Денис Сергеевич - кандидат технических наук, доцент, доцент кафедры электронных вычислительных средств.</p><p>220013, Минск, ул. П. Бровки, 6. Тел.: +375 17 293-85-05</p></bio><bio xml:lang="en"><p>Likhachov Denis Sergeevich - Cand. of Sci., Associate Professor, Associate Professor at Computer Engineering De partment.</p><p>220013, Minsk, P. Brovki St., 6. Tel.: +375 17 293-85-05</p></bio><email xlink:type="simple">likhachov@bsuir.by</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Вашкевич</surname><given-names>М. И.</given-names></name><name name-style="western" xml:lang="en"><surname>Vashkevich</surname><given-names>M. I.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Доктор технических наук, доцент, доцент кафедры электронных вычислительных средств.</p><p>220013, Минск, ул. П. Бровки, 6</p></bio><bio xml:lang="en"><p>Maxim I. Vashkevich - Dr. of Sci. (Tech.), Associate Professor at Computer Engineering Department.</p><p>220013, Minsk, P. Brovki St., 6</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Петровский</surname><given-names>Н. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Petrovsky</surname><given-names>N. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Кандидат технических наук, доцент, доцент кафедры электронных вычислительных средств.</p><p>220013, Минск, ул. П. Бровки, 6</p></bio><bio xml:lang="en"><p>Nick A. Petrovsky - Cand. of Sci., Associate Professor, Associate Professor at Computer Engineering De partment.</p><p>220013, Minsk, P. Brovki St., 6</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Азаров</surname><given-names>И. С.</given-names></name><name name-style="western" xml:lang="en"><surname>Azarov</surname><given-names>E. S.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Доктор технических наук, доцент, заведующий кафедрой электронных вычислительных средств.</p><p>220013, Минск, ул. П. Бровки, 6</p></bio><bio xml:lang="en"><p>Elias S. Azarov - Dr. of Sci. (Tech.), Associate Professor, Head of Computer Engineering Department.</p><p>220013, Minsk, P. Brovki St., 6</p></bio><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Белорусский государственный университет информатики и радиоэлектроники</institution></aff><aff xml:lang="en"><institution>Belarusian State University of Informatics and Radioelectronics</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2023</year></pub-date><pub-date pub-type="epub"><day>29</day><month>08</month><year>2023</year></pub-date><volume>21</volume><issue>4</issue><fpage>110</fpage><lpage>117</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Лихачёв Д.С., Вашкевич М.И., Петровский Н.А., Азаров И.С., 2023</copyright-statement><copyright-year>2023</copyright-year><copyright-holder xml:lang="ru">Лихачёв Д.С., Вашкевич М.И., Петровский Н.А., Азаров И.С.</copyright-holder><copyright-holder xml:lang="en">Likhachov D.S., Vashkevich M.I., Petrovsky N.A., Azarov E.S.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://doklady.bsuir.by/jour/article/view/3689">https://doklady.bsuir.by/jour/article/view/3689</self-uri><abstract><p>Задача выявления голосовых патологий отличается малым объемом доступных данных для обучения, вследствие чего системы классификации, использующие малоразмерные данные, являются наиболее актуальными. Предлагается совместное использование методов LASSO (least absolute shrinkage and selection operator) и BSS (backward stepwise selection) в отборе наиболее значимых признаков для задач определения голосовых патологий, в частности бокового амиотрофического склероза. Использованы признаки на основе мел-частотных кепстральных коэффициентов, традиционно применяемые в обработке речевых сигналов, и на основе дискретной оценки огибающей спектра авторегрессионного процесса. Вторые спектральные признаки извлекаются с помощью генеративного метода, предполагающего вычисление дискретного преобразования Фурье последовательности отчетов, сгенерированной с использованием авторегрессионной модели входного голосового сигнала. Последовательность генерируется таким образом, чтобы учесть периодическую природу преобразования Фурье. Это позволяет повысить точность оценки спектра и уменьшить эффект спектральной утечки. Отбор признаков с помощью методов LASSO и BSS позволил повысить эффективность классификации, используя меньшее число признаков, по сравнению с применением только метода LASSO.</p></abstract><trans-abstract xml:lang="en"><p>The task of detecting vocal abnormalities is characterized by a small amount of available data for training, as a consequence of which classification systems that use low-dimensional data are the most relevant. We propose to use LASSO (least absolute shrinkage and selection operator) and BSS (backward stepwise selection) methods together to select the most significant features for the detection of vocal pathologies, in particular amyotrophic lateral sclerosis. Features based on fine-frequency cepstral coefficients, traditionally used in speech signal processing, and features based on discrete estimation of the autoregressive spectrum envelope are used. Spectral features based on the autoregressive process envelope spectrum are extracted using the generative method, which involves calculating a discrete Fourier transform of the report sequence generated using the autoregressive model of the input voice signal. The sequence is generated by the autoregressive model so as to account for the periodic nature of the Fourier transform. This improves the accuracy of the spectrum estimation and reduces the spectral leakage effect. Using LASSO in conjunction with BSS allowed us to improve the classification efficiency using a smaller number of features as compared to using the LASSO method alone.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>анализ голоса</kwd><kwd>генеративный метод</kwd><kwd>авторегрессия</kwd><kwd>машинное обучение</kwd><kwd>спектральные признаки</kwd><kwd>классификация</kwd></kwd-group><kwd-group xml:lang="en"><kwd>voice analysis</kwd><kwd>generative method</kwd><kwd>autoregression</kwd><kwd>machine learning</kwd><kwd>spectral features</kwd><kwd>classification</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Rabiner, L. R. Fundamentals of Speech Recognition / L. R. Rabiner, B. H. Juang // Pearson Education. 1993.</mixed-citation><mixed-citation xml:lang="en">Rabiner L. R., Juang B. H. (1993) Fundamentals of Speech Recognition. Pearson Education.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Benba, A. Discriminating between Patients with Parkinson’s and Neurological Diseases Using Cepstral Analysis / A. Benba, A. Jilbab, A. Hammouch // IEEE Transactions on Neural Systems and Rehabilitation Engineering. 2016. Vol. 24, No 10. P. 1100–1108.</mixed-citation><mixed-citation xml:lang="en">Benba A., Jilbab A., Hammouch A. (2016) Discriminating between Patients with Parkinson’s and Neurological Diseases Using Cepstral Analysis. IEEE Transactions on Neural Systems and Rehabilitation Engineering. 24 (10), 1100–1108.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Vashkevich, M. Classification of ALS Patients Based on Acoustic Analysis of Sustained Vowel Phonations / M. Vashkevich, Y. Rushkevich // Biomedical Signal Processing and Control. 2021. Vol. 65. P. 1–14.</mixed-citation><mixed-citation xml:lang="en">Vashkevich M., Rushkevich Y. (2021) Classification of ALS Patients Based on Acoustic Analysis of Sustained Vowel Phonations. Biomedical Signal Processing and Control. 65, 1–14.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Amyotrophic Lateral Sclerosis / M. C. Kiernan [et al.] // Lancet. 2011. Vol. 377, Iss. 9769. P. 942–955.</mixed-citation><mixed-citation xml:lang="en">Kiernan M. C. (2011) Amyotrophic Lateral Sclerosis. Lancet. 377 (9769), 942–955.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Detection of Bulbar ALS Using a Comprehensive Speech Assessment Battery / Y. Yunusova [et al.] // Proceedings of the International Workshop on Models and Analysis of Vocal Emissions for Biomedical Applications. 2013. P. 217–220</mixed-citation><mixed-citation xml:lang="en">Yunusova Y. (2013) Detection of Bulbar ALS Using a Comprehensive Speech Assessment Battery. Proceedings of the International Workshop on Models and Analysis of Vocal Emissions for Biomedical Applications. 217–220.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Fractal Features for Automatic Detection of Dysarthria / T. Spangler [et al.] // IEEE EMBS International Conference on Biomedical Health Informatics. 2017. P. 437–440.</mixed-citation><mixed-citation xml:lang="en">Spangler T. (2017) Fractal Features for Automatic Detection of Dysarthria. IEEE EMBS International Conference on Biomedical Health Informatics. 437–440.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Малоразмерные спектральные признаки для машинного обучения в задачах анализа и классификации голосового сигнала / Д. С. Лихачёв [и др.] // Информатика. 2023. № 1. С. 102–112. DOI: 10.37661/18160301-2023-20-1-102-112.</mixed-citation><mixed-citation xml:lang="en">Likhachov D. S., Vashkevich M. I., Petrovsky N. A., Azarov E. S. (2023) Small-Size Spectral Features for Machine Learning in Voice Signal Analysis and Classification Tasks. Informatics. (20), 102–112. DOI: 10.37661/1816-0301-2023-20-1-102-112 (in Russian).</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Markel, J. D. Linear Prediction of Speech / J. D. Markel, A. H. Gray. Berlin, New York: Springer-Verlag, 1976. 290 p.</mixed-citation><mixed-citation xml:lang="en">Markel J. D., Gray A. H. (1976) Linear Prediction of Speech. Berlin, New York, Springer-Verlag. 290.</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Вашкевич, М. И. Система анализа и классификации голосового сигнала на основе пертрубационных параметров и кепстрального представления в психоакустических шкалах / М. И. Вашкевич, Д. С. Лихачёв, И. С. Азаров // Доклады БГУИР. 2022. Т. 20, № 4. С. 73–82. DOI: https://doi.org/10.35596/1729-7648-2022-20-1-73-82.</mixed-citation><mixed-citation xml:lang="en">Vashkevich M. I., Likhachov D. S., Azarov E. S. (2022) Voice Analysis and Classification System Based on Perturbation Parameters and Cepstral Presentation in Psychoacoustic Scales. Doklady BGUIR. 20 (1), 73–82. DOI: 10.35596/1729-7648-2022-20-1-73-82 (in Russian).</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Анализ акустических параметров голоса для выявления заболеваний гортани / М. И. Вашкевич [и др.] // Информатика. 2020. № 17. С. 78–86.</mixed-citation><mixed-citation xml:lang="en">Vashkevich M. I., Burak A. A., Kanoika N. S., Daldova V. S. (2020) Analysis of Acoustic Voice Parameters for Larynx Pathology Detection. Informatics. 17 (1), 78–86 (in Russian).</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Flach, P. Machine Learning: the Art and Science of Algorithms that Make Sense of Data / P. Flach. Great Britain: Cambridge University Press, 2012. 416 p.</mixed-citation><mixed-citation xml:lang="en">Flach P. (2012) Machine Learning: the Art and Science of Algorithms that Make Sense of Data. Great Britain, Cambridge University Press Publ. 416.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">An Introduction to Statistical Learning with Applications in R / G. James [et al.]. Springer, 2013. 440 p.</mixed-citation><mixed-citation xml:lang="en">James G., Witten D., Hastie T., Tibshirani R. (2013) An Introduction to Statistical Learning with Applications in R. Springer Publ. 440.</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Kotu, V. Data Science: Concepts and Practice / V. Kotu, B. Deshpande. 2 ed. USA: Morgan Kaufmann Publishers an Imprint of Elsevier, 2019.</mixed-citation><mixed-citation xml:lang="en">Kotu V., Deshpande B. (2019) Data Science: Concepts and Practice. 2 ed. USA, Morgan Kaufmann Publishers an Imprint of Elsevier.</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Voice Database Used in the Article Classification of ALS Patients Based on Acoustic Analysis of Sustained Vowel Phonations [Electronic Resource]. Mode of access: https://github.com/Mak-Sim/Minsk2020_ALS_database. Date of access: 12.05.2023.</mixed-citation><mixed-citation xml:lang="en">Voice Database Used in the Article Classification of ALS Patients Based on Acoustic Analysis of Sustained Vowel Phonations. Available: https://github.com/Mak-Sim/Minsk2020_ALS_database (Accessed 12 May 2023).</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">The Necessity of Leave One Subject Out (LOSO) Cross Validation for EEG Disease Diagnosis / S. Kunjan [et al.] // Brain Informatics. Springer, 2021. P. 558–567.</mixed-citation><mixed-citation xml:lang="en">Kunjan S., Grummett T. S., Pope K. J., Powers D. M. W., Fitzgibbon S. P., Lewis T. W. (2021) The Necessity of Leave One Subject Out (LOSO) Cross Validation for EEG Disease Diagnosis. Brain Informatics. Springer Publ. 558–567.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
