<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">bsuir</journal-id><journal-title-group><journal-title xml:lang="ru">Доклады БГУИР</journal-title><trans-title-group xml:lang="en"><trans-title>Doklady BGUIR</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1729-7648</issn><issn pub-type="epub">2708-0382</issn><publisher><publisher-name>БГУИР</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.35596/1729-7648-2023-21-3-102-110</article-id><article-id custom-type="elpub" pub-id-type="custom">bsuir-3653</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ЭЛЕКТРОНИКА, РАДИОФИЗИКА, РАДИОТЕХНИКА, ИНФОРМАТИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>ELECTRONICS, RADIOPHYSICS, RADIOENGINEERING, INFORMATICS</subject></subj-group></article-categories><title-group><article-title>IТ-диагностика болезни Паркинсона на основе анализа голосовых маркеров и машинного обучения</article-title><trans-title-group xml:lang="en"><trans-title>IT Diagnostics of Parkinson’s Disease Based on the Analysis of Voice Markers and Machine Learning</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Вишняков</surname><given-names>В. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Vishniakou</surname><given-names>U. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Вишняков Владимир Анатольевич, д. т. н., профессор кафедры инфокоммуникационных технологий</p><p>220013, г. Минск, ул. П. Бровки, 6</p><p>Тел.: +375 44 486-71-82</p></bio><bio xml:lang="en"><p>Vishniakou Uladzimir Anatolievich, Dr. of Sci. (Tech.), Professor at the Department of Infocommunication Technologies</p><p>220013, Minsk, P. Brovki St., 6</p><p>Tel.: +375 44 486-71-82</p></bio><email xlink:type="simple">vish@bsuir.by</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Ивэй</surname><given-names>Ся</given-names></name><name name-style="western" xml:lang="en"><surname>YiWei</surname><given-names>Xia</given-names></name></name-alternatives><bio xml:lang="ru"><p>аспирант кафедры инфокоммуникационных технологий</p><p>Минск</p></bio><bio xml:lang="en"><p>Postgraduate at the Department of Infocommunication Technologies</p><p>Minsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Белорусский государственный университет информатики и радиоэлектроники</institution></aff><aff xml:lang="en"><institution>Belarusian State University of Informatics and Radioelectronics</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2023</year></pub-date><pub-date pub-type="epub"><day>22</day><month>06</month><year>2023</year></pub-date><volume>21</volume><issue>3</issue><fpage>102</fpage><lpage>110</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Вишняков В.А., Ивэй С., 2023</copyright-statement><copyright-year>2023</copyright-year><copyright-holder xml:lang="ru">Вишняков В.А., Ивэй С.</copyright-holder><copyright-holder xml:lang="en">Vishniakou U.A., YiWei X.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://doklady.bsuir.by/jour/article/view/3653">https://doklady.bsuir.by/jour/article/view/3653</self-uri><abstract><p>Представлены результаты исследования параметров спектров речевых сигналов с помощью машинного обучения с применением нейронных сетей, проведенного в целях экспериментального подтверждения возможности выполнения оценки этих параметров для выявления болезни Паркинсона на ранних стадиях (IТ-диагностика). В ходе исследования использовали общедоступную базу данных, в которой систематизированы спектры гласных звуков, произнесенных пациентами с болезнью Паркинсона. Примененный метод – бинарная классификация данных. Сначала выполняли предварительную обработку спектра речевых данных, состоявшую в его фильтрации, для удаления из него шумов и устранения присутствующих в нем всплесков и пробелов. Затем определяли параметры обработанного спектра речевых данных: среднее значение, максимум, минимум, пик, вейвлет-коэффициенты, MFCC и TQWT. После этого выбирали объект с помощью алгоритма PCA. Для обучения модели использовали алгоритмы Knn и Random Forest и нейронной сети Байеса. Для нахождения наилучших гиперпараметров модели применяли алгоритм оптимизации Байеса и метод GridSearch. Установлено, что при использовании Knn, Random Forest и нейронной сети Байеса можно обеспечить увеличение точности распознавания болезни Паркинсона на 94,7; 88,16 и 74,74 % соответственно. Аналогичное исследование, проведенное другими учеными, показало, что точность распознавания наборов данных составила всего 86 %.</p></abstract><trans-abstract xml:lang="en"><p>The results of studying the parameters of the spectra of speech signals by machine learning with the use of neural networks are presented. This study was carried out in order to confirm experimentally the possibility of performing an assessment of these parameters for the detection of Parkinson’s disease in the early stages (IT diagnostics). During the study, the public database was used, which systematized the spectra of vowel sounds uttered by patients with Parkinson’s disease. The applied method is binary data classification. In the course of the study, the speech data spectrum was first preprocessed, which consisted of filtering it in order to remove its noise components and eliminate bursts and gaps in it. Then the parameters of the processed spectrum of speech data were determined: average value, maximum and minimum, peak, wavelet coefficients, MFCC and TQWT. After that, the object was selected using the PCA algorithm. The model was trained using the Knn and Random Forest algorithms, as well as the Bayesian neural network. The Bayesian optimization algorithm and the GridSearch method were used to find the best model hyperparameters. It has been established that when using Knn, Random Forest and Bayesian neural network, it is possible to increase the accuracy of recognition of Parkinson’s disease by 94.7; 88.16 and 74.74 %, respectively. A similar study by other scientists showed that the recognition accuracy of data sets was only 86 %.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>машинное обучение</kwd><kwd>нейронные сети</kwd><kwd>бинарная классификация</kwd><kwd>гиперпараметрическая оптимизация</kwd><kwd>дерево решений</kwd><kwd>чувствительность</kwd><kwd>точность</kwd></kwd-group><kwd-group xml:lang="en"><kwd>machine learning</kwd><kwd>neural networks</kwd><kwd>binary classification</kwd><kwd>hyperparameter optimization</kwd><kwd>decision tree</kwd><kwd>sensitivity</kwd><kwd>precision</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Davie C. A. (2008) A Review of Parkinson’s Disease. British Medical Bulletin. 86 (1), 109‒127.</mixed-citation><mixed-citation xml:lang="en">Davie C. A. (2008) A Review of Parkinson’s Disease. British Medical Bulletin. 86 (1), 109‒127.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Braak H., Ghebremedhin E., Rüb U., Bratzke H., Del Tredici K. (2004) Stages in the Development of Parkinson’s Disease-Related Pathology. Cell and Tissue Research. 318 (1), 121‒134.</mixed-citation><mixed-citation xml:lang="en">Braak H., Ghebremedhin E., Rüb U., Bratzke H., Del Tredici K. (2004) Stages in the Development of Parkinson’s Disease-Related Pathology. Cell and Tissue Research. 318 (1), 121‒134.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Upadhya S. S., Cheeran A. N. (2018) Discriminating Parkinson and Healthy People Using Phonation and Cepstral Features of Speech. Computer Science. 143, 197‒202.</mixed-citation><mixed-citation xml:lang="en">Upadhya S. S., Cheeran A. N. (2018) Discriminating Parkinson and Healthy People Using Phonation and Cepstral Features of Speech. Computer Science. 143, 197‒202.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Putri F., Caesarendra W., Pamanasari E. D., Ariyanto M., Setiawan J. D. (2018) Parkinson Disease Detection Based on Voice and EMG Pattern Classification Method for Indonesian Case Study. Journal of Energy, Mechanical, Material, and Manufacturing Engineering. 3 (2), 87‒98.</mixed-citation><mixed-citation xml:lang="en">Putri F., Caesarendra W., Pamanasari E. D., Ariyanto M., Setiawan J. D. (2018) Parkinson Disease Detection Based on Voice and EMG Pattern Classification Method for Indonesian Case Study. Journal of Energy, Mechanical, Material, and Manufacturing Engineering. 3 (2), 87‒98.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Zhang M. L., Zhou Z. H. (2007) ML-KNN: a Lazy Learning Approach to Multi-Label Learning. Pattern Recognition. 40 (7), 2038‒2048.</mixed-citation><mixed-citation xml:lang="en">Zhang M. L., Zhou Z. H. (2007) ML-KNN: a Lazy Learning Approach to Multi-Label Learning. Pattern Recognition. 40 (7), 2038‒2048.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Palimkar P., Shaw R. N., Ghosh A. (2022) Machine Learning Technique to Prognosis Diabetes Disease: Random Forest Classifier Approach. Advanced Computing and Intelligent Technologies. Springer, Singapore. 219–244.</mixed-citation><mixed-citation xml:lang="en">Palimkar P., Shaw R. N., Ghosh A. (2022) Machine Learning Technique to Prognosis Diabetes Disease: Random Forest Classifier Approach. Advanced Computing and Intelligent Technologies. Springer, Singapore. 219–244.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Kareem S. W, Alyousuf F. Q., Ahmad K., Hawezi R., Awla H. (2022) Structure Learning of Bayesian Network: a Review. Qalaai Zanist Journal. 7 (1), 956‒975.</mixed-citation><mixed-citation xml:lang="en">Kareem S. W, Alyousuf F. Q., Ahmad K., Hawezi R., Awla H. (2022) Structure Learning of Bayesian Network: a Review. Qalaai Zanist Journal. 7 (1), 956‒975.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Sakar C. O., Serbes G., Gunduz A., Tunc H. C., Nizam H. (2019) A Comparative Analysis of Speech Signal Processing Algorithms for Parkinson’s Disease Classification and the Use of the Tunable Q-Factor Wavelet Transform. Applied Soft Computing. 74 (4), 255‒263.</mixed-citation><mixed-citation xml:lang="en">Sakar C. O., Serbes G., Gunduz A., Tunc H. C., Nizam H. (2019) A Comparative Analysis of Speech Signal Processing Algorithms for Parkinson’s Disease Classification and the Use of the Tunable Q-Factor Wavelet Transform. Applied Soft Computing. 74 (4), 255‒263.</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Upadhya S. S., Cheeran A. N., Nirmal J. H. (2017) Statistical Comparison of Jitter and Shimmer Voice Features for Healthy and Parkinson Affected Persons. Electrical, Computer and Communication Technologies. IEEE. 1‒6.</mixed-citation><mixed-citation xml:lang="en">Upadhya S. S., Cheeran A. N., Nirmal J. H. (2017) Statistical Comparison of Jitter and Shimmer Voice Features for Healthy and Parkinson Affected Persons. Electrical, Computer and Communication Technologies. IEEE. 1‒6.</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Holmes J. R., Oates M. J., Phyland J. D., Hughes J. A. (2000) Voice Characteristics in the Progression of Parkinson’s Disease. International Journal of Language &amp; Communication Disorders. 35 (3), 407‒418.</mixed-citation><mixed-citation xml:lang="en">Holmes J. R., Oates M. J., Phyland J. D., Hughes J. A. (2000) Voice Characteristics in the Progression of Parkinson’s Disease. International Journal of Language &amp; Communication Disorders. 35 (3), 407‒418.</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Abdurrahman G., Sintawati M. (2020) Implementation of Xgboost for Classification of Parkinson’s Disease. Journal of Physics. 1538 (1), 1‒12.</mixed-citation><mixed-citation xml:lang="en">Abdurrahman G., Sintawati M. (2020) Implementation of Xgboost for Classification of Parkinson’s Disease. Journal of Physics. 1538 (1), 1‒12.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Tsanas A., Little M., McSharry P. E., Ramig L. O. (2010) New Nonlinear Markers and Insights into Speech Signal Degradation for Effective Tracking of Parkinson’s Disease Symptom Severity. NOLTA, Poland. 457–460.</mixed-citation><mixed-citation xml:lang="en">Tsanas A., Little M., McSharry P. E., Ramig L. O. (2010) New Nonlinear Markers and Insights into Speech Signal Degradation for Effective Tracking of Parkinson’s Disease Symptom Severity. NOLTA, Poland. 457–460.</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Erdogdu S. B., Serbes G., Sakar C. O. (2017) Analyzing the Effectiveness of Vocal Features in Early Telediagnosis of Parkinson’s Disease. PloS One. 12 (8), 1‒18.</mixed-citation><mixed-citation xml:lang="en">Erdogdu S. B., Serbes G., Sakar C. O. (2017) Analyzing the Effectiveness of Vocal Features in Early Telediagnosis of Parkinson’s Disease. PloS One. 12 (8), 1‒18.</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Selesnick I. W. (2011) Wavelet Transform with Tunable Q-Factor. IEEE Transactions on Signal Processing. 59 (8), 3560‒3575.</mixed-citation><mixed-citation xml:lang="en">Selesnick I. W. (2011) Wavelet Transform with Tunable Q-Factor. IEEE Transactions on Signal Processing. 59 (8), 3560‒3575.</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Visa S., Ramsay B., Ralescu A. L., Esther van der Knaap (2011) Confusion Matrix-Based Feature Selection. Artificial Intelligence and Cognitive Science. 710 (1), 120‒127.</mixed-citation><mixed-citation xml:lang="en">Visa S., Ramsay B., Ralescu A. L., Esther van der Knaap (2011) Confusion Matrix-Based Feature Selection. Artificial Intelligence and Cognitive Science. 710 (1), 120‒127.</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Maćkiewicz A., Ratajczak W. (1993) Principal Components Analysis (PCA). Computers &amp; Geosciences. 19 (3), 303‒342.</mixed-citation><mixed-citation xml:lang="en">Maćkiewicz A., Ratajczak W. (1993) Principal Components Analysis (PCA). Computers &amp; Geosciences. 19 (3), 303‒342.</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Fawcett T. (2006) An Introduction to ROC Analysis. Pattern Recognition Letters. 27 (8), 861‒874.</mixed-citation><mixed-citation xml:lang="en">Fawcett T. (2006) An Introduction to ROC Analysis. Pattern Recognition Letters. 27 (8), 861‒874.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
