<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">bsuir</journal-id><journal-title-group><journal-title xml:lang="ru">Доклады БГУИР</journal-title><trans-title-group xml:lang="en"><trans-title>Doklady BGUIR</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1729-7648</issn><issn pub-type="epub">2708-0382</issn><publisher><publisher-name>БГУИР</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.35596/1729-7648-2019-123-5-66-71</article-id><article-id custom-type="elpub" pub-id-type="custom">bsuir-1153</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ЭЛЕКТРОНИКА, РАДИОФИЗИКА, РАДИОТЕХНИКА, ИНФОРМАТИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>ELECTRONICS, RADIOPHYSICS, RADIOENGINEERING, INFORMATICS</subject></subj-group></article-categories><title-group><article-title>Сегментация речи на фонетические элементы для систем защиты речевой информации</article-title><trans-title-group xml:lang="en"><trans-title>Segmentation of speech on phonetic elements for systems of speech information protection</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Сейткулов</surname><given-names>Е. Н.</given-names></name><name name-style="western" xml:lang="en"><surname>Seitkulov</surname><given-names>Y. N.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Кандидат физико-математических наук, директор НИИ информационной безопасности криптологии</p></bio><bio xml:lang="en"><p>PhD, director of the institute of information security and cryptology</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Боранбаев</surname><given-names>С. Н.</given-names></name><name name-style="western" xml:lang="en"><surname>Boranbayev</surname><given-names>S. N.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Доктор технических наук, профессор</p></bio><bio xml:lang="en"><p>Eurasian national university named after L.N. Gumilyov</p></bio><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Потапович</surname><given-names>А. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Patapovich</surname><given-names>A. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Потапович Александр Владимирович - старший научный сотрудник НИЛ 5.3 НИЧ.</p><p>220013, Минск, ул. П. Бровки, 6, тел. +375-29-670-30-40</p></bio><bio xml:lang="en"><p>Patapovich Aleksandr Vladimirovich  - researcher of SRL 5.3 of R&amp;D department.</p><p>20013, Minsk, P. Brovka st., 6, tel. +375-29-670-30-40</p></bio><email xlink:type="simple">nil53@bsuir.edu.by.by</email><xref ref-type="aff" rid="aff-3"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Давыдов</surname><given-names>Г. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Davydau</surname><given-names>H. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Кандидат технических наук, ведущий научный сотрудник НИЛ 5.3 НИЧ.</p><p>220013, Минск, ул. П. Бровки, 6</p></bio><bio xml:lang="en"><p>PhD, researcher of SRL 5.3 of R&amp;D department.</p><p>20013, Minsk, P. Brovka st., 6</p></bio><xref ref-type="aff" rid="aff-3"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Евразийский национальный университет им. Л.Н. Гумилева</institution></aff><aff xml:lang="en"><institution>Eurasian national university named after L.N. Gumilyov</institution></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru"><institution>Евразийский национальный университет им. Л.Н. Гумилева</institution></aff><aff xml:lang="en"><institution>D.Sci, professor</institution></aff></aff-alternatives><aff-alternatives id="aff-3"><aff xml:lang="ru"><institution>Белорусский государственный университет информатики и радиоэлектроники</institution></aff><aff xml:lang="en"><institution>Belarusian state university of informatics and radioelectronics</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2019</year></pub-date><pub-date pub-type="epub"><day>03</day><month>07</month><year>2019</year></pub-date><volume>0</volume><issue>5</issue><fpage>66</fpage><lpage>71</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Сейткулов Е.Н., Боранбаев С.Н., Потапович А.В., Давыдов Г.В., 2019</copyright-statement><copyright-year>2019</copyright-year><copyright-holder xml:lang="ru">Сейткулов Е.Н., Боранбаев С.Н., Потапович А.В., Давыдов Г.В.</copyright-holder><copyright-holder xml:lang="en">Seitkulov Y.N., Boranbayev S.N., Patapovich A.V., Davydau H.V.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://doklady.bsuir.by/jour/article/view/1153">https://doklady.bsuir.by/jour/article/view/1153</self-uri><abstract><p>Статья посвящена разработке алгоритма сегментации речи на фонетические элементы для синтеза речеподобных сигналов в системах защиты речевой информации. Основное внимание уделяется установлению границ фонетических единиц речи с учетом влияния этого фактора на качество синтезируемой речи компиляционным методом. Рассматриваются особенности установления границ фонем для слитной речи и влияние этого фактора на качество синтезируемой речи по базе фонем. Предлагается для обеспечения качественной синтезируемой речи начало и окончание фонем при сегментации устанавливать при переходе реализации сигнала через ноль, а при синтезе речеподобных сигналов использовать сплайн-функции на границах сегментов фонем.</p></abstract><trans-abstract xml:lang="en"><p>The article is devoted to the development of speech segmentation algorithm on phonetic elements for the synthesis of speech-like signals in speech information protection systems. The main attention is paid to establishing the boundaries of phonetic units of speech, taking into account the influence of this factor on the quality of the synthesized speech by the compilation method. The features of establishing the boundaries of phonemes for fused speech and the influence of this factor on the quality of synthesized speech on the basis of phonemes are considered. It is proposed to ensure the quality of synthesized speech beginning and ending phonemes at the segmentation set in the transition implementation of a signal through zero and in the synthesis of speech-like signals to use the spline function at the boundaries of segments phonemes.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>сегментация речи</kwd><kwd>границы фонем</kwd><kwd>речеподобные сигналы</kwd><kwd>синтез</kwd><kwd>сплайн-функции</kwd></kwd-group><kwd-group xml:lang="en"><kwd>speech segmentation</kwd><kwd>phoneme boundaries</kwd><kwd>speech-like signals</kwd><kwd>synthesis</kwd><kwd>spline functions</kwd></kwd-group><funding-group><funding-statement xml:lang="ru">Работа выполнена при поддержке грантового финансирования КНМОН РК, №АР 05130293</funding-statement></funding-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Sakoe H., Chiba S. Dynamic Programming Algorithm Optimization for Spoken Word Recognition // IEEE Transactions on Acoustics, Speech, and Signal Processing. 1978. Vol. ASSP-26, No. 1. P. 43-49.</mixed-citation><mixed-citation xml:lang="en">Sakoe H., Chiba S. Dynamic Programming Algorithm Optimization for Spoken Word Recognition // IEEE Transactions on Acoustics, Speech, and Signal Processing. 1978. Vol. ASSP-26, No. 1. P. 43-49.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Scharenborg O., Wan V., Ernestus M. Unsupervised speech segmentation: An analysis of the hypothesized phone boundaries // The Journal of the Acoustical Society of America. 2010. Vol. 127, No. 2. P. 1084-1095.</mixed-citation><mixed-citation xml:lang="en">Scharenborg O., Wan V., Ernestus M. Unsupervised speech segmentation: An analysis of the hypothesized phone boundaries // The Journal of the Acoustical Society of America. 2010. Vol. 127, No. 2. P. 1084-1095.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Gomez J.A., Calvo M. Improvements on automatic speech segmentation at the phonetic level // Materials of 16th Iberoamerican CongressProgress in Pattern Recognition, Image Analysis, Computer Vision and Applikations. 2011. P. 557-564.</mixed-citation><mixed-citation xml:lang="en">Gomez J.A., Calvo M. Improvements on automatic speech segmentation at the phonetic level // Materials of 16th Iberoamerican CongressProgress in Pattern Recognition, Image Analysis, Computer Vision and Applikations. 2011. P. 557-564.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Bemdt D.J., Clifford J. Using Dynamic Time Warping to FindPatterns in Time Series // AAAI Proc. knowledge discovery in databases. 1994. P. 359-370.</mixed-citation><mixed-citation xml:lang="en">Bemdt D.J., Clifford J. Using Dynamic Time Warping to FindPatterns in Time Series // AAAI Proc. knowledge discovery in databases. 1994. P. 359-370.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">A Review: Automatic Speech Segmentation / Sakran A.E. [et al.] // International Jornal of Computer Science and Mobile Computing. 2017. Vol. 6, No. 4. P. 308-315.</mixed-citation><mixed-citation xml:lang="en">A Review: Automatic Speech Segmentation / Sakran A.E. [et al.] // International Jornal of Computer Science and Mobile Computing. 2017. Vol. 6, No. 4. P. 308-315.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Makowski R., Hossa R. Automatic speech signal segmentation based on the innovation adaptive filter // International Journal of Applied Mathematics and Computer Science. 2014. Vol. 24, No. 2. P. 259-270.</mixed-citation><mixed-citation xml:lang="en">Makowski R., Hossa R. Automatic speech signal segmentation based on the innovation adaptive filter // International Journal of Applied Mathematics and Computer Science. 2014. Vol. 24, No. 2. P. 259-270.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Kamarauskas J. Automatic Segmetation of Phonemes using Artificial Neural Networks // Elektronika ir Elektrotechnika. 2006. Vol. 72, No. 8. P. 39-42.</mixed-citation><mixed-citation xml:lang="en">Kamarauskas J. Automatic Segmetation of Phonemes using Artificial Neural Networks // Elektronika ir Elektrotechnika. 2006. Vol. 72, No. 8. P. 39-42.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Automatic Silence/Unvoiced/Voiced Classification of Bangla Velar Phonemes: New Approach / Syed Akhter Hossain [et al.] // 8th ICCIT. Dhaka, 2005.</mixed-citation><mixed-citation xml:lang="en">Automatic Silence/Unvoiced/Voiced Classification of Bangla Velar Phonemes: New Approach / Syed Akhter Hossain [et al.] // 8th ICCIT. Dhaka, 2005.</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">. Highly accurate phonetic segmentation using boundary correction models and system fusion / A. Stolcke [et al.] // 2014 IEEE International Conference on Acoustic, Speech and Signal Processing (ICASSP). IEEE, 2014. P. 5552-5556.</mixed-citation><mixed-citation xml:lang="en">. Highly accurate phonetic segmentation using boundary correction models and system fusion / A. Stolcke [et al.] // 2014 IEEE International Conference on Acoustic, Speech and Signal Processing (ICASSP). IEEE, 2014. P. 5552-5556.</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Method for protecting speech information / H.V. Davydau [et al.] // Doklady BGUIR. 2015. N° 8 (94). P. 107-110.</mixed-citation><mixed-citation xml:lang="en">Method for protecting speech information / H.V. Davydau [et al.] // Doklady BGUIR. 2015. N° 8 (94). P. 107-110.</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Rationale for the method of formation of the combined speech masking signals / Y. Seitkulov [et al.] // IEEE 8th International Conference on Application on Information and Communication Technologies (AICT). Astana, Kazakhstan, 2014.</mixed-citation><mixed-citation xml:lang="en">Rationale for the method of formation of the combined speech masking signals / Y. Seitkulov [et al.] // IEEE 8th International Conference on Application on Information and Communication Technologies (AICT). Astana, Kazakhstan, 2014.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Sorokin V.N. Segmentation of the period of the fundamental tone of a voice source // Acoustical Physics. 2016. Vol. 62, No. 2. P. 244-254.</mixed-citation><mixed-citation xml:lang="en">Sorokin V.N. Segmentation of the period of the fundamental tone of a voice source // Acoustical Physics. 2016. Vol. 62, No. 2. P. 244-254.</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Algoritym of forming speech base units using the method of dynamic programming / Seitkulov Y.N. [et al.] // Journal of Theoretical and Applied Information Technology. 2018. Vol. 96, No 23. P. 7928-7941.</mixed-citation><mixed-citation xml:lang="en">Algoritym of forming speech base units using the method of dynamic programming / Seitkulov Y.N. [et al.] // Journal of Theoretical and Applied Information Technology. 2018. Vol. 96, No 23. P. 7928-7941.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
