<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">bsuir</journal-id><journal-title-group><journal-title xml:lang="ru">Доклады БГУИР</journal-title><trans-title-group xml:lang="en"><trans-title>Doklady BGUIR</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1729-7648</issn><issn pub-type="epub">2708-0382</issn><publisher><publisher-name>БГУИР</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.35596/1729-7648-2023-21-3-87-95</article-id><article-id custom-type="elpub" pub-id-type="custom">bsuir-3651</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ЭЛЕКТРОНИКА, РАДИОФИЗИКА, РАДИОТЕХНИКА, ИНФОРМАТИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>ELECTRONICS, RADIOPHYSICS, RADIOENGINEERING, INFORMATICS</subject></subj-group></article-categories><title-group><article-title>Формирование обучающей выборки для свёрточных нейронных сетей при реидентификации людей по видеоданным</article-title><trans-title-group xml:lang="en"><trans-title>Training Sample Formation for Convolution Neural Networks to Person Re-Identification from Video</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Игнатьева</surname><given-names>С. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Ihnatsyeva</surname><given-names>S. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Игнатьева Светлана Александровна,</p><p>211440, г. Новополоцк, ул. Блохина, 29</p><p>Тел.: +375 214 42-30-31</p></bio><bio xml:lang="en"><p>Ihnatsyeva Sviatlana Aleksandrovna, Postgraduate at the Department of Computing Systems and Networks</p><p>211440, Novopolotsk, Blokhina St., 29</p><p>Tel.: +375 214 42-30-31</p></bio><email xlink:type="simple">s.ignatieva@pdu.by</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Богуш</surname><given-names>Р. П.</given-names></name><name name-style="western" xml:lang="en"><surname>Bohush</surname><given-names>R. P.</given-names></name></name-alternatives><bio xml:lang="ru"><p>д. т. н., доцент, заведующий кафедрой вычислительных систем и сетей</p><p>Полоцк</p></bio><bio xml:lang="en"><p>Dr. of Sci. (Tech.), Associate Professor, Head of the Department of Computing Systems and Networks</p><p>Polotsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Полоцкий государственный университет имени Евфросинии Полоцкой</institution></aff><aff xml:lang="en"><institution>Euphrosyne Polotskaya State University of Polotsk</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2023</year></pub-date><pub-date pub-type="epub"><day>22</day><month>06</month><year>2023</year></pub-date><volume>21</volume><issue>3</issue><fpage>87</fpage><lpage>95</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Игнатьева С.А., Богуш Р.П., 2023</copyright-statement><copyright-year>2023</copyright-year><copyright-holder xml:lang="ru">Игнатьева С.А., Богуш Р.П.</copyright-holder><copyright-holder xml:lang="en">Ihnatsyeva S.A., Bohush R.P.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://doklady.bsuir.by/jour/article/view/3651">https://doklady.bsuir.by/jour/article/view/3651</self-uri><abstract><p>Для повышения точности работы системы реидентификации людей предлагается комплексный подход при формировании обучающей выборки для свёрточных нейронных сетей, предполагающий использование нового набора изображений, увеличение количества тренировочных примеров за счет существующих баз данных и применение ряда преобразований для повышения их разнообразия. Созданный набор данных PolReID1077 содержит изображения людей, которые были получены во все времена года, что позволит повысить корректность работы систем реидентификации при смене сезонов. ПреимуществомPolReID1077 является также использование видеоданных, полученных при внешнем и внутреннем наблюдении в большом количестве различных мест съемки. Поэтому изображения людей в созданном наборе характеризуются вариабельностью фона, яркостных и цветовых характеристик. Объединение созданного набора с существующими CUHK02, CUHK03, Market-1501, DukeMTMC-ReID и MSMT17 позволило получить 109 772 изображения для обучения. Увеличение разнообразия сформированных примеров достигается за счет применения к ним циклического сдвига, исключения цветности и замещения фрагмента уменьшенной копией другого изображения. Представлены результаты исследований по оценке точности реидентификации для свёрточных нейронных сетей ResNet-50 и DenseNet-121 при их тренировке с использованием предложенного подхода для формирования обучающей выборки.</p></abstract><trans-abstract xml:lang="en"><p>To improve the person re-identification system accuracy, an integrated approach is proposed in the formation of a training sample for convolutional neural networks, which involves the use of a new image dataset, an increase in the training examples number using existing datasets, and the use of a number of transformations to increase their diversity. The created dataset PolReID1077 contains images of people that were obtained in all seasons, which will improve the correct operation of re-identification systems when the seasons change. Another PolReID1077 advantage is the video data use obtained from external and internal surveillance in a large number of different filming locations. Therefore, the people images in the created set are characterized by the variability of the background, brightness and color characteristics. Joining the created dataset with the existing CUHK02, CUHK03, Market-1501, DukeMTMC-ReID and MSMT17 sets made it possible to obtain 109 772 images for training. An increase in the variety of generated examples is achieved by applying a cyclic shift to them, eliminating color and replacing a fragment with a reduced copy of another image. The research results on estimating the accuracy of re-identification for the ResNet-50 and DenseNet-121 convolutional neural networks during their training, using the proposed approach to form a training sample, are presented.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>повторная идентификация людей</kwd><kwd>свёрточные нейронные сети</kwd><kwd>PolReID1077</kwd><kwd>машинное обучение</kwd><kwd>аугментация</kwd></kwd-group><kwd-group xml:lang="en"><kwd>person re-identification</kwd><kwd>convolutional neural networks</kwd><kwd>PolReID1077</kwd><kwd>machine learning</kwd><kwd>augmentation</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Shorten С., Taghi M. K. (2019) A Survey on Image Data Augmentation for Deep Learning. Journal of Big Data. (6), 1–48. DOI: 10.1186/s40537-019-0197-0.</mixed-citation><mixed-citation xml:lang="en">Shorten С., Taghi M. K. (2019) A Survey on Image Data Augmentation for Deep Learning. Journal of Big Data. (6), 1–48. DOI: 10.1186/s40537-019-0197-0.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Chen H., Ihnatsyeva S., Bohush R., Ablameyko S. (2022) Choice of Activation Function in Convolution Neural Network in Video Surveillance Systems. Programming and Computer Software. (5), 312–321. DOI: 10.1134/S0361768822050036.</mixed-citation><mixed-citation xml:lang="en">Chen H., Ihnatsyeva S., Bohush R., Ablameyko S. (2022) Choice of Activation Function in Convolution Neural Network in Video Surveillance Systems. Programming and Computer Software. (5), 312–321. DOI: 10.1134/S0361768822050036.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Wei L., Wang X. (2013) Locally Aligned Feature Transforms Across Views. 2013 IEEE Conference on Computer Vision and Pattern Recognition. 3594–3601. DOI: 10.1109/CVPR.2013.461.</mixed-citation><mixed-citation xml:lang="en">Wei L., Wang X. (2013) Locally Aligned Feature Transforms Across Views. 2013 IEEE Conference on Computer Vision and Pattern Recognition. 3594–3601. DOI: 10.1109/CVPR.2013.461.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Li W., Zhao R., Xiao T., Wang X. (2014) DeepReID: Deep Filter Pairing Neural Network for Person Re-Identification. 2014 IEEE Conference on Computer Vision and Pattern Recognition. 152–159. DOI: 10.1109/CVPR.2014.27.</mixed-citation><mixed-citation xml:lang="en">Li W., Zhao R., Xiao T., Wang X. (2014) DeepReID: Deep Filter Pairing Neural Network for Person Re-Identification. 2014 IEEE Conference on Computer Vision and Pattern Recognition. 152–159. DOI: 10.1109/CVPR.2014.27.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Zheng L., Shen L., Tian L., Wang S., Wang J., Tian Q. (2015) Scalable Person Re-Identification: a Benchmark. 2015 IEEE International Conference on Computer Vision. 1116–1124. DOI: 10.1109/ICCV.2015.133.</mixed-citation><mixed-citation xml:lang="en">Zheng L., Shen L., Tian L., Wang S., Wang J., Tian Q. (2015) Scalable Person Re-Identification: a Benchmark. 2015 IEEE International Conference on Computer Vision. 1116–1124. DOI: 10.1109/ICCV.2015.133.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Ristani E., Solera F., Zou R. S., Cucchiara R., Tomasi C. (2016) Performance Measures and a Data Set for Multi-Target, Multi-Camera Tracking. ECCV Workshops. DOI: 10.1007/978-3-319-48881-3_2.</mixed-citation><mixed-citation xml:lang="en">Ristani E., Solera F., Zou R. S., Cucchiara R., Tomasi C. (2016) Performance Measures and a Data Set for Multi-Target, Multi-Camera Tracking. ECCV Workshops. DOI: 10.1007/978-3-319-48881-3_2.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Wei L., Zhang S., Gao W., Tian Q. (2017) Person Transfer GAN to Bridge Domain Gap for Person Re-Identification. 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. 79–88. DOI: 10.1109/CVPR.2018.00016.</mixed-citation><mixed-citation xml:lang="en">Wei L., Zhang S., Gao W., Tian Q. (2017) Person Transfer GAN to Bridge Domain Gap for Person Re-Identification. 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. 79–88. DOI: 10.1109/CVPR.2018.00016.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Felzenszwalb P., Girshick R., McAllester D., Ramanan D. (2010) Object Detection with Discriminatively Trained Part-Based Models. PAMI. DOI: 10.1109/TPAMI.2009.167.</mixed-citation><mixed-citation xml:lang="en">Felzenszwalb P., Girshick R., McAllester D., Ramanan D. (2010) Object Detection with Discriminatively Trained Part-Based Models. PAMI. DOI: 10.1109/TPAMI.2009.167.</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Gong Y., Zeng Z. (2021) An Effective Data Augmentation for Person Re-Identification. ArXiv, abs/2101.08533. DOI: 10.48550/arXiv.2101.08533.</mixed-citation><mixed-citation xml:lang="en">Gong Y., Zeng Z. (2021) An Effective Data Augmentation for Person Re-Identification. ArXiv, abs/2101.08533. DOI: 10.48550/arXiv.2101.08533.</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Fu D., Chen D., Bao J., Yang H., Yuan L., Zhang L., Li H., Chen D. (2021) Unsupervised Pre-Training for Person Re-Identification. 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. 14745–14754. DOI: 10.1109/CVPR46437.2021.01451.</mixed-citation><mixed-citation xml:lang="en">Fu D., Chen D., Bao J., Yang H., Yuan L., Zhang L., Li H., Chen D. (2021) Unsupervised Pre-Training for Person Re-Identification. 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. 14745–14754. DOI: 10.1109/CVPR46437.2021.01451.</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Cubuk E. D., Zoph B., Shlens J., Le Q. V. (2020) Randaugment: Practical Automated Data Augmentation with a Reduced Search Space. 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops. 3008–3017. DOI: 10.1109/CVPRW50498.2020.00359.</mixed-citation><mixed-citation xml:lang="en">Cubuk E. D., Zoph B., Shlens J., Le Q. V. (2020) Randaugment: Practical Automated Data Augmentation with a Reduced Search Space. 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops. 3008–3017. DOI: 10.1109/CVPRW50498.2020.00359.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Hendrycks D., Mu N., Cubuk E. D., Zoph B., Gilmer J., Lakshminarayanan B. (2019) AugMix: a Simple Data Processing Method to Improve Robustness and Uncertainty. ArXiv, abs/1912.02781. DOI: 10.48550/arXiv.1912.02781.</mixed-citation><mixed-citation xml:lang="en">Hendrycks D., Mu N., Cubuk E. D., Zoph B., Gilmer J., Lakshminarayanan B. (2019) AugMix: a Simple Data Processing Method to Improve Robustness and Uncertainty. ArXiv, abs/1912.02781. DOI: 10.48550/arXiv.1912.02781.</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Zhang H., Cissй M., Dauphin Y., Lopez-Paz D. (2017) Mixup: Beyond Empirical Risk Minimization. ArXiv, abs/1710.09412. DOI: 10.48550/arXiv.1710.09412.</mixed-citation><mixed-citation xml:lang="en">Zhang H., Cissй M., Dauphin Y., Lopez-Paz D. (2017) Mixup: Beyond Empirical Risk Minimization. ArXiv, abs/1710.09412. DOI: 10.48550/arXiv.1710.09412.</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Zhong Z., Zheng L., Kang G., Li S., Yang Y. (2017) Random Erasing Data Augmentation. AAAI Conference on Artificial Intelligence. DOI: 10.1609/AAAI.V34I07.7000.</mixed-citation><mixed-citation xml:lang="en">Zhong Z., Zheng L., Kang G., Li S., Yang Y. (2017) Random Erasing Data Augmentation. AAAI Conference on Artificial Intelligence. DOI: 10.1609/AAAI.V34I07.7000.</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Yun S., Han D., Oh S., Chun S., Choe J., Yoo Y. J. (2019) CutMix: Regularization Strategy to Train Strong Classifiers with Localizable Features. 2019 IEEE/CVF International Conference on Computer Vision. 6022– 6031. DOI: 10.1109/ICCV.2019.00612.</mixed-citation><mixed-citation xml:lang="en">Yun S., Han D., Oh S., Chun S., Choe J., Yoo Y. J. (2019) CutMix: Regularization Strategy to Train Strong Classifiers with Localizable Features. 2019 IEEE/CVF International Conference on Computer Vision. 6022– 6031. DOI: 10.1109/ICCV.2019.00612.</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Xie T., Cheng X., Wang X., Liu M., Deng J., Zhou T., Liu M. (2021) Cut-Thumbnail: a Novel Data Augmentation for Convolutional Neural Network. Proceedings of the 29th ACM International Conference on Multimedia. DOI: 10.1145/3474085.3475302.</mixed-citation><mixed-citation xml:lang="en">Xie T., Cheng X., Wang X., Liu M., Deng J., Zhou T., Liu M. (2021) Cut-Thumbnail: a Novel Data Augmentation for Convolutional Neural Network. Proceedings of the 29th ACM International Conference on Multimedia. DOI: 10.1145/3474085.3475302.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
