<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">ellibs</journal-id><journal-title-group><journal-title xml:lang="ru">Электронные библиотеки</journal-title><trans-title-group xml:lang="en"><trans-title>Russian Digital Libraries Journal</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">1562-5419</issn><publisher><publisher-name>Казанский (Приволжский) федеральный университет</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.26907/1562-5419-2023-26-4-466-482</article-id><article-id custom-type="elpub" pub-id-type="custom">ellibs-384</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>Статьи</subject></subj-group></article-categories><title-group><article-title>Cистема контролируемой генерации лица, построенная с использованием сети StyleGAN2</article-title><trans-title-group xml:lang="en"><trans-title>Controlled Face Generation System using StyleGAN2 Neural Network</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Исангулов</surname><given-names>М. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Isangulov</surname><given-names>M.</given-names></name></name-alternatives><email xlink:type="simple">marathon.our@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Миннеахметов</surname><given-names>Р. Р.</given-names></name><name name-style="western" xml:lang="en"><surname>Minneakhmetov</surname><given-names>R.</given-names></name></name-alternatives><email xlink:type="simple">razil0071999@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Хамеджанов</surname><given-names>А. Р.</given-names></name><name name-style="western" xml:lang="en"><surname>Khamedzhanov</surname><given-names>A.</given-names></name></name-alternatives><email xlink:type="simple">hamedzhanovalmaz@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Хафизьянов</surname><given-names>Т. Р.</given-names></name><name name-style="western" xml:lang="en"><surname>Khafizyanov</surname><given-names>T.</given-names></name></name-alternatives><email xlink:type="simple">hamstertima@gmail.com</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Пашаев</surname><given-names>Э. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Pashaev</surname><given-names>E.</given-names></name></name-alternatives><email xlink:type="simple">emil.p.mail@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Калимуллин</surname><given-names>Э. Р.</given-names></name><name name-style="western" xml:lang="en"><surname>Kalimullin</surname><given-names>E.</given-names></name></name-alternatives><email xlink:type="simple">erik182182@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Казанский (Приволжский) Федеральный университет</institution></aff><aff xml:lang="en"><institution>Kazan (Volga region) Federal University</institution></aff></aff-alternatives><aff xml:lang="ru" id="aff-2"><institution>Казанский (Приволжский) Федеральный университет</institution><country>Russian Federation</country></aff><pub-date pub-type="collection"><year>2023</year></pub-date><pub-date pub-type="epub"><day>28</day><month>08</month><year>2023</year></pub-date><volume>26</volume><issue>4</issue><fpage>466</fpage><lpage>482</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Исангулов М.В., Миннеахметов Р.Р., Хамеджанов А.Р., Хафизьянов Т.Р., Пашаев Э.А., Калимуллин Э.Р., 2023</copyright-statement><copyright-year>2023</copyright-year><copyright-holder xml:lang="ru">Исангулов М.В., Миннеахметов Р.Р., Хамеджанов А.Р., Хафизьянов Т.Р., Пашаев Э.А., Калимуллин Э.Р.</copyright-holder><copyright-holder xml:lang="en">Isangulov M., Minneakhmetov R., Khamedzhanov A., Khafizyanov T., Pashaev E., Kalimullin E.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://ellibs.elpub.ru/jour/article/view/384">https://ellibs.elpub.ru/jour/article/view/384</self-uri><abstract><p>Представлен новый подход к контролируемой генерации лиц, использующий генеративные модели с открытым исходным кодом, включая StyleGAN2 и Гребневую регрессию. Разработана методология, расширяющая возможности StyleGAN2 для контроля характеристик лиц, таких как возраст, раса, пол, выражение лица и атрибуты волос, а также использован обширный набор данных человеческих лиц с аннотациями атрибутов. Лица закодированы в 256-мерном латентном пространстве с использованием кодировщика StyleGAN2, что привело к набору характерных латентных кодов. Применен алгоритм t-SNE для кластеризации этих кодов на основе признаков, продемонстрирована возможность контроля генерации лиц, впоследствии обучены модели регрессии Риджа для каждого измерения латентных кодов с использованием размеченных признаков. При декодировании с использованием StyleGAN2 полученные коды успешно восстанавливали изображения лиц, сохраняя связь с входными признаками. Разработанный подход дает легкий и эффективный способ контролируемой генерации лиц с использованием существующих генеративных моделей, таких как StyleGAN2, и открывает новые возможности для различных областей применения.
</p></abstract><trans-abstract xml:lang="en"><p>A novel approach to supervised face generation using open-source generative models including StyleGAN2 and Ridge Regression is presented. A methodology that extends StyleGAN2 to control facial characteristics such as age, race, gender, facial expression, and hair attributes is developed, and an extensive dataset of human faces with attribute annotations is utilized. The faces were encoded in 256-dimensional latent space using the StyleGAN2 encoder, resulting in a set of characteristic latent codes. We applied the t-SNE algorithm to cluster these feature-based codes, demonstrated the ability to control face generation, and subsequently trained Ridge regression models for each dimension of the latent codes using the labeled features. When decoded using StyleGAN2, the resulting codes successfully reconstructed face images while maintaining the association with the input features. The developed approach provides an easy and efficient way to supervised face generation using existing generative models such as StyleGAN2, and opens up new possibilities for different application areas.
</p></trans-abstract><kwd-group xml:lang="ru"><kwd>машинное обучение</kwd><kwd>генерация лица</kwd><kwd>энкодер</kwd><kwd>декодер</kwd><kwd>скрытые коды</kwd><kwd>отображение признаков</kwd><kwd>гребневая регрессия</kwd></kwd-group><kwd-group xml:lang="en"><kwd>StyleGan</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Xia W., Zhang Y., Yang Y., Xue J.-H., Zhou B., Yang M.-H. GAN Inversion: A Survey. ArXiv210105278 Cs. 2022. URL: http://arxiv.org/abs/2101.05278</mixed-citation><mixed-citation xml:lang="en">Xia W., Zhang Y., Yang Y., Xue J.-H., Zhou B., Yang M.-H. GAN Inversion: A Survey. ArXiv210105278 Cs. 2022. URL: http://arxiv.org/abs/2101.05278</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Bishop C. Pattern Recognition and Machine Learning. Information Science and Statistics. 2006. URL: https://link.springer.com/book/9780387310732</mixed-citation><mixed-citation xml:lang="en">Bishop C. Pattern Recognition and Machine Learning. Information Science and Statistics. 2006. URL: https://link.springer.com/book/9780387310732</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Karras T., Laine S., Aila T. A Style-Based Generator Architecture for Generative Adversarial Networks. ArXiv181204948 Cs Stat. 2019. URL: http://arxiv.org/abs/1812.04948</mixed-citation><mixed-citation xml:lang="en">Karras T., Laine S., Aila T. A Style-Based Generator Architecture for Generative Adversarial Networks. ArXiv181204948 Cs Stat. 2019. URL: http://arxiv.org/abs/1812.04948</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Karras T., Hellsten J et al. Analyzing and Improving the Image Quality of StyleGAN. arXiv:1912.04958 Cs. 2019. URL: https://arxiv.org/pdf/1912.04958.pdf</mixed-citation><mixed-citation xml:lang="en">Karras T., Hellsten J et al. Analyzing and Improving the Image Quality of StyleGAN. arXiv:1912.04958 Cs. 2019. URL: https://arxiv.org/pdf/1912.04958.pdf</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Kryuchkov M., Khanzhina N., Osmakov I., Ulyanov P. CT images GAN-based augmentation with AdaIN for lung nodules detection // Proceedings of SPIE – The International Society for Optical Engineering: 13, Rome, 02–06 November 2020. Rome, 2020. P. 1160526. https://doi.org/10.1117/12.2587940–EDN JYZOEO.</mixed-citation><mixed-citation xml:lang="en">Kryuchkov M., Khanzhina N., Osmakov I., Ulyanov P. CT images GAN-based augmentation with AdaIN for lung nodules detection // Proceedings of SPIE – The International Society for Optical Engineering: 13, Rome, 02–06 November 2020. Rome, 2020. P. 1160526. https://doi.org/10.1117/12.2587940–EDN JYZOEO.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Huang G., Ramesh M., Berg T., Learned-Miller E. Labeled Faces in the Wild: A Database for Studying Face Recognition in Unconstrained Environments. University of Massachusetts, Amherst, Technical Report 07-49. 2018. URL: http://vis-www.cs.umass.edu/lfw/</mixed-citation><mixed-citation xml:lang="en">Huang G., Ramesh M., Berg T., Learned-Miller E. Labeled Faces in the Wild: A Database for Studying Face Recognition in Unconstrained Environments. University of Massachusetts, Amherst, Technical Report 07-49. 2018. URL: http://vis-www.cs.umass.edu/lfw/</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Viola P., Jones M. Robust Real-time Object Detection. Second international workshop on statistical and computational theories of vision. 2001. URL: https://www.cs.cmu.edu/~efros/courses/LBMV07/Papers</mixed-citation><mixed-citation xml:lang="en">Viola P., Jones M. Robust Real-time Object Detection. Second international workshop on statistical and computational theories of vision. 2001. URL: https://www.cs.cmu.edu/~efros/courses/LBMV07/Papers</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Ledig C., Theis L. et al. Photo-realistic single image super-resolution using a generative adversarial network. ArXiv:1609.04802v5 Cs. 2016. URL: https://arxiv.org/pdf/1609.04802v5.pdf</mixed-citation><mixed-citation xml:lang="en">Ledig C., Theis L. et al. Photo-realistic single image super-resolution using a generative adversarial network. ArXiv:1609.04802v5 Cs. 2016. URL: https://arxiv.org/pdf/1609.04802v5.pdf</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Goar V., Kuri M., Kumar R., Senjyu T. Data Compression and Visualization Using PCA and T-SNE. Advances in Information Communication Technology and Computing. 2019. URL: https://www.researchgate.net/publication/344000619_Data_Compression_ and_Visualization_Using_PCA_and_T-SNE</mixed-citation><mixed-citation xml:lang="en">Goar V., Kuri M., Kumar R., Senjyu T. Data Compression and Visualization Using PCA and T-SNE. Advances in Information Communication Technology and Computing. 2019. URL: https://www.researchgate.net/publication/344000619_Data_Compression_ and_Visualization_Using_PCA_and_T-SNE</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Kolo B. Binary and Multiclass Classification. Weatherford Press. 2010. URL: https://www.amazon.com/Binary-Multiclass-Classification-Brian-Kolo/dp/1615800131</mixed-citation><mixed-citation xml:lang="en">Kolo B. Binary and Multiclass Classification. Weatherford Press. 2010. URL: https://www.amazon.com/Binary-Multiclass-Classification-Brian-Kolo/dp/1615800131</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Rawlings J., Pantula S., Dickey D. Polynomial Regression. Applied Regression Analysis. 1998. URL: https://link.springer.com/chapter/10.1007/0-387-22753-9_8</mixed-citation><mixed-citation xml:lang="en">Rawlings J., Pantula S., Dickey D. Polynomial Regression. Applied Regression Analysis. 1998. URL: https://link.springer.com/chapter/10.1007/0-387-22753-9_8</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Козина Н. И., Шиян Н. В., Чалченко М. Р. Современные достижения в области генерации изображений на примере нейронной сети MIDJOURNEY // Сборник материалов XVI-ой международной очно-заочной научно-практической конференции. М.: Научно-издательский центр «Империя», 2023. С. 121–125.</mixed-citation><mixed-citation xml:lang="en">Козина Н. И., Шиян Н. В., Чалченко М. Р. Современные достижения в области генерации изображений на примере нейронной сети MIDJOURNEY // Сборник материалов XVI-ой международной очно-заочной научно-практической конференции. М.: Научно-издательский центр «Империя», 2023. С. 121–125.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
