<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">ellibs</journal-id><journal-title-group><journal-title xml:lang="ru">Электронные библиотеки</journal-title><trans-title-group xml:lang="en"><trans-title>Russian Digital Libraries Journal</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">1562-5419</issn><publisher><publisher-name>Казанский (Приволжский) федеральный университет</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.26907/1562-5419-2020-23-6-1155-1171</article-id><article-id custom-type="elpub" pub-id-type="custom">ellibs-254</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>Статьи</subject></subj-group></article-categories><title-group><article-title>Определение дефектов на стальных листах с использованием сверточных нейронных сетей</article-title><trans-title-group xml:lang="en"><trans-title>Steel Defects Analysis Using CNN (Convolutional Neural Networks)</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Гаскаров</surname><given-names>Р. Д.</given-names></name><name name-style="western" xml:lang="en"><surname>Gaskarov</surname><given-names>R. D.</given-names></name></name-alternatives><email xlink:type="simple">komnatakita@gmail.com</email></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Бирюков</surname><given-names>А. М.</given-names></name><name name-style="western" xml:lang="en"><surname>Biryukov</surname><given-names>A. M.</given-names></name></name-alternatives><email xlink:type="simple">herou.public@gmail.com</email></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Никонов</surname><given-names>А.</given-names></name><name name-style="western" xml:lang="en"><surname>Nikonov</surname><given-names>A. F.</given-names></name></name-alternatives><email xlink:type="simple">nikonowalex@gmail.com</email></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Агниашвили</surname><given-names>Д. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Agniashvili</surname><given-names>D. V.</given-names></name></name-alternatives><email xlink:type="simple">daniilak@gmail.com</email></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Хайрисламов</surname><given-names>Д. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Khayrislamov</surname><given-names>D. A.</given-names></name></name-alternatives><email xlink:type="simple">danilhayrislamov@gmail.com</email></contrib></contrib-group><pub-date pub-type="collection"><year>2020</year></pub-date><pub-date pub-type="epub"><day>28</day><month>12</month><year>2020</year></pub-date><volume>23</volume><issue>6</issue><fpage>1155</fpage><lpage>1171</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Гаскаров Р.Д., Бирюков А.М., Никонов A.А., Агниашвили Д.В., Хайрисламов  Д.А., 2020</copyright-statement><copyright-year>2020</copyright-year><copyright-holder xml:lang="ru">Гаскаров Р.Д., Бирюков А.М., Никонов A.А., Агниашвили Д.В., Хайрисламов  Д.А.</copyright-holder><copyright-holder xml:lang="en">Gaskarov R.D., Biryukov A.M.,  Nikonov A.F.,  Agniashvili D.V., Khayrislamov D.A.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://ellibs.elpub.ru/jour/article/view/254">https://ellibs.elpub.ru/jour/article/view/254</self-uri><abstract><p>Сталь в наши дни является одним из важнейших производственных материалов, который используется повсеместно, от медицины до промышленных отраслей. Своевременное обнаружение и распознавание дефектов на стальных листах после проката – одна из ключевых проблем этого производства с учетом его сложности и необходимости затрат большого количества времени на проведение вручную проверок каждого листа и каждой заготовки. Одними из целей настоящей работы были автоматизация и упрощение данного процесса. Для решения соответствующих задач была использована, в первую очередь, модель сверточной нейронной сети под названием UNet, которая уже зарекомендовала себя как отличный инструмент решения таких задач — при высокой результативности она требует меньшего количества учебных данных. В основе этой модели лежат последовательная, производимая в несколько шагов свертка изображения до приемлемого размера (иными словами, сжатие или кодирование), а затем развертка, восстановление изображения к исходному размеру и соотношению сторон, после чего на выходе будет получена маска изображения с классами элементов, которые необходимо было найти. В дополнение к этой нейронной сети в качестве кодирующего (сворачивающего) слоя была использована другая модель — ResNet34, предварительно обученная на датасете (наборе данных) ImageNet1000. В этой модели также был модифицирован выходной слой — вместо 34 слоев с классами на выходе возвращалось лишь 4, что сократило время обработки и позволило использовать наиболее удачные определения в результатах. Используя данный подход и проведя все необходимые проверки, при подведении итогов, мы получили результат в 94,8% точности определения дефектов на стальных листах.
</p></abstract><trans-abstract xml:lang="en"><p>Steel is one of the most important bulk materials these days. It is used almost everywhere - from medicine to industry. Detecting this material's defects is one of the most challenging problems for industries worldwide. This process is also manual and time-consuming. Through this study we tried to automate this process. A convolutional neural network model UNet was used for this task for more accurate segmentation with less training image data set for our model. The essence of this NN (neural network) is in step-by-step convolution of every image (encoding) and then stretching them to initial resolution, consequently getting a mask of an image with various classes on it. The foremost modification is changing an input image's size to 128x800 px resolution (original images in dataset are 256x1600 px) because of GPU memory size's limitation. Secondly, we used ResNet34 CNN (convolutional neural network) as encoder, which was pre-trained on ImageNet1000 dataset with modified output layer - it shows 4 layers instead of 34. After running tests of this model, we obtained 92.7% accuracy using images of hot-rolled steel sheets.
</p></trans-abstract><kwd-group xml:lang="ru"><kwd>сверточные нейронные сети</kwd><kwd>нейронные сети</kwd><kwd>машинное обучение</kwd><kwd>сталь</kwd><kwd>искусственный интеллект</kwd><kwd>определение дефектов</kwd><kwd>сегментация</kwd><kwd>классификация</kwd></kwd-group><kwd-group xml:lang="en"><kwd>UNet</kwd><kwd>ResNet</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Stavropoulos P. et al. Monitoring and control of manufacturing processes: A review // Procedia CIRP. 2013. V. 8. P. 421–425.</mixed-citation><mixed-citation xml:lang="en">Stavropoulos P. et al. Monitoring and control of manufacturing processes: A review // Procedia CIRP. 2013. V. 8. P. 421–425.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Chao W. and al. Research on Classification of Surface Defects of Hot-rolled Steel Strip Based on Deep Learning // DEStech Transactions on Computer Science and Engineering. 2019. 2nd International Conference on Informatics, Control and Auto-mation (ICA 2019). 2019. P. 362–366.</mixed-citation><mixed-citation xml:lang="en">Chao W. and al. Research on Classification of Surface Defects of Hot-rolled Steel Strip Based on Deep Learning // DEStech Transactions on Computer Science and Engineering. 2019. 2nd International Conference on Informatics, Control and Auto-mation (ICA 2019). 2019. P. 362–366.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Li J. and al. Real-time detection of steel strip surface defects based on im-proved yolo detection network // IFAC-PapersOnLine. 2018. V. 51, No. 21. P. 76–81.</mixed-citation><mixed-citation xml:lang="en">Li J. and al. Real-time detection of steel strip surface defects based on im-proved yolo detection network // IFAC-PapersOnLine. 2018. V. 51, No. 21. P. 76–81.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Zhang Z., Zhang S., Li Q. Online Surface Defects Detection System for Cold-rolled Steel Strip // Recent Patents on Engineering. 2017. V. 11, No. 1. P. 62–67.</mixed-citation><mixed-citation xml:lang="en">Zhang Z., Zhang S., Li Q. Online Surface Defects Detection System for Cold-rolled Steel Strip // Recent Patents on Engineering. 2017. V. 11, No. 1. P. 62–67.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">He K. and al. Mask r-cnn // Proceedings of the IEEE international conference on computer vision, 2017. P. 2961–2969.</mixed-citation><mixed-citation xml:lang="en">He K. and al. Mask r-cnn // Proceedings of the IEEE international conference on computer vision, 2017. P. 2961–2969.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Ren S. and al. Faster r-cnn: Towards real-time object detection with region proposal networks // Advances in Neural Information Processing Systems, 2015. P. 91–99.</mixed-citation><mixed-citation xml:lang="en">Ren S. and al. Faster r-cnn: Towards real-time object detection with region proposal networks // Advances in Neural Information Processing Systems, 2015. P. 91–99.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Shang W. and al. Understanding and improving convolutional neural net-works via concatenated rectified linear units // International Conference on Machine Learning, 2016. P. 2217–2225.</mixed-citation><mixed-citation xml:lang="en">Shang W. and al. Understanding and improving convolutional neural net-works via concatenated rectified linear units // International Conference on Machine Learning, 2016. P. 2217–2225.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Ferguson M.K. and al. Detection and segmentation of manufacturing defects with convolutional neural networks and transfer learning // Smart and Sustainable Manufacturing Systems. 2018. V. 2. arXiv:1808.02518 [cs.CV]</mixed-citation><mixed-citation xml:lang="en">Ferguson M.K. and al. Detection and segmentation of manufacturing defects with convolutional neural networks and transfer learning // Smart and Sustainable Manufacturing Systems. 2018. V. 2. arXiv:1808.02518 [cs.CV]</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Ronneberger O., Fischer P., Brox T. U-net: Convolutional networks for bio-medical image segmentation // International Conference on Medical Image Compu-ting and Computer-Assisted Intervention. Springer, Cham, 2015. P. 234–241.</mixed-citation><mixed-citation xml:lang="en">Ronneberger O., Fischer P., Brox T. U-net: Convolutional networks for bio-medical image segmentation // International Conference on Medical Image Compu-ting and Computer-Assisted Intervention. Springer, Cham, 2015. P. 234–241.</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Wu Z., Shen C., Van Den Hengel A. Wider or deeper: Revisiting the resnet model for visual recognition // Pattern Recognition. 2019. V. 90. P. 119–133.</mixed-citation><mixed-citation xml:lang="en">Wu Z., Shen C., Van Den Hengel A. Wider or deeper: Revisiting the resnet model for visual recognition // Pattern Recognition. 2019. V. 90. P. 119–133.</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">He K. and al. Deep residual learning for image recognition // Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 2016. P. 770–778.</mixed-citation><mixed-citation xml:lang="en">He K. and al. Deep residual learning for image recognition // Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 2016. P. 770–778.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Ronneberger O., Fischer P., Brox T. U-net: Convolutional networks for bio-medical image segmentation // International Conference on Medical Image Compu-ting and Computer-Assisted Intervention. Springer, Cham, 2015. P. 234–241.</mixed-citation><mixed-citation xml:lang="en">Ronneberger O., Fischer P., Brox T. U-net: Convolutional networks for bio-medical image segmentation // International Conference on Medical Image Compu-ting and Computer-Assisted Intervention. Springer, Cham, 2015. P. 234–241.</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Salehi S.S.M., Erdogmus D., Gholipour A. Tversky loss function for image segmentation using 3D fully convolutional deep networks // International Workshop on Machine Learning in Medical Imaging. Springer, Cham, 2017. P. 379–387.</mixed-citation><mixed-citation xml:lang="en">Salehi S.S.M., Erdogmus D., Gholipour A. Tversky loss function for image segmentation using 3D fully convolutional deep networks // International Workshop on Machine Learning in Medical Imaging. Springer, Cham, 2017. P. 379–387.</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Milletari F., Navab N., Ahmadi S.A. V-net: Fully convolutional neural net-works for volumetric medical image segmentation // 2016 Fourth International Con-ference on 3D Vision (3DV). IEEE, 2016. P. 565–571.</mixed-citation><mixed-citation xml:lang="en">Milletari F., Navab N., Ahmadi S.A. V-net: Fully convolutional neural net-works for volumetric medical image segmentation // 2016 Fourth International Con-ference on 3D Vision (3DV). IEEE, 2016. P. 565–571.</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Wang P., Chung A.C.S. Focal dice loss and image dilation for brain tumor segmentation // Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support. Springer, Cham, 2018. P. 119–127.</mixed-citation><mixed-citation xml:lang="en">Wang P., Chung A.C.S. Focal dice loss and image dilation for brain tumor segmentation // Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support. Springer, Cham, 2018. P. 119–127.</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Sudre C.H. and al. Generalised dice overlap as a deep learning loss function for highly unbalanced segmentations // Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support. Springer, Cham, 2017. P. 240–248.</mixed-citation><mixed-citation xml:lang="en">Sudre C.H. and al. Generalised dice overlap as a deep learning loss function for highly unbalanced segmentations // Deep Learning in Medical Image Analysis and Multimodal Learning for Clinical Decision Support. Springer, Cham, 2017. P. 240–248.</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Sitdikov V.D. and al. Application of X-ray Technique to Study the Structure of Ultrafine-Grained Ferritic/Martensitic Steel // J. of Materials Engineering and Per-formance. 2019. V. 28, No. 11. P. 7109–7118.</mixed-citation><mixed-citation xml:lang="en">Sitdikov V.D. and al. Application of X-ray Technique to Study the Structure of Ultrafine-Grained Ferritic/Martensitic Steel // J. of Materials Engineering and Per-formance. 2019. V. 28, No. 11. P. 7109–7118.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
