<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">ellibs</journal-id><journal-title-group><journal-title xml:lang="ru">Электронные библиотеки</journal-title><trans-title-group xml:lang="en"><trans-title>Russian Digital Libraries Journal</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">1562-5419</issn><publisher><publisher-name>Казанский (Приволжский) федеральный университет</publisher-name></publisher></journal-meta><article-meta><article-id custom-type="elpub" pub-id-type="custom">ellibs-713</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>Статьи</subject></subj-group></article-categories><title-group><article-title>Метод автоматической классификации полнотекстовых описаний кернов с использованием словарей</article-title><trans-title-group xml:lang="en"><trans-title>Method for Automatic Classification of Full-Text Descriptions of Cores Using Dictionaries</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Антонов</surname><given-names>Алексей Петрович</given-names></name><name name-style="western" xml:lang="en"><surname>Antonov</surname><given-names>Alexey Petrovich</given-names></name></name-alternatives><email xlink:type="simple">alexey.p.antonov@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Афонин</surname><given-names>Сергей Александрович</given-names></name><name name-style="western" xml:lang="en"><surname>Afonin</surname><given-names>Sergey Alexandrovich</given-names></name></name-alternatives><email xlink:type="simple">serg@msu.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Козицын</surname><given-names>Александр Сергеевич</given-names></name><name name-style="western" xml:lang="en"><surname>Kozytsyn</surname><given-names>Alexander Sergeevich</given-names></name></name-alternatives><email xlink:type="simple">alexanderkz@mail.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Староверов</surname><given-names>Владимир Михайлович</given-names></name><name name-style="western" xml:lang="en"><surname>Staroverov</surname><given-names>Vladimir Mikhailovich</given-names></name></name-alternatives><email xlink:type="simple">staroverovvl@yandex.ru</email><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Московский государственный университет имени М. В. Ломоносова</institution></aff><aff xml:lang="en"><institution>Lomonosov Moscow State University</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>04</day><month>03</month><year>2026</year></pub-date><volume>29</volume><issue>1</issue><fpage>3</fpage><lpage>23</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Антонов А.П., Афонин С.А., Козицын А.С., Староверов В.М., 2026</copyright-statement><copyright-year>2026</copyright-year><copyright-holder xml:lang="ru">Антонов А.П., Афонин С.А., Козицын А.С., Староверов В.М.</copyright-holder><copyright-holder xml:lang="en">Antonov A.P., Afonin S.A., Kozytsyn A.S., Staroverov V.M.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://ellibs.elpub.ru/jour/article/view/713">https://ellibs.elpub.ru/jour/article/view/713</self-uri><abstract><p>Использование методов автоматической обработки текстов, в том числе методов классификации полнотекстовых описаний, позволяет достичь существенного снижения трудозатрат при обработке экспериментальных данных. В настоящей работе рассмотрено применение метода автоматической классификации текстов в области обработки и классификации элементов керна и определения литофаций. Литофациями называют одновозрастные геологические тела (отложения), которые по своему составу или строению отличаются от соседних слоев.


При проведении оценки нефтегазового потенциала месторождений требуется выполнять построение карт и схем распространения литофаций. Для этого необходимо осуществить классификацию большого количества полнотекстовых описаний участков керна, выполненных специалистами. Алгоритм, представленный в статье, позволяет на основе заданных правил и словарей провести классификацию с учетом порядка и значимости ключевых слов в предложениях. Преимуществами такого подхода являются возможность различать близкие литофации, возможность использования архивных данных, простота настройки на новые классы, адаптация к русскоязычным описаниям кернов и возможность локального использования без необходимости передавать описания кернов сторонним приложениям.
</p></abstract><trans-abstract xml:lang="en"><p>The use of automatic text processing methods, including full-text description classification methods, allows achieving a significant reduction in labor costs when processing experimental data. This paper discusses the use of the automatic text classification method in the field of processing and classifying core elements and determining lithofacies. Lithofacies are coeval geological bodies (deposits) that differ in composition or structure from adjacent layers. When assessing the oil and gas potential of fields, it is necessary to construct maps and diagrams of lithofacies distribution. This requires classifying a large number of full-text descriptions of core sections prepared by specialists. The algorithm presented in the article allows, based on specified rules and dictionaries, to conduct classification taking into account the order and significance of keywords in sentences. The advantages of this approach are: the ability to distinguish between close lithofacies, the ability to use archival data, ease of adjustment to new classes, adaptation to Russian-language core descriptions and the possibility of local use without the need to transfer core descriptions to third-party applications.
</p></trans-abstract><kwd-group xml:lang="ru"><kwd>классификация текстов</kwd><kwd>литофации</kwd><kwd>словари</kwd><kwd>информационные системы</kwd></kwd-group><kwd-group xml:lang="en"><kwd>text classification</kwd><kwd>lithofacies</kwd><kwd>dictionaries</kwd><kwd>information systems</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Iskusstvennyi intellekt v neftegazovoi industrii Kitaia. URL: https://nntc.pro/tpost/h2hoet4se1-iskusstvennii-intellekt-v-neftegazovoi-i (data obrashcheniia: 11.12.2025)</mixed-citation><mixed-citation xml:lang="en">Iskusstvennyi intellekt v neftegazovoi industrii Kitaia. URL: https://nntc.pro/tpost/h2hoet4se1-iskusstvennii-intellekt-v-neftegazovoi-i (data obrashcheniia: 11.12.2025)</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Antonov A.P., Afonin S.A., Kozitsyn A.S. i dr. Avtomatizirovannoe postroenie realistichnykh litofatsialnykh kart metodami kombinatornoi optimizatsii // Intellektualnye sistemy. Teoriia i prilozheniia. 2024. Vol. 28, № 4. S. 5–20.</mixed-citation><mixed-citation xml:lang="en">Antonov A.P., Afonin S.A., Kozitsyn A.S. i dr. Avtomatizirovannoe postroenie realistichnykh litofatsialnykh kart metodami kombinatornoi optimizatsii // Intellektualnye sistemy. Teoriia i prilozheniia. 2024. Vol. 28, № 4. S. 5–20.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Informatsionnaia sistema ABAI. URL: https://kmge.kz/abai/ (11.12.2025)</mixed-citation><mixed-citation xml:lang="en">Informatsionnaia sistema ABAI. URL: https://kmge.kz/abai/ (11.12.2025)</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Baraboshkin E.E., Panchenko E.A., Demidov A.E. i dr. Sistema avtomaticheskogo opisaniia kerna v proizvodstvennom protsesse. Opyt primeneniia // Puti realizatsii neftegazovogo potentsiala Zapadnoi Sibiri: Materialy XXV nauchno-prakticheskoi konferentsii, Khanty-Mansiisk, 23–26 noiabria 2021 goda / Pod redaktsiei E.A. Vtorushinoi, E.E. Oksenoid, S.A. Aleshina, N.N. Zakharchenko, E.V. Oleinik, T.N. Pecherina. Khanty-Mansiisk: Avtonomnoe uchrezhdenie Khanty-Mansiiskogo avtonomnogo okruga – Iugry "Nauchno-analiticheskii tsentr ratsionalnogo nedropolzovaniia im.V.I.Shpilmana", 2022. S. 293–299.</mixed-citation><mixed-citation xml:lang="en">Baraboshkin E.E., Panchenko E.A., Demidov A.E. i dr. Sistema avtomaticheskogo opisaniia kerna v proizvodstvennom protsesse. Opyt primeneniia // Puti realizatsii neftegazovogo potentsiala Zapadnoi Sibiri: Materialy XXV nauchno-prakticheskoi konferentsii, Khanty-Mansiisk, 23–26 noiabria 2021 goda / Pod redaktsiei E.A. Vtorushinoi, E.E. Oksenoid, S.A. Aleshina, N.N. Zakharchenko, E.V. Oleinik, T.N. Pecherina. Khanty-Mansiisk: Avtonomnoe uchrezhdenie Khanty-Mansiiskogo avtonomnogo okruga – Iugry "Nauchno-analiticheskii tsentr ratsionalnogo nedropolzovaniia im.V.I.Shpilmana", 2022. S. 293–299.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Kompleks DHD. URL: https://magazine.neftegaz.ru/articles/tsifrovizatsiya/682038-tsifrovoy-analiz-kerna-v-zadachakh-proektirovaniya-razrabotki-neftyanykh-i-gazovykh-mestorozhdeniy-/ (11.12.2025)</mixed-citation><mixed-citation xml:lang="en">Kompleks DHD. URL: https://magazine.neftegaz.ru/articles/tsifrovizatsiya/682038-tsifrovoy-analiz-kerna-v-zadachakh-proektirovaniya-razrabotki-neftyanykh-i-gazovykh-mestorozhdeniy-/ (11.12.2025)</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Programmnyi kompleks "Tsifrovoi kern". URL: https://globalcio.ru/projects/10448/ (11.12.2025)</mixed-citation><mixed-citation xml:lang="en">Programmnyi kompleks "Tsifrovoi kern". URL: https://globalcio.ru/projects/10448/ (11.12.2025)</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Aristov A.I., Zelenin A.V., Katanov Iu.E. Neirosetevoe raspoznavanie teksturnykh osobennostei graficheskikh kernovykh dannykh. Svidetelstvo o registratsii programmy dlia EVM RU 2024615647, 11.03.2024. Zaiavka № 2024614650 11.03.2024.</mixed-citation><mixed-citation xml:lang="en">Aristov A.I., Zelenin A.V., Katanov Iu.E. Neirosetevoe raspoznavanie teksturnykh osobennostei graficheskikh kernovykh dannykh. Svidetelstvo o registratsii programmy dlia EVM RU 2024615647, 11.03.2024. Zaiavka № 2024614650 11.03.2024.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Li H, Wan B, Chu D, Wang R, Ma G, Fu J, Xiao Z. Progressive Geological Modeling and Uncertainty Analysis Using Machine Learning // ISPRS International Journal of Geo-Information. 2023. Vol. 12(3). 97. https://doi.org/10.3390/ijgi12030097</mixed-citation><mixed-citation xml:lang="en">Li H, Wan B, Chu D, Wang R, Ma G, Fu J, Xiao Z. Progressive Geological Modeling and Uncertainty Analysis Using Machine Learning // ISPRS International Journal of Geo-Information. 2023. Vol. 12(3). 97. https://doi.org/10.3390/ijgi12030097</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Khimulia V.V. Primenenie tekhnologii tsifrovogo analiza kerna dlia izucheniia filtratsionno-emkostnykh svoistv i struktury vysokopronitsaemykh porod podzemnykh khranilishch gaza // RJES. 2024. №5. S. 1–15. URL: https://rjes.ru/temp/fddc89c0f81314f3d14bad3446565446.pdf (11.12.2025).</mixed-citation><mixed-citation xml:lang="en">Khimulia V.V. Primenenie tekhnologii tsifrovogo analiza kerna dlia izucheniia filtratsionno-emkostnykh svoistv i struktury vysokopronitsaemykh porod podzemnykh khranilishch gaza // RJES. 2024. №5. S. 1–15. URL: https://rjes.ru/temp/fddc89c0f81314f3d14bad3446565446.pdf (11.12.2025).</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Fuentes I., Padarian J., Iwanaga T., Vervoort R.W., 3D Lithological mapping of borehole descriptions using word embeddings // Computers &amp; Geosciences. 2020. Vol. 141. 104516. https://doi.org/10.1016/j.cageo.2020.104516 URL: https://www.sciencedirect.com/science/article/pii/S0098300419306533</mixed-citation><mixed-citation xml:lang="en">Fuentes I., Padarian J., Iwanaga T., Vervoort R.W., 3D Lithological mapping of borehole descriptions using word embeddings // Computers &amp; Geosciences. 2020. Vol. 141. 104516. https://doi.org/10.1016/j.cageo.2020.104516 URL: https://www.sciencedirect.com/science/article/pii/S0098300419306533</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Padarian J., Fuentes I. Word embeddings for application in geosciences: development, evaluation, and examples of soil-related concepts // SOIL. 2019. Vol. 5. P. 177–187. https://doi.org/10.5194/soil-5-177-2019, 2019. URL: https://soil.copernicus.org/articles/5/177/2019/</mixed-citation><mixed-citation xml:lang="en">Padarian J., Fuentes I. Word embeddings for application in geosciences: development, evaluation, and examples of soil-related concepts // SOIL. 2019. Vol. 5. P. 177–187. https://doi.org/10.5194/soil-5-177-2019, 2019. URL: https://soil.copernicus.org/articles/5/177/2019/</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Pennington J., Socher R., Manning C. Glove: Global vectors for word representation // Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP). 2014. P. 1532–1543</mixed-citation><mixed-citation xml:lang="en">Pennington J., Socher R., Manning C. Glove: Global vectors for word representation // Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP). 2014. P. 1532–1543</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Katanov Iu.E., Aristov A.I., Iagafarov A.K., Novruzov O.D. Tsifrovoi kern: neirosetevoe raspoznavanie tekstovoi geologo-geofizicheskoi informatsii // Izvestiia vysshikh uchebnykh zavedenii. Neft i gaz. 2023. № 3 (159). S. 35–54.</mixed-citation><mixed-citation xml:lang="en">Katanov Iu.E., Aristov A.I., Iagafarov A.K., Novruzov O.D. Tsifrovoi kern: neirosetevoe raspoznavanie tekstovoi geologo-geofizicheskoi informatsii // Izvestiia vysshikh uchebnykh zavedenii. Neft i gaz. 2023. № 3 (159). S. 35–54.</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Denisov D.V. Analiz metodov mashinnogo obucheniia dlia tematicheskoi klassifikatsii tekstov // Mezhdunarodnyi zhurnal informatsionnykh tekhnologii i energoeffektivnosti. 2024. Vol. 9, № 4(42). S. 5–11.</mixed-citation><mixed-citation xml:lang="en">Denisov D.V. Analiz metodov mashinnogo obucheniia dlia tematicheskoi klassifikatsii tekstov // Mezhdunarodnyi zhurnal informatsionnykh tekhnologii i energoeffektivnosti. 2024. Vol. 9, № 4(42). S. 5–11.</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Kozitsyn A.S. Algoritmy tematicheskogo poiska dannykh v naukometricheskikh sistemakh // Programmnaia inzheneriia. 2022. Vol. 13, № 6. S. 291–300.</mixed-citation><mixed-citation xml:lang="en">Kozitsyn A.S. Algoritmy tematicheskogo poiska dannykh v naukometricheskikh sistemakh // Programmnaia inzheneriia. 2022. Vol. 13, № 6. S. 291–300.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
