<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">ellibs</journal-id><journal-title-group><journal-title xml:lang="ru">Электронные библиотеки</journal-title><trans-title-group xml:lang="en"><trans-title>Russian Digital Libraries Journal</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">1562-5419</issn><publisher><publisher-name>Казанский (Приволжский) федеральный университет</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.26907/1562-5419-2025-28-6-1324-1345</article-id><article-id custom-type="elpub" pub-id-type="custom">ellibs-622</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>Статьи</subject></subj-group></article-categories><title-group><article-title>Библиотека научных предметных областей SciLibRu</article-title><trans-title-group xml:lang="en"><trans-title>SciLibRu, the Library of Scientific Subject Domains</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Атаева</surname><given-names>Ольга Муратовна</given-names></name><name name-style="western" xml:lang="en"><surname>Ataeva</surname><given-names>Olga Muratovna</given-names></name></name-alternatives><email xlink:type="simple">OAtaeva@frccsc.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Тучкова</surname><given-names>Наталия Павловна</given-names></name><name name-style="western" xml:lang="en"><surname>Tuchkova</surname><given-names>Natalia Pavlovna</given-names></name></name-alternatives><email xlink:type="simple">NTuchkova@frccsc.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Теймуразов</surname><given-names>Кирилл Борисович</given-names></name><name name-style="western" xml:lang="en"><surname>Teymurazov</surname><given-names>Kirill Borisovich</given-names></name></name-alternatives><email xlink:type="simple">KTeymurazov@frccsc.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Абдышов</surname><given-names>Айдин</given-names></name><name name-style="western" xml:lang="en"><surname>Abdyshov</surname><given-names>Aidin</given-names></name></name-alternatives><email xlink:type="simple">abdysovajdin@gmail.com</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Кобук</surname><given-names>Михаил Геннадьевич</given-names></name><name name-style="western" xml:lang="en"><surname>Kobuk</surname><given-names>Mikhail Gennadievich</given-names></name></name-alternatives><email xlink:type="simple">mikhail.kobuk@mail.ru</email><xref ref-type="aff" rid="aff-2"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Федеральный исследовательский центр «Информатика и управление» Российской академии наук</institution></aff><aff xml:lang="en"><institution>Federal Research Center “Computer Science and Control” of the Russian Academy of Sciences</institution></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru"><institution>Московский университет имени С.Ю. Витте</institution></aff><aff xml:lang="en"><institution>S. Y. Witte University of Moscow</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>19</day><month>12</month><year>2025</year></pub-date><volume>28</volume><issue>6</issue><fpage>1324</fpage><lpage>1345</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Атаева О.М., Тучкова Н.П., Теймуразов К.Б., Абдышов А., Кобук М.Г., 2025</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="ru">Атаева О.М., Тучкова Н.П., Теймуразов К.Б., Абдышов А., Кобук М.Г.</copyright-holder><copyright-holder xml:lang="en">Ataeva O.M., Tuchkova N.P., Teymurazov K.B., Abdyshov A., Kobuk M.G.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://ellibs.elpub.ru/jour/article/view/622">https://ellibs.elpub.ru/jour/article/view/622</self-uri><abstract><p>Работа посвящена проблеме интеграции данных для представления научных предметных областей на основе их семантического описания в цифровой библиотеке SciLibRu. В качестве модели данных использованы онтология и граф знаний библиотеки LibMeta. Наполнение библиотеки SciLibRu осуществляется путем добавления данных научных журналов. Показано, как реализованы этапы анализа слабоструктурированных научных публикаций для их встраивания в онтологию библиотеки. При прохождении всех этапов предобработки данных формируется датасет, который может быть использован в обучении языковых моделей для запросов в русскоязычных научных предметных областях.


Приложение работы заключается в создании рекомендательных систем для работы с научными русскоязычными журналами.
</p></abstract><trans-abstract xml:lang="en"><p>The work is devoted to the problem of data integration for representing scientific subject areas based on their semantic description in the SciLibRu digital library. The LibMeta library's ontology and knowledge graph are used as the data model. SciLibRu is populated by adding data from scientific journals. The paper demonstrates how the stages of processing semi-structured scientific publications for their integration into the library's ontology are implemented. Completing all data preprocessing stages yields a dataset that can be used to train language models for queries in Russian-language scientific subject areas.
</p></trans-abstract><kwd-group xml:lang="ru"><kwd>икладная онтология</kwd><kwd>граф знаний</kwd><kwd>источники данных</kwd><kwd>анализ слабоструктурированных научных публикаций</kwd></kwd-group><kwd-group xml:lang="en"><kwd>applied ontology</kwd><kwd>knowledge graph</kwd><kwd>data sources</kwd><kwd>analysis of semi-structured scientific publications</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Serebryakov V.A., Ataeva O.M. Informacionnaya model' otkrytoj personal'noj semanticheskoj biblioteki LibMeta // Nauchnyj servis v seti Internet: trudy XVIII Vserossijskoj nauchnoj konferencii (19–24 sentyabrya 2016 g., g. Novorossijsk). M.: IPM im. M.V. Keldysha, 2016. S. 304–313. URL: http://keldysh.ru/abrau/2016/3.pdf (In Russ.)</mixed-citation><mixed-citation xml:lang="en">Serebryakov V.A., Ataeva O.M. Informacionnaya model' otkrytoj personal'noj semanticheskoj biblioteki LibMeta // Nauchnyj servis v seti Internet: trudy XVIII Vserossijskoj nauchnoj konferencii (19–24 sentyabrya 2016 g., g. Novorossijsk). M.: IPM im. M.V. Keldysha, 2016. S. 304–313. URL: http://keldysh.ru/abrau/2016/3.pdf (In Russ.)</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Rospocher M., Tonelli S., Serafini L., Pianta E. Corpus-based terminological evaluation of ontologies // Applied Ontology. 2012. Vol. 7, No. 4. P. 429–448. https://doi.org/10.3233/AO-2012-0114</mixed-citation><mixed-citation xml:lang="en">Rospocher M., Tonelli S., Serafini L., Pianta E. Corpus-based terminological evaluation of ontologies // Applied Ontology. 2012. Vol. 7, No. 4. P. 429–448. https://doi.org/10.3233/AO-2012-0114</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Ataeva O., Serebryakov V., Tuchkova N. Ontological approach to a knowledge graph construction in a semantic library // Lobachevskii J. of Mathematics. 2023. Vol. 44, No. 6. P. 2229–2239. https://doi.org/10.1134/S1995080223060471</mixed-citation><mixed-citation xml:lang="en">Ataeva O., Serebryakov V., Tuchkova N. Ontological approach to a knowledge graph construction in a semantic library // Lobachevskii J. of Mathematics. 2023. Vol. 44, No. 6. P. 2229–2239. https://doi.org/10.1134/S1995080223060471</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Handbook on Ontologies. Editors: Steffen Staab, Rudi Studer, Springer-Verlag Berlin Heidelberg, 2004. https://doi.org/10.1007/978-3-540-24750-0</mixed-citation><mixed-citation xml:lang="en">Handbook on Ontologies. Editors: Steffen Staab, Rudi Studer, Springer-Verlag Berlin Heidelberg, 2004. https://doi.org/10.1007/978-3-540-24750-0</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Ataeva O., Serebryakov V., Tuchkova N. Podhody k organizacii matematicheskih znanij pri formirovaniya predmetnyh tezaurusov razlichnyh razdelov matematiki // CEUR Workshop Proceedings. 2018. Vol. 2260. P. 42–54. https://doi.org/10.20948/abrau-2018-66 (In Russ.)</mixed-citation><mixed-citation xml:lang="en">Ataeva O., Serebryakov V., Tuchkova N. Podhody k organizacii matematicheskih znanij pri formirovaniya predmetnyh tezaurusov razlichnyh razdelov matematiki // CEUR Workshop Proceedings. 2018. Vol. 2260. P. 42–54. https://doi.org/10.20948/abrau-2018-66 (In Russ.)</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Hlomani H., Stacey D. Approaches, methods, metrics, measures, and subjectivity in ontology evaluation: A survey // Semantic Web Journal. 2014. Vol. 1, No. 5. P. 1–11. https://www.semantic-web-journal.net/system/files/swj657.pdf</mixed-citation><mixed-citation xml:lang="en">Hlomani H., Stacey D. Approaches, methods, metrics, measures, and subjectivity in ontology evaluation: A survey // Semantic Web Journal. 2014. Vol. 1, No. 5. P. 1–11. https://www.semantic-web-journal.net/system/files/swj657.pdf</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Lozano-Tello A., Gómez-Pérez A. Ontometric: A method to choose the appropriate ontology // Journal of Database Management. 2004. Vol. 15, No. 2. P. 1–18. https://doi.org/10.4018/jdm.2004040101</mixed-citation><mixed-citation xml:lang="en">Lozano-Tello A., Gómez-Pérez A. Ontometric: A method to choose the appropriate ontology // Journal of Database Management. 2004. Vol. 15, No. 2. P. 1–18. https://doi.org/10.4018/jdm.2004040101</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Shrejder Yu.A. Tezaurusy v informatike i teoreticheskoj semantike // Nauchno-tekhnicheskaya informaciya. Ser. 2. 1971. № 3. S. 21–24 (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Shrejder Yu.A. Tezaurusy v informatike i teoreticheskoj semantike // Nauchno-tekhnicheskaya informaciya. Ser. 2. 1971. № 3. S. 21–24 (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Lukashevich N.V. Tezaurusy v zadachah informacionnogo poiska. M.: Izd-vo MGU, 2011. 495 s. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Lukashevich N.V. Tezaurusy v zadachah informacionnogo poiska. M.: Izd-vo MGU, 2011. 495 s. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Harari F. Teoriya grafov. Per. s angl. i predisl. V.P. Kozyreva. Pod red. G.P. Gavrilova. Izd. 2-e. M.: Editorial URSS, 2003. 296 s</mixed-citation><mixed-citation xml:lang="en">Harari F. Teoriya grafov. Per. s angl. i predisl. V.P. Kozyreva. Pod red. G.P. Gavrilova. Izd. 2-e. M.: Editorial URSS, 2003. 296 s</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Barrasa J., Webber J. Building Knowledge Graphs: A Practitioner’s Guide. O'Reilly. 2023. 290 p.</mixed-citation><mixed-citation xml:lang="en">Barrasa J., Webber J. Building Knowledge Graphs: A Practitioner’s Guide. O'Reilly. 2023. 290 p.</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Biswas G., Bezdek J., Oakman R.L. A knowledge-based approach to online document retrieval system design // In Proc. ACM SIGART Int. Symp. Methodol. Intell. Syst. (ISMIS '86), 1986. P. 112–120. https://doi/10.1145/12808.12821</mixed-citation><mixed-citation xml:lang="en">Biswas G., Bezdek J., Oakman R.L. A knowledge-based approach to online document retrieval system design // In Proc. ACM SIGART Int. Symp. Methodol. Intell. Syst. (ISMIS '86), 1986. P. 112–120. https://doi/10.1145/12808.12821</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Gavrilova T.A., Kudryavcev D.V., Muromcev D.I. Inzheneriya znanij. Modeli i metody: Uchebnik. SPb.: Izdatel'stvo «Lan'», 2016. 324 s. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Gavrilova T.A., Kudryavcev D.V., Muromcev D.I. Inzheneriya znanij. Modeli i metody: Uchebnik. SPb.: Izdatel'stvo «Lan'», 2016. 324 s. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Pan S. et al. Unifying Large Language Models and Knowledge Graphs: A Roadmap // in IEEE Transactions on Knowledge and Data Engineering. 2024. Vol. 36, No. 7. P. 3580–3599. https://doi.org/10.1109/TKDE.2024.3352100</mixed-citation><mixed-citation xml:lang="en">Pan S. et al. Unifying Large Language Models and Knowledge Graphs: A Roadmap // in IEEE Transactions on Knowledge and Data Engineering. 2024. Vol. 36, No. 7. P. 3580–3599. https://doi.org/10.1109/TKDE.2024.3352100</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Luo L. et al. Graph-constrained reasoning: Faithful reasoning on knowledge graphs with large language models // arXiv preprint arXiv:2410.13080. 2024. https://doi.org/10.48550/arXiv.2410.13080</mixed-citation><mixed-citation xml:lang="en">Luo L. et al. Graph-constrained reasoning: Faithful reasoning on knowledge graphs with large language models // arXiv preprint arXiv:2410.13080. 2024. https://doi.org/10.48550/arXiv.2410.13080</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Vinogradov I.M. (Gl. red.). Matematicheskaya enciklopediya (v 5 tomah) M.: Sovetskaya enciklopediya (1977–1985) (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Vinogradov I.M. (Gl. red.). Matematicheskaya enciklopediya (v 5 tomah) M.: Sovetskaya enciklopediya (1977–1985) (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Faddeev L.D. (Gl. red.). Enciklopediya matematicheskoj fiziki. Enciklopediya. M.: Bol'shaya russkaya enciklopediya.1998. 692 s. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Faddeev L.D. (Gl. red.). Enciklopediya matematicheskoj fiziki. Enciklopediya. M.: Bol'shaya russkaya enciklopediya.1998. 692 s. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit18"><label>18</label><citation-alternatives><mixed-citation xml:lang="ru">Ataeva O.M., Tuchkova N.P. Adaptation of the language model for mathematical texts in the semantic library // System Informatics. 2025. No. 27. P. 59–75.</mixed-citation><mixed-citation xml:lang="en">Ataeva O.M., Tuchkova N.P. Adaptation of the language model for mathematical texts in the semantic library // System Informatics. 2025. No. 27. P. 59–75.</mixed-citation></citation-alternatives></ref><ref id="cit19"><label>19</label><citation-alternatives><mixed-citation xml:lang="ru">Budzko V.I., Ataeva O.M., Tuchkova N.P. Access automation to information for navigating through semantic library data and integrating the knowledge graph with the language model // Highly Available Systems. 2025. V. 21. No. 2. P. 5−11. https://doi.org/ 10.18127/j20729472-202502-0. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Budzko V.I., Ataeva O.M., Tuchkova N.P. Access automation to information for navigating through semantic library data and integrating the knowledge graph with the language model // Highly Available Systems. 2025. V. 21. No. 2. P. 5−11. https://doi.org/ 10.18127/j20729472-202502-0. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit20"><label>20</label><citation-alternatives><mixed-citation xml:lang="ru">Klyukin A.A., Shirokov A.A. Avtomatizirovannaya sistema podgotovki slabostrukturirovannoj informacii. [Elektronnyj resurs] // Gaudeamus. 2014. Vol. 24, No. 2. URL: https://cyberleninka.ru/article/n/avtomatizirovannaya-sistema-podgotovki-slabostrukturirovannoy-informatsii (date of access: 01.11.2025) (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Klyukin A.A., Shirokov A.A. Avtomatizirovannaya sistema podgotovki slabostrukturirovannoj informacii. [Elektronnyj resurs] // Gaudeamus. 2014. Vol. 24, No. 2. URL: https://cyberleninka.ru/article/n/avtomatizirovannaya-sistema-podgotovki-slabostrukturirovannoy-informatsii (date of access: 01.11.2025) (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit21"><label>21</label><citation-alternatives><mixed-citation xml:lang="ru">Kurtyukin S.V. Metod avtomatizirovannogo formirovaniya sbornikov arhivnyh dokumentov [Elektronnyj resurs] // Teoriya i praktika sovremennoj nauki. 2018. №5 (35). URL: https://cyberleninka.ru/article/n/metod-avtomatizirovannogo-formirovaniya-sbornikov-arhivnyh-dokumentov (data obrashcheniya: 01.11.2025).</mixed-citation><mixed-citation xml:lang="en">Kurtyukin S.V. Metod avtomatizirovannogo formirovaniya sbornikov arhivnyh dokumentov [Elektronnyj resurs] // Teoriya i praktika sovremennoj nauki. 2018. №5 (35). URL: https://cyberleninka.ru/article/n/metod-avtomatizirovannogo-formirovaniya-sbornikov-arhivnyh-dokumentov (data obrashcheniya: 01.11.2025).</mixed-citation></citation-alternatives></ref><ref id="cit22"><label>22</label><citation-alternatives><mixed-citation xml:lang="ru">Aho A., Seti R., Ul'man Dzh. Kompilyatory: principy, tekhnologii, instrument. M.: Vil'yams, 2001, 762 s. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Aho A., Seti R., Ul'man Dzh. Kompilyatory: principy, tekhnologii, instrument. M.: Vil'yams, 2001, 762 s. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit23"><label>23</label><citation-alternatives><mixed-citation xml:lang="ru">Volkova I.A., Vylitok A.A., Rudenko T.V. Formal'nye grammatiki i yazyki. Elementy teorii translyacii : uchebnoe posobie dlya studentov II kursa M.: Izd-vo Mosk. gos. un-ta,2009. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Volkova I.A., Vylitok A.A., Rudenko T.V. Formal'nye grammatiki i yazyki. Elementy teorii translyacii : uchebnoe posobie dlya studentov II kursa M.: Izd-vo Mosk. gos. un-ta,2009. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit24"><label>24</label><citation-alternatives><mixed-citation xml:lang="ru">Gladkij A.V. Formal'nye grammatiki i yazyki. M.: Nauka, Gl. red. fiz.-mat. lit., 1973, 368 s. (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Gladkij A.V. Formal'nye grammatiki i yazyki. M.: Nauka, Gl. red. fiz.-mat. lit., 1973, 368 s. (In Russ.).</mixed-citation></citation-alternatives></ref><ref id="cit25"><label>25</label><citation-alternatives><mixed-citation xml:lang="ru">Bryabrin V.M., Landau I.Ya., Nemenman M.E. O sisteme kodirovaniya dlya personal'nyh EVM // Mikroprocessornye sredstva i sistemy. 1986. № 4. S. 61–64 (In Russ.).</mixed-citation><mixed-citation xml:lang="en">Bryabrin V.M., Landau I.Ya., Nemenman M.E. O sisteme kodirovaniya dlya personal'nyh EVM // Mikroprocessornye sredstva i sistemy. 1986. № 4. S. 61–64 (In Russ.).</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
