<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="en"><front><journal-meta><journal-id journal-id-type="publisher-id">gscience</journal-id><journal-title-group><journal-title xml:lang="en">Mining Science and Technology (Russia)</journal-title><trans-title-group xml:lang="ru"><trans-title>Горные науки и технологии</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">2500-0632</issn><publisher><publisher-name>The National University of Science and Technology MISiIS (NUST MISIS)</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.17073/2500-0632-2025-05-416</article-id><article-id custom-type="elpub" pub-id-type="custom">gscience-974</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>GEOLOGY OF MINERAL DEPOSITS</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ГЕОЛОГИЯ МЕСТОРОЖДЕНИЙ ПОЛЕЗНЫХ ИСКОПАЕМЫХ</subject></subj-group></article-categories><title-group><article-title>From visual diagnostics to deep learning: automatic mineral identification in polished section images</article-title><trans-title-group xml:lang="ru"><trans-title>От визуальной диагностики к глубокому обучению: автоматическое определение минералов на фотографиях аншлифов</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-8500-7193</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Коршунов</surname><given-names>Д. М.</given-names></name><name name-style="western" xml:lang="en"><surname>Korshunov</surname><given-names>D. M.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Дмитрий Михайлович Коршунов – кандидат геолого-минералогических наук, старший научный сотрудник</p><p>г. Москва</p></bio><bio xml:lang="en"><p>Dmitrii M. Korshunov – Cand. Sci. (Geol. and Miner.), Senior Researcher</p><p>Moscow</p></bio><email xlink:type="simple">dmit0korsh@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-4217-7141</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Хвостиков</surname><given-names>А. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Khvostikov</surname><given-names>A. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Александр Владимирович Хвостиков – кандидат физико-математических наук, научный сотрудник лаборатории математических методов обработки изображений факультета вычислительной математики и кибернетики</p><p>г. Москва</p><p> Scopus ID 57188856261</p></bio><bio xml:lang="en"><p>Alexander V. Khvostikov – Cand. Sci. (Phys. and Math.), Senior Researcher of the Laboratory of Mathematical Methods for Image Processing, Faculty of Computational Mathematics and Cybernetics (CMC)</p><p>Moscow</p><p>Scopus ID 57188856261</p></bio><email xlink:type="simple">khvostikov@cs.msu.ru</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0003-0814-3997</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Николаев</surname><given-names>Г. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Nikolaev</surname><given-names>G. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Глеб Витальевич Николаев – студент магистратуры факультета вычислительной математики и кибернетики</p><p>г. Москва</p></bio><bio xml:lang="en"><p>Gleb V. Nikolaev – M.Sc. Student, Faculty of Computational Mathematics and Cybernetics (CMC)</p><p>Moscow</p></bio><email xlink:type="simple">nickolaev.gleb03@gmail.com</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-3299-2545</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Сорокин</surname><given-names>Д. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Sorokin</surname><given-names>D. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Дмитрий Васильевич Сорокин – кандидат физико-математических наук, старший научный сотрудник лаборатории математических методов обработки изображений факультета вычислительной математики и кибернетики</p><p>г. Москва</p></bio><bio xml:lang="en"><p>Dmitry V. Sorokin – Cand. Sci. (Phys. and Math.), Senior Researcher of the Laboratory of Mathematical Methods for Image Processing, Faculty of Computational Mathematics and Cybernetics</p><p>Moscow</p></bio><email xlink:type="simple">dsorokin@cs.msu.ru</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0007-0936-4088</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Индычко</surname><given-names>О. И.</given-names></name><name name-style="western" xml:lang="en"><surname>Indychko</surname><given-names>O. I.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Олеся Игоревна Индычко – аспирант факультета вычислительной математики и кибернетики</p><p>г. Москва</p></bio><bio xml:lang="en"><p>Olesya I. Indychko – PhD-Student, Faculty of Computational Mathematics and Cybernetics (CMC)</p><p>Moscow</p></bio><email xlink:type="simple">olesyaindychko@gmail.com</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-0133-7185</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Богуславский</surname><given-names>М. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Boguslavskii</surname><given-names>M. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Михаил Александрович Богуславский – кандидат геолого-минералогических наук, доцент кафедры геологии, геохимии и экономики полезных ископаемых геологического факультета</p><p>г. Москва</p><p>ResearcherID V-4671-2017</p></bio><bio xml:lang="en"><p>Mikhail A. Boguslavskii – Cand. Sci. (Geol. and Miner.), Associate Professor of the Department of Geology, Geochemistry and Mineral Economics, Faculty of Geology</p><p>Moscow</p><p>ResearcherID V-4671-2017</p></bio><email xlink:type="simple">mboguslavskiy@yandex.ru</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-9910-4501</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Крылов</surname><given-names>А. С.</given-names></name><name name-style="western" xml:lang="en"><surname>Krylov</surname><given-names>A. S.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Андрей Серджевич Крылов – доктор физико-математических наук, профессор, заведующий лабораторией математических методов обработки изображений факультета факультета вычислительной математики и кибернетики</p><p>г. Москва</p><p>Scopus ID 7202280261</p><p>ResearcherID B-9651-2014</p></bio><bio xml:lang="en"><p>Andrey S. Krylov – Dr. Sci. (Phys. and Math.), Professor, Head of the Laboratory of Mathematical Methods for Image Processing, Faculty of Computational Mathematics and Cybernetics</p><p>Moscow</p><p>Scopus ID 7202280261</p><p>ResearcherID B-9651-2014</p></bio><email xlink:type="simple">kryl@cs.msu.ru</email><xref ref-type="aff" rid="aff-2"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru">Геологический институт РАН<country>Россия</country></aff><aff xml:lang="en">Geological Institute of the Russian Academy of Sciences (GIN RAS)<country>Russian Federation</country></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru">Московский государственный университет имени М. В. Ломоносова<country>Россия</country></aff><aff xml:lang="en">Lomonosov Moscow State University<country>Russian Federation</country></aff></aff-alternatives><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>13</day><month>10</month><year>2025</year></pub-date><volume>10</volume><issue>3</issue><fpage>232</fpage><lpage>244</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Korshunov D.M., Khvostikov A.V., Nikolaev G.V., Sorokin D.V., Indychko O.I., Boguslavskii M.A., Krylov A.S., 2025</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="ru">Коршунов Д.М., Хвостиков А.В., Николаев Г.В., Сорокин Д.В., Индычко О.И., Богуславский М.А., Крылов А.С.</copyright-holder><copyright-holder xml:lang="en">Korshunov D.M., Khvostikov A.V., Nikolaev G.V., Sorokin D.V., Indychko O.I., Boguslavskii M.A., Krylov A.S.</copyright-holder><license license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://mst.misis.ru/jour/article/view/974">https://mst.misis.ru/jour/article/view/974</self-uri><abstract><p>Studying mineralogical composition of ores is a fundamental step in the exploration of new deposits, as it allows determining the forms in which useful components are found, the processes of ore formation, and the potential recoverability of valuable elements. The mineral associations, textures, and structures of ores not only provide key information about the geology of a deposit, but also determine the choice of beneficiation methods. Despite the development of modern analytical tools and existing solutions for automatic mineral diagnosis, such as those based on the SEM-EDS method, optical microscopy remains the most accessible means of quantitative mineralogical analysis. However, it remains labor-intensive and requires highly skilled specialists. In addition, its visual nature limits the accuracy and reproducibility of results, creating a need for more effective approaches. One promising area is the automation of ore mineral identification based on images of polished sections. The aim of the work was to develop and validate a universal segmentation model based on deep learning. In the course of the research, related problems were also solved, including the creation of an open LumenStone dataset, the development of color adaptation methods, joint analysis of PPL and XPL images, panorama construction, and the development of a fast annotation method. The work applied convolutional neural network architectures, color correction and joint image processing algorithms, as well as an original sampling method that compensates for class imbalance. The proposed segmentation model demonstrated high accuracy (IoU up to 0.88, PA up to 0.96) for nine minerals. The obtained results confirmed the effectiveness of integrating deep learning and modern image processing algorithms in mineralogical analysis systems and laid the foundation for further development of digital methods in automated petrography.</p></abstract><trans-abstract xml:lang="ru"><p>Изучение минерального состава руд является основополагающим этапом при разведке новых месторождений, поскольку именно оно позволяет определить формы нахождения полезных компонентов, процессы рудообразования и потенциальную извлекаемость ценных элементов. Минеральная ассоциация, текстуры и структуры руд не только дают ключевые сведения о геологии месторождения, но и определяют выбор методов обогащения. Несмотря на развитие современной аналитической базы и существующие решения автоматической диагностики минералов, например, на основе СЭМ-EDS метода, оптическая микроскопия является самым доступным средством количественного минералогического анализа. Однако она остаётся трудоемкой и требует высокой квалификации специалиста. А её визуальный характер ограничивает точность и воспроизводимость результатов, что создает необходимость в разработке более эффективных подходов. Одним из перспективных направлений является автоматизация идентификации рудных минералов по фотоизображениям аншлифов. Целью работы являлась разработка и валидация универсальной сегментационной модели на основе глубокого обучения. В процессе исследования также были решены сопутствующие задачи, включая формирование открытого набора данных LumenStone, разработку методов цветовой адаптации, совместного анализа PPL- и XPL-изображений, построения панорам и разработки метода быстрой разметки. В работе были применены свёрточные нейросетевые архитектуры, алгоритмы коррекции цвета и совместной обработки изображений, а также оригинальный метод семплирования, компенсирующий дисбаланс классов. Предложенная модель сегментации продемонстрировала высокую точность (IoU до 0,88, PA до 0,96) по девяти минералам. Полученные результаты подтвердили эффективность интеграции глубокого обучения и современных алгоритмов обработки изображений для задач минералогического анализа и заложили основу для дальнейшего развития цифровых методов в автоматизированной петрографии.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>минералогия</kwd><kwd>минераграфия</kwd><kwd>цифровая петрография</kwd><kwd>автоматические методы анализа изображений</kwd><kwd>сегментация</kwd><kwd>глубокое обучение</kwd><kwd>цветовая адаптация</kwd><kwd>панорамные изображения</kwd></kwd-group><kwd-group xml:lang="en"><kwd>mineralogy</kwd><kwd>mineragraphy</kwd><kwd>digital petrography</kwd><kwd>automatic image analysis methods</kwd><kwd>segmentation</kwd><kwd>deep learning</kwd><kwd>color adaptation</kwd><kwd>panoramic images</kwd></kwd-group><funding-group xml:lang="ru"><funding-statement>Исследование выполнено за счет гранта Российского научного фонда (проект № 24-21-00061).</funding-statement></funding-group><funding-group xml:lang="en"><funding-statement>This research was supported by the Russian Science Foundation (project no. 24-21-00061).</funding-statement></funding-group></article-meta></front><body><sec><title>From visual diagnostics to deep learning: automatic mineral identification in polished section images</title></sec><sec><title>Introduction</title><p>Studying mineralogical composition of ores is a fundamental step in the exploration of new deposits, as it allows determining the forms in which useful components are found, the processes of ore formation, and the potential recoverability of valuable elements. The mineral associations, textures, and structures of ores not only provide key information about the geology of a deposit, but also determine the choice of beneficiation methods.</p><p>Despite the development of modern analytical tools and existing solutions for automatic mineral diagnosis, such as those based on the SEM-EDS method [1, 2], optical microscopy remains the most accessible means of quantitative mineralogical analysis. However, it remains labor-intensive and requires highly skilled specialists. In addition, its visual nature limits the accuracy and reproducibility of results, creating a need for more effective approaches.</p><p>A promising area is the automation of ore mineral identification based on photographs of polished sections. This approach not only reduces span time, but also minimizes subjective errors associated with visual diagnostics and enables the implementation of accurate statistical analysis methods. The aim of this work is to describe our experience in developing a segmentation model for automatic detection of minerals in photographs of polished sections and solving a number of related problems that arose during the research. The paper systematically outlines the main problems encountered by the authors and the solutions they propose.</p></sec><sec><title>Current state of the problem</title><p>The first attempts to create tools for the automatic diagnostics of ore minerals under a microscope were made in the second half of the 20th century [3, 4]. At that time, spectrophotometers were used to measure the color of minerals, in particular, a mineral type was interpreted based on the absorption spectra of light in the visible range. Due to its low accuracy, this method was not widely used. More advanced methods of automatic mineral identification were developed in the second half of the 1990s and were based on the analysis of photographs of polished sections under a microscope [5, 6].</p><p>Attempts were made to automatically analyze mineral associations using cluster analysis in order to find patterns between different objects in photographs [<xref ref-type="bibr" rid="cit7">7</xref>]. Special mention should be made of the attempt by the authors [<xref ref-type="bibr" rid="cit8">8</xref>] to compile a digital atlas of all minerals and to identify the minerals themselves using a dendrogram based on a digital questionnaire.</p><p>To date, existing classical solutions (without the use of deep learning) for automatic mineral identification can be divided into two main groups:</p><p>Both approaches have significant limitations. Methods that use color and reflectivity are unable to distinguish between minerals with similar optical properties. Statistical methods, in turn, require recalibration for each new geological object, making their application "situational" and limited. This is well illustrated in [<xref ref-type="bibr" rid="cit12">12</xref>], which shows the features of applying this principle to separate copper ore into three minerals and three lithological types at a specific deposit.</p><p>It is worth noting that there are also highly specialized solutions available in the form of extensions for popular image analysis software packages such as Fiji/ImageJ. For example, [<xref ref-type="bibr" rid="cit13">13</xref>] describes a method for automatic determining  hematite grade, size, and intergrowth types in ore using this software. The problem with such solutions is that they solve a narrow, specific problem and lack the necessary level of versatility.</p><p>The most effective way to overcome the shortcomings of the classical methods and achieve fundamentally better results in the automatic analysis of such images is to use trainable deep models (e.g., convolutional neural networks) that are capable of extracting complex hierarchical features from images, taking into account not only local textures and shapes, but also global relationships between image fragments. Instead of manually selecting color and statistical characteristics, such models – whether traditional convolutional neural networks (CNN) [13–15], modern transformers with a self-attention mechanism [<xref ref-type="bibr" rid="cit16">16</xref>], or hybrid architectures (e.g., Mamba [<xref ref-type="bibr" rid="cit17">17</xref>]) – learn to identify the distinctive morphological and structural-textural features of each mineral.</p><p>For instance, convolutional neural networks were used to detect surface defects and examine polishing quality of metal products [18, 19] and to analyze carbon distribution in cast iron based on microphotographs of rough workpiece surfaces [<xref ref-type="bibr" rid="cit20">20</xref>]. In [<xref ref-type="bibr" rid="cit21">21</xref>], a method is presented for separating hematite and quartz in iron ore polished sections, with the determining their size classes to optimize the feed for a processing plant. It is also worth noting a number of works devoted to the assessment and classification of the dimensionality of individual mineral individuals [22, 23], as well as the analysis and typification of the morphology of intergrowths in a system with known mineral associations [24, 25]. The segmentation model proposed in these works achieved 98% accuracy in predicting iron ore quality and hematite recoverability, highlighting the potential of deep models in solving industrial problems.</p><p>In [<xref ref-type="bibr" rid="cit14">14</xref>], the effectiveness of deep convolutional networks for three-dimensional mineral identification and free grain analysis was demonstrated, and in [<xref ref-type="bibr" rid="cit26">26</xref>], the authors showed that combined analysis of optical micrographs using CNN improves the accuracy of mineral content estimation in charge. In [<xref ref-type="bibr" rid="cit15">15</xref>], the authors improved the methods of feature downsampling, classifying rocks more accurately based on polished section images.</p><p>It is worth noting that applying modern deep learning approaches facilitates transition from image fragment classification [<xref ref-type="bibr" rid="cit27">27</xref>] to full semantic segmentation, which allows for accurate pixel-level segmentation (decomposition) of images by mineral, see [17, 26] and [14, 28]. At the same time, works [14, 29] demonstrated the fundamental feasibility of creating high-quality ore mineral segmentation models with high identification accuracy (&gt; 0.8 by the IoU metric).</p><p>The main advantage of using deep trainable neural networks when working with images of ore samples is their ability to take into account the context of an image and adapt to the variability of mineral associations. Most importantly, it allows reliable differentiation even between minerals with very similar characteristics (pyrite–marcasite, covellite–chalcocite, etc.) without the need for permanent recalibration of the algorithm for new samples, unlike other computer vision methods. However, there are still relatively few studies devoted directly to the diagnostics of mineral species using such approaches. Deep learning models can also be used in conjunction with domain adaptation methods, which allow the segmentation model to be retrained on "new" images – taken with different equipment or under different lighting conditions, and thus maintain high performance even with significant variations in input data. Extensive reviews on domain adaptation [<xref ref-type="bibr" rid="cit14">14</xref>] and examples of successful application in semantic segmentation of geological and satellite images [30, 31] confirm that this approach provides versatility and stability in a wide variety of conditions. The fundamental feature of most deep learning methods is the need for complete image annotation for training. This is often a very labor-intensive process, but the use of specialized weak supervision methods, which appear to the user as annotation the image with of rough strokes (ScribbleSup [<xref ref-type="bibr" rid="cit32">32</xref>], ScribbleSeg [<xref ref-type="bibr" rid="cit33">33</xref>]) or clicks [<xref ref-type="bibr" rid="cit34">34</xref>], allows in many cases to significantly speed up the collection and preparation of training data.</p><p>To build a reliable system based on deep learning, the following fundamental problems must be solved, which are discussed in detail in this paper:</p></sec><sec><title>Research Materials and Techniques</title><p>This study used a collection of polished sections provided by the Department of Geology, Geochemistry, and Mineral Resources of the Faculty of Geology at Lomonosov Moscow State University. A Carl Zeiss AxioScope 40 polarizing microscope with a Canon PowerShot G10 camera was used to obtain images of the polished sections. All photos were taken with a magnification of ×50 and have a resolution of 3396×2547 pixels.</p><p>The main drawback of existing solutions that use deep neural network models in the considered problems of analyzing photos of polished sections [23, 35], according to the authors, are the proprietary image sets used and the proprietary code base, which makes it impossible to compare the methods being developed. Therefore, all annotated (indexed) image sets created as part of the work are presented as a single open dataset LumenStone1, and the software implementation of all developed methods is published as a petroscope2 library with open source code for the Python 3 programming language.</p><p>The LumenStone image dataset contains several subsets focused on solving various image analysis problems for polished sections. The main subsets are S1, S2, and S3, which are aimed at the problem of mineral segmentation (automatic identification) and are formed taking into account mineral associations and mineral properties:</p><p>Pixel masks of the corresponding minerals were created for all images of the datasets using Supervisely and Adobe Photoshop software. The masks are necessary for training and testing deep learning models.</p><p>It should be noted that due to natural reasons (frequency of occurrence in nature), the collected set of images has a significant minerals imbalance (the percentage ratio is given in Table 1). This fact is an additional complication for the development of methods for automatic mineral segmentation and must be taken into account.</p><p>The authors also collected additional subsets of images necessary for solving related problems:</p><p>To solve the problem of simultaneous analysis of anisotropic mineral photographs in PPL and XPL, "rotated" photographs of a single field of view were taken with the microscope stage rotation increment of 5 and 15° and additionally included in LumenStone S3.</p><p>Table 1</p><p>Distribution of minerals on labeled photographs of polished sectionsin the LumenStone S1, S2, and S3 sets for solving segmentation problems(the distribution when divided into training and test datasets is provided in square brackets)</p><p>1 LumenStone Dataset. URL: <ext-link xlink:href="https://imaging.cs.msu.ru/en/research/geology/lumenstone" ext-link-type="uri">https://imaging.cs.msu.ru/en/research/geology/lumenstone</ext-link></p><p>2 GitHub. URL: <ext-link xlink:href="https://github.com/xubiker/petroscope" ext-link-type="uri">https://github.com/xubiker/petroscope</ext-link></p></sec><sec><title>Problems and their solutions (discussion)</title><p>The descriptions of the problems in the field of image processing and analysis that are to be considered the complex problem of automatic mineral identification in microscopic images of polished sections and the approaches proposed by the authors to solve these problems are given below.</p></sec><sec><title>1. Neural network methods for mineral segmentation</title><p>In this work, we consider convolutional neural networks to solve segmentation problems. Transformer-based alternatives, although promising, remain excessively resource-intensive for standard laboratory conditions [<xref ref-type="bibr" rid="cit36">36</xref>]. Despite the good generalization ability of convolutional neural networks, they are quite sensitive to class imbalance in training dataset [37, 38], which is characteristic of the collected data (Table 1). Furthermore, neural network methods cannot be directly applied to high-resolution images due to hardware limitations. To mitigate these shortcomings, we proposed a specialized method for sampling the training sample collection during the training process, which extracts small fragments from images (patches) and acts as a data balancer.</p><p>The objective of the developed sampling method is to equalize the distribution of mineral classes fed into a neural network during training. For each pair "training image – mineral type," a matrix containing the extracted area of a selected mineral at each point in the case of selecting a patch centered at that point is calculated. The resulting set of matrices is used as probability maps when selecting patches for training. For instance, at each sampling iteration, for the mineral that is currently the least represented, 1) an image from the training dataset is selected (proportional to the content of this mineral), 2) the center of the patch is selected in accordance with the previously calculated probability maps, 3) the patch is extracted, and 4) the information about the representation of minerals in the used data is updated. With moderate patch sizes (256–384 px), this method allows for a significant equalization of the distribution of minerals in the LumenStone S1, S2, and S3 sets that has a positive effect on the training speed of segmentation models and on the final segmentation quality metrics.</p><p>When developing neural network models for mineral segmentation, we reviewed and investigated a number of convolutional architectures, ranging from the traditional UNet [<xref ref-type="bibr" rid="cit40">40</xref>] and its modification ResUNet [<xref ref-type="bibr" rid="cit29">29</xref>] to more modern PSPNet [<xref ref-type="bibr" rid="cit41">41</xref>] and UPerNet [<xref ref-type="bibr" rid="cit42">42</xref>]. The advantage of the latter lies in the ability to analyze images at different scales, correctly identify both small and very large objects simultaneously, and take into account local and global context that significantly improves the quality of segmentation based on the available data.</p><p>To evaluate the quality of segmentation in this work, IoU (Intersection over Union) metric was used [<xref ref-type="bibr" rid="cit43">43</xref>]. IoU is a key metric in object detection and segmentation that measures the overlap between predicted and ground truth boxes). This is one of the simplest and most common methods of geometric evaluation of segmentation when reference labeling is available. The metric takes values from the range [0, 1], where 1 corresponds to a complete match between the predicted and reference labelings (ideal case), and 0 corresponds to no intersections between the predicted and reference segmentation annotation. An IoU value greater than 0.7 is usually considered satisfactory, although this depends, of course, on the subject area.</p><p>In our case, training the PSPNet neural network with the ResNet18 encoder on the LumenStone S1 and S2 datasets, together with the class-balanced sampling method described above, allowed segmenting nine minerals and a generalized class of nonmetallic minerals with very high quality (the average IoU value on the test set was 0.88). The training uses a cross-entropy loss function, random augmentations (rotation, slight changes in scale, brightness, and color), an Adam optimizer with an initial learning rate of 0.001 and a decrease upon reaching a plateau. The training took approximately 3 hours using a Nvidia A6000 GPU. An example of applying the trained mineral segmentation model to an image from a test set is shown in Fig. 1.</p><p>Fig. 1. Example of a polished section image segmentation with the trained PSPNet model: a – image; b – error map (correctly recognized areas are highlighted in green, segmentation errors are highlighted in red); c – mineral mask (expert annotation); d – model prediction</p></sec><sec><title>2. Adaptive methods for image calibration and preprocessing</title><p>One of the main problems encountered by the authors when working with primary data is high sensitivity of segmentation models to the color palette of images. Differences in color characteristics between training images and real images lead to a significant deterioration in the quality of mineral identification. The color and brightness characteristics of images are determined by many factors: microscope parameters, camera settings, lighting, etc.</p><p>A solution to this problem is to use automatic color correction based on the color difference between the received image and a known reference (e.g., [<xref ref-type="bibr" rid="cit44">44</xref>]).</p><p>We proposed the method for correcting color distortions in [<xref ref-type="bibr" rid="cit45">45</xref>]. The main idea is to construct a transition matrix (Color Correction Matrix, CCM) [<xref ref-type="bibr" rid="cit46">46</xref>] between the color spaces of a distorted and reference images (images from the training set are taken as reference).</p><p>The process includes extracting the averaged colors of minerals and the background using partial labeling, linearizing colors through gamma correction (γ = 2.2), and calculating the affine transformation. The minimization problem is solved in LAB space, using the sum of the squares of color differences calculated using the CIEDE2000 formula [<xref ref-type="bibr" rid="cit47">47</xref>] as a loss function. The work uses a 4x3 matrix with initial approximation initialization based on the "white balance" method [<xref ref-type="bibr" rid="cit46">46</xref>]. The final step is to transform the distorted image through matrix multiplication by the previously calculated color correction matrix.</p><p>The proposed method allows preserving color differences that are critical for mineral identification (Fig. 2), while minimizing the influence of lighting changes and equipment settings. The algorithm supports two operating modes: an individual correction for each image and a "calibration" mode for a series of images, where the correction matrix is calculated once and applied to the entire group. The method does not require any prior training, and processing a single image takes less than 10 seconds on an Intel Xeon Gold 6226R CPU.</p><p>Fig. 2. An example of how the proposed color calibration method works: a – original image taken with alternative equipment; b – reference image;c – initial image after applying the method</p></sec><sec><title>3. Methods for joint processing of heterogeneous images</title><p>Many minerals are identified not only by their color and reflectivity, but also by the presence or absence of anisotropic properties. Anisotropy manifests itself in the ability of minerals to "fade" in doubly polarized light (crossed nicols) when the optical axes of a mineral coincide with the direction of the microscope polarizers. This property is a key to distinguishing minerals with similar reflectance and color parameters. For example, pyrite (isotropic) and marcasite (anisotropic) have similar optical characteristics but differ in the manifestation of anisotropy. Similarly, pyrite and arsenopyrite, although they have slightly different reflectivity and color, can also be reliably separated based on the manifestation of anisotropy by arsenopyrite.</p><p>We developed a neural network segmentation method that uses XPL and PPL images as additional input data for the segmentation neural network to improve the accuracy of mineral segmentation [<xref ref-type="bibr" rid="cit48">48</xref>]. The key step in this method is to align images taken at different angles of rotation with the reference PPL image. For this purpose, SIFT algorithms [<xref ref-type="bibr" rid="cit49">49</xref>] were used to detect stable key points in images, and RANSAC algorithm [<xref ref-type="bibr" rid="cit50">50</xref>] was used to calculate the affine transformation between images based on the found matches. Thus, all images were referred to a single coordinate system (Fig. 3). Then XPL images referred to a single coordinate system were used as additional input channels for a neural network based on the architecture proposed earlier by the authors [<xref ref-type="bibr" rid="cit29">29</xref>]. The used hyperparameters are described in [<xref ref-type="bibr" rid="cit29">29</xref>], and the model training time is approximately 6 hours with the use of a NVidia A6000 GPU.</p><p>Fig. 3. Alignment of XPL images of arsenopyrite:top row – images of arsenopyrite in different orientations; bottom row – images of arsenopyrite in different orientations after alignment. Four different orientations out of 24 are presented for each image with anisotropic minerals.</p></sec><sec><title>4. Methods for creating panoramic images</title><p>The average polished section area is several square centimeters, with typical ×50 magnification. Under such conditions, only a small part of a polished section, measuring a few square millimeters, is visible in each photograph. The use of photographs covering a large area of a sample would allow more accurate information to be obtained about the distribution of minerals in a sample and their relative positions, which would have a positive effect on the quality of the analysis.</p><p>Scanning electron microscopes (SEM) can be used to obtain large images in geology, but such equipment is very expensive, structural and textural features may be lost due to the nature of the method, and the identification of mineral phases requires additional effort. Therefore, like other researchers [<xref ref-type="bibr" rid="cit51">51</xref>], we have opted for software stitching series of overlapping images into a single panorama.</p><p>Currently, there are many examples of software for automatic stitching disparate photos into a single panoramic image. These include Adobe Photoshop, Fiji/ImageJ, and many others. However, using third-party software has a number of disadvantages. Powerful tools such as Adobe Photoshop can overly transform a panorama (unnaturally change colors, remove important details, mistaking them for artifacts of stitching). Integrating a third-party implementation into your system is tricky, and it also makes it impossible to make the changes needed to the algorithm to fit the specifics of the problem you're trying to solve.</p><p>We developed our own algorithm for stitching photographs into a panoramic image of the surface of a polished section [<xref ref-type="bibr" rid="cit52">52</xref>] (Fig. 4). The algorithm consists of two main stages: image alignment and further post-processing to improve visual perception. At the first stage, with the use of calibration images, geometric distortions of images are corrected using the Brown–Conrady model [<xref ref-type="bibr" rid="cit53">53</xref>], and photometric distortions are corrected using flat field compensation [<xref ref-type="bibr" rid="cit54">54</xref>]. Then, using the LoFTR neural network [<xref ref-type="bibr" rid="cit55">55</xref>], common key points are found in images that have overlapping areas. These are used to calculate perspective transformations (homographies) for pairs of adjacent images using RANSAC [<xref ref-type="bibr" rid="cit50">50</xref>], after which all images are transformed into the coordinates of a single image (reference image). Finally, global panorama optimization is performed to minimize the alignment errors. The result of this stage is a preliminary panorama, a collage. The second stage involves improving the initial panorama. The differences in exposure between images are compensated. The seams between images are masked by constructing the least noticeable seam using the graphcut method [<xref ref-type="bibr" rid="cit56">56</xref>], taking into account the differences in color and gradients of neighboring pixels. The final step is to blend the images near the joints of the panorama tiles to remove any remaining stitching artifacts. The LumenStone P1 dataset, compiled for the panorama construction, was used to test the algorithm. The method does not require prior training, and the processing speed for a single panorama consisting of 25 images at an Intel Xeon Gold 6226R CPU is approximately 5 minutes.</p><p>Fig. 4. Illustration of the developed method for constructing panoramas: on the left, several images of the same polished section, taken with overlap; on the right, the constructed panorama</p></sec><sec><title>5. Additional methods for processing and analyzing images of polished sections</title><p>The application of deep learning methods for mineral segmentation in images requires accurate annotation of a large number of images, which is a labor-intensive process. To simplify the annotation process and create a segmentation model capable of recognizing the main ore minerals, the authors are developing a method of accelerated interactive annotation using superpixel clustering based on the SLIC [<xref ref-type="bibr" rid="cit57">57</xref>] and Felzenswalb [<xref ref-type="bibr" rid="cit58">58</xref>] methods. A geologist roughly annotates minerals with strokes, labeling entire areas of an image with the label of a particular mineral based on the scribble data and the superpixel map. The user adjusts the method's predictions until the final annotation is obtained. A distinctive feature of this approach is multi-scale clustering, which allows to quickly label both large homogeneous areas and small fragments, automatically breaking large clusters into smaller ones as needed.</p><p>One can also reduce the labor costs of data annotating by extending the training set with partially annotated data. The main idea behind this approach is to highlight areas of uncertainty (lack of confidence) in the trained segmentation model on images. The authors suggest highlighting areas of uncertainty in images [<xref ref-type="bibr" rid="cit59">59</xref>] using a hyperbolic radius [<xref ref-type="bibr" rid="cit60">60</xref>] that reduces the scope of annotation to 5–10% of the original image (Fig. 5).</p><p>Fig. 5. The result of uncertainty area assessment method:a – original image; b – prediction of segmentation model uncertainty areas;c – areas for manual labeling</p><p>The final stage after recognizing and segmenting all minerals in the images is the statistical analysis of an image. It is responsible for conducting quantitative analysis to assess the areal ratio of mineral phases and their particle size analysis with separating fractions by size class for each mineral. This stage is currently under development.</p><p>Findings</p><p>The result of the authors' research into the automatic analysis of microscopic images of geological polished sections to determine mineral composition was the creation of an open image dataset dataset called LumenStone and a number of algorithms and methods that solve the main problems encountered:</p><p>1. Neural network methods for mineral segmentation</p><p>A convolutional neural network model for mineral segmentation and a special method for sampling training data have been developed, allowing the existing class imbalance to be neutralized. The accuracy of mineral segmentation according to the IoU metric was as follows: non-metallic minerals – 0.912, bornite – 0.938, chalcopyrite – 0.899, galena – 0.905, magnetite – 0.650, pentlandite – 0.790, pyrrhotite – 0.928, pyrite – 0.964, sphalerite – 0.922, tennantite – 0.882. The overall pixel accuracy (PA) of the segmentation was 0.96. The differences in mineral identification results can be explained by the difference in the size of the training sets used for LumenStone S1 and LumenStone S2.</p><p>2. Adaptive methods for image calibration and preprocessing</p><p>An algorithm has been developed for adapting images of polished sections obtained under different shooting conditions using partial user annotation. Pixel segmentation accuracy for distorted images increased from 0.29 (before) to 0.87 after adaptation using annotation covering approximately 30–35% of the image.</p><p>3. Methods for joint processing of heterogeneous images</p><p>The developed algorithm for segmenting anisotropic minerals using additional rotated XPL images improved the quality of anisotropic mineral segmentation by 3–12%. It has been shown that the best results can be achieved by using 6 additional rotated images.</p><p>4. Methods for creating panoramic images</p><p>A method for constructing panoramic microscopic images of polished sections has been developed. The root mean square error of alignment of panorama tiles from 25 images was 0.5–0.6 px. The resulting panoramas have a resolution of 12000×8000 pixels and can be used for automatic mineral segmentation. The implemented method does not have the disadvantages of less specialized solutions such as Adobe Photoshop, Fiji, and Panorama Studio.</p><p>5. Additional methods for processing and analyzing images of polished sections</p><p>A prototype method for interactive annotation of polished section images has been developed, which significantly speeds up the process of preparing data for training segmentation models. A method for automatically searching for areas of uncertainty has also been developed, allowing image annotation to be prioritized and significantly reducing the scope of annotation required.</p></sec><sec><title>Conclusion</title><p>This paper presents the authors' experience in developing a set of methods for the automatic analysis of images of polished sections for the identification of ore minerals. The developed segmentation method based on a convolutional neural network is capable of identifying nine ore minerals (with correct distinguishing between ore minerals and non-metallic phases) with an IoU accuracy = 0.88 and PA = 0.96. The potential of using additional information from XPL images to increase the accuracy of anisotropic mineral identification was demonstrated.</p><p>The developed methods of interactive annotation and image adaptation significantly accelerate and improve the training and use of segmentation models on new data. It is worth noting the method developed by the authors for obtaining panoramic images of polished sections, which allows detailed images of the entire surface of polished sections to be obtained in high resolution without expensive equipment. Unlike existing software solutions, this method does not distort the final panorama that has a positive effect on the segmentation results. Working with large-format images opens up new possibilities for the automatic analysis of images of polished sections.</p><p>The results obtained justify the need for further development of the area under consideration and form the basis for the creation of an intelligent quantitative assessment system capable not only of identifying minerals and calculating their areal fractions and performing particle-size analysis by size class, but also determining the types of minerals intergrowths. The implementation of this methodology will open up new possibilities in digital petrography, enabling fast, economical, and reproducible mineralogical analysis on optical microscopes in reflected light. Ultimately, this will enable the formation of unified criteria for analyzing the structural and textural characteristics of mineral associations for genesis comparison of different deposits.</p><p>Currently, the authors are integrating most of the methods and algorithms described in this paper into their PathScribe software platform [<xref ref-type="bibr" rid="cit61">61</xref>]. This platform is a cloud-based client-server solution with cross-platform clients for working with ultra-high-resolution images and is designed for universal use in both scientific and educational applications. The authors hope that the ability to work with panoramic images of polished sections using convenient tools for annotation and fully automatic analysis will be useful for geologists of various specializations.</p><p> </p></sec></body><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">De Castro B., Benzaazoua M., Chopard A., et al. Automated mineralogical characterization using optical microscopy: Review and recommendations. Minerals Engineering. 2022;189:107896. https://doi.org/10.1016/j.mineng.2022.107896</mixed-citation><mixed-citation xml:lang="en">De Castro B., Benzaazoua M., Chopard A., et al. Automated mineralogical characterization using optical microscopy: Review and recommendations. Minerals Engineering. 2022;189:107896. https://doi.org/10.1016/j.mineng.2022.107896</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Duncan P., Gavyn K. R. Unlocking the applications of automated mineral analysis. Geology Today. 2011;27(6):226–235. https://doi.org/10.1111/j.1365-2451.2011.00818.x</mixed-citation><mixed-citation xml:lang="en">Duncan P., Gavyn K. R. Unlocking the applications of automated mineral analysis. Geology Today. 2011;27(6):226–235. https://doi.org/10.1111/j.1365-2451.2011.00818.x</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Юшко С. А. Методы лабораторных исследований руд. М.: Недра; 1984. 389 с.</mixed-citation><mixed-citation xml:lang="en">Yushko S. A. Methods of laboratory ore research. Moscow: Nedra; 1984. 389 p. (In Russ.)</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Craig J. R., Vaughan D. J. Ore microscopy and ore petrography. Manchester: A Wiley-interscience Publication; 1994. 446 p.</mixed-citation><mixed-citation xml:lang="en">Craig J. R., Vaughan D. J. Ore microscopy and ore petrography. Manchester: A Wiley-interscience Publication; 1994. 446 p.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Bonifazi G. Digital multispectral techniques and automated image analysis procedures for industrial ore modelling. Minerals Engineering. 1995;8(7):779–794. https://doi.org/10.1016/0892-6875(95)00039-S</mixed-citation><mixed-citation xml:lang="en">Bonifazi G. Digital multispectral techniques and automated image analysis procedures for industrial ore modelling. Minerals Engineering. 1995;8(7):779–794. https://doi.org/10.1016/0892-6875(95)00039-S</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Marschallinger R. Automatic mineral classification in the macroscopic scale. Computers &amp; Geosciences. 1997;23(1):119–126. https://doi.org/10.1016/S0098-3004(96)00074-X</mixed-citation><mixed-citation xml:lang="en">Marschallinger R. Automatic mineral classification in the macroscopic scale. Computers &amp; Geosciences. 1997;23(1):119–126. https://doi.org/10.1016/S0098-3004(96)00074-X</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Berry R., Walters S.G., McMahon C. Automated mineral identification by optical microscopy. In: Ninth International Congress for Applied Mineralogy. Brisbane, Australia, 8–10 September 2008. Brisbane: QLD; 2008. Pp. 91–94.</mixed-citation><mixed-citation xml:lang="en">Berry R., Walters S.G., McMahon C. Automated mineral identification by optical microscopy. In: Ninth International Congress for Applied Mineralogy. Brisbane, Australia, 8–10 September 2008. Brisbane: QLD; 2008. Pp. 91–94.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Shoji T., Keneda H. An interactive system to assist mineral identification in ore microscopy. Mathematical Geology. 1994;26:961–972. https://doi.org/10.1007/BF02083424</mixed-citation><mixed-citation xml:lang="en">Shoji T., Keneda H. An interactive system to assist mineral identification in ore microscopy. Mathematical Geology. 1994;26:961–972. https://doi.org/10.1007/BF02083424</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">López-Benito A., Catalina J. C., Alarcón D., et al. Automated ore microscopy based on multispectral measurements of specular reflectance. I–A comparative study of some supervised classification techniques. Minerals Engineering. 2020;146:106136. https://doi.org/10.1016/j.mineng.2019.106136</mixed-citation><mixed-citation xml:lang="en">López-Benito A., Catalina J. C., Alarcón D., et al. Automated ore microscopy based on multispectral measurements of specular reflectance. I–A comparative study of some supervised classification techniques. Minerals Engineering. 2020;146:106136. https://doi.org/10.1016/j.mineng.2019.106136</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Berrezueta E., Ordóñez-Casado B., Bonilla W., Banda R., Castroviejo R., Carrión P., Puglla S. Ore petrography using optical image analysis: application to Zaruma-Portovelo deposit (Ecuador). Geosciences. 2016;6(2):30. https://doi.org/10.3390/geosciences6020030</mixed-citation><mixed-citation xml:lang="en">Berrezueta E., Ordóñez-Casado B., Bonilla W., Banda R., Castroviejo R., Carrión P., Puglla S. Ore petrography using optical image analysis: application to Zaruma-Portovelo deposit (Ecuador). Geosciences. 2016;6(2):30. https://doi.org/10.3390/geosciences6020030</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Köse C., Alp I., İkibaş C. Statistical methods for segmentation and quantification of minerals in ore microscopy. Minerals Engineering. 2012;30:19–32. https://doi.org/10.1016/j.mineng.2012.01.008</mixed-citation><mixed-citation xml:lang="en">Köse C., Alp I., İkibaş C. Statistical methods for segmentation and quantification of minerals in ore microscopy. Minerals Engineering. 2012;30:19–32. https://doi.org/10.1016/j.mineng.2012.01.008</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Krawczykowska A., Trybalski K., Krawczykowski D. The application of modern techniques and measurement devices for identification of copper ore types and their properties. Archives of Mining Sciences. 2013;58(2):433–448. https://doi.org/10.2478/amsc-2013-0029</mixed-citation><mixed-citation xml:lang="en">Krawczykowska A., Trybalski K., Krawczykowski D. The application of modern techniques and measurement devices for identification of copper ore types and their properties. Archives of Mining Sciences. 2013;58(2):433–448. https://doi.org/10.2478/amsc-2013-0029</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Iglesias J. C. A, Augusto K. S, Gomes O. D. F. M., et al. Automatic characterization of iron ore by digital microscopy and image analysis. Journal of Materials Research and Technology. 2018;7(3):376–380. https://doi.org/10.1016/j.jmrt.2018.06.014</mixed-citation><mixed-citation xml:lang="en">Iglesias J. C. A, Augusto K. S, Gomes O. D. F. M., et al. Automatic characterization of iron ore by digital microscopy and image analysis. Journal of Materials Research and Technology. 2018;7(3):376–380. https://doi.org/10.1016/j.jmrt.2018.06.014</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Tang K., Chen J., Zhou H., Liu J. Deep convolutional neural network for 3D mineral identification and liberation analysis. Minerals Engineering. 2022;183:107592. https://doi.org/10.1016/j.mineng.2022.107592</mixed-citation><mixed-citation xml:lang="en">Tang K., Chen J., Zhou H., Liu J. Deep convolutional neural network for 3D mineral identification and liberation analysis. Minerals Engineering. 2022;183:107592. https://doi.org/10.1016/j.mineng.2022.107592</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Zhou Z., Yuan H., Cai X. Rock Thin section image identification based on convolutional neural networks of adaptive and second-order pooling methods. Mathematics. 2023;11(5):1245. https://doi.org/10.3390/math11051245</mixed-citation><mixed-citation xml:lang="en">Zhou Z., Yuan H., Cai X. Rock Thin section image identification based on convolutional neural networks of adaptive and second-order pooling methods. Mathematics. 2023;11(5):1245. https://doi.org/10.3390/math11051245</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Kirillov A., Mintun E., Ravi N., et al. Segment anything. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. 2023;4015–4026. https://doi.org/10.48550/arXiv.2304.02643</mixed-citation><mixed-citation xml:lang="en">Kirillov A., Mintun E., Ravi N., et al. Segment anything. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. 2023;4015–4026. https://doi.org/10.48550/arXiv.2304.02643</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Hatamizadeh A., Kautz J. Mambavision: A hybrid mamba-transformer vision backbone. arXiv preprint arXiv: 2407.08083. 2024. https://doi.org/10.48550/arXiv.2407.08083</mixed-citation><mixed-citation xml:lang="en">Hatamizadeh A., Kautz J. Mambavision: A hybrid mamba-transformer vision backbone. arXiv preprint arXiv: 2407.08083. 2024. https://doi.org/10.48550/arXiv.2407.08083</mixed-citation></citation-alternatives></ref><ref id="cit18"><label>18</label><citation-alternatives><mixed-citation xml:lang="ru">Liu M. W., Lin Y. H., Lo Y. C., et al. Defect Detection of grinded and polished workpieces using faster R-CNN. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 2021. Pp. 1290–1296. https://doi.org/10.1109/AIM46487.2021.9517664</mixed-citation><mixed-citation xml:lang="en">Liu M. W., Lin Y. H., Lo Y. C., et al. Defect Detection of grinded and polished workpieces using faster R-CNN. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. 2021. Pp. 1290–1296. https://doi.org/10.1109/AIM46487.2021.9517664</mixed-citation></citation-alternatives></ref><ref id="cit19"><label>19</label><citation-alternatives><mixed-citation xml:lang="ru">Zhongliang L. V., Zhenyu Lu., Kewen Xia., et al. LAACNet: Lightweight adaptive activation convolution network-based defect detection on polished metal surfaces. Engineering Applications of Artificial Intelligence. 2024;133(E):108482. https://doi.org/10.1016/j.engappai.2024.108482</mixed-citation><mixed-citation xml:lang="en">Zhongliang L. V., Zhenyu Lu., Kewen Xia., et al. LAACNet: Lightweight adaptive activation convolution network-based defect detection on polished metal surfaces. Engineering Applications of Artificial Intelligence. 2024;133(E):108482. https://doi.org/10.1016/j.engappai.2024.108482</mixed-citation></citation-alternatives></ref><ref id="cit20"><label>20</label><citation-alternatives><mixed-citation xml:lang="ru">Sivkova T., Gusev A., Syropyatov A. Technology for cast iron microstructure analysis in SIAMS software using neural networks. In: Proceedings of the 31th International Conference on Computer Graphics and Vision. September 27–30, 2021, Nizhny Novgorod, Russia. 2021;2:772–780.</mixed-citation><mixed-citation xml:lang="en">Sivkova T., Gusev A., Syropyatov A. Technology for cast iron microstructure analysis in SIAMS software using neural networks. In: Proceedings of the 31th International Conference on Computer Graphics and Vision. September 27–30, 2021, Nizhny Novgorod, Russia. 2021;2:772–780.</mixed-citation></citation-alternatives></ref><ref id="cit21"><label>21</label><citation-alternatives><mixed-citation xml:lang="ru">Amaral B., Soares A.K., Iglesias J.C.Á., Caldas T.D.P., Santos R.B.M., Paciornik S. Instance segmentation of quartz in iron ore optical microscopy images by deep learning. Minerals Engineering. 2024;211:108681. https://doi.org/10.1016/j.mineng.2024.108681</mixed-citation><mixed-citation xml:lang="en">Amaral B., Soares A.K., Iglesias J.C.Á., Caldas T.D.P., Santos R.B.M., Paciornik S. Instance segmentation of quartz in iron ore optical microscopy images by deep learning. Minerals Engineering. 2024;211:108681. https://doi.org/10.1016/j.mineng.2024.108681</mixed-citation></citation-alternatives></ref><ref id="cit22"><label>22</label><citation-alternatives><mixed-citation xml:lang="ru">Maitre J., Bouchard K., Bédard L.P. Mineral grains recognition using computer vision and machine learning. Computers &amp; Geosciences. 2019;130:84–93. https://doi.org/10.1016/j.cageo.2019.05.009</mixed-citation><mixed-citation xml:lang="en">Maitre J., Bouchard K., Bédard L.P. Mineral grains recognition using computer vision and machine learning. Computers &amp; Geosciences. 2019;130:84–93. https://doi.org/10.1016/j.cageo.2019.05.009</mixed-citation></citation-alternatives></ref><ref id="cit23"><label>23</label><citation-alternatives><mixed-citation xml:lang="ru">Song Y., Huang Z., Shen C., et al. Deep learning-based automated image segmentation for concrete petrographic analysis. Cement and Concrete Research. 2020;135:106118. https://doi.org/10.1016/j.cemconres.2020.106118</mixed-citation><mixed-citation xml:lang="en">Song Y., Huang Z., Shen C., et al. Deep learning-based automated image segmentation for concrete petrographic analysis. Cement and Concrete Research. 2020;135:106118. https://doi.org/10.1016/j.cemconres.2020.106118</mixed-citation></citation-alternatives></ref><ref id="cit24"><label>24</label><citation-alternatives><mixed-citation xml:lang="ru">Donskoi E., Hapugoda S., Manuel J. R., et al. Automated optical image analysis of iron ore sinter. Minerals. 2021;11(6):562. https://doi.org/10.3390/min11060562</mixed-citation><mixed-citation xml:lang="en">Donskoi E., Hapugoda S., Manuel J. R., et al. Automated optical image analysis of iron ore sinter. Minerals. 2021;11(6):562. https://doi.org/10.3390/min11060562</mixed-citation></citation-alternatives></ref><ref id="cit25"><label>25</label><citation-alternatives><mixed-citation xml:lang="ru">Donskoi E., Poliakov A. Advances in optical image analysis textural segmentation in ironmaking. Applied Sciences. 2020;10(18):6242. https://doi.org/10.3390/app10186242</mixed-citation><mixed-citation xml:lang="en">Donskoi E., Poliakov A. Advances in optical image analysis textural segmentation in ironmaking. Applied Sciences. 2020;10(18):6242. https://doi.org/10.3390/app10186242</mixed-citation></citation-alternatives></ref><ref id="cit26"><label>26</label><citation-alternatives><mixed-citation xml:lang="ru">Santoro L., Lezzerini M., Aquino A., et al. A novel method for evaluation of ore minerals based on optical microscopy and image analysis: preliminary results. Minerals. 2022;12(11):1348. https://doi.org/10.3390/min12111348</mixed-citation><mixed-citation xml:lang="en">Santoro L., Lezzerini M., Aquino A., et al. A novel method for evaluation of ore minerals based on optical microscopy and image analysis: preliminary results. Minerals. 2022;12(11):1348. https://doi.org/10.3390/min12111348</mixed-citation></citation-alternatives></ref><ref id="cit27"><label>27</label><citation-alternatives><mixed-citation xml:lang="ru">Su C., Wang Y., Zhu J., Zhang X. C. Rock classification in petrographic thin section images based on concatenated convolutional neural networks. Earth Science Informatics. 2020;13:1477–1484. https://doi.org/10.1007/s12145-020-00505-1</mixed-citation><mixed-citation xml:lang="en">Su C., Wang Y., Zhu J., Zhang X. C. Rock classification in petrographic thin section images based on concatenated convolutional neural networks. Earth Science Informatics. 2020;13:1477–1484. https://doi.org/10.1007/s12145-020-00505-1</mixed-citation></citation-alternatives></ref><ref id="cit28"><label>28</label><citation-alternatives><mixed-citation xml:lang="ru">Tang H., Wang H., Wang L., et al. An improved mineral image recognition method based on deep learning. JOM. 2023;75:2590–2602. https://doi.org/10.1007/s11837-023-05792-9</mixed-citation><mixed-citation xml:lang="en">Tang H., Wang H., Wang L., et al. An improved mineral image recognition method based on deep learning. JOM. 2023;75:2590–2602. https://doi.org/10.1007/s11837-023-05792-9</mixed-citation></citation-alternatives></ref><ref id="cit29"><label>29</label><citation-alternatives><mixed-citation xml:lang="ru">Khvostikov A. V., Korshunov D. M., Krylov A. S., Boguslavskii M. A. Automatic identification of minerals in images of polished sections. The International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences. 2021;XLIV-2/W1-2021:113–118. https://doi.org/10.5194/isprs-archives-XLIV-2-W1-2021-113-2021</mixed-citation><mixed-citation xml:lang="en">Khvostikov A. V., Korshunov D. M., Krylov A. S., Boguslavskii M. A. Automatic identification of minerals in images of polished sections. The International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences. 2021;XLIV-2/W1-2021:113–118. https://doi.org/10.5194/isprs-archives-XLIV-2-W1-2021-113-2021</mixed-citation></citation-alternatives></ref><ref id="cit30"><label>30</label><citation-alternatives><mixed-citation xml:lang="ru">Chen H., Zhang H., Yang G. A., Zhang L. Mutual information domain adaptation network for remotely sensed semantic segmentation. In: IEEE Transactions on Geoscience and Remote Sensing. 2022;60:1–16. https://doi.org/10.1109/TGRS.2022.3203910</mixed-citation><mixed-citation xml:lang="en">Chen H., Zhang H., Yang G. A., Zhang L. Mutual information domain adaptation network for remotely sensed semantic segmentation. In: IEEE Transactions on Geoscience and Remote Sensing. 2022;60:1–16. https://doi.org/10.1109/TGRS.2022.3203910</mixed-citation></citation-alternatives></ref><ref id="cit31"><label>31</label><citation-alternatives><mixed-citation xml:lang="ru">Nasim M. K., Tannistha M., Shrivastava A., Singh T. Seismic facies analysis: a deep domain adaptation approach. In: IEEE Transactions on Geoscience and Remote Sensing. 2020;60:1–16. https://doi.org/10.1109/TGRS.2022.3151883</mixed-citation><mixed-citation xml:lang="en">Nasim M. K., Tannistha M., Shrivastava A., Singh T. Seismic facies analysis: a deep domain adaptation approach. In: IEEE Transactions on Geoscience and Remote Sensing. 2020;60:1–16. https://doi.org/10.1109/TGRS.2022.3151883</mixed-citation></citation-alternatives></ref><ref id="cit32"><label>32</label><citation-alternatives><mixed-citation xml:lang="ru">Lin D., Dai J., Jia J., et al. Scribblesup: Scribble-supervised convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Las Vegas, NV, USA; 2016. Pp. 3159–3167. https://doi.org/10.1109/CVPR.2016.344</mixed-citation><mixed-citation xml:lang="en">Lin D., Dai J., Jia J., et al. Scribblesup: Scribble-supervised convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Las Vegas, NV, USA; 2016. Pp. 3159–3167. https://doi.org/10.1109/CVPR.2016.344</mixed-citation></citation-alternatives></ref><ref id="cit33"><label>33</label><citation-alternatives><mixed-citation xml:lang="ru">Chen X., Cheung Y. S. J., Lim S. N., Zhao H. ScribbleSeg: Scribble-based interactive image segmentation. arXiv preprint arXiv: 2303.11320. 2023. https://doi.org/10.48550/arXiv.2303.11320</mixed-citation><mixed-citation xml:lang="en">Chen X., Cheung Y. S. J., Lim S. N., Zhao H. ScribbleSeg: Scribble-based interactive image segmentation. arXiv preprint arXiv: 2303.11320. 2023. https://doi.org/10.48550/arXiv.2303.11320</mixed-citation></citation-alternatives></ref><ref id="cit34"><label>34</label><citation-alternatives><mixed-citation xml:lang="ru">Cheng B., Parkhi O., Kirillov A. Pointly-supervised instance segmentation. In: IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). New Orleans, LA, USA; 2022. Pp. 2617–2626. https://doi.org/10.1109/CVPR52688.2022.00264</mixed-citation><mixed-citation xml:lang="en">Cheng B., Parkhi O., Kirillov A. Pointly-supervised instance segmentation. In: IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). New Orleans, LA, USA; 2022. Pp. 2617–2626. https://doi.org/10.1109/CVPR52688.2022.00264</mixed-citation></citation-alternatives></ref><ref id="cit35"><label>35</label><citation-alternatives><mixed-citation xml:lang="ru">Tang H., He. L., Huang B, et al. Segmentation and labeling of polished section images based on deep learning. Mining, Metallurgy &amp; Exploration. 2025;42:1053–1063. https://doi.org/10.1007/s42461-025-01205-4</mixed-citation><mixed-citation xml:lang="en">Tang H., He. L., Huang B, et al. Segmentation and labeling of polished section images based on deep learning. Mining, Metallurgy &amp; Exploration. 2025;42:1053–1063. https://doi.org/10.1007/s42461-025-01205-4</mixed-citation></citation-alternatives></ref><ref id="cit36"><label>36</label><citation-alternatives><mixed-citation xml:lang="ru">Tabani H., Balasubramaniam A., Marzbanet S., et al. Improving the efficiency of transformers for resource-constrained devices. In: 24th Euromicro Conference on Digital System Design (DSD). Palermo, Italy; 2021. Pp. 449–456. https://doi.org/10.1109/DSD53832.2021.00074</mixed-citation><mixed-citation xml:lang="en">Tabani H., Balasubramaniam A., Marzbanet S., et al. Improving the efficiency of transformers for resource-constrained devices. In: 24th Euromicro Conference on Digital System Design (DSD). Palermo, Italy; 2021. Pp. 449–456. https://doi.org/10.1109/DSD53832.2021.00074</mixed-citation></citation-alternatives></ref><ref id="cit37"><label>37</label><citation-alternatives><mixed-citation xml:lang="ru">Bressan P. O., Junior J. M. Martins J. A. C., et al. Semantic segmentation with labeling uncertainty and class imbalance. International Journal of Applied Earth Observation and Geoinformation. 2022;108:102690. https://doi.org/10.1016/j.jag.2022.102690</mixed-citation><mixed-citation xml:lang="en">Bressan P. O., Junior J. M. Martins J. A. C., et al. Semantic segmentation with labeling uncertainty and class imbalance. International Journal of Applied Earth Observation and Geoinformation. 2022;108:102690. https://doi.org/10.1016/j.jag.2022.102690</mixed-citation></citation-alternatives></ref><ref id="cit38"><label>38</label><citation-alternatives><mixed-citation xml:lang="ru">Li Z., Kamnitsas K., Glocker B. Analyzing overfitting underclass imbalance in neural networks for image segmentation. In: IEEE Transactions on Medical Imaging. 2021;40(3):1065–1077. https://doi.org/10.1109/TMI.2020.3046692</mixed-citation><mixed-citation xml:lang="en">Li Z., Kamnitsas K., Glocker B. Analyzing overfitting underclass imbalance in neural networks for image segmentation. In: IEEE Transactions on Medical Imaging. 2021;40(3):1065–1077. https://doi.org/10.1109/TMI.2020.3046692</mixed-citation></citation-alternatives></ref><ref id="cit39"><label>39</label><citation-alternatives><mixed-citation xml:lang="ru">Kochkarev A., Khvosticov A., Korshunov D., Boguslavskii M. Data balancing method for training segmentation neural networks. In: Proceedings of the 30th International Conference on Computer Graphics and Machine Vision (GraphiCon 2020). Saint Petersburg, Russia, 22–25 September. Saint Petersburg: Ceur Workshop Proceedings; 2020.</mixed-citation><mixed-citation xml:lang="en">Kochkarev A., Khvosticov A., Korshunov D., Boguslavskii M. Data balancing method for training segmentation neural networks. In: Proceedings of the 30th International Conference on Computer Graphics and Machine Vision (GraphiCon 2020). Saint Petersburg, Russia, 22–25 September. Saint Petersburg: Ceur Workshop Proceedings; 2020.</mixed-citation></citation-alternatives></ref><ref id="cit40"><label>40</label><citation-alternatives><mixed-citation xml:lang="ru">Ronneberger O., Fischer P., Brox T. U-Net: Convolutional networks for biomedical image segmentation. B: Navab N. Medical Image Computing and Computer-Assisted Intervention – MICCAI 2015. Cham: Springer; 2015. Pp. 234–41. https://doi.org/10.1007/978-3-319-24574-4_28</mixed-citation><mixed-citation xml:lang="en">Ronneberger O., Fischer P., Brox T. U-Net: Convolutional networks for biomedical image segmentation. B: Navab N. Medical Image Computing and Computer-Assisted Intervention – MICCAI 2015. Cham: Springer; 2015. Pp. 234–41. https://doi.org/10.1007/978-3-319-24574-4_28</mixed-citation></citation-alternatives></ref><ref id="cit41"><label>41</label><citation-alternatives><mixed-citation xml:lang="ru">Zhao H., Shi J., Qi X., et al. Pyramid scene parsing network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Honolulu, HI, USA; 2017. Pp. 2881–2890. https://doi.org/10.1109/CVPR.2017.660</mixed-citation><mixed-citation xml:lang="en">Zhao H., Shi J., Qi X., et al. Pyramid scene parsing network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Honolulu, HI, USA; 2017. Pp. 2881–2890. https://doi.org/10.1109/CVPR.2017.660</mixed-citation></citation-alternatives></ref><ref id="cit42"><label>42</label><citation-alternatives><mixed-citation xml:lang="ru">Xiao T., Liu Y., Zhou B., et al. Unified perceptual parsing for scene understanding. In: Ferrari V., Hebert M., Sminchisescu C., Weiss Y. (eds.) Computer Vision – ECCV 2018. ECCV 2018. Lecture Notes in Computer Science. Vol 11209. Springer, Cham; 2018. Pp. 418–434. https://doi.org/10.1007/978-3-030-01228-1_26</mixed-citation><mixed-citation xml:lang="en">Xiao T., Liu Y., Zhou B., et al. Unified perceptual parsing for scene understanding. In: Ferrari V., Hebert M., Sminchisescu C., Weiss Y. (eds.) Computer Vision – ECCV 2018. ECCV 2018. Lecture Notes in Computer Science. Vol 11209. Springer, Cham; 2018. Pp. 418–434. https://doi.org/10.1007/978-3-030-01228-1_26</mixed-citation></citation-alternatives></ref><ref id="cit43"><label>43</label><citation-alternatives><mixed-citation xml:lang="ru">Rezatofighi H., Tsoi N., Gwak J., et al. Generalized intersection over union: A metric and a loss for bounding box regression. In: Proceedings of the IEEE. 2019. Pp. 658–666. https://doi.org/10.48550/arXiv.1902.09630</mixed-citation><mixed-citation xml:lang="en">Rezatofighi H., Tsoi N., Gwak J., et al. Generalized intersection over union: A metric and a loss for bounding box regression. In: Proceedings of the IEEE. 2019. Pp. 658–666. https://doi.org/10.48550/arXiv.1902.09630</mixed-citation></citation-alternatives></ref><ref id="cit44"><label>44</label><citation-alternatives><mixed-citation xml:lang="ru">Reinhard E., Adhikhmin M., Gooch B., Shirley P. Color transfer between images. In: IEEE Computer Graphics and Applications. 2001;21(5):34-41. https://doi.org/10.1109/38.946629</mixed-citation><mixed-citation xml:lang="en">Reinhard E., Adhikhmin M., Gooch B., Shirley P. Color transfer between images. In: IEEE Computer Graphics and Applications. 2001;21(5):34-41. https://doi.org/10.1109/38.946629</mixed-citation></citation-alternatives></ref><ref id="cit45"><label>45</label><citation-alternatives><mixed-citation xml:lang="ru">Indychko O. I., Khvostikov A. V., Korshunov D. M., Boguslavskii M. A. Color adaptation in images of polished sections of geological specimens. Computational Mathematics and Modeling. 2022;33:487–500. https://doi.org/10.1007/s10598-023-09588-z</mixed-citation><mixed-citation xml:lang="en">Indychko O. I., Khvostikov A. V., Korshunov D. M., Boguslavskii M. A. Color adaptation in images of polished sections of geological specimens. Computational Mathematics and Modeling. 2022;33:487–500. https://doi.org/10.1007/s10598-023-09588-z</mixed-citation></citation-alternatives></ref><ref id="cit46"><label>46</label><citation-alternatives><mixed-citation xml:lang="ru">Wolf S. Color correction matrix for digital still and video imaging systems. Washington, D.C.: National Telecommunications and Information Administration; 2003. 28 p.</mixed-citation><mixed-citation xml:lang="en">Wolf S. Color correction matrix for digital still and video imaging systems. Washington, D.C.: National Telecommunications and Information Administration; 2003. 28 p.</mixed-citation></citation-alternatives></ref><ref id="cit47"><label>47</label><citation-alternatives><mixed-citation xml:lang="ru">Sharma G., Wu W., Dalal E. N. The CIEDE2000 color-difference formula: Implementation notes, supplementary test data, and mathematical observations. Color Research &amp; Application. 2005;30(1):21–30. https://doi.org/10.1002/col.20070</mixed-citation><mixed-citation xml:lang="en">Sharma G., Wu W., Dalal E. N. The CIEDE2000 color-difference formula: Implementation notes, supplementary test data, and mathematical observations. Color Research &amp; Application. 2005;30(1):21–30. https://doi.org/10.1002/col.20070</mixed-citation></citation-alternatives></ref><ref id="cit48"><label>48</label><citation-alternatives><mixed-citation xml:lang="ru">Razzhivina D. I., Korshunov D. M., Boguslavskiy M. A., et al. Registration and segmentation of PPL and XPL images of geological polished sections containing anisotropic minerals. Computational Mathematics and Modeling. 2024;34:16–26. https://doi.org/10.1007/s10598-024-09592-x</mixed-citation><mixed-citation xml:lang="en">Razzhivina D. I., Korshunov D. M., Boguslavskiy M. A., et al. Registration and segmentation of PPL and XPL images of geological polished sections containing anisotropic minerals. Computational Mathematics and Modeling. 2024;34:16–26. https://doi.org/10.1007/s10598-024-09592-x</mixed-citation></citation-alternatives></ref><ref id="cit49"><label>49</label><citation-alternatives><mixed-citation xml:lang="ru">Lowe D. G. Distinctive image features from scale invariant keypoints. International Journal of Computer Vision. 2004;60:91–110. https://doi.org/10.1023/B:VISI.0000029664.99615.94</mixed-citation><mixed-citation xml:lang="en">Lowe D. G. Distinctive image features from scale invariant keypoints. International Journal of Computer Vision. 2004;60:91–110. https://doi.org/10.1023/B:VISI.0000029664.99615.94</mixed-citation></citation-alternatives></ref><ref id="cit50"><label>50</label><citation-alternatives><mixed-citation xml:lang="ru">Fischler M. A., Bolles R. C. Random sample consensus: a paradigm for model fitting with applications to image analysis and automated cartography. Communications of the ACM. 1981;24(6):381–395.</mixed-citation><mixed-citation xml:lang="en">Fischler M. A., Bolles R. C. Random sample consensus: a paradigm for model fitting with applications to image analysis and automated cartography. Communications of the ACM. 1981;24(6):381–395.</mixed-citation></citation-alternatives></ref><ref id="cit51"><label>51</label><citation-alternatives><mixed-citation xml:lang="ru">Ro S.-H., Kim S.-H. An image stitching algorithm for the mineralogical analysis. Minerals Engineering. 2021:169;106968. https://doi.org/10.1016/j.mineng.2021.106968</mixed-citation><mixed-citation xml:lang="en">Ro S.-H., Kim S.-H. An image stitching algorithm for the mineralogical analysis. Minerals Engineering. 2021:169;106968. https://doi.org/10.1016/j.mineng.2021.106968</mixed-citation></citation-alternatives></ref><ref id="cit52"><label>52</label><citation-alternatives><mixed-citation xml:lang="ru">Nikolaev G., Korshunov D., Khvostikov A. Automatic stitching of panoramas for geological images of polished sections. ISPRS Annals of the Photogrammetry, Remote Sensing and Spatial Information Sciences. 2024;X-2/W1-2024:39–46. https://doi.org/10.5194/isprs-annals-X-2-W1-2024-39-2024</mixed-citation><mixed-citation xml:lang="en">Nikolaev G., Korshunov D., Khvostikov A. Automatic stitching of panoramas for geological images of polished sections. ISPRS Annals of the Photogrammetry, Remote Sensing and Spatial Information Sciences. 2024;X-2/W1-2024:39–46. https://doi.org/10.5194/isprs-annals-X-2-W1-2024-39-2024</mixed-citation></citation-alternatives></ref><ref id="cit53"><label>53</label><citation-alternatives><mixed-citation xml:lang="ru">Brown D. C. Decentering distortion of lenses. Photogrammetric Engineering. 1966:32(3);444–462.</mixed-citation><mixed-citation xml:lang="en">Brown D. C. Decentering distortion of lenses. Photogrammetric Engineering. 1966:32(3);444–462.</mixed-citation></citation-alternatives></ref><ref id="cit54"><label>54</label><citation-alternatives><mixed-citation xml:lang="ru">Seibert J. A., Boone J. M., Lindfors K. K. Flat-field correction technique for digital detectors. In: Proceedings of SPIE, Medical Imaging 1998: Physics of Medical Imaging. 1998:3336;348–354. https://doi.org/10.1117/12.317034</mixed-citation><mixed-citation xml:lang="en">Seibert J. A., Boone J. M., Lindfors K. K. Flat-field correction technique for digital detectors. In: Proceedings of SPIE, Medical Imaging 1998: Physics of Medical Imaging. 1998:3336;348–354. https://doi.org/10.1117/12.317034</mixed-citation></citation-alternatives></ref><ref id="cit55"><label>55</label><citation-alternatives><mixed-citation xml:lang="ru">Sun J., Shen Z., Wang Y., et al. LoFTR: Detector-free local feature matching with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). 2021. Pp. 8922–8931. https://doi.org/10.48550/arXiv.2104.00680</mixed-citation><mixed-citation xml:lang="en">Sun J., Shen Z., Wang Y., et al. LoFTR: Detector-free local feature matching with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). 2021. Pp. 8922–8931. https://doi.org/10.48550/arXiv.2104.00680</mixed-citation></citation-alternatives></ref><ref id="cit56"><label>56</label><citation-alternatives><mixed-citation xml:lang="ru">Boykov Y., Kolmogorov V. An experimental comparison of min-cut/max-flow algorithms for energy minimization in vision. In: IEEE Transactions on Pattern Analysis and Machine Intelligence. 2004;26(9):1124–1137. https://doi.org/10.1109/TPAMI.2004.60</mixed-citation><mixed-citation xml:lang="en">Boykov Y., Kolmogorov V. An experimental comparison of min-cut/max-flow algorithms for energy minimization in vision. In: IEEE Transactions on Pattern Analysis and Machine Intelligence. 2004;26(9):1124–1137. https://doi.org/10.1109/TPAMI.2004.60</mixed-citation></citation-alternatives></ref><ref id="cit57"><label>57</label><citation-alternatives><mixed-citation xml:lang="ru">Achanta R., Shaji A., Smith K., et al. SLIC superpixels compared to state-of-the-art superpixel methods. In: IEEE Transactions on Pattern Analysis and Machine Intelligence. 2012;34(11):2274–2282. https://doi.org/10.1109/TPAMI.2012.120</mixed-citation><mixed-citation xml:lang="en">Achanta R., Shaji A., Smith K., et al. SLIC superpixels compared to state-of-the-art superpixel methods. In: IEEE Transactions on Pattern Analysis and Machine Intelligence. 2012;34(11):2274–2282. https://doi.org/10.1109/TPAMI.2012.120</mixed-citation></citation-alternatives></ref><ref id="cit58"><label>58</label><citation-alternatives><mixed-citation xml:lang="ru">Felzenszwalb P. F., Huttenlocher D. P. Efficient graph-based image segmentation. International Journal of Computer Vision. 2004:59;167–181. https://doi.org/10.1023/B:VISI.0000022288.19776.77</mixed-citation><mixed-citation xml:lang="en">Felzenszwalb P. F., Huttenlocher D. P. Efficient graph-based image segmentation. International Journal of Computer Vision. 2004:59;167–181. https://doi.org/10.1023/B:VISI.0000022288.19776.77</mixed-citation></citation-alternatives></ref><ref id="cit59"><label>59</label><citation-alternatives><mixed-citation xml:lang="ru">Indychko O., Korshunov D., Khvostikov A. Using uncertainty to expand training sets for mineral segmentation in geological images. The International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences. 2025. In press.</mixed-citation><mixed-citation xml:lang="en">Indychko O., Korshunov D., Khvostikov A. Using uncertainty to expand training sets for mineral segmentation in geological images. The International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences. 2025. In press.</mixed-citation></citation-alternatives></ref><ref id="cit60"><label>60</label><citation-alternatives><mixed-citation xml:lang="ru">Franco L., Mandica P., Kallidromitis K., et al. Hyperbolic Active Learning for Semantic Segmentation under Domain Shift. In: Proceedings of the 41st International Conference on Machine Learning. 2024. https://doi.org/10.48550/arXiv.2306.11180</mixed-citation><mixed-citation xml:lang="en">Franco L., Mandica P., Kallidromitis K., et al. Hyperbolic Active Learning for Semantic Segmentation under Domain Shift. In: Proceedings of the 41st International Conference on Machine Learning. 2024. https://doi.org/10.48550/arXiv.2306.11180</mixed-citation></citation-alternatives></ref><ref id="cit61"><label>61</label><citation-alternatives><mixed-citation xml:lang="ru">Khvostikov A., Ippolitov V., Krylov A., et al. PathScribe: new software to work with whole slide histological images for education and research. In: Proceedings of the 2023 8th International Conference on Biomedical Imaging, Signal Processing. Singapore: ACM; 2023. Pp. 63–70. https://doi.org/10.1145/3634875.3634884</mixed-citation><mixed-citation xml:lang="en">Khvostikov A., Ippolitov V., Krylov A., et al. PathScribe: new software to work with whole slide histological images for education and research. In: Proceedings of the 2023 8th International Conference on Biomedical Imaging, Signal Processing. Singapore: ACM; 2023. Pp. 63–70. https://doi.org/10.1145/3634875.3634884</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
