<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">vestifm</journal-id><journal-title-group><journal-title xml:lang="ru">Известия Национальной академии наук Беларуси. Серия физико-математических наук</journal-title><trans-title-group xml:lang="en"><trans-title>Proceedings of the National Academy of Sciences of Belarus. Physics and Mathematics Series</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1561-2430</issn><issn pub-type="epub">2524-2415</issn><publisher><publisher-name>The Republican Unitary Enterprise Publishing House "Belaruskaya Navuka"</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.29235/1561-2430-2025-61-3-253-264</article-id><article-id custom-type="elpub" pub-id-type="custom">vestifm-853</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ИНФОРМАТИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>INFORMATICS</subject></subj-group></article-categories><title-group><article-title>Метод обнаружения объектов на изображениях дистанционного зондирования Земли ABS-YOLO на основе улучшенного YOLOv11</article-title><trans-title-group xml:lang="en"><trans-title>A remote sensing image object detection method ABS-YOLO based on improved YOLOv11</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0003-6976-5386</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Сяньи</surname><given-names>Ву</given-names></name><name name-style="western" xml:lang="en"><surname>Xianyi</surname><given-names>Wu</given-names></name></name-alternatives><bio xml:lang="ru"><p>Ву Сяньи – аспирант</p><p>пр. Независимости, 4, 220030, Минск</p></bio><bio xml:lang="en"><p>Wu Xianyi – Postgraduate Student</p><p>4, Nezavisimosti Ave., 220030, Minsk</p></bio><email xlink:type="simple">tigerv5872@gmail.com</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-9404-1206</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Абламейко</surname><given-names>С. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Ablameyko</surname><given-names>S. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Абламейко Сергей Владимирович – академик Национальной академии наук Беларуси, доктор технических наук, профессор</p><p>ул. Сурганова, 6, 220012, Минск</p></bio><bio xml:lang="en"><p>Sergey V. Ablameyko – Academician of the National Academy of Sciences of Belarus, Dr. Sc. (Engineering), Professor</p><p>6, Surganov Str., 220012, Minsk</p><p> </p></bio><email xlink:type="simple">ablameyko@yandex.by</email><xref ref-type="aff" rid="aff-2"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Белорусский государственный университет</institution></aff><aff xml:lang="en"><institution>Belarusian State University</institution></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru"><institution>Объединенный институт проблем информатики Национальной академии наук Беларуси</institution></aff><aff xml:lang="en"><institution>United Institute of Informatics Problems of the National Academy of Sciences of Belarus</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>14</day><month>10</month><year>2025</year></pub-date><volume>61</volume><issue>3</issue><fpage>253</fpage><lpage>264</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Сяньи В., Абламейко С.В., 2025</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="ru">Сяньи В., Абламейко С.В.</copyright-holder><copyright-holder xml:lang="en">Xianyi W., Ablameyko S.V.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://vestifm.belnauka.by/jour/article/view/853">https://vestifm.belnauka.by/jour/article/view/853</self-uri><abstract><p>Исследуется задача обнаружения объектов на изображениях дистанционного зондирования Земли, что важно для сельскохозяйственного мониторинга, городского планирования, раннего предупреждения о стихийных бедствиях и др. Из-за различных размеров объектов, сложного фона и плотного распределения мелких объектов на изображениях дистанционного зондирования часто возникают проблемы, связанные с высоким процентом пропущенных объектов и недостаточной точностью определения их координат. В связи с этим предлагается усовершенствованный метод для YOLOv11 – ABS-YOLO, который значительно повышает производительность обнаружения объектов за счет интеграции усредненной свертки (AConv), двунаправленной пирамиды взвешенных признаков (BiFPN) и механизма внимания Swin Transformer. Экспериментальные результаты показывают, что по сравнению с YOLOv11 предложенный метод обнаружения объектов ABS-YOLO с AConv, BiFPN и Swin Transformer достигает увеличения оценок mAP50 на 3,9 % и mAP50-95 на 2,6 % на наборе данных NWPU VHR-10 со значительным улучшением в точности и показателях полноты. Данный метод позволяет достичь баланса между эффективностью и точностью обнаружения объектов дистанционного зондирования благодаря предложенным усовершенствованиям.</p></abstract><trans-abstract xml:lang="en"><p>The problem of object detection in Earth remote sensing images is studied, which is important for agricultural monitoring, urban planning, early warning of natural disasters, etc. Due to the different sizes of objects, complex background, and dense distribution of small objects in remote sensing images, problems such as high percentage of missed objects and insufficient accuracy of their coordinates often arise. In this regard, an improved method for YOLOv11, ABS-YOLO, is proposed, which significantly improves the performance of object detection by integrating Averaged Convolution (AConv), Bidirectional Weighted Feature Pyramid (BiFPN), and Swin Transformer attention mechanism. Experimental results show that, compared with YOLOv11, the proposed object detection method ABS-YOLO with AConv, BiFPN, and Swin Transformer achieves 3.9 % increase in mAP50 estimations and 2.6 % increase in mAP50-95 on the NWPU VHR-10 dataset with significant improvement in precision and recall rates. This method allows achieving a balance between efficiency and accuracy of remote sensing object detection due to the proposed improvements.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>YOLOv11</kwd><kwd>Swin Transformer</kwd><kwd>изображение дистанционного зондирования</kwd><kwd>обнаружение объектов</kwd></kwd-group><kwd-group xml:lang="en"><kwd>YOLOv11</kwd><kwd>Swin Transformer</kwd><kwd>remote sensing image</kwd><kwd>object detection</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Velastegui-Montoya A., Montalván-Burbano N., Carrión-Mero P., Rivera-Torres H., Sadeck L., Adami M. Google Earth Engine: A Global Analysis and Future Trends. Remote Sensing, 2023, vol. 15, no. 14, art. ID 3675. https://doi.org/10.3390/rs15143675</mixed-citation><mixed-citation xml:lang="en">Velastegui-Montoya A., Montalván-Burbano N., Carrión-Mero P., Rivera-Torres H., Sadeck L., Adami M. Google Earth Engine: A Global Analysis and Future Trends. Remote Sensing, 2023, vol. 15, no. 14, art. ID 3675. https://doi.org/10.3390/rs15143675</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Liu H., Gong P., Wang J., Wang X., Ning G., Xu B. Production of global daily seamless data cubes and quantification of global land cover change from 1985 to 2020 – iMap World 1.0. Remote Sensing of Environment, 2021, vol. 258, art. ID 112364. https://doi.org/10.1016/j.rse.2021.112364</mixed-citation><mixed-citation xml:lang="en">Liu H., Gong P., Wang J., Wang X., Ning G., Xu B. Production of global daily seamless data cubes and quantification of global land cover change from 1985 to 2020 – iMap World 1.0. Remote Sensing of Environment, 2021, vol. 258, art. ID 112364. https://doi.org/10.1016/j.rse.2021.112364</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Zhang L. P., Shen H. F. Progress and future of remote sensing data fusion. Journal of Remote Sensing, 2016, vol. 20, no. 5, pp. 1050–1061. https://doi.org/10.11834/jrs.20166243</mixed-citation><mixed-citation xml:lang="en">Zhang L. P., Shen H. F. Progress and future of remote sensing data fusion. Journal of Remote Sensing, 2016, vol. 20, no. 5, pp. 1050–1061. https://doi.org/10.11834/jrs.20166243</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Dalal N., Triggs B. Histograms of oriented gradients for human detection. Proceedings of the 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR’05), 2005, vol. 1, pp. 886–893. https://doi.org/10.1109/CVPR.2005.177</mixed-citation><mixed-citation xml:lang="en">Dalal N., Triggs B. Histograms of oriented gradients for human detection. Proceedings of the 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR’05), 2005, vol. 1, pp. 886–893. https://doi.org/10.1109/CVPR.2005.177</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Lowe D. G. Object recognition from local scale-invariant features. Proceedings of the Seventh IEEE International Conference on Computer Vision, 1999, vol. 2, pp. 1150–1157. https://doi.org/10.1109/ICCV.1999.790410</mixed-citation><mixed-citation xml:lang="en">Lowe D. G. Object recognition from local scale-invariant features. Proceedings of the Seventh IEEE International Conference on Computer Vision, 1999, vol. 2, pp. 1150–1157. https://doi.org/10.1109/ICCV.1999.790410</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Maturana D., Mery D., Soto Á. Face recognition with local binary patterns, spatial pyramid histograms and naive Bayes nearest neighbor classification. Proceedings of the 2009 International Conference of the Chilean Computer Science Society, 2009, pp. 125–132. https://doi.org/10.1109/SCCC.2009.21</mixed-citation><mixed-citation xml:lang="en">Maturana D., Mery D., Soto Á. Face recognition with local binary patterns, spatial pyramid histograms and naive Bayes nearest neighbor classification. Proceedings of the 2009 International Conference of the Chilean Computer Science Society, 2009, pp. 125–132. https://doi.org/10.1109/SCCC.2009.21</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Girshick R., Donahue J., Darrell T., Malik J. Rich feature hierarchies for accurate object detection and semantic segmentation. Arxiv [Preprint], 2014. Available at: https://arxiv.org/abs/1311.2524. https://doi.org/10.48550/arXiv.1311.2524</mixed-citation><mixed-citation xml:lang="en">Girshick R., Donahue J., Darrell T., Malik J. Rich feature hierarchies for accurate object detection and semantic segmentation. Arxiv [Preprint], 2014. Available at: https://arxiv.org/abs/1311.2524. https://doi.org/10.48550/arXiv.1311.2524</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Girshick R. Fast R-CNN. Arxiv [Preprint], 2015. Available at: https://arxiv.org/abs/1504.08083. https://doi.org/10.48550/arXiv.1504.08083</mixed-citation><mixed-citation xml:lang="en">Girshick R. Fast R-CNN. Arxiv [Preprint], 2015. Available at: https://arxiv.org/abs/1504.08083. https://doi.org/10.48550/arXiv.1504.08083</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Ren S., He K., Girshick R., Sun J. Faster R-CNN: Towards real-time object detection with region proposal networks. Arxiv [Preprint], 2016. Available at: https://arxiv.org/abs/1506.01497. https://doi.org/10.48550/arXiv.1506.01497</mixed-citation><mixed-citation xml:lang="en">Ren S., He K., Girshick R., Sun J. Faster R-CNN: Towards real-time object detection with region proposal networks. Arxiv [Preprint], 2016. Available at: https://arxiv.org/abs/1506.01497. https://doi.org/10.48550/arXiv.1506.01497</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Redmon J., Divvala S., Girshick R., Farhadi A. You only look once: Unified, real-time object detection. Arxiv [Preprint], 2016. Available at: https://arxiv.org/abs/1506.02640. https://doi.org/10.48550/arXiv.1506.02640</mixed-citation><mixed-citation xml:lang="en">Redmon J., Divvala S., Girshick R., Farhadi A. You only look once: Unified, real-time object detection. Arxiv [Preprint], 2016. Available at: https://arxiv.org/abs/1506.02640. https://doi.org/10.48550/arXiv.1506.02640</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Liu W., Anguelov D., Erhan D., Szegedy C., Reed S., Fu C.-Y., Berg A. C. SSD: Single Shot MultiBox Detector. Computer Vision – ECCV 2016. ECCV 2016. Lecture Notes in Computer Science, vol 9905. Springer, 2016, pp. 21–37. https://doi.org/10.1007/978-3-319-46448-0_2</mixed-citation><mixed-citation xml:lang="en">Liu W., Anguelov D., Erhan D., Szegedy C., Reed S., Fu C.-Y., Berg A. C. SSD: Single Shot MultiBox Detector. Computer Vision – ECCV 2016. ECCV 2016. Lecture Notes in Computer Science, vol 9905. Springer, 2016, pp. 21–37. https://doi.org/10.1007/978-3-319-46448-0_2</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Zhang Y., Ye M., Zhu G., Liu Y., Guo P., Yan J. FFCA-YOLO for small object detection in remote sensing images. IEEE Transactions on Geoscience and Remote Sensing, 2024, vol. 62, pp. 1–15. https://doi.org/10.1109/TGRS.2024.3363057</mixed-citation><mixed-citation xml:lang="en">Zhang Y., Ye M., Zhu G., Liu Y., Guo P., Yan J. FFCA-YOLO for small object detection in remote sensing images. IEEE Transactions on Geoscience and Remote Sensing, 2024, vol. 62, pp. 1–15. https://doi.org/10.1109/TGRS.2024.3363057</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Yi H., Liu B., Zhao B., Liu E. Small object detection algorithm based on improved YOLOv8 for remote sensing. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing, 2024, vol. 17, pp. 1734–1747. https://doi.org/10.1109/JSTARS.2023.3339235</mixed-citation><mixed-citation xml:lang="en">Yi H., Liu B., Zhao B., Liu E. Small object detection algorithm based on improved YOLOv8 for remote sensing. IEEE Journal of Selected Topics in Applied Earth Observations and Remote Sensing, 2024, vol. 17, pp. 1734–1747. https://doi.org/10.1109/JSTARS.2023.3339235</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Wu T., Dong Y. YOLO-SE: Improved YOLOv8 for Remote Sensing Object Detection and Recognition. Applied Sciences, 2023, vol. 13, no. 24, art. ID 12977. https://doi.org/10.3390/app132412977</mixed-citation><mixed-citation xml:lang="en">Wu T., Dong Y. YOLO-SE: Improved YOLOv8 for Remote Sensing Object Detection and Recognition. Applied Sciences, 2023, vol. 13, no. 24, art. ID 12977. https://doi.org/10.3390/app132412977</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Wang X., Gao H., Jia Z., Li Z. BL-YOLOv8: An Improved Road Defect Detection Model Based on YOLOv8. Sensors, 2023, vol. 23, no. 20, art. ID 8361. https://doi.org/10.3390/s23208361</mixed-citation><mixed-citation xml:lang="en">Wang X., Gao H., Jia Z., Li Z. BL-YOLOv8: An Improved Road Defect Detection Model Based on YOLOv8. Sensors, 2023, vol. 23, no. 20, art. ID 8361. https://doi.org/10.3390/s23208361</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Soudeep S., Jahin M. A., Mridha M. F. Interpretable dynamic graph neural networks for small occluded object detection and tracking. Arxiv [Preprint], 2025. Available at: https://arxiv.org/abs/2411.17251. https://doi.org/10.48550/arXiv.2411.17251</mixed-citation><mixed-citation xml:lang="en">Soudeep S., Jahin M. A., Mridha M. F. Interpretable dynamic graph neural networks for small occluded object detection and tracking. Arxiv [Preprint], 2025. Available at: https://arxiv.org/abs/2411.17251. https://doi.org/10.48550/arXiv.2411.17251</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Khanam R., Hussain M. YOLOv11: An overview of the key architectural enhancements. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2410.17725. https://doi.org/10.48550/arXiv.2410.17725</mixed-citation><mixed-citation xml:lang="en">Khanam R., Hussain M. YOLOv11: An overview of the key architectural enhancements. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2410.17725. https://doi.org/10.48550/arXiv.2410.17725</mixed-citation></citation-alternatives></ref><ref id="cit18"><label>18</label><citation-alternatives><mixed-citation xml:lang="ru">Tan M., Pang R., Le Q. V. EfficientDet: Scalable and efficient object detection. Arxiv [Preprint], 2020. Available at: https://arxiv.org/abs/1911.09070. https://doi.org/10.48550/arXiv.1911.09070</mixed-citation><mixed-citation xml:lang="en">Tan M., Pang R., Le Q. V. EfficientDet: Scalable and efficient object detection. Arxiv [Preprint], 2020. Available at: https://arxiv.org/abs/1911.09070. https://doi.org/10.48550/arXiv.1911.09070</mixed-citation></citation-alternatives></ref><ref id="cit19"><label>19</label><citation-alternatives><mixed-citation xml:lang="ru">Lin T.-Y., Dollár P., Girshick R., He K., Hariharan B., Belongie S. Feature pyramid networks for object detection. Arxiv [Preprint], 2017. Available at: https://arxiv.org/abs/1612.03144. https://doi.org/10.48550/arXiv.1612.03144</mixed-citation><mixed-citation xml:lang="en">Lin T.-Y., Dollár P., Girshick R., He K., Hariharan B., Belongie S. Feature pyramid networks for object detection. Arxiv [Preprint], 2017. Available at: https://arxiv.org/abs/1612.03144. https://doi.org/10.48550/arXiv.1612.03144</mixed-citation></citation-alternatives></ref><ref id="cit20"><label>20</label><citation-alternatives><mixed-citation xml:lang="ru">Liu S., Qi L., Qin H., Shi J., Jia J. Path aggregation network for instance segmentation. Arxiv [Preprint], 2018. Available at: https://arxiv.org/abs/1803.01534. https://doi.org/10.48550/arXiv.1803.01534</mixed-citation><mixed-citation xml:lang="en">Liu S., Qi L., Qin H., Shi J., Jia J. Path aggregation network for instance segmentation. Arxiv [Preprint], 2018. Available at: https://arxiv.org/abs/1803.01534. https://doi.org/10.48550/arXiv.1803.01534</mixed-citation></citation-alternatives></ref><ref id="cit21"><label>21</label><citation-alternatives><mixed-citation xml:lang="ru">Ghiasi G., Lin T.-Y., Pang R., Le Q. V. NAS-FPN: Learning scalable feature pyramid architecture for object detection. Arxiv [Preprint], 2019. Available at: https://arxiv.org/abs/1904.07392. https://doi.org/10.48550/arXiv.1904.07392</mixed-citation><mixed-citation xml:lang="en">Ghiasi G., Lin T.-Y., Pang R., Le Q. V. NAS-FPN: Learning scalable feature pyramid architecture for object detection. Arxiv [Preprint], 2019. Available at: https://arxiv.org/abs/1904.07392. https://doi.org/10.48550/arXiv.1904.07392</mixed-citation></citation-alternatives></ref><ref id="cit22"><label>22</label><citation-alternatives><mixed-citation xml:lang="ru">Liu Z., Lin Y., Cao Y., Hu H., Wei Y., Zhang Z., Lin S., Guo B. Swin Transformer: Hierarchical vision transformer using shifted windows. Arxiv [Preprint], 2021. Available at: https://arxiv.org/abs/2103.14030. https://doi.org/10.48550/arXiv.2103.14030</mixed-citation><mixed-citation xml:lang="en">Liu Z., Lin Y., Cao Y., Hu H., Wei Y., Zhang Z., Lin S., Guo B. Swin Transformer: Hierarchical vision transformer using shifted windows. Arxiv [Preprint], 2021. Available at: https://arxiv.org/abs/2103.14030. https://doi.org/10.48550/arXiv.2103.14030</mixed-citation></citation-alternatives></ref><ref id="cit23"><label>23</label><citation-alternatives><mixed-citation xml:lang="ru">Su H., Wei S., Yan M., Wang C., Shi J., Zhang X. Object detection and instance segmentation in remote sensing imagery based on precise Mask R-CNN. IGARSS 2019 – 2019 IEEE International Geoscience and Remote Sensing Symposium, 2019, pp. 1454–1457. https://doi.org/10.1109/IGARSS.2019.8898573</mixed-citation><mixed-citation xml:lang="en">Su H., Wei S., Yan M., Wang C., Shi J., Zhang X. Object detection and instance segmentation in remote sensing imagery based on precise Mask R-CNN. IGARSS 2019 – 2019 IEEE International Geoscience and Remote Sensing Symposium, 2019, pp. 1454–1457. https://doi.org/10.1109/IGARSS.2019.8898573</mixed-citation></citation-alternatives></ref><ref id="cit24"><label>24</label><citation-alternatives><mixed-citation xml:lang="ru">Su H., Wei S., Liu S., Liang J., Wang C., Shi J., Zhang X. HQ-ISNet: High-Quality Instance Segmentation for Remote Sensing Imagery. Remote Sensing, 2020, vol. 12, no. 6, pp. 989. https://doi.org/10.3390/rs12060989</mixed-citation><mixed-citation xml:lang="en">Su H., Wei S., Liu S., Liang J., Wang C., Shi J., Zhang X. HQ-ISNet: High-Quality Instance Segmentation for Remote Sensing Imagery. Remote Sensing, 2020, vol. 12, no. 6, pp. 989. https://doi.org/10.3390/rs12060989</mixed-citation></citation-alternatives></ref><ref id="cit25"><label>25</label><citation-alternatives><mixed-citation xml:lang="ru">Khanam R., Hussain M. What is YOLOv5: A deep look into the internal features of the popular object detector. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2407.20892. https://doi.org/10.48550/arXiv.2407.20892</mixed-citation><mixed-citation xml:lang="en">Khanam R., Hussain M. What is YOLOv5: A deep look into the internal features of the popular object detector. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2407.20892. https://doi.org/10.48550/arXiv.2407.20892</mixed-citation></citation-alternatives></ref><ref id="cit26"><label>26</label><citation-alternatives><mixed-citation xml:lang="ru">Li C., Li L., Jiang H., Weng K., Geng Y., Li L., Ke Z. [et al.]. YOLOv6: A single-stage object detection framework for industrial applications. Arxiv [Preprint], 2022. Available at: https://arxiv.org/abs/2209.02976. https://doi.org/10.48550/arXiv.2209.02976</mixed-citation><mixed-citation xml:lang="en">Li C., Li L., Jiang H., Weng K., Geng Y., Li L., Ke Z. [et al.]. YOLOv6: A single-stage object detection framework for industrial applications. Arxiv [Preprint], 2022. Available at: https://arxiv.org/abs/2209.02976. https://doi.org/10.48550/arXiv.2209.02976</mixed-citation></citation-alternatives></ref><ref id="cit27"><label>27</label><citation-alternatives><mixed-citation xml:lang="ru">Jocher G., Qiu J., Chaurasia A. Ultralytics YOLO (Version 8.0.0) [Computer software]. 2023. Available at: https:// github.com/ultralytics/ultralytics</mixed-citation><mixed-citation xml:lang="en">Jocher G., Qiu J., Chaurasia A. Ultralytics YOLO (Version 8.0.0) [Computer software]. 2023. Available at: https:// github.com/ultralytics/ultralytics</mixed-citation></citation-alternatives></ref><ref id="cit28"><label>28</label><citation-alternatives><mixed-citation xml:lang="ru">Wang A., Chen H., Liu L., Chen K., Lin Z., Han J., Ding G. YOLOv10: Real-time end-to-end object detection. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2405.14458. https://doi.org/10.48550/arXiv.2405.14458</mixed-citation><mixed-citation xml:lang="en">Wang A., Chen H., Liu L., Chen K., Lin Z., Han J., Ding G. YOLOv10: Real-time end-to-end object detection. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2405.14458. https://doi.org/10.48550/arXiv.2405.14458</mixed-citation></citation-alternatives></ref><ref id="cit29"><label>29</label><citation-alternatives><mixed-citation xml:lang="ru">Ouyang D., He S., Zhang G., Luo M., Guo H., Zhan J., Huang Z. Efficient multi-scale attention module with cross-spatial learning. ICASSP 2023 – 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, 2023, pp. 1–5. https://doi.org/10.1109/ICASSP49357.2023.10096516</mixed-citation><mixed-citation xml:lang="en">Ouyang D., He S., Zhang G., Luo M., Guo H., Zhan J., Huang Z. Efficient multi-scale attention module with cross-spatial learning. ICASSP 2023 – 2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). IEEE, 2023, pp. 1–5. https://doi.org/10.1109/ICASSP49357.2023.10096516</mixed-citation></citation-alternatives></ref><ref id="cit30"><label>30</label><citation-alternatives><mixed-citation xml:lang="ru">Yang L., Zhang R.-Y., Li L., Xie X. SimAM: A simple, parameter-free attention module for convolutional neural networks. Proceedings of the 38th International Conference on Machine Learning, PMLR, 2021, vol. 139, pp. 11863–11874. Available at: https://proceedings.mlr.press/v139/yang21o.html</mixed-citation><mixed-citation xml:lang="en">Yang L., Zhang R.-Y., Li L., Xie X. SimAM: A simple, parameter-free attention module for convolutional neural networks. Proceedings of the 38th International Conference on Machine Learning, PMLR, 2021, vol. 139, pp. 11863–11874. Available at: https://proceedings.mlr.press/v139/yang21o.html</mixed-citation></citation-alternatives></ref><ref id="cit31"><label>31</label><citation-alternatives><mixed-citation xml:lang="ru">Chen Z., Lu S. CAF-YOLO: A Robust framework for multi-scale lesion detection in biomedical imagery. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2408.01897. https://doi.org/10.48550/arXiv.2408.01897</mixed-citation><mixed-citation xml:lang="en">Chen Z., Lu S. CAF-YOLO: A Robust framework for multi-scale lesion detection in biomedical imagery. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2408.01897. https://doi.org/10.48550/arXiv.2408.01897</mixed-citation></citation-alternatives></ref><ref id="cit32"><label>32</label><citation-alternatives><mixed-citation xml:lang="ru">Xu S., Zheng S., Xu W., Xu R., Wang C., Zhang J., Teng X., Li A., Guo L. HCF-Net: Hierarchical context fusion net work for infrared small object detection. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2403.10778. https://doi.org/10.48550/arXiv.2403.10778</mixed-citation><mixed-citation xml:lang="en">Xu S., Zheng S., Xu W., Xu R., Wang C., Zhang J., Teng X., Li A., Guo L. HCF-Net: Hierarchical context fusion net work for infrared small object detection. Arxiv [Preprint], 2024. Available at: https://arxiv.org/abs/2403.10778. https://doi.org/10.48550/arXiv.2403.10778</mixed-citation></citation-alternatives></ref><ref id="cit33"><label>33</label><citation-alternatives><mixed-citation xml:lang="ru">He K., Gkioxari G., Dollár P., Girshick R. Mask R-CNN. Arxiv [Preprint], 2018. Available at: https://arxiv.org/abs/1703.06870. https://doi.org/10.48550/arXiv.1703.06870</mixed-citation><mixed-citation xml:lang="en">He K., Gkioxari G., Dollár P., Girshick R. Mask R-CNN. Arxiv [Preprint], 2018. Available at: https://arxiv.org/abs/1703.06870. https://doi.org/10.48550/arXiv.1703.06870</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
