Article(id=1251480535583899932, tenantId=1146029695717560320, journalId=1251234078029037663, issueId=1251480531381207309, articleNumber=null, orderNo=null, doi=10.11887/j.issn.1001-2486.24090041, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1727452800000, receivedDateStr=2024-09-28, revisedDate=null, revisedDateStr=null, acceptedDate=null, acceptedDateStr=null, onlineDate=1776305811067, onlineDateStr=2026-04-16, pubDate=1766851200000, pubDateStr=2025-12-28, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1776305811067, onlineIssueDateStr=2026-04-16, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1776305811067, creator=13701087609, updateTime=1776305811067, updator=13701087609, issue=Issue{id=1251480531381207309, tenantId=1146029695717560320, journalId=1251234078029037663, year='2025', volume='47', issue='6', pageStart='1', pageEnd='306', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1776305810065, creator=13701087609, updateTime=1776305899308, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1251480905865446141, tenantId=1146029695717560320, journalId=1251234078029037663, issueId=1251480531381207309, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1251480905865446142, tenantId=1146029695717560320, journalId=1251234078029037663, issueId=1251480531381207309, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=224, endPage=234, ext={EN=ArticleExt(id=1251480535869112610, articleId=1251480535583899932, tenantId=1146029695717560320, journalId=1251234078029037663, language=EN, title=Multi-scale learning algorithm for infrared UAV target detection, columnId=1251480534468211258, journalTitle=Journal of National Niversity of Defense Technology, columnName=Control Science and Engineering·Information and Communication Engineering·Electronic Science and Technology, runingTitle=null, highlight=null, articleAbstract=
The issues of small UAV(unmanned aerial vehicle)target size, limited pixel coverage in images, weak texture detail information, and the difficulty in effectively extracting infrared UAV target features, which lead to low detection accuracy, were addressed by proposing a multiscale learning-based target detection algorithm.A multi-scale feature fusion structure was constructed in the neck network of the model, and a multi-scale feature learning module was introduced.Features from both deep and shallow networks were cascaded to capture target features at multiple scales, enriching the semantic and feature information of the feature map, which significantly improved the detection accuracy of small UAV targets.During training, SIoU was used in place of CIoU loss, minimizing the network model′s loss and enhancing the regression accuracy. Experimental results demonstrate that, compared to other infrared small target detection algorithms and mainstream methods, the proposed approach effectively improves the detection accuracy of UAV targets and meet the detection accuracy requirements for UAV target detection in practical applications.
, correspAuthors=Shudong YUAN, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Zhen ZUO, Shudong YUAN, Can LI, Honghe HUANG), CN=ArticleExt(id=1251480543116870059, articleId=1251480535583899932, tenantId=1146029695717560320, journalId=1251234078029037663, language=CN, title=多尺度学习的红外无人机目标检测算法, columnId=1251480534619206204, journalTitle=国防科技大学学报, columnName=控制科学与工程·信息与通信工程·电子科学与技术, runingTitle=null, highlight=null, articleAbstract=
针对无人机目标体积小、在图像中所占像素少、纹理细节信息弱、算法难以有效提取红外无人机目标特征导致检测精度较低等问题,提出多尺度学习的目标检测算法。通过在模型的颈部网络中构造多尺度特征融合结构,引入多尺度特征学习模块,将深层网络和浅层网络的特征进行级联,获取目标在多个尺度上的特征,丰富特征图的语义信息和特征信息,显著提高了算法对小型无人机目标的检测精度。在训练过程中使用SIoU代替CIoU损失函数,使网络模型在训练过程中损失最小化,提高了回归精度。实验结果表明,与其他红外小目标、主流检测算法相比,所提方法能有效提高无人机目标的检测精度,在实际应用中可以满足探测无人机目标的检测精度需求。
, correspAuthors=袁书东, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=r+2ncTUsWv2bYK/wGEBFkg==, magXml=Zlj3B+f1JFKghecy+OM1Bg==, pdfUrl=null, pdf=5QDd1QuDu6U13RYg+EY7uw==, pdfFileSize=3940979, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=zD+NTRIBysvqLnOQBV6lmw==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=7BiW4mPH4P4AquzpdmkWgw==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=左震, 袁书东, 李灿, 黄泓赫)}, authors=[Author(id=1251480543485968840, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=z.zuo@nudt.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251480543590826446, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480543485968840, language=EN, stringName=Zhen ZUO, firstName=Zhen, middleName=null, lastName=ZUO, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251480543687295443, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480543485968840, language=CN, stringName=左震, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=国防科技大学 智能科学学院,湖南 长沙 410073, bio={"content":"
左震(1982—),男,安徽安庆人,副研究员,博士,硕士生导师,E-mail:z.zuo@nudt.edu.cn
"}, bioImg=null, bioContent=
左震(1982—),男,安徽安庆人,副研究员,博士,硕士生导师,E-mail:z.zuo@nudt.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251480543364334015, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, xref=null, ext=[AuthorCompanyExt(id=1251480543381111232, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China), AuthorCompanyExt(id=1251480543389499841, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=国防科技大学 智能科学学院,湖南 长沙 410073)])]), Author(id=1251480543783764443, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=yuanshudong21@nudt.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1251480543913787878, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480543783764443, language=EN, stringName=Shudong YUAN, firstName=Shudong, middleName=null, lastName=YUAN, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251480544006062573, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480543783764443, language=CN, stringName=袁书东, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=国防科技大学 智能科学学院,湖南 长沙 410073, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251480543364334015, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, xref=null, ext=[AuthorCompanyExt(id=1251480543381111232, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China), AuthorCompanyExt(id=1251480543389499841, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=国防科技大学 智能科学学院,湖南 长沙 410073)])]), Author(id=1251480544089948659, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251480544312246780, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480544089948659, language=EN, stringName=Can LI, firstName=Can, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251480544404521473, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480544089948659, language=CN, stringName=李灿, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=国防科技大学 智能科学学院,湖南 长沙 410073, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251480543364334015, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, xref=null, ext=[AuthorCompanyExt(id=1251480543381111232, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China), AuthorCompanyExt(id=1251480543389499841, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=国防科技大学 智能科学学院,湖南 长沙 410073)])]), Author(id=1251480544475824647, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251480544626819598, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480544475824647, language=EN, stringName=Honghe HUANG, firstName=Honghe, middleName=null, lastName=HUANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251480544723288598, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, authorId=1251480544475824647, language=CN, stringName=黄泓赫, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=国防科技大学 智能科学学院,湖南 长沙 410073, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251480543364334015, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, xref=null, ext=[AuthorCompanyExt(id=1251480543381111232, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China), AuthorCompanyExt(id=1251480543389499841, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=国防科技大学 智能科学学院,湖南 长沙 410073)])])], keywords=[Keyword(id=1251480544899449377, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, orderNo=1, keyword=infrared imagery), Keyword(id=1251480545117553193, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, orderNo=2, keyword=detecting UAV), Keyword(id=1251480545243382319, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, orderNo=3, keyword=multi-scale learning), Keyword(id=1251480545369211445, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, orderNo=1, keyword=红外图像), Keyword(id=1251480545465680446, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, orderNo=2, keyword=探测无人机), Keyword(id=1251480545574732359, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, orderNo=3, keyword=多尺度学习)], refs=[Reference(id=1251480551660667728, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2022, volume=2022, issue=1, pageStart=4065734, pageEnd=null, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=ZHAI H Q, ZHANG Y, journalName=Journal of Robotics, refType=null, unstructuredReference=
ZHAI H Q,
ZHANG Y.Target detection of low-altitude UAV based on improved YOLOv3 network[J].
Journal of Robotics,
2022,
2022(1):4065734., articleTitle=Target detection of low-altitude UAV based on improved YOLOv3 network, refAbstract=null), Reference(id=1251480551748748119, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2024, volume=21, issue=null, pageStart=6001105, pageEnd=null, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=WANG MM, ZHANG B, journalName=IEEE Geoscience and Remote Sensing Letters, refType=null, unstructuredReference=
WANG MM,
ZHANG B.Contrastive learning and similarity feature fusion for UAV image target detection[J].
IEEE Geoscience and Remote Sensing Letters,
2024,
21:6001105., articleTitle=Contrastive learning and similarity feature fusion for UAV image target detection, refAbstract=null), Reference(id=1251480551845217120, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=139, issue=null, pageStart=109451, pageEnd=null, url=null, language=null, rfNumber=[3], rfOrder=2, authorNames=SUNKARA R, LUO T, journalName=Pattern Recognition, refType=null, unstructuredReference=
SUNKARA R,
LUO T.YOGA:deep object detection in the wild with lightweight feature learning and multiscale attention[J].
Pattern Recognition,
2023,
139:109451., articleTitle=YOGA:deep object detection in the wild with lightweight feature learning and multiscale attention, refAbstract=null), Reference(id=1251480551979434857, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=12, issue=4, pageStart=898, pageEnd=null, url=null, language=null, rfNumber=[4], rfOrder=3, authorNames=XU C, ZHANG Q, MEI L Y, journalName=Electronics, refType=null, unstructuredReference=
XU C,
ZHANG Q,
MEI L Y,
et al.Dense multiscale feature learning transformer embedding cross-shaped attention for road damage detection[J].
Electronics,
2023,
12(4):898., articleTitle=Dense multiscale feature learning transformer embedding cross-shaped attention for road damage detection, refAbstract=null), Reference(id=1251480552054932335, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=24, issue=7, pageStart=7717, pageEnd=7725, url=null, language=null, rfNumber=[5], rfOrder=4, authorNames=YANG L, ZHONG J H, ZHANG Y, journalName=IEEE Transactions on Intelligent Transportation Systems, refType=null, unstructuredReference=
YANG L,
ZHONG J H,
ZHANG Y,
et al.An improving faster-RCNN with multi-attention ResNet for small target detection in intelligent autonomous transport with 6G[J].
IEEE Transactions on Intelligent Transportation Systems,
2023,
24(7):7717-7725., articleTitle=An improving faster-RCNN with multi-attention ResNet for small target detection in intelligent autonomous transport with 6G, refAbstract=null), Reference(id=1251480552172372856, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=9196, pageEnd=9205, url=null, language=null, rfNumber=[6], rfOrder=5, authorNames=WANG K X, LIEW J H, ZOU Y T, journalName=null, refType=null, unstructuredReference=
WANG K X,
LIEW J H,
ZOU Y T,
et al.PANet:few-shot image semantic segmentation with prototype alignment[C]//Proceedings of the IEEE/CVF International Conference on Computer Vision (ICCV),
2019:9196-9205., articleTitle=PANet:few-shot image semantic segmentation with prototype alignment, refAbstract=null), Reference(id=1251480552306590595, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=7029, pageEnd=7038, url=null, language=null, rfNumber=[7], rfOrder=6, authorNames=GHIASI G, LIN T Y, LE Q V, journalName=null, refType=null, unstructuredReference=
GHIASI G,
LIN T Y,
LE Q V.NAS-FPN:learning scalable feature pyramid architecture for object detection[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR),
2019:7029-7038., articleTitle=NAS-FPN:learning scalable feature pyramid architecture for object detection, refAbstract=null), Reference(id=1251480552398865290, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2019, volume=33, issue=1, pageStart=9259, pageEnd=9266, url=null, language=null, rfNumber=[8], rfOrder=7, authorNames=ZHAO Q J, SHENG T, WANG Y T, journalName=Proceedings of the AAAI Conference on Artificial Intelligence, refType=null, unstructuredReference=
ZHAO Q J,
SHENG T,
WANG Y T,
et al.M2Det:a single-shot object detector based on multi-level feature pyramid network[J].
Proceedings of the AAAI Conference on Artificial Intelligence,
2019,
33(1):9259-9266., articleTitle=M2Det:a single-shot object detector based on multi-level feature pyramid network, refAbstract=null), Reference(id=1251480552533083028, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2022, volume=123, issue=null, pageStart=104107, pageEnd=null, url=null, language=null, rfNumber=[9], rfOrder=8, authorNames=YU C, LIU Y P, WU S H, journalName=Infrared Physics &Technology, refType=null, unstructuredReference=
YU C,
LIU Y P,
WU S H,
et al.Infrared small target detection based on multiscale local contrast learning networks[J].
Infrared Physics &Technology,
2022,
123:104107., articleTitle=Infrared small target detection based on multiscale local contrast learning networks, refAbstract=null), Reference(id=1251480552612774808, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=45, issue=7, pageStart=746, pageEnd=754, url=null, language=null, rfNumber=[10], rfOrder=9, authorNames=李向荣, 孙立辉, journalName=红外技术, refType=null, unstructuredReference=李向荣, 孙立辉.融合注意力机制的多尺度红外目标检测[J].
红外技术,
2023,
45(7):746-754., articleTitle=融合注意力机制的多尺度红外目标检测, refAbstract=null), Reference(id=1251480552730215332, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=45, issue=7, pageStart=746, pageEnd=754, url=null, language=null, rfNumber=[10], rfOrder=10, authorNames=LI X R, SUN L H, journalName=Infrared Technology, refType=null, unstructuredReference=
LI X R,
SUN L H.Multiscale infrared target detection based on attention mechanism[J].
Infrared Technology,
2023,
45(7):746-754.(in Chinese), articleTitle=Multiscale infrared target detection based on attention mechanism, refAbstract=null), Reference(id=1251480552826684335, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=59, issue=8, pageStart=227, pageEnd=238, url=null, language=null, rfNumber=[11], rfOrder=11, authorNames=张朝阳, 张上, 王恒涛, journalName=计算机工程与应用, refType=null, unstructuredReference=张朝阳, 张上, 王恒涛,
等.多尺度下遥感小目标多头注意力检测[J].
计算机工程与应用,
2023,
59(8):227-238., articleTitle=多尺度下遥感小目标多头注意力检测, refAbstract=null), Reference(id=1251480552923153335, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=59, issue=8, pageStart=227, pageEnd=238, url=null, language=null, rfNumber=[11], rfOrder=12, authorNames=ZHANG Z Y, ZHANG S, WANG H T, journalName=Computer Engineering and Applications, refType=null, unstructuredReference=
ZHANG Z Y,
ZHANG S,
WANG H T,
et al.Multi-head attention detection of small targets in remote sensing at multiple scales[J].
Computer Engineering and Applications,
2023,
59(8):227-238.(in Chinese), articleTitle=Multi-head attention detection of small targets in remote sensing at multiple scales, refAbstract=null), Reference(id=1251480553028010945, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2020, volume=34, issue=7, pageStart=12993, pageEnd=13000, url=null, language=null, rfNumber=[12], rfOrder=13, authorNames=ZHENG Z H, WANG P, LIU W, journalName=Proceedings of the AAAI Conference on Artificial Intelligence, refType=null, unstructuredReference=
ZHENG Z H,
WANG P,
LIU W,
et al.Distance-IoU loss:faster and better learning for bounding box regression[J].
Proceedings of the AAAI Conference on Artificial Intelligence,
2020,
34(7):12993-13000., articleTitle=Distance-IoU loss:faster and better learning for bounding box regression, refAbstract=null), Reference(id=1251480553111897035, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2024-04-02, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[13], rfOrder=14, authorNames=GEVORGYAN Z, journalName=null, refType=null, unstructuredReference=
GEVORGYAN Z. SIoU loss:more powerful learning for bounding box regression[EB/OL].(2022-05-25)[
2024-04-02].
https://arxiv.org/abs/2205.12740., articleTitle=SIoU loss:more powerful learning for bounding box regression, refAbstract=null), Reference(id=1251480553220948945, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2020, volume=5, issue=3, pageStart=291, pageEnd=302, url=null, language=null, rfNumber=[14], rfOrder=15, authorNames=回丙伟, 宋志勇, 范红旗, journalName=中国科学数据, refType=null, unstructuredReference=回丙伟, 宋志勇, 范红旗,
等.地/空背景下红外图像弱小飞机目标检测跟踪数据集[J].
中国科学数据,
2020,
5(3):291-302., articleTitle=地/空背景下红外图像弱小飞机目标检测跟踪数据集, refAbstract=null), Reference(id=1251480553325806554, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2020, volume=5, issue=3, pageStart=291, pageEnd=302, url=null, language=null, rfNumber=[14], rfOrder=16, authorNames=HUI B W, SONG Z Y, FAN H Q, journalName=China Scientific Data, refType=null, unstructuredReference=
HUI B W,
SONG Z Y,
FAN H Q,
et al.A dataset for infrared detection and tracking of dim-small aircraft targets under ground/air background[J].
China Scientific Data,
2020,
5(3):291-302.(in Chinese), articleTitle=A dataset for infrared detection and tracking of dim-small aircraft targets under ground/air background, refAbstract=null), Reference(id=1251480553443247076, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2010, volume=43, issue=6, pageStart=2145, pageEnd=2156, url=null, language=null, rfNumber=[15], rfOrder=17, authorNames=BAI X Z, ZHOU F G, journalName=Pattern Recognition, refType=null, unstructuredReference=
BAI X Z,
ZHOU F G.Analysis of new top-hat transformation and the application for infrared dim small target detection[J].
Pattern Recognition,
2010,
43(6):2145-2156., articleTitle=Analysis of new top-hat transformation and the application for infrared dim small target detection, refAbstract=null), Reference(id=1251480553573270514, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2016, volume=58, issue=null, pageStart=216, pageEnd=226, url=null, language=null, rfNumber=[16], rfOrder=18, authorNames=WEI Y T, YOU X G, LI H, journalName=Pattern Recognition, refType=null, unstructuredReference=
WEI Y T,
YOU X G,
LI H.Multiscale patch-based contrast measure for small infrared target detection[J].
Pattern Recognition,
2016,
58:216-226., articleTitle=Multiscale patch-based contrast measure for small infrared target detection, refAbstract=null), Reference(id=1251480553657156604, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=32, issue=null, pageStart=364, pageEnd=376, url=null, language=null, rfNumber=[17], rfOrder=19, authorNames=WU X, HONG D F, CHANUSSOT J, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
WU X,
HONG D F,
CHANUSSOT J.UIU-Net:U-Net in UNet for infrared small object detection[J].
IEEE Transactions on Image Processing,
2023,
32:364-376., articleTitle=UIU-Net:U-Net in UNet for infrared small object detection, refAbstract=null), Reference(id=1251480553787179014, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=32, issue=null, pageStart=1745, pageEnd=1758, url=null, language=null, rfNumber=[18], rfOrder=20, authorNames=LI B Y, XIAO C, WANG L G, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
LI B Y,
XIAO C,
WANG L G,
et al.Dense nested attention network for infrared small target detection[J].
IEEE Transactions on Image Processing,
2023,
32:1745-1758., articleTitle=Dense nested attention network for infrared small target detection, refAbstract=null), Reference(id=1251480553904619540, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2022, volume=19, issue=null, pageStart=7506205, pageEnd=null, url=null, language=null, rfNumber=[19], rfOrder=21, authorNames=HOU Q Y, ZHANG L W, TAN F J, journalName=IEEE Geoscience and Remote Sensing Letters, refType=null, unstructuredReference=
HOU Q Y,
ZHANG L W,
TAN F J,
et al.ISTDU-Net:infrared small-target detection U-Net[J].
IEEE Geoscience and Remote Sensing Letters,
2022,
19:7506205., articleTitle=ISTDU-Net:infrared small-target detection U-Net, refAbstract=null), Reference(id=1251480554038837280, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=5439, pageEnd=5448, url=null, language=null, rfNumber=[20], rfOrder=22, authorNames=TIAN Z, SHEN C H, WANG X L, journalName=null, refType=null, unstructuredReference=
TIAN Z,
SHEN C H,
WANG X L,
et al.BoxInst:high-performance instance segmentation with box annotations[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR),
2021:5439-5448., articleTitle=BoxInst:high-performance instance segmentation with box annotations, refAbstract=null), Reference(id=1251480554147889196, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=282, pageEnd=298, url=null, language=null, rfNumber=[21], rfOrder=23, authorNames=TIAN Z, SHEN C H, CHEN H, journalName=null, refType=null, unstructuredReference=
TIAN Z,
SHEN C H,
CHEN H.Conditional convolutions for instance segmentation[C]//Proceedings of the European Conference on Computer Vision,
2020:282-298., articleTitle=Conditional convolutions for instance segmentation, refAbstract=null), Reference(id=1251480554248552506, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2022, volume=44, issue=2, pageStart=1108, pageEnd=1121, url=null, language=null, rfNumber=[22], rfOrder=24, authorNames=BOLYA D, ZHOU C, XIAO F Y, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
BOLYA D,
ZHOU C,
XIAO F Y,
et al.YOLACT++better real-time instance segmentation[J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2022,
44 (2):1108-1121., articleTitle=YOLACT++better real-time instance segmentation, refAbstract=null), Reference(id=1251480554349215813, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2024-04-06, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[23], rfOrder=25, authorNames=HE K M, GKIOXARI G, DOLLÁR P, journalName=null, refType=null, unstructuredReference=
HE K M,
GKIOXARI G,
DOLLÁR P,
et al.Mask R-CNN[EB/OL].(2017-03-20)[
2024-04-06].
https://arxiv.org/abs/1703.06870., articleTitle=Mask R-CNN, refAbstract=null), Reference(id=1251480554449879117, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=7464, pageEnd=7475, url=null, language=null, rfNumber=[24], rfOrder=26, authorNames=WANG C Y, BOCHKOVSKIY A, LIAO H M, journalName=null, refType=null, unstructuredReference=
WANG C Y,
BOCHKOVSKIY A,
LIAO H M.YOLOv7:trainable bag-of-freebies sets new state-of-the-art for real-time object detectors[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR),
2023:7464-7475., articleTitle=YOLOv7:trainable bag-of-freebies sets new state-of-the-art for real-time object detectors, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1251480543364334015, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, xref=null, ext=[AuthorCompanyExt(id=1251480543381111232, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Intelligence Science and Technology, National University of Defense Technology, Changsha 410073, China), AuthorCompanyExt(id=1251480543389499841, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, companyId=1251480543364334015, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=国防科技大学 智能科学学院,湖南 长沙 410073)])], figs=[ArticleFig(id=1251480547202122332, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Fig.1, caption=
IRSDD-YOLOv8 network structure, figureFileSmall=E6mrDeSRykVlwH0P14dlGQ==, figureFileBig=zD+NTRIBysvqLnOQBV6lmw==, tableContent=null), ArticleFig(id=1251480547290202721, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=图1, caption=
IRSDD-YOLOv8网络结构, figureFileSmall=E6mrDeSRykVlwH0P14dlGQ==, figureFileBig=zD+NTRIBysvqLnOQBV6lmw==, tableContent=null), ArticleFig(id=1251480547541860983, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Fig.2, caption=
Comparison of feature fusion structures, figureFileSmall=QA5707J2KbWsciNOvPAEyA==, figureFileBig=HMVQmKASz1JkKujijMLw2g==, tableContent=null), ArticleFig(id=1251480547642524290, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=图2, caption=
特征融合结构的比较, figureFileSmall=QA5707J2KbWsciNOvPAEyA==, figureFileBig=HMVQmKASz1JkKujijMLw2g==, tableContent=null), ArticleFig(id=1251480547759964813, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Fig.3, caption=
Multi-scale feature learning module, figureFileSmall=MKNXuJiqHL5j7lhzcUuEog==, figureFileBig=BTgikODC9fRkaB0ot5SsmA==, tableContent=null), ArticleFig(id=1251480547856433812, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=图3, caption=
多尺度特征学习模块, figureFileSmall=MKNXuJiqHL5j7lhzcUuEog==, figureFileBig=BTgikODC9fRkaB0ot5SsmA==, tableContent=null), ArticleFig(id=1251480547978068639, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Fig.4, caption=
IRSDD-YOLOv8 and other algorithmic detection results, figureFileSmall=5ou7LzmwITUmEcPCKVey0Q==, figureFileBig=pE20QqMQXDX3PwhMqklNVw==, tableContent=null), ArticleFig(id=1251480548187783852, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=图4, caption=
IRSDD-YOLOv8及其他算法检测结果, figureFileSmall=5ou7LzmwITUmEcPCKVey0Q==, figureFileBig=pE20QqMQXDX3PwhMqklNVw==, tableContent=null), ArticleFig(id=1251480548284252850, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Fig.5, caption=
Example of feature extraction from the multi-scale feature learning module, figureFileSmall=SMZPeNUR0LlNiZB4Z/NtaA==, figureFileBig=xNM2V53k3bqvRGSlChHetg==, tableContent=null), ArticleFig(id=1251480548380721850, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=图5, caption=
多尺度特征学习模块的目标特征提取示例, figureFileSmall=SMZPeNUR0LlNiZB4Z/NtaA==, figureFileBig=xNM2V53k3bqvRGSlChHetg==, tableContent=null), ArticleFig(id=1251480548468802245, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Fig.6, caption=
Segmentation loss and precision-recall curves for ablation experiments, figureFileSmall=GcHGFL5eK6Ehn68Rcm+ghQ==, figureFileBig=+KvMVaCbLoGkhuC6B8aRzQ==, tableContent=null), ArticleFig(id=1251480548586242767, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=图6, caption=
消融实验的分割损失与精度-召回曲曲线, figureFileSmall=GcHGFL5eK6Ehn68Rcm+ghQ==, figureFileBig=+KvMVaCbLoGkhuC6B8aRzQ==, tableContent=null), ArticleFig(id=1251480548691100379, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.1, caption=
Number of images in the SIDD training and test sets
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模拟场景 | 训练集 | 测试集 | 总计 |
|---|
| 城市 | 874 | 219 | 1093 |
| 山地 | 1720 | 431 | 2151 |
| 海面 | 570 | 143 | 713 |
| 天空 | 624 | 156 | 780 |
| 总计 | 3788 | 949 | 4737 |
), ArticleFig(id=1251480548804346596, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表1, caption=
SIDD训练集和测试集中的图像数量
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模拟场景 | 训练集 | 测试集 | 总计 |
|---|
| 城市 | 874 | 219 | 1093 |
| 山地 | 1720 | 431 | 2151 |
| 海面 | 570 | 143 | 713 |
| 天空 | 624 | 156 | 780 |
| 总计 | 3788 | 949 | 4737 |
), ArticleFig(id=1251480548921787113, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.2, caption=
Hardware and software environment configuration
, figureFileSmall=null, figureFileBig=null, tableContent=
| 项目 | 配置 |
|---|
| 硬件 | GPU:NVIDIA GeForce RTX3060 |
| CPU:AMD Ryzen 75800H |
| 软件 | 系统:Ubuntu18.04 |
| 版本:CUDA11.1 |
), ArticleFig(id=1251480549035033329, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表2, caption=
软硬件环境配置
, figureFileSmall=null, figureFileBig=null, tableContent=
| 项目 | 配置 |
|---|
| 硬件 | GPU:NVIDIA GeForce RTX3060 |
| CPU:AMD Ryzen 75800H |
| 软件 | 系统:Ubuntu18.04 |
| 版本:CUDA11.1 |
), ArticleFig(id=1251480549131502330, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.3, caption=
Detection results of infrared small target algorithms in different scenarios
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法评价指标 | 检测算法 | 城市场景 | 山地场景 | 海面场景 | 天空场景 |
|---|
| μIoU | top-hat | 0.010 | 0.006 | 0.110 | 0.097 |
| MPCM | 0.027 | 0.001 | 0.004 | 0.034 |
| UIU-Net | 0.136 | 0.125 | 0.288 | 0.504 |
| DNANet | 0.364 | 0.062 | 0.114 | 0.464 |
| ISTDU-Net | 0.608 | 0.367 | 0.480 | 0.586 |
| YOLOv8n-seg | 0.812 | 0.728 | 0.649 | 0.837 |
| IRSDD-YOLOv8 | 0.824 | 0.752 | 0.665 | 0.839 |
| nIoU | top-hat | 0.010 | 0.013 | 0.134 | 0.172 |
| MPCM | 0.028 | 0.001 | 0.005 | 0.043 |
| UIU-Net | 0.322 | 0.200 | 0.402 | 0.595 |
| DNANet | 0.366 | 0.062 | 0.114 | 0.468 |
| ISTDU-Net | 0.571 | 0.336 | 0.475 | 0.573 |
| YOLOv8n-seg | 0.820 | 0.742 | 0.639 | 0.804 |
| IRSDD-YOLOv8 | 0.831 | 0.770 | 0.653 | 0.806 |
), ArticleFig(id=1251480549240554243, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表3, caption=
在不同场景下红外小目标算法的检测结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法评价指标 | 检测算法 | 城市场景 | 山地场景 | 海面场景 | 天空场景 |
|---|
| μIoU | top-hat | 0.010 | 0.006 | 0.110 | 0.097 |
| MPCM | 0.027 | 0.001 | 0.004 | 0.034 |
| UIU-Net | 0.136 | 0.125 | 0.288 | 0.504 |
| DNANet | 0.364 | 0.062 | 0.114 | 0.464 |
| ISTDU-Net | 0.608 | 0.367 | 0.480 | 0.586 |
| YOLOv8n-seg | 0.812 | 0.728 | 0.649 | 0.837 |
| IRSDD-YOLOv8 | 0.824 | 0.752 | 0.665 | 0.839 |
| nIoU | top-hat | 0.010 | 0.013 | 0.134 | 0.172 |
| MPCM | 0.028 | 0.001 | 0.005 | 0.043 |
| UIU-Net | 0.322 | 0.200 | 0.402 | 0.595 |
| DNANet | 0.366 | 0.062 | 0.114 | 0.468 |
| ISTDU-Net | 0.571 | 0.336 | 0.475 | 0.573 |
| YOLOv8n-seg | 0.820 | 0.742 | 0.639 | 0.804 |
| IRSDD-YOLOv8 | 0.831 | 0.770 | 0.653 | 0.806 |
), ArticleFig(id=1251480549337023247, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.4, caption=
Detection results of mainstream detection algorithms in different scenarios
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法评价指标 | 检测算法 | 城市场景 | 山地场景 | 海面场景 | 天空场景 |
|---|
| mAP@0.5:0.95 | BoxInst | 0.197 | — | — | 0.395 |
| CondInst | 0.565 | 0.284 | 0.292 | 0.673 |
| Mask R-CNN | 0.629 | 0.416 | 0.463 | 0.711 |
| YOLACT++ | 0.423 | 0.177 | 0.163 | 0.561 |
| YOLOv7 | 0.440 | 0.269 | 0.335 | 0.580 |
| YOLOv5 n-seg | 0.473 | 0.245 | 0.342 | 0.572 |
| YOLOv8n-seg | 0.477 | 0.253 | 0.337 | 0.591 |
| IRSDD-YOLOv8 | 0.511 | 0.309 | 0.352 | 0.606 |
| mAP@0.5 | BoxInst | 0.538 | 0.013 | — | 0.806 |
| CondInst | 0.936 | 0.731 | 0.819 | 0.977 |
| Mask R-CNN | 0.937 | 0.749 | 0.933 | 0.987 |
| YOLACT++ | 0.902 | 0.625 | 0.445 | 0.958 |
| YOLOv7 | 0.877 | 0.746 | 0.930 | 0.974 |
| YOLOv5 n-seg | 0.936 | 0.689 | 0.886 | 0.966 |
| YOLOv8n-seg | 0.927 | 0.664 | 0.829 | 0.957 |
| IRSDD-YOLOv8 | 0.939 | 0.785 | 0.902 | 0.965 |
| FPS | BoxInst | 9.60 | 10.26 | 8.97 | 9.06 |
| CondInst | 9.60 | 10.35 | 8.86 | 8.91 |
| Mask R-CNN | 3.97 | 4.04 | 4.04 | 4.03 |
| YOLACT++ | 10.77 | 11.93 | 9.42 | 9.74 |
| YOLOv7 | 16.28 | 20.79 | 13.82 | 14.61 |
| YOLOv5 n-seg | 35.55 | 49.73 | 25.32 | 26.01 |
| YOLOv8n-seg | 28.07 | 45.48 | 22.08 | 21.44 |
| IRSDD-YOLOv8 | 29.01 | 38.06 | 19.32 | 22.50 |
), ArticleFig(id=1251480549450269461, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表4, caption=
在不同场景下主流检测算法的检测结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法评价指标 | 检测算法 | 城市场景 | 山地场景 | 海面场景 | 天空场景 |
|---|
| mAP@0.5:0.95 | BoxInst | 0.197 | — | — | 0.395 |
| CondInst | 0.565 | 0.284 | 0.292 | 0.673 |
| Mask R-CNN | 0.629 | 0.416 | 0.463 | 0.711 |
| YOLACT++ | 0.423 | 0.177 | 0.163 | 0.561 |
| YOLOv7 | 0.440 | 0.269 | 0.335 | 0.580 |
| YOLOv5 n-seg | 0.473 | 0.245 | 0.342 | 0.572 |
| YOLOv8n-seg | 0.477 | 0.253 | 0.337 | 0.591 |
| IRSDD-YOLOv8 | 0.511 | 0.309 | 0.352 | 0.606 |
| mAP@0.5 | BoxInst | 0.538 | 0.013 | — | 0.806 |
| CondInst | 0.936 | 0.731 | 0.819 | 0.977 |
| Mask R-CNN | 0.937 | 0.749 | 0.933 | 0.987 |
| YOLACT++ | 0.902 | 0.625 | 0.445 | 0.958 |
| YOLOv7 | 0.877 | 0.746 | 0.930 | 0.974 |
| YOLOv5 n-seg | 0.936 | 0.689 | 0.886 | 0.966 |
| YOLOv8n-seg | 0.927 | 0.664 | 0.829 | 0.957 |
| IRSDD-YOLOv8 | 0.939 | 0.785 | 0.902 | 0.965 |
| FPS | BoxInst | 9.60 | 10.26 | 8.97 | 9.06 |
| CondInst | 9.60 | 10.35 | 8.86 | 8.91 |
| Mask R-CNN | 3.97 | 4.04 | 4.04 | 4.03 |
| YOLACT++ | 10.77 | 11.93 | 9.42 | 9.74 |
| YOLOv7 | 16.28 | 20.79 | 13.82 | 14.61 |
| YOLOv5 n-seg | 35.55 | 49.73 | 25.32 | 26.01 |
| YOLOv8n-seg | 28.07 | 45.48 | 22.08 | 21.44 |
| IRSDD-YOLOv8 | 29.01 | 38.06 | 19.32 | 22.50 |
), ArticleFig(id=1251480549546738461, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.5, caption=
Experimental results of adding C2f quantities in different layers
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验组别 | 不同数量的C2 f [n1,n2] | mAP@0.5:0.95 | mAP@0.5 |
|---|
| exp(1) | [1,1] | 0.281 | 0.745 |
| exp(2) | [1,2] | 0.270 | 0.733 |
| exp(3) | [1,3] | 0.276 | 0.751 |
| exp(4) | [2,1] | 0.278 | 0.742 |
| exp(5) | [3,2] | 0.286 | 0.744 |
| exp(6) | [3,3] | 0.282 | 0.758 |
), ArticleFig(id=1251480549634818851, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表5, caption=
在不同层中添加C2f数量的实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验组别 | 不同数量的C2 f [n1,n2] | mAP@0.5:0.95 | mAP@0.5 |
|---|
| exp(1) | [1,1] | 0.281 | 0.745 |
| exp(2) | [1,2] | 0.270 | 0.733 |
| exp(3) | [1,3] | 0.276 | 0.751 |
| exp(4) | [2,1] | 0.278 | 0.742 |
| exp(5) | [3,2] | 0.286 | 0.744 |
| exp(6) | [3,3] | 0.282 | 0.758 |
), ArticleFig(id=1251480549752259370, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.6, caption=
Experimental results of adding different submodules (mountain scenario)
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验组别 | MSFLM | SimAM | SIoU | mAP@0.5:0.95 | mAP@0.5 |
|---|
| 消融实验1 | | | | 0.253 | 0.664 |
| 消融实验2 | √ | | | 0.282 | 0.758 |
| 消融实验3 | √ | √ | | 0.270 | 0.763 |
| 消融实验4 | √ | √ | √ | 0.309 | 0.785 |
), ArticleFig(id=1251480549848728371, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表6, caption=
添加不同子模块的实验结果(山地场景)
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验组别 | MSFLM | SimAM | SIoU | mAP@0.5:0.95 | mAP@0.5 |
|---|
| 消融实验1 | | | | 0.253 | 0.664 |
| 消融实验2 | √ | | | 0.282 | 0.758 |
| 消融实验3 | √ | √ | | 0.270 | 0.763 |
| 消融实验4 | √ | √ | √ | 0.309 | 0.785 |
), ArticleFig(id=1251480549949391672, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=EN, label=Tab.7, caption=
Comparison of detection accuracy of algorithms on the actual collection dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 检测算法 | mAP@0.5 | mAP@0.5:0.95 |
|---|
| YOLOv5 n-seg | 0.832 | 0.341 |
| YOLOv8n-seg | 0.922 | 0.373 |
| IRSDD-YOLOv8 | 0.940 | 0.425 |
), ArticleFig(id=1251480550045860673, tenantId=1146029695717560320, journalId=1251234078029037663, articleId=1251480535583899932, language=CN, label=表7, caption=
算法在实采数据集上的检测精度对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 检测算法 | mAP@0.5 | mAP@0.5:0.95 |
|---|
| YOLOv5 n-seg | 0.832 | 0.341 |
| YOLOv8n-seg | 0.922 | 0.373 |
| IRSDD-YOLOv8 | 0.940 | 0.425 |
)], attaches=null, journal=Journal(id=1251231494090305632, delFlag=0, nameCn=国防科技大学学报, nameEn=Journal of National Niversity of Defense Technology, nameHistory1=null, nameHistory2=null, issn=1001-2486, eissn=, cn=43-1067/T, coden=null, periodic=双月刊, language=CN, oaType=1, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=, officePhone=, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=h+HgOUssQ5XqPoD980XNIA==, journalPrice=null, startedYear=null, abbrevIsoEn=Journal of National Niversity of Defense Technology, journalRemark=null, publicationField=null, createdTime=1776246434950, updatedTime=1776251967711, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=J, firstLetterEn=J, subjectCode=Engineering, subjectName=工程, subjectCodeEn=Engineering, subjectNameEn=null, picCn=h+HgOUssQ5XqPoD980XNIA==, picEn=hJx8onaXftcX9VtGkHdjDA==, jcr=null, cjcr=null, exts=[JournalExt(id=1251254700306285546, language=CN, name=国防科技大学学报, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1776251967741, updatedTime=1776251967741, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://journal.nudt.edu.cn/gfkjdxxb/author/login, submissionEditorUrl=http://journal.nudt.edu.cn/gfkjdxxb/editor/login, submissionReviewUrl=http://journal.nudt.edu.cn/gfkjdxxb/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1251254700356617195, language=EN, name=Journal of National Niversity of Defense Technology, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1776251967753, updatedTime=1776251967753, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://journal.nudt.edu.cn/gfkjdxxb/author/login, submissionEditorUrl=http://journal.nudt.edu.cn/gfkjdxxb/editor/login, submissionReviewUrl=http://journal.nudt.edu.cn/gfkjdxxb/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1251234078029037663, websiteList=[Website(id=1251257283485843500, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1251234078029037663, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/gfkjdxxb/CN, language=CN, createTime=1776252583619, createBy=18614031015, updateTime=1776253414371, updateBy=18614031015, name=国防科技大学学报-中文, tplId=1146099689490845704, title=国防科技大学学报, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1251260875290653228, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=articleTextType, value=kx, createTime=1776253439972, updateTime=1776253439972, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875273876009, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=banner, value=null, createTime=1776253439968, updateTime=1776253439968, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875311624751, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=grayFlag, value=0, createTime=1776253439977, updateTime=1776253439977, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875261293096, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=logo, value=https://castjournals.cast.org.cn/joweb/gfkjdxxb/CN/file/pic?fileId=WpHzMFTSHy8AuOKzUbYrdw==, createTime=1776253439965, updateTime=1776253439965, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875382927921, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=minRunFlag, value=0, createTime=1776253439994, updateTime=1776253439994, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875286458923, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/gfkjdxxb/CN/file/pic, createTime=1776253439971, updateTime=1776253439971, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875320013360, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=silenceFlag, value=0, createTime=1776253439979, updateTime=1776253439979, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875278070314, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1776253439969, updateTime=1776253439969, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875299041837, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=themeColor, value=null, createTime=1776253439974, updateTime=1776253439974, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260875303236142, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283485843500, code=themeStyle, value=null, createTime=1776253439975, updateTime=1776253439975, creator=18614031015, updator=18614031015)]), Website(id=1251257283599089718, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1251234078029037663, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/gfkjdxxb/EN, language=EN, createTime=1776252583646, createBy=18614031015, updateTime=1776253409915, updateBy=18614031015, name=国防科技大学学报-英文, tplId=1146101810881728533, title=Journal of National Niversity of Defense Technology, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1251260846312210678, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=articleTextType, value=kx, createTime=1776253433063, updateTime=1776253433063, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846232518899, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=banner, value=null, createTime=1776253433044, updateTime=1776253433044, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846396096761, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=grayFlag, value=0, createTime=1776253433083, updateTime=1776253433083, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846219935986, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=logo, value=https://castjournals.cast.org.cn/joweb/gfkjdxxb/EN/file/pic?fileId=WpHzMFTSHy8AuOKzUbYrdw==, createTime=1776253433041, updateTime=1776253433041, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846442234107, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=minRunFlag, value=0, createTime=1776253433094, updateTime=1776253433094, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846282850549, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/gfkjdxxb/EN/file/pic, createTime=1776253433056, updateTime=1776253433056, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846417068282, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=silenceFlag, value=0, createTime=1776253433088, updateTime=1776253433088, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846257684724, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1776253433050, updateTime=1776253433050, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846337376503, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=themeColor, value=null, createTime=1776253433070, updateTime=1776253433070, creator=18614031015, updator=18614031015), WebsiteProps(id=1251260846362542328, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283599089718, code=themeStyle, value=null, createTime=1776253433075, updateTime=1776253433075, creator=18614031015, updator=18614031015)])], journalTitle=国防科技大学学报, weixinUrl=null, journalUrl=http://journal.nudt.edu.cn/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Journal of National Niversity of Defense Technology, journalPhotoCn=h+HgOUssQ5XqPoD980XNIA==, journalPhotoEn=hJx8onaXftcX9VtGkHdjDA==, journalFirstLetter=J, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/gfkjdxxb/CN/10.11887/j.issn.1001-2486.24090041, detailUrlEn=https://castjournals.cast.org.cn/joweb/gfkjdxxb/EN/10.11887/j.issn.1001-2486.24090041, pdfUrlCn=https://castjournals.cast.org.cn/joweb/gfkjdxxb/CN/PDF/10.11887/j.issn.1001-2486.24090041, pdfUrlEn=https://castjournals.cast.org.cn/joweb/gfkjdxxb/EN/PDF/10.11887/j.issn.1001-2486.24090041, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)