Article(id=1149773874725871618, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149773869357167407, articleNumber=null, orderNo=null, doi=10.12404/j.issn.1671-1815.2404266, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1717689600000, receivedDateStr=2024-06-07, revisedDate=1736956800000, revisedDateStr=2025-01-16, acceptedDate=null, acceptedDateStr=null, onlineDate=1752057053500, onlineDateStr=2025-07-09, pubDate=1746633600000, pubDateStr=2025-05-08, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1752057053500, onlineIssueDateStr=2025-07-09, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1752057053500, creator=13701087609, updateTime=1752057053500, updator=13701087609, issue=Issue{id=1149773869357167407, tenantId=1146029695717560320, journalId=1146123166801305609, year='2025', volume='25', issue='13', pageStart='5273', pageEnd='5704', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=0, createTime=1752057052207, creator=13701087609, updateTime=1768456769392, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1218559268744253990, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149773869357167407, language=EN, specialIssueTitle=, coverIllustrator=, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1218559268744253991, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149773869357167407, language=CN, specialIssueTitle=, coverIllustrator=, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=5527, endPage=5534, ext={EN=ArticleExt(id=1149773875606675465, articleId=1149773874725871618, tenantId=1146029695717560320, journalId=1146123166801305609, language=EN, title=Small Target Detection Algorithm in Aerial Images Based on Improved RT-DETR, columnId=1156262729162810294, journalTitle=Science Technology and Engineering, columnName=Papers·Automation and Computational Technology, runingTitle=null, highlight=null, articleAbstract=
An algorithm has been proposed to detect small targets in unmanned aerial vehicle(UAV) aerial images. The algorithm is based on an improved real-time detection Transformer (RT-DETR) and aims to address the challenges posed by complex backgrounds and a large number of small target samples. To enhance the feature fusion network, a dedicated feature fusion structure for small targets has been incorporated, utilizing rich location information from the shallow feature map to improve the network's ability to detect small targets. Furthermore, the last residual block in the BackBone has been removed to prevent an increase in additional parameters. Additionally, the MCP Block, a reconstructed BasicBlock structure in the backbone network, has been designed, which includes a multi-channel feature partial convolution module (MCPConv) to reduce redundancy in channel features and enhance the acquisition of multi-scale detail features. Moreover, a location encoding mechanism with learning ability has been introduced to obtain more accurate and expressive location information. The normalized weighted deviation(NWD) and mean precision-driven IoU(MPDIoU) positioning loss functions have been incorporated to accelerate the convergence speed of the model and reduce sensitivity to position deviation. Experimental results on the VisDrone2019-DET dataset demonstrate that the improved model reduces parameters by 62% compared to the original model, increases mAP50 by 3.9%, and improves FPS by 17%. The improved model exhibits superior detection performance compared to other mainstream detection models.
, correspAuthors=Wei-dong LI, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Zi-qi ZHAO, Wei-dong LI, Xiao-juan LI), CN=ArticleExt(id=1149773893034008895, articleId=1149773874725871618, tenantId=1146029695717560320, journalId=1146123166801305609, language=CN, title=基于改进实时Transformer的航拍图像小目标检测算法, columnId=1156262729783567290, journalTitle=科学技术与工程, columnName=论文·自动化技术、计算机技术, runingTitle=null, highlight=null, articleAbstract=
针对无人机航拍图像中背景复杂、小目标样本多,难以提取有效特征等问题,提出一种改进实时Transformer(real-time detection Transformer,RT-DETR)的无人机航拍小目标检测算法。首先,在特征融合网络中增加针对微小目标的特征融合结构,利用浅层特征图中丰富的位置信息来增强网络对小目标的检测能力,同时为了防止额外参数的增加,去除主干网络中最后一个残差结构;其次,设计一种多通道特征部分卷积模块(multichannel partial convolution,MCPConv),基于此重新构造了主干网络中的BasicBlock结构,命名为MCP Block,减少通道特征冗余,提升多尺度细节特征的获取能力;引入具有学习能力的位置编码,获取更精确、更具表达能力的位置信息;最后引入归一化加权偏差(normalized weighted deviation,NWD)和平均精度驱动交并比(mean precision-driven IoU,MPDIoU)定位损失函数,降低对位置偏差的敏感性,加快模型收敛速度。实验结果表明,在VisDrone2019-DET数据集上,改进后的模型较原始模型参数量降低了62%,检测精度mAP50提升了3.9%,且FPS较改进前提升了17%,对比其他主流检测模型具有更好的检测效果。
, correspAuthors=李卫东, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=SYBFEtmVmfVNN9RYK0lJ4w==, magXml=1Od40VZhuAovQUBaC315MA==, pdfUrl=null, pdf=edBDfUZkiUL+Z3QtnUhbgQ==, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=fo9deKWXZkRyNpAm7SG9tg==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=赵子琪, 李卫东, 李晓娟)}, authors=[Author(id=1175114407483949601, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=583982413@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1175114407559447074, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, authorId=1175114407483949601, language=EN, stringName=Zi-qi ZHAO, firstName=Zi-qi, middleName=null, lastName=ZHAO, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1175114407685276197, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, authorId=1175114407483949601, language=CN, stringName=赵子琪, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062, bio={"content":"
赵子琪(2000—),男,汉族,河北石家庄人,硕士研究生。研究方向:图像处理、目标检测。E-mail:583982413@qq.com。
"}, bioImg=null, bioContent=
赵子琪(2000—),男,汉族,河北石家庄人,硕士研究生。研究方向:图像处理、目标检测。E-mail:583982413@qq.com。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1175114407324566041, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=1, ext=[AuthorCompanyExt(id=1175114407328760345, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407337148954, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062)])]), Author(id=1175114407848854054, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=14263859@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1175114407974683178, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, authorId=1175114407848854054, language=EN, stringName=Wei-dong LI, firstName=Wei-dong, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, *, address=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China
2 Hebei Cross border E-commerce Technology Innovation Center, Shijiazhuang 050062, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1175114408041792044, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, authorId=1175114407848854054, language=CN, stringName=李卫东, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, *, address=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062
2 河北省跨境电商技术创新中心, 石家庄 050062, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1175114407324566041, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=1, ext=[AuthorCompanyExt(id=1175114407328760345, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407337148954, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062)]), AuthorCompany(id=1175114407383286299, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=2, ext=[AuthorCompanyExt(id=1175114407391674909, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407383286299, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 Hebei Cross border E-commerce Technology Innovation Center, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407400063518, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407383286299, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 河北省跨境电商技术创新中心, 石家庄 050062)])]), Author(id=1175114408125678127, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1175114408331199026, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, authorId=1175114408125678127, language=EN, stringName=Xiao-juan LI, firstName=Xiao-juan, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China
2 Hebei Cross border E-commerce Technology Innovation Center, Shijiazhuang 050062, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1175114408410890805, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, authorId=1175114408125678127, language=CN, stringName=李晓娟, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062
2 河北省跨境电商技术创新中心, 石家庄 050062, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1175114407324566041, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=1, ext=[AuthorCompanyExt(id=1175114407328760345, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407337148954, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062)]), AuthorCompany(id=1175114407383286299, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=2, ext=[AuthorCompanyExt(id=1175114407391674909, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407383286299, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 Hebei Cross border E-commerce Technology Innovation Center, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407400063518, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407383286299, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 河北省跨境电商技术创新中心, 石家庄 050062)])])], keywords=[Keyword(id=1175114408553497145, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, orderNo=1, keyword=small object detection), Keyword(id=1175114408662549051, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, orderNo=2, keyword=RT-DETR), Keyword(id=1175114408733852220, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, orderNo=3, keyword=multi channel partial convolution), Keyword(id=1175114408788378174, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, orderNo=4, keyword=learned position embedding), Keyword(id=1175114408863875648, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, orderNo=1, keyword=小目标检测), Keyword(id=1175114409002287680, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, orderNo=2, keyword=RT-DETR), Keyword(id=1175114409140699715, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, orderNo=3, keyword=多通道部分卷积), Keyword(id=1175114409199419971, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, orderNo=4, keyword=可学习位置编码)], refs=[Reference(id=1175114411695030910, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=580, pageEnd=587, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=Girshick R, Donahue J, Darrell T, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Girshick R,
Donahue J,
Darrell T, et al. Rich feature hierarchies for accurate object detection and semantic segmentation[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Columbus: IEEE,
2014: 580-587., articleTitle=Rich feature hierarchies for accurate object detection and semantic segmentation, refAbstract=null), Reference(id=1175114411774722689, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=779, pageEnd=788, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=Redmon J, Divvala S, Girshick R, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Redmon J,
Divvala S,
Girshick R, et al. You only look once: unified, real-time object detection[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Las Vegas: IEEE,
2016: 779-788., articleTitle=You only look once: unified, real-time object detection, refAbstract=null), Reference(id=1175114411862803074, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=18, pageStart=7726, pageEnd=7732, url=null, language=null, rfNumber=[3], rfOrder=2, authorNames=桑雨, 李立权, 李铁, journalName=科学技术与工程, refType=null, unstructuredReference=桑雨, 李立权, 李铁. 轻量化YOLOv7-tiny的遥感图像小目标检测[J].
科学技术与工程,
2024,
24(18): 7726-7732., articleTitle=轻量化YOLOv7-tiny的遥感图像小目标检测, refAbstract=null), Reference(id=1175114411950883461, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=18, pageStart=7726, pageEnd=7732, url=null, language=null, rfNumber=[3], rfOrder=3, authorNames=Sang Yu, Li Liquan, Li Tie, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Sang Yu,
Li Liquan,
Li Tie, et al. Lightweight YOLOv7-tiny for remote sensing image small target detection[J].
Science Technology and Engineering,
2024,
24(18): 7726-7732., articleTitle=Lightweight YOLOv7-tiny for remote sensing image small target detection, refAbstract=null), Reference(id=1175114412059935368, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=1, pageStart=274, pageEnd=282, url=null, language=null, rfNumber=[4], rfOrder=4, authorNames=刘晋川, 黎向锋, 刘安旭, journalName=科学技术与工程, refType=null, unstructuredReference=刘晋川, 黎向锋, 刘安旭, 等. 改进RetinaNet的无人机小目标检测[J].
科学技术与工程,
2023,
23(1): 274-282., articleTitle=改进RetinaNet的无人机小目标检测, refAbstract=null), Reference(id=1175114412177375883, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=1, pageStart=274, pageEnd=282, url=null, language=null, rfNumber=[4], rfOrder=5, authorNames=Liu Jinchuan, Li Xiangfeng, Liu Anxu, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Liu Jinchuan,
Li Xiangfeng,
Liu Anxu, et al. Improved RetinaNet for unmanned aerial vehicle small target detection[J].
Science Technology and Engineering,
2023,
23(1): 274-282., articleTitle=Improved RetinaNet for unmanned aerial vehicle small target detection, refAbstract=null), Reference(id=1175114412319982224, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2020, volume=20, issue=27, pageStart=11185, pageEnd=11191, url=null, language=null, rfNumber=[5], rfOrder=6, authorNames=吴稳稳, 吴晓红, 刘强, journalName=科学技术与工程, refType=null, unstructuredReference=吴稳稳, 吴晓红, 刘强, 等. 基于全局注意力的多级特征融合目标检测算法[J].
科学技术与工程,
2020,
20(27): 11185-11191., articleTitle=基于全局注意力的多级特征融合目标检测算法, refAbstract=null), Reference(id=1175114412403868306, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2020, volume=20, issue=27, pageStart=11185, pageEnd=11191, url=null, language=null, rfNumber=[5], rfOrder=7, authorNames=Wu Wenwen, Wu Xiaohong, Liu Qiang, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Wu Wenwen,
Wu Xiaohong,
Liu Qiang, et al. Multi-level feature fusion object detection algorithm based on global attention[J].
Science Technology and Engineering,
2020,
20(27): 11185-11191., articleTitle=Multi-level feature fusion object detection algorithm based on global attention, refAbstract=null), Reference(id=1175114412542280340, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=9, pageStart=3533, pageEnd=3542, url=null, language=null, rfNumber=[6], rfOrder=8, authorNames=康传利, 张思瑶, 李玄皓, journalName=科学技术与工程, refType=null, unstructuredReference=康传利, 张思瑶, 李玄皓, 等. 高斯Wasserstein距离改进轻量YOLOv7模型的遥感影像道路交叉口检测[J].
科学技术与工程,
2024,
24(9): 3533-3542., articleTitle=高斯Wasserstein距离改进轻量YOLOv7模型的遥感影像道路交叉口检测, refAbstract=null), Reference(id=1175114412605194902, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=9, pageStart=3533, pageEnd=3542, url=null, language=null, rfNumber=[6], rfOrder=9, authorNames=Kang Chuanli, Zhang Siyao, Li Xuanhao, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Kang Chuanli,
Zhang Siyao,
Li Xuanhao, et al. Gaussian Wasserstein distance improvement of lightweight YOLOv7 model for remote sensing image road intersection detection[J].
Science Technology and Engineering,
2024,
24(9): 3533-3542., articleTitle=Gaussian Wasserstein distance improvement of lightweight YOLOv7 model for remote sensing image road intersection detection, refAbstract=null), Reference(id=1175114412722635418, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[7], rfOrder=10, authorNames=Tan M, Le Q, journalName=ArXiv, refType=null, unstructuredReference=
Tan M,
Le Q. Efficientnet: rethinking model scaling for convolutional neural networks[J].
ArXiv,
2019: 1905.11946., articleTitle=Efficientnet: rethinking model scaling for convolutional neural networks, refAbstract=null), Reference(id=1175114412873630361, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=213, pageEnd=229, url=null, language=null, rfNumber=[8], rfOrder=11, authorNames=Carion N, Massa F, Synnaeve G, journalName=European Conference on Computer Vision, refType=null, unstructuredReference=
Carion N,
Massa F,
Synnaeve G, et al. End-to-end object detection with transformers[C]//
European Conference on Computer Vision. Cham: Springer International Publishing,
2020: 213-229., articleTitle=End-to-end object detection with transformers, refAbstract=null), Reference(id=1175114413079151259, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[9], rfOrder=12, authorNames=Zhu X, Su W, Lu L, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Zhu X,
Su W,
Lu L, et al. Deformable detr: deformable transformers for end-to-end object detection[J].
ArXiv Preprint ArXiv,
2020: 2010.04159., articleTitle=Deformable detr: deformable transformers for end-to-end object detection, refAbstract=null), Reference(id=1175114413272089243, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=764, pageEnd=773, url=null, language=null, rfNumber=[10], rfOrder=13, authorNames=Dai J, Qi H, Xiong Y, journalName=Proceedings of the IEEE International Conference on Computer Vision, refType=null, unstructuredReference=
Dai J,
Qi H,
Xiong Y, et al. Deformable convolutional networks[C]//
Proceedings of the IEEE International Conference on Computer Vision. Venice: IEEE,
2017: 764-773., articleTitle=Deformable convolutional networks, refAbstract=null), Reference(id=1175114413410501277, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=3651, pageEnd=3660, url=null, language=null, rfNumber=[11], rfOrder=14, authorNames=Meng D, Chen X, Fan Z, journalName=Proceedings of the IEEE/CVF International Conference on Computer Vision, refType=null, unstructuredReference=
Meng D,
Chen X,
Fan Z, et al. Conditional detr for fast training convergence[C]//
Proceedings of the IEEE/CVF International Conference on Computer Vision. Montreal: IEEE,
2021: 3651-3660., articleTitle=Conditional detr for fast training convergence, refAbstract=null), Reference(id=1175114413532136094, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2022, volume=36, issue=3, pageStart=2567, pageEnd=2575, url=null, language=null, rfNumber=[12], rfOrder=15, authorNames=Wang Y, Zhang X, Yang T, journalName=Proceedings of the AAAI Conference on Artificial Intelligence, refType=null, unstructuredReference=
Wang Y,
Zhang X,
Yang T, et al. Anchor DETR: query design for Transformer-based detector[C]//
Proceedings of the AAAI Conference on Artificial Intelligence. New York: AAAI,
2022,
36(3): 2567-2575., articleTitle=Anchor DETR: query design for Transformer-based detector, refAbstract=null), Reference(id=1175114413641187999, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[13], rfOrder=16, authorNames=Liu S, Li F, Zhang H, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Liu S,
Li F,
Zhang H, et al. DAB-DETR: dynamic anchor boxes are better queries for DETR[J].
ArXiv Preprint ArXiv,
2022: 2201.12329., articleTitle=DAB-DETR: dynamic anchor boxes are better queries for DETR, refAbstract=null), Reference(id=1175114413725074081, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2022, volume=46, issue=4, pageStart=13619, pageEnd=13627, url=null, language=null, rfNumber=[14], rfOrder=17, authorNames=Li F, Zhang H, Liu S, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Li F,
Zhang H,
Liu S, et al. DN-DETR: accelerate DETR training by introducing query denoising[J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2022,
46(4): 13619-13627., articleTitle=DN-DETR: accelerate DETR training by introducing query denoising, refAbstract=null), Reference(id=1175114413876069027, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[15], rfOrder=18, authorNames=Zhang H, Li F, Liu S, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Zhang H,
Li F,
Liu S, et al. Dino: DETR with improved denoising anchor boxes for end-to-end object detection[J].
ArXiv Preprint ArXiv,
2022: 2203.03605., articleTitle=Dino: DETR with improved denoising anchor boxes for end-to-end object detection, refAbstract=null), Reference(id=1175114414027063973, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[16], rfOrder=19, authorNames=Lü W, Xu S, Zhao Y, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Lü W,
Xu S,
Zhao Y, et al. DETRs beat yolos on real-time object detection[J].
ArXiv Preprint ArXiv,
2023: 2304.08069., articleTitle=DETRs beat yolos on real-time object detection, refAbstract=null), Reference(id=1175114414148698791, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=740, pageEnd=755, url=null, language=null, rfNumber=[17], rfOrder=20, authorNames=Lin T Y, Maire M, Belongie S, journalName=Computer Vision-ECCV 2014: 13th European Conference, refType=null, unstructuredReference=
Lin T Y,
Maire M,
Belongie S, et al. Microsoft COCO: common objects in context[C]//
Computer Vision-ECCV 2014: 13th European Conference. Zurich: Springer International Publishing,
2014: 740-755., articleTitle=Microsoft COCO: common objects in context, refAbstract=null), Reference(id=1175114414404551337, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[18], rfOrder=21, authorNames=Wang J, Xu C, Yang W, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Wang J,
Xu C,
Yang W, et al. A normalized Gaussian Wasserstein distance for tiny object detection[J].
ArXiv Preprint ArXiv,
2021: 2110.13389., articleTitle=A normalized Gaussian Wasserstein distance for tiny object detection, refAbstract=null), Reference(id=1175114414501020330, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[19], rfOrder=22, authorNames=Siliang M, Yong X, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Siliang M,
Yong X. Mpdiou: a loss for efficient and accurate bounding box regression[J].
ArXiv Preprint ArXiv,
2023: 2307.07662., articleTitle=Mpdiou: a loss for efficient and accurate bounding box regression, refAbstract=null), Reference(id=1175114414614266540, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=770, pageEnd=778, url=null, language=null, rfNumber=[20], rfOrder=23, authorNames=He K, Zhang X, Ren S, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
He K,
Zhang X,
Ren S, et al. Deep residual learning for image recognition[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Chengdu: IEEE,
2016: 770-778., articleTitle=Deep residual learning for image recognition, refAbstract=null), Reference(id=1175114414677181102, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2012, volume=null, issue=null, pageStart=25, pageEnd=null, url=null, language=null, rfNumber=[21], rfOrder=24, authorNames=Krizhevsky A, Sutskever I, Hinton G E, journalName=Advances in Neural Information Processing Systems, refType=null, unstructuredReference=
Krizhevsky A,
Sutskever I,
Hinton G E. ImageNet classification with deep convolutional neural networks[J].
Advances in Neural Information Processing Systems,
2012, 25., articleTitle=ImageNet classification with deep convolutional neural networks, refAbstract=null), Reference(id=1175114414941422256, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[22], rfOrder=25, authorNames=Sifre L, Mallat S, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Sifre L,
Mallat S. Rigid-motion scattering for texture classification[J].
ArXiv Preprint ArXiv,
2014: 1403.1687., articleTitle=Rigid-motion scattering for texture classification, refAbstract=null), Reference(id=1175114415092417202, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=12021, pageEnd=12031, url=null, language=null, rfNumber=[23], rfOrder=26, authorNames=Chen J, Kao S, He H, journalName=Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Chen J,
Kao S,
He H, et al. Run, don't walk: chasing higher FLOPS for faster neural networks[C]//
Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Vancouver: IEEE,
2023: 12021-12031., articleTitle=Run, don't walk: chasing higher FLOPS for faster neural networks, refAbstract=null), Reference(id=1175114415193080500, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=1314, pageEnd=1324, url=null, language=null, rfNumber=[24], rfOrder=27, authorNames=Howard A, Sandler M, Chu G, journalName=Proceedings of the IEEE/CVF International Conference on Computer Vision, refType=null, unstructuredReference=
Howard A,
Sandler M,
Chu G, et al. Searching for MobileNetV3[C]//
Proceedings of the IEEE/CVF International Conference on Computer Vision. Seoul: IEEE,
2019: 1314-1324., articleTitle=Searching for MobileNetV3, refAbstract=null), Reference(id=1175114415360852660, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=6848, pageEnd=6856, url=null, language=null, rfNumber=[25], rfOrder=28, authorNames=Zhang X, Zhou X, Lin M, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Zhang X,
Zhou X,
Lin M, et al. ShuffleNet: an extremely efficient convolutional neural network for mobile devices[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Salt Lake City: IEEE,
2018: 6848-6856., articleTitle=ShuffleNet: an extremely efficient convolutional neural network for mobile devices, refAbstract=null), Reference(id=1175114415478293174, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=1580, pageEnd=1589, url=null, language=null, rfNumber=[26], rfOrder=29, authorNames=Han K, Wang Y, Tian Q, journalName=Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Han K,
Wang Y,
Tian Q, et al. GhostNet: more features from cheap operations[C]//
Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle: IEEE,
2020: 1580-1589., articleTitle=GhostNet: more features from cheap operations, refAbstract=null), Reference(id=1175114415553790648, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[27], rfOrder=30, authorNames=Tan M, Le Q, journalName=ArXiv, refType=null, unstructuredReference=
Tan M,
Le Q. EfficientNet: rethinking model scaling for convolutional neural networks[J].
ArXiv,
2019: 1905.11946., articleTitle=EfficientNet: rethinking model scaling for convolutional neural networks, refAbstract=null), Reference(id=1175114415700591289, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[28], rfOrder=31, authorNames=Zhang Q, Jiang Z, Lu Q, journalName=ArXiv Preprint ArXiv, refType=null, unstructuredReference=
Zhang Q,
Jiang Z,
Lu Q, et al. Split to be slim: an overlooked redundancy in Vanilla convolution[J].
ArXiv Preprint ArXiv,
2020: 2006.12085., articleTitle=Split to be slim: an overlooked redundancy in Vanilla convolution, refAbstract=null)], funds=[Fund(id=1175114411300766327, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, awardId=SZX2020034, language=CN, fundingSource=河北省省级科技计划(SZX2020034), fundOrder=null, country=null), Fund(id=1175114411443372665, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, awardId=BJK2022041, language=CN, fundingSource=河北省高等学校科学研究计划(BJK2022041), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1175114407324566041, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=1, ext=[AuthorCompanyExt(id=1175114407328760345, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Management Science and Information Engineering, Hebei University of Economics and Business, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407337148954, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407324566041, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 河北经贸大学管理科学与信息工程学院, 石家庄 050062)]), AuthorCompany(id=1175114407383286299, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, xref=2, ext=[AuthorCompanyExt(id=1175114407391674909, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407383286299, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 Hebei Cross border E-commerce Technology Innovation Center, Shijiazhuang 050062, China), AuthorCompanyExt(id=1175114407400063518, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, companyId=1175114407383286299, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 河北省跨境电商技术创新中心, 石家庄 050062)])], figs=[ArticleFig(id=1175114409388163659, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Fig.1, caption=
Improved RT-DETR model structure, figureFileSmall=K3XwWYNeOWgoqB6villyZA==, figureFileBig=Ch3bN5pVs+3Wrvdw3wE8lw==, tableContent=null), ArticleFig(id=1175114409446883916, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=图1, caption=
改进RT-DETR算法模型结构, figureFileSmall=K3XwWYNeOWgoqB6villyZA==, figureFileBig=Ch3bN5pVs+3Wrvdw3wE8lw==, tableContent=null), ArticleFig(id=1175114409513992783, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Fig.2, caption=
Model structure comparison, figureFileSmall=cPNoqzbaf2tmb1jKuEM04g==, figureFileBig=DMG940CKfqwVtaxLWvtLXA==, tableContent=null), ArticleFig(id=1175114409618850386, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=图2, caption=
模型结构对比图, figureFileSmall=cPNoqzbaf2tmb1jKuEM04g==, figureFileBig=DMG940CKfqwVtaxLWvtLXA==, tableContent=null), ArticleFig(id=1175114409753068118, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Fig.3, caption=
Multichannel partial convolution, figureFileSmall=17KV/nIoqo6paP+JiUr++Q==, figureFileBig=qNf06OOwuF35cyHfs5HyNg==, tableContent=null), ArticleFig(id=1175114409832759895, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=图3, caption=
MCPConv, figureFileSmall=17KV/nIoqo6paP+JiUr++Q==, figureFileBig=qNf06OOwuF35cyHfs5HyNg==, tableContent=null), ArticleFig(id=1175114409916645978, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Fig.4, caption=
Comparison of Basic Block and MCP Block design, figureFileSmall=qiUBZslDv0Vq8VAQvRwLdA==, figureFileBig=n0PSeqUSPhlT4P0R6g6xgw==, tableContent=null), ArticleFig(id=1175114410004726364, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=图4, caption=
Basic Block 与MCP Block设计对比, figureFileSmall=qiUBZslDv0Vq8VAQvRwLdA==, figureFileBig=n0PSeqUSPhlT4P0R6g6xgw==, tableContent=null), ArticleFig(id=1175114410134749791, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Fig.5, caption=
Comparison between the improved model and the original model, figureFileSmall=mippP/sKgC6Fu4ecPF5R+w==, figureFileBig=Dnwg8CQZMciNWTEgJQqzhQ==, tableContent=null), ArticleFig(id=1175114410252190306, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=图5, caption=
改进后的模型与原模型检测效果对比, figureFileSmall=mippP/sKgC6Fu4ecPF5R+w==, figureFileBig=Dnwg8CQZMciNWTEgJQqzhQ==, tableContent=null), ArticleFig(id=1175114410336076389, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Table 1, caption=
Model performance comparison
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 参数量/106 | 计算量 | 准确率/% | 召回率/% | mAP50/% | mAP50:95/% | FPS/(帧·s-1) |
| RT-DETR | 19.9 | 57.3 | 55.4 | 37.6 | 36.6 | 21.0 | 60 |
| 方法一 | 18.6 | 78.8 | 55.2 | 40.3 | 39.3 | 23.2 | 46 |
| 方法二 | 7.9 | 69.4 | 56.2 | 39.9 | 39.1 | 23.1 | 61 |
), ArticleFig(id=1175114410411573864, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=表1, caption=
模型效果对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 参数量/106 | 计算量 | 准确率/% | 召回率/% | mAP50/% | mAP50:95/% | FPS/(帧·s-1) |
| RT-DETR | 19.9 | 57.3 | 55.4 | 37.6 | 36.6 | 21.0 | 60 |
| 方法一 | 18.6 | 78.8 | 55.2 | 40.3 | 39.3 | 23.2 | 46 |
| 方法二 | 7.9 | 69.4 | 56.2 | 39.9 | 39.1 | 23.1 | 61 |
), ArticleFig(id=1175114410537402986, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Table 2, caption=
Cryogenic experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 序号 | 方法 | 参数量/106 | 计算量 | 准确率/% | 召回率/% | mAP50/% | mAP50:95/% | FPS/(帧·s-1) |
| — | RT-DETR | 19.9 | 57.3 | 55.4 | 37.6 | 36.6 | 21.0 | 60 |
| A | RT-DETR+MCP Block | 16.8 | 49.8 | 54.5 | 38.6 | 37.5 | 21.8 | 58 |
| B | RT-DETR+AIFI-LPE | 20.0 | 57.3 | 55.5 | 38.8 | 37.8 | 22.0 | 63 |
| C | RT-DETR+NWD-MPDIoU | 19.9 | 57.3 | 55.6 | 38.2 | 37.5 | 21.7 | 59 |
| D | RT-DETR+多尺度特征 | 7.9 | 69.4 | 56.2 | 39.9 | 39.1 | 23.1 | 61 |
| E | A+B | 16.9 | 49.8 | 56.2 | 39.1 | 38.0 | 22.1 | 60 |
| F | A+B+C | 16.9 | 49.8 | 56.0 | 39.4 | 38.5 | 22.4 | 61 |
| 本文 | A+B+C+D | 7.5 | 63.2 | 57.7 | 41.8 | 40.5 | 23.7 | 70 |
), ArticleFig(id=1175114410738729581, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=表2, caption=
消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 序号 | 方法 | 参数量/106 | 计算量 | 准确率/% | 召回率/% | mAP50/% | mAP50:95/% | FPS/(帧·s-1) |
| — | RT-DETR | 19.9 | 57.3 | 55.4 | 37.6 | 36.6 | 21.0 | 60 |
| A | RT-DETR+MCP Block | 16.8 | 49.8 | 54.5 | 38.6 | 37.5 | 21.8 | 58 |
| B | RT-DETR+AIFI-LPE | 20.0 | 57.3 | 55.5 | 38.8 | 37.8 | 22.0 | 63 |
| C | RT-DETR+NWD-MPDIoU | 19.9 | 57.3 | 55.6 | 38.2 | 37.5 | 21.7 | 59 |
| D | RT-DETR+多尺度特征 | 7.9 | 69.4 | 56.2 | 39.9 | 39.1 | 23.1 | 61 |
| E | A+B | 16.9 | 49.8 | 56.2 | 39.1 | 38.0 | 22.1 | 60 |
| F | A+B+C | 16.9 | 49.8 | 56.0 | 39.4 | 38.5 | 22.4 | 61 |
| 本文 | A+B+C+D | 7.5 | 63.2 | 57.7 | 41.8 | 40.5 | 23.7 | 70 |
), ArticleFig(id=1175114410944250479, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=EN, label=Table 3, caption=
Comparative Experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 参数量/106 | 计算量 | 准确率/% | 召回率/% | mAP50/% | mAP50:95/% | FPS/(帧·s-1) |
| YOLOv5-m | 25.0 | 64.2 | 48.5 | 35.3 | 34.1 | 19.8 | 112 |
| YOLOv5-l | 53.1 | 135.0 | 48.4 | 37.1 | 35.5 | 20.8 | 99 |
| YOLOv8-m | 25.9 | 79.3 | 48.1 | 36.0 | 34.4 | 20.0 | 108 |
| YOLOv8-L | 43.6 | 165.7 | 49.2 | 36.8 | 35.3 | 20.7 | 101 |
| 本文 | 7.5 | 63.2 | 57.7 | 41.8 | 40.5 | 23.7 | 70 |
), ArticleFig(id=1175114411023942257, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149773874725871618, language=CN, label=表3, caption=
对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 参数量/106 | 计算量 | 准确率/% | 召回率/% | mAP50/% | mAP50:95/% | FPS/(帧·s-1) |
| YOLOv5-m | 25.0 | 64.2 | 48.5 | 35.3 | 34.1 | 19.8 | 112 |
| YOLOv5-l | 53.1 | 135.0 | 48.4 | 37.1 | 35.5 | 20.8 | 99 |
| YOLOv8-m | 25.9 | 79.3 | 48.1 | 36.0 | 34.4 | 20.0 | 108 |
| YOLOv8-L | 43.6 | 165.7 | 49.2 | 36.8 | 35.3 | 20.7 | 101 |
| 本文 | 7.5 | 63.2 | 57.7 | 41.8 | 40.5 | 23.7 | 70 |
)], attaches=null, journal=Journal(id=1146119176004939786, delFlag=0, nameCn=科学技术与工程, nameEn=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, issn=1671-1815, eissn=, cn=11-4688/T, coden=null, periodic=4, language=CN, oaType=是, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=UKU/O7GSka5polgCTkbIIw==, journalPrice=null, startedYear=null, abbrevIsoEn=Sci Technol Eng, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1754445529766, createdBy=null, updatedBy=13701087609, firstLetterCn=S, firstLetterEn=S, subjectCode=Natural Sciences, subjectName=自然科学, subjectCodeEn=Natural Sciences, subjectNameEn=null, picCn=UKU/O7GSka5polgCTkbIIw==, picEn=5hwlULoNwcbj3xUmVi9MAQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1159791870395564357, language=CN, name=科学技术与工程, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529793, updatedTime=1754445529793, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=http://www.stae.com.cn/jsygc/site/menus/20090429150146001, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1159791870441701702, language=EN, name=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529804, updatedTime=1754445529804, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146123166801305609, websiteList=[Website(id=1148243202391400884, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/CN, language=CN, createTime=1751692112777, createBy=18614031015, updateTime=1753520965431, updateBy=18614031015, name=科学技术与工程-中文站点, tplId=1146099689490845704, title=科学技术与工程, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148622798802673703, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=articleTextType, value=kx, createTime=1751782615614, updateTime=1751782615614, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798781702180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=banner, value=null, createTime=1751782615609, updateTime=1751782615609, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798769119267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1751782615606, updateTime=1751782615606, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798794285094, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782615612, updateTime=1751782615612, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798790090789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782615611, updateTime=1751782615611, creator=18614031015, updator=18614031015)]), Website(id=1155914124811976731, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/EN, language=EN, createTime=1753521003206, createBy=18614031015, updateTime=1753521003206, updateBy=18614031015, name=科学技术与工程-英文站点, tplId=1146101810881728533, title=Science Technology and Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155914371227308235, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=articleTextType, value=kx, createTime=1753521061952, updateTime=1753521061952, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371210531016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=banner, value=null, createTime=1753521061947, updateTime=1753521061947, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371202142407, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1753521061945, updateTime=1753521061945, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371223113930, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753521061950, updateTime=1753521061950, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371218919625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753521061949, updateTime=1753521061949, creator=18614031015, updator=18614031015)])], journalTitle=科学技术与工程, weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Science Technology and Engineering, journalPhotoCn=UKU/O7GSka5polgCTkbIIw==, journalPhotoEn=5hwlULoNwcbj3xUmVi9MAQ==, journalFirstLetter=S, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/10.12404/j.issn.1671-1815.2404266, detailUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/10.12404/j.issn.1671-1815.2404266, pdfUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/PDF/10.12404/j.issn.1671-1815.2404266, pdfUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/PDF/10.12404/j.issn.1671-1815.2404266, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)