Article(id=1149774733274739464, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149774724923880044, articleNumber=null, orderNo=null, doi=10.12404/j.issn.1671-1815.2403743, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1716220800000, receivedDateStr=2024-05-21, revisedDate=1737475200000, revisedDateStr=2025-01-22, acceptedDate=null, acceptedDateStr=null, onlineDate=1752057258194, onlineDateStr=2025-07-09, pubDate=1745769600000, pubDateStr=2025-04-28, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1752057258194, onlineIssueDateStr=2025-07-09, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1752057258194, creator=13701087609, updateTime=1752057258194, updator=13701087609, issue=Issue{id=1149774724923880044, tenantId=1146029695717560320, journalId=1146123166801305609, year='2025', volume='25', issue='12', pageStart='4827', pageEnd='5272', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=0, createTime=1752057256203, creator=13701087609, updateTime=1768456746933, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1218559174552764785, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149774724923880044, language=EN, specialIssueTitle=, coverIllustrator=, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1218559174552764786, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149774724923880044, language=CN, specialIssueTitle=, coverIllustrator=, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=5093, endPage=5102, ext={EN=ArticleExt(id=1149774733547369230, articleId=1149774733274739464, tenantId=1146029695717560320, journalId=1146123166801305609, language=EN, title=Ship Target Detection Algorithm Based on Improved YOLOv8, columnId=1156262729162810294, journalTitle=Science Technology and Engineering, columnName=Papers·Automation and Computational Technology, runingTitle=null, highlight=null, articleAbstract=
An improved DGA-YOLOv8 offshore ship target detection algorithm was proposed to tackle the issues of low accuracy and single ship detection categories that are present in traditional ship target detection algorithms. Firstly, the network was adapted to include deformable convolution, which expanded the model's receptive field. Learnable offsets were introduced, allowing the model to adaptively adjust the size and shape of the receptive field in response to the actual shape of the object, ensuring that the convolution area can precisely cover the contour of the ship object. Secondly, the incorporation of a GAM(global attention mechanism) attention mechanism enabled the network to effectively emphasize the key features of ship targets, thereby enhancing the target recognition capability. The experimental results demonstrate that the improved algorithm achieves accuracy and average accuracy mean (mAP) of 96.4% and 92.2%, respectively. An frames per second(FPS) of 43.55 is recorded, indicating not only an enhancement in accuracy but also the maintenance of a certain detection speed, thus fulfilling the requirements for real-time detection. When compared with other mainstream algorithms, such as faster region-based convolutional neural network(Faster R-CNN) and YOLOv5s, YOLOv10. The results show that the proposed algorithm exhibits higher average accuracy and significant superior classification performance.
, correspAuthors=Qing-hua LIU, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Cong-xin DONG, Qing-hua LIU), CN=ArticleExt(id=1149774768183931054, articleId=1149774733274739464, tenantId=1146029695717560320, journalId=1146123166801305609, language=CN, title=基于改进YOLOv8的船只目标检测算法, columnId=1156262729783567290, journalTitle=科学技术与工程, columnName=论文·自动化技术、计算机技术, runingTitle=null, highlight=null, articleAbstract=
针对传统船只目标检测算法的精度较低、船只检测类别单一等问题,提出一种改进的DGA-YOLOv8海上船只目标检测算法。首先,网络采用可变形卷积扩大模型的感受野,通过引入可学习偏移量,使模型能够根据物体实际形状自适应调整感受野大小和形状,确保卷积区域能够精确覆盖船只物体的轮廓。其次,引入GAM(global attention mechanism)注意力机制,使网络能够有效突出船只目标的关键特征,提高目标识别能力。实验结果表明:改进后算法的精确度和平均精度均值(mAP)达到96.4%和92.2%,FPS(frame per second)为43.55,在提升精度的同时也保证了一定的检测速度,满足了实时性检测的需求。同时与其他主流算法对比,其中包括Faster R-CNN(faster region-based convolutional neural network)、YOLOv5s和YOLOv10等。结果表明:所提算法具有更高的平均精度和更显著的分类效果。
, correspAuthors=刘庆华, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=SVAb4IYpLpw3/xDlQg2b9g==, magXml=/rcdrASDYDpHfiQoeBbPYg==, pdfUrl=null, pdf=PrkhN6WQloPR4d4HLVkORA==, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=4EB6j+wDuf1nCXC3/FKhpA==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=董从鑫, 刘庆华)}, authors=[Author(id=1180089380308926665, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=2440701788@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1180089380376035531, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, authorId=1180089380308926665, language=EN, stringName=Cong-xin DONG, firstName=Cong-xin, middleName=null, lastName=DONG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=Information and Communication College, Guilin University of Electronic and Technology, Guilin 541010, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1180089380430561484, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, authorId=1180089380308926665, language=CN, stringName=董从鑫, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=桂林电子科技大学信息与通信学院, 桂林 541010, bio={"content":"
董从鑫(2001—),男,汉族,广西贺州人,硕士研究生。研究方向:目标检测。E-mail:2440701788@qq.com。
"}, bioImg=null, bioContent=
董从鑫(2001—),男,汉族,广西贺州人,硕士研究生。研究方向:目标检测。E-mail:2440701788@qq.com。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1180089380233429189, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, xref=null, ext=[AuthorCompanyExt(id=1180089380241817798, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, companyId=1180089380233429189, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=Information and Communication College, Guilin University of Electronic and Technology, Guilin 541010, China), AuthorCompanyExt(id=1180089380250206407, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, companyId=1180089380233429189, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=桂林电子科技大学信息与通信学院, 桂林 541010)])]), Author(id=1180089380493476046, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=qhliu@guet.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1180089380560584912, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, authorId=1180089380493476046, language=EN, stringName=Qing-hua LIU, firstName=Qing-hua, middleName=null, lastName=LIU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=Information and Communication College, Guilin University of Electronic and Technology, Guilin 541010, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1180089380627693777, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, authorId=1180089380493476046, language=CN, stringName=刘庆华, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=桂林电子科技大学信息与通信学院, 桂林 541010, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1180089380233429189, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, xref=null, ext=[AuthorCompanyExt(id=1180089380241817798, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, companyId=1180089380233429189, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=Information and Communication College, Guilin University of Electronic and Technology, Guilin 541010, China), AuthorCompanyExt(id=1180089380250206407, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, companyId=1180089380233429189, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=桂林电子科技大学信息与通信学院, 桂林 541010)])])], keywords=[Keyword(id=1180089380761911506, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, orderNo=1, keyword=YOLOv8), Keyword(id=1180089380820631763, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, orderNo=2, keyword=ship target detection), Keyword(id=1180089380879352020, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, orderNo=3, keyword=deformable convolution), Keyword(id=1180089380938072277, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, orderNo=4, keyword=attention mechanism), Keyword(id=1180089380992598230, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, orderNo=1, keyword=YOLOv8), Keyword(id=1180089381047124183, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, orderNo=2, keyword=船只目标检测), Keyword(id=1180089381114233048, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, orderNo=3, keyword=可变形卷积), Keyword(id=1180089381177147609, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, orderNo=4, keyword=注意力机制)], refs=[Reference(id=1180089383735673085, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2022, volume=22, issue=25, pageStart=11241, pageEnd=11249, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=徐慧智, 宋爱秋, 武笑宇, journalName=科学技术与工程, refType=null, unstructuredReference=徐慧智, 宋爱秋, 武笑宇. 基于均匀设计的船舶目标检测深度学习模型训练方法研究[J].
科学技术与工程,
2022,
22(25): 11241-11249., articleTitle=基于均匀设计的船舶目标检测深度学习模型训练方法研究, refAbstract=null), Reference(id=1180089383798587646, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2022, volume=22, issue=25, pageStart=11241, pageEnd=11249, url=null, language=null, rfNumber=[1], rfOrder=1, authorNames=Xu Huizhi, Song Aiqiu, Wu Xiaoyu, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Xu Huizhi,
Song Aiqiu,
Wu Xiaoyu. Research on training method of deep learning to ship target detection based on uniform design[J].
Science Technology and Engineering,
2022,
22(25): 11241-11249., articleTitle=Research on training method of deep learning to ship target detection based on uniform design, refAbstract=null), Reference(id=1180089383853113599, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2019, volume=49, issue=S2, pageStart=185, pageEnd=191, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=石洪基, 郎海涛, 宋棋, journalName=中国海洋大学学报(自然科学版), refType=null, unstructuredReference=石洪基, 郎海涛, 宋棋, 等. 基于改进区域卷积神经网络的SAR图像船只检测方法[J].
中国海洋大学学报(自然科学版),
2019,
49(S2): 185-191., articleTitle=基于改进区域卷积神经网络的SAR图像船只检测方法, refAbstract=null), Reference(id=1180089383916028160, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2019, volume=49, issue=S2, pageStart=185, pageEnd=191, url=null, language=null, rfNumber=[2], rfOrder=3, authorNames=Shi Hongji, Lang Haitao, Song Qi, journalName=Journal of Ocean University of China(Natural Science Edition), refType=null, unstructuredReference=
Shi Hongji,
Lang Haitao,
Song Qi, et al. Ship detection method in SAR images based on improved regional convolutional neural network[J].
Journal of Ocean University of China(Natural Science Edition),
2019,
49(S2): 185-191., articleTitle=Ship detection method in SAR images based on improved regional convolutional neural network, refAbstract=null), Reference(id=1180089383962165505, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2022, volume=46, issue=4, pageStart=22, pageEnd=27, url=null, language=null, rfNumber=[3], rfOrder=4, authorNames=王程丽, 赵静, 杨攀攀, journalName=移动通信, refType=null, unstructuredReference=王程丽, 赵静, 杨攀攀, 等. 基于迁移学习的小样本SAR船只目标识别[J].
移动通信,
2022,
46(4): 22-27., articleTitle=基于迁移学习的小样本SAR船只目标识别, refAbstract=null), Reference(id=1180089384020885762, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2022, volume=46, issue=4, pageStart=22, pageEnd=27, url=null, language=null, rfNumber=[3], rfOrder=5, authorNames=Wang Chengli, Zhao Jing, Yang Panpan, journalName=Mobile Communications, refType=null, unstructuredReference=
Wang Chengli,
Zhao Jing,
Yang Panpan, et al. Smallsample SAR ship target recognition based on transfer learning[J].
Mobile Communications,
2022,
46(4): 22-27., articleTitle=Smallsample SAR ship target recognition based on transfer learning, refAbstract=null), Reference(id=1180089384087994627, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2021, volume=10, issue=6, pageStart=885, pageEnd=894, url=null, language=null, rfNumber=[4], rfOrder=6, authorNames=刘方坚, 李媛, journalName=雷达学报, refType=null, unstructuredReference=刘方坚, 李媛. 基于视觉显著性的 SAR 遥感图像 NanoDet 舰船检测方法[J].
雷达学报,
2021,
10(6): 885-894., articleTitle=基于视觉显著性的 SAR 遥感图像 NanoDet 舰船检测方法, refAbstract=null), Reference(id=1180089384146714884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2021, volume=10, issue=6, pageStart=885, pageEnd=894, url=null, language=null, rfNumber=[4], rfOrder=7, authorNames=Liu Fangjian, Li Yuan, journalName=Radar Journal, refType=null, unstructuredReference=
Liu Fangjian,
Li Yuan. NanoDet ship detection method for SAR remote sensing images based on visual saliency[J].
Radar Journal,
2021,
10(6): 885-894., articleTitle=NanoDet ship detection method for SAR remote sensing images based on visual saliency, refAbstract=null), Reference(id=1180089384205435141, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=17, pageStart=7205, pageEnd=7213, url=null, language=null, rfNumber=[5], rfOrder=8, authorNames=宣以国, 余成波, 蒋启超, journalName=科学技术与工程, refType=null, unstructuredReference=宣以国, 余成波, 蒋启超, 等. 基于改进YOLOv7的道路裂缝和坑洞检测算法[J].
科学技术与工程,
2024,
24(17): 7205-7213., articleTitle=基于改进YOLOv7的道路裂缝和坑洞检测算法, refAbstract=null), Reference(id=1180089384268349702, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=17, pageStart=7205, pageEnd=7213, url=null, language=null, rfNumber=[5], rfOrder=9, authorNames=Xuan Yiguo, Yu Chengbo, Jiang Qichao, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Xuan Yiguo,
Yu Chengbo,
Jiang Qichao, et al. Improved YOLOv7 road crack and pothole detection algorithm[J].
Science Technology and Engineering,
2024,
24(17): 7205-7213., articleTitle=Improved YOLOv7 road crack and pothole detection algorithm, refAbstract=null), Reference(id=1180089384339652871, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=580, pageEnd=587, url=null, language=null, rfNumber=[6], rfOrder=10, authorNames=Girshick R, Donahue J, Darrell T, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Girshick R,
Donahue J,
Darrell T, et al. Rich feature hierarchies for accurate object detection and semantic segmentation[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. New York: IEEE,
2014: 580-587., articleTitle=Rich feature hierarchies for accurate object detection and semantic segmentation, refAbstract=null), Reference(id=1180089384402567432, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=1440, pageEnd=1448, url=null, language=null, rfNumber=[7], rfOrder=11, authorNames=Girshick R, journalName=Proceedings of the IEEE International Conference on Computer Vision, refType=null, unstructuredReference=
Girshick R. Fast R-CNN[C]//
Proceedings of the IEEE International Conference on Computer Vision. New York: IEEE,
2015: 1440-1448., articleTitle=Fast R-CNN, refAbstract=null), Reference(id=1180089384461287689, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2016, volume=39, issue=6, pageStart=1137, pageEnd=1149, url=null, language=null, rfNumber=[8], rfOrder=12, authorNames=Ren S, He K, Girshick R, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Ren S,
He K,
Girshick R, et al. Faster R-CNN: towards real-time object detection with region proposal networks[J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2016,
39(6): 1137-1149., articleTitle=Faster R-CNN: towards real-time object detection with region proposal networks, refAbstract=null), Reference(id=1180089384520007946, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=779, pageEnd=788, url=null, language=null, rfNumber=[9], rfOrder=13, authorNames=Redmon J, Divvala S, Girshick R, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Redmon J,
Divvala S,
Girshick R, et al. You only look once: unified, real-time object detection[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. New York: IEEE,
2016: 779-788., articleTitle=You only look once: unified, real-time object detection, refAbstract=null), Reference(id=1180089384582922507, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=7263, pageEnd=7271, url=null, language=null, rfNumber=[10], rfOrder=14, authorNames=Redmon J, Farhadi A, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Redmon J,
Farhadi A. YOLO9000: better, faster, stronger[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. New York: IEEE,
2017: 7263-7271., articleTitle=YOLO9000: better, faster, stronger, refAbstract=null), Reference(id=1180089384641642764, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[11], rfOrder=15, authorNames=Redmon J, Farhadi A, journalName=arXiv Preprint, refType=null, unstructuredReference=
Redmon J,
Farhadi A. YOLOv3: an incremental improvement[J].
arXiv Preprint,
2018: arXiv: 1804.02767., articleTitle=YOLOv3: an incremental improvement, refAbstract=null), Reference(id=1180089384700363021, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[12], rfOrder=16, authorNames=Bochkovskiy A, Wang C Y, Liao H Y M, journalName=arXiv Preprint, refType=null, unstructuredReference=
Bochkovskiy A,
Wang C Y,
Liao H Y M. YOLOv4: optimal speed and accuracy of object detection[J].
arXiv Preprint,
2020: arXiv: 2004.10934., articleTitle=YOLOv4: optimal speed and accuracy of object detection, refAbstract=null), Reference(id=1180089384767471886, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=7464, pageEnd=7475, url=null, language=null, rfNumber=[13], rfOrder=17, authorNames=Wang C Y, Bochkovskiy A, Liao H Y M, journalName=Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Wang C Y,
Bochkovskiy A,
Liao H Y M. YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors[C]//
Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. New York: IEEE,
2023: 7464-7475., articleTitle=YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors, refAbstract=null), Reference(id=1180089384830386447, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2023, volume=38, issue=1, pageStart=37, pageEnd=43, url=null, language=null, rfNumber=[14], rfOrder=18, authorNames=李静, 鲜林, 王海江, journalName=成都信息工程大学学报, refType=null, unstructuredReference=李静, 鲜林, 王海江. 基于YOLOv3的船只检测算法研究[J].
成都信息工程大学学报,
2023,
38(1): 37-43., articleTitle=基于YOLOv3的船只检测算法研究, refAbstract=null), Reference(id=1180089384889106704, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2023, volume=38, issue=1, pageStart=37, pageEnd=43, url=null, language=null, rfNumber=[14], rfOrder=19, authorNames=Li Jing, Xian Lin, Wang Haijiang, journalName=Journal of Chengdu University of Information Technology, refType=null, unstructuredReference=
Li Jing,
Xian Lin,
Wang Haijiang. Research on ship detection algorithm based on YOLOv3[J].
Journal of Chengdu University of Information Technology,
2023,
38(1): 37-43., articleTitle=Research on ship detection algorithm based on YOLOv3, refAbstract=null), Reference(id=1180089384952021265, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=483, pageEnd=487, url=null, language=null, rfNumber=[15], rfOrder=20, authorNames=Liu T, Zhou B, Zhao Y, journalName=2021 6th International Conference on Automation, Control and Robotics Engineering(CACRE), refType=null, unstructuredReference=
Liu T,
Zhou B,
Zhao Y, et al. Ship detection algorithm based on improved YOLOv5[C]//
2021 6th International Conference on Automation, Control and Robotics Engineering(CACRE). New York: IEEE,
2021: 483-487., articleTitle=Ship detection algorithm based on improved YOLOv5, refAbstract=null), Reference(id=1180089385010741522, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=222, pageEnd=227, url=null, language=null, rfNumber=[16], rfOrder=21, authorNames=Wang B, Han B, Yang L, journalName=2021 6th International Conference on Transportation Information and Safety(ICTIS), refType=null, unstructuredReference=
Wang B,
Han B,
Yang L. Accurate real-time ship target detection using YOLOv4[C]//
2021 6th International Conference on Transportation Information and Safety(ICTIS). NewYork: IEEE,
2021: 222-227., articleTitle=Accurate real-time ship target detection using YOLOv4, refAbstract=null), Reference(id=1180089385086238995, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=659, pageEnd=665, url=null, language=null, rfNumber=[17], rfOrder=22, authorNames=Zhang J, journalName=International Conference on Mechatronic Engineering and Artificial Intelligence, refType=null, unstructuredReference=
Zhang J. Ship target detection based on CBAM-YOLOv8[C]//
International Conference on Mechatronic Engineering and Artificial Intelligence. Shanghai: SPIE,
2024: 659-665., articleTitle=Ship target detection based on CBAM-YOLOv8, refAbstract=null), Reference(id=1180089385149153556, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=764, pageEnd=773, url=null, language=null, rfNumber=[18], rfOrder=23, authorNames=Dai J, Qi H, Xiong Y, journalName=Proceedings of the IEEE International Conference on Computer Vision, refType=null, unstructuredReference=
Dai J,
Qi H,
Xiong Y, et al. Deformable convolutional networks[C]//
Proceedings of the IEEE International Conference on Computer Vision. New York: IEEE,
2017: 764-773., articleTitle=Deformable convolutional networks, refAbstract=null), Reference(id=1180089385207873813, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[19], rfOrder=24, authorNames=Liu Y, Shao Z, Hoffmann N, journalName=arXiv Preprint, refType=null, unstructuredReference=
Liu Y,
Shao Z,
Hoffmann N. Global attention mechanism: retain information to enhance channel-spatial interactions[J].
arXiv Preprint,
2021: arXiv: 2112.05561., articleTitle=Global attention mechanism: retain information to enhance channel-spatial interactions, refAbstract=null), Reference(id=1180089385258205462, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=558, pageEnd=573, url=null, language=null, rfNumber=[20], rfOrder=25, authorNames=Bolya D, Foley S, Hays J, journalName=Computer Vision-ECCV 2020: 16th European Conference, refType=null, unstructuredReference=
Bolya D,
Foley S,
Hays J, et al. Tide: a general toolbox for identifying object detection errors[C]//
Computer Vision-ECCV 2020: 16th European Conference. Glasgow: Springer International Publishing,
2020: 558-573., articleTitle=Tide: a general toolbox for identifying object detection errors, refAbstract=null), Reference(id=1180089385312731415, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=7132, pageEnd=7141, url=null, language=null, rfNumber=[21], rfOrder=26, authorNames=Hu J, Shen L, Sun G, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Hu J,
Shen L,
Sun G. Squeeze-and-excitation networks[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. New York: IEEE,
2018: 7132-7141., articleTitle=Squeeze-and-excitation networks, refAbstract=null), Reference(id=1180089385375645976, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=11534, pageEnd=11542, url=null, language=null, rfNumber=[22], rfOrder=27, authorNames=Wang Q, Wu B, Zhu P, journalName=Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Wang Q,
Wu B,
Zhu P, et al. ECA-Net: efficient channel attention for deep convolutional neural networks[C]//
Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. New York: IEEE,
2020: 11534-11542., articleTitle=ECA-Net: efficient channel attention for deep convolutional neural networks, refAbstract=null), Reference(id=1180089385434366233, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=3, pageEnd=19, url=null, language=null, rfNumber=[23], rfOrder=28, authorNames=Woo S, Park J, Lee J Y, journalName=Proceedings of the European Conference on Computer Vision(ECCV), refType=null, unstructuredReference=
Woo S,
Park J,
Lee J Y, et al. CBAM: convolutional block attention module[C]//
Proceedings of the European Conference on Computer Vision(ECCV). New York: IEEE,
2018: 3-19., articleTitle=CBAM: convolutional block attention module, refAbstract=null)], funds=[Fund(id=1180089383601455356, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, awardId=桂科AA21077008, language=CN, fundingSource=广西创新驱动发展专项(桂科AA21077008), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1180089380233429189, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, xref=null, ext=[AuthorCompanyExt(id=1180089380241817798, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, companyId=1180089380233429189, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=Information and Communication College, Guilin University of Electronic and Technology, Guilin 541010, China), AuthorCompanyExt(id=1180089380250206407, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, companyId=1180089380233429189, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=桂林电子科技大学信息与通信学院, 桂林 541010)])], figs=[ArticleFig(id=1180089381344919770, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.1, caption=
Network structure of DGA-YOLOv8, figureFileSmall=QC5KRQIjzsk0cpEq3KtaNA==, figureFileBig=JXVOkKkN/p+vCh4MkbKW5Q==, tableContent=null), ArticleFig(id=1180089381407834331, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图1, caption=
DGA-YOLOv8网络结构 Backbone为骨干网络;Conv为卷积;C2f为跨阶段双分支特征融合模块;C2f_DCN为本文设计模块,其中DCN为可变形卷积网络;GAM为全局注意力机制;SPPF为空间金字塔池化快速模块;Neck为颈部网络;Concat为拼接;Upsample为上采样;Head为头部网络;Detect为检测模块;Conv2d为二维卷积;Box_Loss为锚框损失;Cls_Loss为类别损失;BatchNorm2d为2维批量归一化;SiLU为激活函数;Split为分割;DCN_Bottleneck为本文设计模块,其中Bottleneck为瓶颈模块;Deformable Conv为可变形卷积;shortcut=True为使用残差连接;MaxPool2d为2维最大值池化
, figureFileSmall=QC5KRQIjzsk0cpEq3KtaNA==, figureFileBig=JXVOkKkN/p+vCh4MkbKW5Q==, tableContent=null), ArticleFig(id=1180089381529469148, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.2, caption=
Traditional convolution and deformable convolution sampling processes, figureFileSmall=5TD0Ypwgo2++JnMvIb6DAQ==, figureFileBig=A3lxrymauerzc6+p54U4jw==, tableContent=null), ArticleFig(id=1180089381592383709, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图2, caption=
传统卷积与可变形卷积采样过程, figureFileSmall=5TD0Ypwgo2++JnMvIb6DAQ==, figureFileBig=A3lxrymauerzc6+p54U4jw==, tableContent=null), ArticleFig(id=1180089381680464094, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.3, caption=
C2f_DCN module, figureFileSmall=91lGwksPDj1WYH7VvC12Qw==, figureFileBig=OK4ikRLv3LnSrqj0qg1lfA==, tableContent=null), ArticleFig(id=1180089381743378655, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图3, caption=
C2f_DCN模块, figureFileSmall=91lGwksPDj1WYH7VvC12Qw==, figureFileBig=OK4ikRLv3LnSrqj0qg1lfA==, tableContent=null), ArticleFig(id=1180089381797904608, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.4, caption=
DCN_Bottleneck structure, figureFileSmall=+FIvzloMbi8OLXxKfDUP2g==, figureFileBig=9JOWdBZAO+dpgd1SEAw/oQ==, tableContent=null), ArticleFig(id=1180089381865013473, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图4, caption=
DCN_Bottleneck结构, figureFileSmall=+FIvzloMbi8OLXxKfDUP2g==, figureFileBig=9JOWdBZAO+dpgd1SEAw/oQ==, tableContent=null), ArticleFig(id=1180089381932122338, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.5, caption=
GAM attention module, figureFileSmall=kUq8OIu6XNmzhzzCYu7rlw==, figureFileBig=WP4VBSyb96zqyA748GQ3fw==, tableContent=null), ArticleFig(id=1180089381990842595, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图5, caption=
GAM注意力模块 Input features为输入特征;Channel Attention为通道注意力;Spatial Attention为空间注意力;Output features为输出特征
, figureFileSmall=kUq8OIu6XNmzhzzCYu7rlw==, figureFileBig=WP4VBSyb96zqyA748GQ3fw==, tableContent=null), ArticleFig(id=1180089382066340068, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.6, caption=
Channel attention module, figureFileSmall=iQGPLvgHPVT/sE3cokB+9g==, figureFileBig=TfF/7zLf9YFAH3is9YKwrA==, tableContent=null), ArticleFig(id=1180089382129254629, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图6, caption=
通道注意力模块 permutation为维度转换;MLP为多层感知机;reverse permutation为维度反转换;Sigmoid为激活函数
, figureFileSmall=iQGPLvgHPVT/sE3cokB+9g==, figureFileBig=TfF/7zLf9YFAH3is9YKwrA==, tableContent=null), ArticleFig(id=1180089382187974886, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.7, caption=
Spatial attention module, figureFileSmall=9fHQUV6dCFGNBkvDEVeMMg==, figureFileBig=vcNrr1RJPOQc1BHnfA5ttg==, tableContent=null), ArticleFig(id=1180089382259278055, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图7, caption=
空间注意力模块 Conv为卷积
, figureFileSmall=9fHQUV6dCFGNBkvDEVeMMg==, figureFileBig=vcNrr1RJPOQc1BHnfA5ttg==, tableContent=null), ArticleFig(id=1180089382309609704, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.8, caption=
TIDE error type definition, figureFileSmall=46KvQj8H3vNshBSaKHPbFg==, figureFileBig=M23FEwemhm/xoXhanxKSmQ==, tableContent=null), ArticleFig(id=1180089382368329961, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图8, caption=
TIDE错误类型定义 分类错误(Cls)表示定位正确,但分类错误;定位错误(Loc)表示分类正确,但定位错误;分类和定位错误(Cls+Loc)表示分类和定位均错误;重复检测错误(Duplicate)表示多次检测到目标物体;背景错误(Bkgd)表示将背景检测为目标物体;未检测错误(Missed)表示未检测到目标物体
, figureFileSmall=46KvQj8H3vNshBSaKHPbFg==, figureFileBig=M23FEwemhm/xoXhanxKSmQ==, tableContent=null), ArticleFig(id=1180089382431244522, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.9, caption=
Training process analysis, figureFileSmall=Q+lWd7P7s62mZ3GafHavDA==, figureFileBig=e4xQtyGEJdifGgF69NXglw==, tableContent=null), ArticleFig(id=1180089382485770475, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图9, caption=
训练过程分析, figureFileSmall=Q+lWd7P7s62mZ3GafHavDA==, figureFileBig=e4xQtyGEJdifGgF69NXglw==, tableContent=null), ArticleFig(id=1180089382536102124, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.10, caption=
Comparison of detection result, figureFileSmall=AaAMrwgEg+Czqgrv4r6XAg==, figureFileBig=igNJU+6xCMdK2yJyqI5G8Q==, tableContent=null), ArticleFig(id=1180089382586433773, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图10, caption=
检测结果对比 绿色框为TP;蓝色框为FP;红色框为FN
, figureFileSmall=AaAMrwgEg+Czqgrv4r6XAg==, figureFileBig=igNJU+6xCMdK2yJyqI5G8Q==, tableContent=null), ArticleFig(id=1180089382640959726, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Fig.11, caption=
Comparison of heat map effects, figureFileSmall=lQSEnts/HQajtEer4gBi8Q==, figureFileBig=nHdeAkhV8wJiTUtzO1HIsg==, tableContent=null), ArticleFig(id=1180089382699679983, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=图11, caption=
热力图效果对比, figureFileSmall=lQSEnts/HQajtEer4gBi8Q==, figureFileBig=nHdeAkhV8wJiTUtzO1HIsg==, tableContent=null), ArticleFig(id=1180089382754205936, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Table 1, caption=
Experimental environment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 配置 |
| 图像大小 | 640×640 |
| 迭代次数 | 200 |
| 批量大小 | 16 |
| 优化器 | SGD |
| 初始学习率 | 0.01 |
| 学习率衰减因子 | 0.01 |
| 权重衰减 | 0.000 5 |
| 动量 | 0.937 |
), ArticleFig(id=1180089382821314801, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=表1, caption=
实验环境
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 配置 |
| 图像大小 | 640×640 |
| 迭代次数 | 200 |
| 批量大小 | 16 |
| 优化器 | SGD |
| 初始学习率 | 0.01 |
| 学习率衰减因子 | 0.01 |
| 权重衰减 | 0.000 5 |
| 动量 | 0.937 |
), ArticleFig(id=1180089382880035058, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Table 2, caption=
Dataset distribution
, figureFileSmall=null, figureFileBig=null, tableContent=
| 船只类型 | 训练集/张 | 验证集/张 | 总计/张 |
| 矿砂船 | 1 508 | 168 | 1 676 |
| 散装货船 | 1 325 | 148 | 1 473 |
| 普通货船 | 1 188 | 133 | 1 321 |
| 集装箱货船 | 1 052 | 117 | 1 169 |
| 渔船 | 1 154 | 129 | 1 283 |
| 客运船 | 378 | 43 | 421 |
| 邮轮 | 795 | 89 | 884 |
| 大型货轮 | 1 513 | 169 | 1 682 |
| 帆船 | 202 | 23 | 225 |
| 其他类型 | 858 | 89 | 947 |
| 总计 | 9 973 | 1 108 | 11 081 |
), ArticleFig(id=1180089382942949619, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=表2, caption=
数据集分布
, figureFileSmall=null, figureFileBig=null, tableContent=
| 船只类型 | 训练集/张 | 验证集/张 | 总计/张 |
| 矿砂船 | 1 508 | 168 | 1 676 |
| 散装货船 | 1 325 | 148 | 1 473 |
| 普通货船 | 1 188 | 133 | 1 321 |
| 集装箱货船 | 1 052 | 117 | 1 169 |
| 渔船 | 1 154 | 129 | 1 283 |
| 客运船 | 378 | 43 | 421 |
| 邮轮 | 795 | 89 | 884 |
| 大型货轮 | 1 513 | 169 | 1 682 |
| 帆船 | 202 | 23 | 225 |
| 其他类型 | 858 | 89 | 947 |
| 总计 | 9 973 | 1 108 | 11 081 |
), ArticleFig(id=1180089383010058484, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Table 3, caption=
Module ablation experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| YOLOv8n | C2f_DCN | GAM | 准确 率/% | 召回 率/% | mAP@0.5/ % | mAP@0.5: 0.95/% |
| √ | — | — | 93.1 | 86.1 | 91.8 | 73.1 |
| √ | √ | — | 94.7 | 86.3 | 91.4 | 73.1 |
| √ | — | √ | 95.4 | 87.4 | 91.4 | 73.5 |
| √ | √ | √ | 96.4 | 87.3 | 92.2 | 74.1 |
), ArticleFig(id=1180089383093944565, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=表3, caption=
模块消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| YOLOv8n | C2f_DCN | GAM | 准确 率/% | 召回 率/% | mAP@0.5/ % | mAP@0.5: 0.95/% |
| √ | — | — | 93.1 | 86.1 | 91.8 | 73.1 |
| √ | √ | — | 94.7 | 86.3 | 91.4 | 73.1 |
| √ | — | √ | 95.4 | 87.4 | 91.4 | 73.5 |
| √ | √ | √ | 96.4 | 87.3 | 92.2 | 74.1 |
), ArticleFig(id=1180089383165247734, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Table 4, caption=
Comparison of TIDE results
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | Cls | Loc | Both | Duplicate | Bkg | Missed | FP | FN |
| YOLOv8 | 1.57 | 1.39 | 0.12 | 0.17 | 1.15 | 0.58 | 5.56 | 2.28 |
| DGA-YOLOv8 | 1.60 | 1.19 | 0.14 | 0.18 | 1.10 | 0.65 | 5.53 | 2.08 |
| 提升 | +0.03 | -0.20 | +0.02 | +0.01 | -0.05 | +0.07 | -0.03 | -0.20 |
), ArticleFig(id=1180089383232356599, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=表4, caption=
TIDE结果对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | Cls | Loc | Both | Duplicate | Bkg | Missed | FP | FN |
| YOLOv8 | 1.57 | 1.39 | 0.12 | 0.17 | 1.15 | 0.58 | 5.56 | 2.28 |
| DGA-YOLOv8 | 1.60 | 1.19 | 0.14 | 0.18 | 1.10 | 0.65 | 5.53 | 2.08 |
| 提升 | +0.03 | -0.20 | +0.02 | +0.01 | -0.05 | +0.07 | -0.03 | -0.20 |
), ArticleFig(id=1180089383291076856, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Table 5, caption=
Comparison of different attention mechanisms
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 准确率/ % | 召回率/ % | mAP@0.5/ % | mAP@0.5:0.95/ % |
| YOLOv8n | 93.1 | 86.1 | 91.8 | 73.1 |
| +SE | 95.5 | 86.7 | 90.9 | 71.7 |
| +ECA | 93.9 | 84.9 | 91.1 | 72.5 |
| +CBAM | 92.9 | 87.2 | 91.4 | 72.6 |
| +GAM | 95.4 | 87.4 | 91.4 | 73.5 |
), ArticleFig(id=1180089383345602809, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=表5, caption=
不同注意力机制比较
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 准确率/ % | 召回率/ % | mAP@0.5/ % | mAP@0.5:0.95/ % |
| YOLOv8n | 93.1 | 86.1 | 91.8 | 73.1 |
| +SE | 95.5 | 86.7 | 90.9 | 71.7 |
| +ECA | 93.9 | 84.9 | 91.1 | 72.5 |
| +CBAM | 92.9 | 87.2 | 91.4 | 72.6 |
| +GAM | 95.4 | 87.4 | 91.4 | 73.5 |
), ArticleFig(id=1180089383408517370, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=EN, label=Table 6, caption=
Comparison experiment of different algorithms
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 准确率/ % | 召回率/ % | mAP@0.5/ % | FPS | 体积/ MB |
| Faster R-CNN | 86.5 | 77.7 | 86.9 | 8.00 | 108.00 |
| YOLOv3 | 93.1 | 86.4 | 90.4 | 6.33 | 235.00 |
| YOLOv5s | 92.4 | 89.7 | 90.2 | 27.77 | 13.80 |
| YOLOv7-tiny | 92.1 | 85.3 | 91.0 | 38.81 | 11.70 |
| YOLOv8n | 93.1 | 86.1 | 91.8 | 43.11 | 5.98 |
| CBAM-YOLOv8[17] | 91.6 | 87.8 | 91.1 | 52.18 | 7.00 |
| YOLOv9s | 95.3 | 87.6 | 91.1 | 24.13 | 19.30 |
| YOLOv10n | 95.5 | 85.9 | 90.6 | 65.79 | 5.53 |
| DGA-YOLOv8 | 96.4 | 87.3 | 92.2 | 43.55 | 10.60 |
), ArticleFig(id=1180089383467237627, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149774733274739464, language=CN, label=表6, caption=
不同算法对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 准确率/ % | 召回率/ % | mAP@0.5/ % | FPS | 体积/ MB |
| Faster R-CNN | 86.5 | 77.7 | 86.9 | 8.00 | 108.00 |
| YOLOv3 | 93.1 | 86.4 | 90.4 | 6.33 | 235.00 |
| YOLOv5s | 92.4 | 89.7 | 90.2 | 27.77 | 13.80 |
| YOLOv7-tiny | 92.1 | 85.3 | 91.0 | 38.81 | 11.70 |
| YOLOv8n | 93.1 | 86.1 | 91.8 | 43.11 | 5.98 |
| CBAM-YOLOv8[17] | 91.6 | 87.8 | 91.1 | 52.18 | 7.00 |
| YOLOv9s | 95.3 | 87.6 | 91.1 | 24.13 | 19.30 |
| YOLOv10n | 95.5 | 85.9 | 90.6 | 65.79 | 5.53 |
| DGA-YOLOv8 | 96.4 | 87.3 | 92.2 | 43.55 | 10.60 |
)], attaches=null, journal=Journal(id=1146119176004939786, delFlag=0, nameCn=科学技术与工程, nameEn=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, issn=1671-1815, eissn=, cn=11-4688/T, coden=null, periodic=4, language=CN, oaType=是, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=UKU/O7GSka5polgCTkbIIw==, journalPrice=null, startedYear=null, abbrevIsoEn=Sci Technol Eng, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1754445529766, createdBy=null, updatedBy=13701087609, firstLetterCn=S, firstLetterEn=S, subjectCode=Natural Sciences, subjectName=自然科学, subjectCodeEn=Natural Sciences, subjectNameEn=null, picCn=UKU/O7GSka5polgCTkbIIw==, picEn=5hwlULoNwcbj3xUmVi9MAQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1159791870395564357, language=CN, name=科学技术与工程, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529793, updatedTime=1754445529793, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=http://www.stae.com.cn/jsygc/site/menus/20090429150146001, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1159791870441701702, language=EN, name=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529804, updatedTime=1754445529804, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146123166801305609, websiteList=[Website(id=1148243202391400884, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/CN, language=CN, createTime=1751692112777, createBy=18614031015, updateTime=1753520965431, updateBy=18614031015, name=科学技术与工程-中文站点, tplId=1146099689490845704, title=科学技术与工程, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148622798802673703, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=articleTextType, value=kx, createTime=1751782615614, updateTime=1751782615614, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798781702180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=banner, value=null, createTime=1751782615609, updateTime=1751782615609, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798769119267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1751782615606, updateTime=1751782615606, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798794285094, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782615612, updateTime=1751782615612, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798790090789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782615611, updateTime=1751782615611, creator=18614031015, updator=18614031015)]), Website(id=1155914124811976731, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/EN, language=EN, createTime=1753521003206, createBy=18614031015, updateTime=1753521003206, updateBy=18614031015, name=科学技术与工程-英文站点, tplId=1146101810881728533, title=Science Technology and Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155914371227308235, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=articleTextType, value=kx, createTime=1753521061952, updateTime=1753521061952, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371210531016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=banner, value=null, createTime=1753521061947, updateTime=1753521061947, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371202142407, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1753521061945, updateTime=1753521061945, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371223113930, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753521061950, updateTime=1753521061950, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371218919625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753521061949, updateTime=1753521061949, creator=18614031015, updator=18614031015)])], journalTitle=科学技术与工程, weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Science Technology and Engineering, journalPhotoCn=UKU/O7GSka5polgCTkbIIw==, journalPhotoEn=5hwlULoNwcbj3xUmVi9MAQ==, journalFirstLetter=S, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/10.12404/j.issn.1671-1815.2403743, detailUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/10.12404/j.issn.1671-1815.2403743, pdfUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/PDF/10.12404/j.issn.1671-1815.2403743, pdfUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/PDF/10.12404/j.issn.1671-1815.2403743, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)