Article(id=1251893512128639586, tenantId=1146029695717560320, journalId=1251234473337991274, issueId=1251893504037831074, articleNumber=null, orderNo=null, doi=10.3969/j.issn.1003-3114.2025.05.015, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1747065600000, receivedDateStr=2025-05-13, revisedDate=null, revisedDateStr=null, acceptedDate=null, acceptedDateStr=null, onlineDate=1776404272348, onlineDateStr=2026-04-17, pubDate=1758124800000, pubDateStr=2025-09-18, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1776404272348, onlineIssueDateStr=2026-04-17, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1776404272348, creator=13701087609, updateTime=1776404272348, updator=13701087609, issue=Issue{id=1251893504037831074, tenantId=1146029695717560320, journalId=1251234473337991274, year='2025', volume='51', issue='5', pageStart='877', pageEnd='1134', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1776404270419, creator=13701087609, updateTime=1776404832543, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1251895861849043019, tenantId=1146029695717560320, journalId=1251234473337991274, issueId=1251893504037831074, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1251895861849043020, tenantId=1146029695717560320, journalId=1251234473337991274, issueId=1251893504037831074, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=1025, endPage=1035, ext={EN=ArticleExt(id=1251893512413852269, articleId=1251893512128639586, tenantId=1146029695717560320, journalId=1251234473337991274, language=EN, title=Enhanced Estimation Algorithm Based on YOLOv8n-Pose Key Point Features, columnId=1251893508886446519, journalTitle=Radio Communications Technology, columnName=Special Topic:Frontiers in Intelligent Communication, Storage, and Information Processing Technologies, runingTitle=null, highlight=null, articleAbstract=
Existing key point detection algorithms tend to suffer from reduced detection precision, missed detections, or misaligned key points in scenarios with varying lighting conditions and dense crowds with overlapping figures. To address this issue, an improved LBW-YOLOv8n-Pose algorithm for multi-person pose estimation in complex environments is proposed based on YOLOv8n-Pose. By introducing the Large Separable Kernel Attention (LSKA) in the Spatial Pyramid Pooling-Fast (SPPF) layer of the feature extraction backbone network, the algorithm enhances the image feature representation and perception capabilities. A weighted Bidirectional Feature Pyramid Network (BiFPN) is incorporated in the neck network for reconstruction to improve the multi-scale feature fusion effect. Additionally, an improved Wise-IoU loss function is adopted to accelerate the model's convergence speed and enhance its robustness in complex scenarios. Experimental results show that the improved model achieves precision, recall, and average detection precision of 85.7%, 76.8%, and 81.7% respectively on the MS-COCO2017 human key point dataset, representing significant improvements over the original model. Moreover, it can more accurately and effectively detect key point information of multiple people in complex situations.
, correspAuthors=Bo HU, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Xiantao YIN, Bo HU, Sizhao LI), CN=ArticleExt(id=1251893522446627814, articleId=1251893512128639586, tenantId=1146029695717560320, journalId=1251234473337991274, language=CN, title=基于YOLOv8n-Pose关键点特征增强估计算法, columnId=1251893509079384505, journalTitle=无线电通信技术, columnName=专题:智能通信、存储与信息处理技术前沿, runingTitle=null, highlight=null, articleAbstract=
现有关键点检测算法在光照变化、人员密集交叉遮挡等情况下,易导致检测精度降低、漏检或关键点检测错位的问题。针对该问题,提出基于YOLOv8n-Pose改进的LBW-YOLOv8n-Pose复杂环境多人人体姿态估计算法。通过在特征提取主干网络的快速空间金字塔池化(Spatial Pyramid Pooling-Fast,SPPF)层引入大核可分离注意力(Large Separable Kernel Attention,LSKA),增强图像特征表达能力和感知能力。在颈部网络引入加权双向特征金字塔网络(Bidirectional Feature Pyramid Network,BiFPN)进行重构,提高多尺度特征融合效果,并采用改进的Wise-IoU损失函数,提升模型收敛速度与复杂场景下的鲁棒性。实验结果表明,改进后模型在MS-COCO2017人体关键点数据集上精确率、召回率、平均精度值分别达到85.7%、76.8%、81.7%,相比原模型均有明显提升,且能更精准、有效地检测复杂情况下多人人体关键点信息。
, correspAuthors=胡波, authorNote=null, correspAuthorsNote=
胡波 男,(1980—),硕士,副教授。主要研究方向:嵌入式系统、AI、模糊系统。
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=YaRp40qKX1ivDbnIV9ksjQ==, magXml=q4f2P6EMdlxpbbaYemHIVA==, pdfUrl=null, pdf=YlukcumegG3AEqApopgWew==, pdfFileSize=14692998, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=er0TL6twC5Oq796QyLKqYA==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=AaPjtGpSNMENpUBAPqokRQ==, mapNumber=null, authorCompany=null, fund=null, authors=
殷贤涛 男,(1998—),硕士研究生。主要研究方向:嵌入式系统、AI。
李思照 男,(1982—),博士,副教授。主要研究方向:AI芯片、新型存储架构。
, authorsList=殷贤涛, 胡波, 李思照)}, authors=[Author(id=1251895520919240941, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251895521061847284, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, authorId=1251895520919240941, language=EN, stringName=Xiantao YIN, firstName=Xiantao, middleName=null, lastName=YIN, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1.School of Big Data and Computer Science, Guizhou Normal University, Guiyang 550025, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251895521162510588, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, authorId=1251895520919240941, language=CN, stringName=殷贤涛, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1.贵州师范大学 大数据与计算机科学学院,贵州 贵阳 550025, bio={"content":"
殷贤涛 男,(1998—),硕士研究生。主要研究方向:嵌入式系统、AI。
"}, bioImg=null, bioContent=
殷贤涛 男,(1998—),硕士研究生。主要研究方向:嵌入式系统、AI。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251895520554336470, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, xref=1., ext=[AuthorCompanyExt(id=1251895520566919383, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520554336470, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.School of Big Data and Computer Science, Guizhou Normal University, Guiyang 550025, China), AuthorCompanyExt(id=1251895520587890905, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520554336470, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.贵州师范大学 大数据与计算机科学学院,贵州 贵阳 550025)])]), Author(id=1251895521246396676, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1251895521342865674, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, authorId=1251895521246396676, language=EN, stringName=Bo HU, firstName=Bo, middleName=null, lastName=HU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, *, address=
1.School of Big Data and Computer Science, Guizhou Normal University, Guiyang 550025, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251895521435140369, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, authorId=1251895521246396676, language=CN, stringName=胡波, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, *, address=
1.贵州师范大学 大数据与计算机科学学院,贵州 贵阳 550025, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251895520554336470, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, xref=1., ext=[AuthorCompanyExt(id=1251895520566919383, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520554336470, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.School of Big Data and Computer Science, Guizhou Normal University, Guiyang 550025, China), AuthorCompanyExt(id=1251895520587890905, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520554336470, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.贵州师范大学 大数据与计算机科学学院,贵州 贵阳 550025)])]), Author(id=1251895521544192282, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251895521628078368, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, authorId=1251895521544192282, language=EN, stringName=Sizhao LI, firstName=Sizhao, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2.College of Computer Science and Technology, Harbin Engineering University, Harbin 150001, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251895521758101797, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, authorId=1251895521544192282, language=CN, stringName=李思照, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2.哈尔滨工程大学 计算机科学与技术学院,黑龙江 哈尔滨 150001, bio={"content":"
李思照 男,(1982—),博士,副教授。主要研究方向:AI芯片、新型存储架构。
"}, bioImg=null, bioContent=
李思照 男,(1982—),博士,副教授。主要研究方向:AI芯片、新型存储架构。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251895520759857381, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, xref=2., ext=[AuthorCompanyExt(id=1251895520768245990, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520759857381, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2.College of Computer Science and Technology, Harbin Engineering University, Harbin 150001, China), AuthorCompanyExt(id=1251895520776634599, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520759857381, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2.哈尔滨工程大学 计算机科学与技术学院,黑龙江 哈尔滨 150001)])])], keywords=[Keyword(id=1251895522018148657, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, orderNo=1, keyword=pose estimation), Keyword(id=1251895522143977784, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, orderNo=2, keyword=attention mechanism), Keyword(id=1251895522253029693, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, orderNo=3, keyword=YOLOv8n-Pose), Keyword(id=1251895522366275908, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, orderNo=1, keyword=姿态估计), Keyword(id=1251895522479522122, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, orderNo=2, keyword=注意力机制), Keyword(id=1251895522609545553, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, orderNo=3, keyword=YOLOv8n-Pose)], refs=[Reference(id=1251895527353303569, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=56, issue=4, pageStart=11, pageEnd=20, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=王珂, 陈启腾, 陈伟, journalName=郑州大学学报(理学版), refType=null, unstructuredReference=王珂,陈启腾,陈伟,
等.基于深度学习的二维人体姿态估计综述[J].
郑州大学学报(理学版),
2024,
56(4):11-20., articleTitle=基于深度学习的二维人体姿态估计综述, refAbstract=null), Reference(id=1251895527470744089, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=1653, pageEnd=1660, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=TOSHEV A, SZEGEDY C, journalName=null, refType=null, unstructuredReference=
TOSHEV A,
SZEGEDY C. DeepPose:Human Pose Estimation via Deep Neural Networks[C]//Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Columbus:IEEE,
2014:1653-1660., articleTitle=DeepPose:Human Pose Estimation via Deep Neural Networks, refAbstract=null), Reference(id=1251895527575601695, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=7291, pageEnd=7299, url=null, language=null, rfNumber=[3], rfOrder=2, authorNames=CAO Z, SIMON T, WEI S E, journalName=null, refType=null, unstructuredReference=
CAO Z,
SIMON T,
WEI S E,
et al. Realtime Multi-person 2D Pose Estimation Using Part Affinity Fields[C]//Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Honolulu:IEEE,
2017:7291-7299., articleTitle=Realtime Multi-person 2D Pose Estimation Using Part Affinity Fields, refAbstract=null), Reference(id=1251895527680459302, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=5386, pageEnd=5395, url=null, language=null, rfNumber=[4], rfOrder=3, authorNames=CHENG B W, XIAO B D, WANG J, journalName=null, refType=null, unstructuredReference=
CHENG B W,
XIAO B D,
WANG J,
et al. HigherHRNet:Scale-aware Representation Learning for Bottom-up Human Pose Estimation[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle:IEEE,
2020:5386-5395., articleTitle=HigherHRNet:Scale-aware Representation Learning for Bottom-up Human Pose Estimation, refAbstract=null), Reference(id=1251895527764345386, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2022, volume=45, issue=6, pageStart=7157, pageEnd=7173, url=null, language=null, rfNumber=[5], rfOrder=4, authorNames=FANG H S, LI J F, TANG H Y, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
FANG H S,
LI J F,
TANG H Y,
et al. Alphapose:Wholebody Regional Multi-person Pose Estimation and Tracking in Real-time[J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2022,
45(6):7157-7173., articleTitle=Alphapose:Wholebody Regional Multi-person Pose Estimation and Tracking in Real-time, refAbstract=null), Reference(id=1251895529341403698, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2017, volume=39, issue=6, pageStart=1137, pageEnd=1149, url=null, language=null, rfNumber=[6], rfOrder=5, authorNames=REN S Q, HE K M, GIRSHICK R, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
REN S Q,
HE K M,
GIRSHICK R,
et al. Faster R-CNN:Towards Real-time Object Detection with Region Proposal Networks[J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2017,
39(6):1137-1149., articleTitle=Faster R-CNN:Towards Real-time Object Detection with Region Proposal Networks, refAbstract=null), Reference(id=1251895529437872697, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=21, pageEnd=37, url=null, language=null, rfNumber=[7], rfOrder=6, authorNames=LIU W, ANGUELOV D, ERHAN D, journalName=null, refType=null, unstructuredReference=
LIU W,
ANGUELOV D,
ERHAN D,
et al. SSD: Single Shot Multibox Detector[C]//European Conference on Computer Vision. Amsterdam:Springer International Publishing,
2016:21-37., articleTitle=SSD: Single Shot Multibox Detector, refAbstract=null), Reference(id=1251895529572090438, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=779, pageEnd=788, url=null, language=null, rfNumber=[8], rfOrder=7, authorNames=REDMON J, DIVVALA S, GIRSHICK R, journalName=null, refType=null, unstructuredReference=
REDMON J,
DIVVALA S,
GIRSHICK R,
et al. You Only Look Once:Unified,Real-time Object Detection[C]//Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Las Vegas:IEEE,
2016:779-788., articleTitle=You Only Look Once:Unified,Real-time Object Detection, refAbstract=null), Reference(id=1251895529714696785, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025, volume=19, issue=3, pageStart=682, pageEnd=692, url=null, language=null, rfNumber=[9], rfOrder=8, authorNames=傅裕, 高树辉, journalName=计算机科学与探索, refType=null, unstructuredReference=傅裕,高树辉.改进YOLOv8s-Pose多人姿态估计轻量化模型研究[J].
计算机科学与探索,
2025,
19(3):682-692., articleTitle=改进YOLOv8s-Pose多人姿态估计轻量化模型研究, refAbstract=null), Reference(id=1251895529853108826, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025, volume=42, issue=3, pageStart=270, pageEnd=277, url=null, language=null, rfNumber=[10], rfOrder=9, authorNames=闻举, 伊力哈木·亚尔买买提, journalName=计算机仿真, refType=null, unstructuredReference=闻举,伊力哈木·亚尔买买提.针对太极动作的轻量级人体姿态估计[J].
计算机仿真,
2025,
42(3):270-277., articleTitle=针对太极动作的轻量级人体姿态估计, refAbstract=null), Reference(id=1251895529941189216, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=2637, pageEnd=2646, url=null, language=null, rfNumber=[11], rfOrder=10, authorNames=MAJI D, NAGORI S, MATHEW M, journalName=null, refType=null, unstructuredReference=
MAJI D,
NAGORI S,
MATHEW M,
et al. YOLO-Pose:Enhancing YOLO for Multi Person Pose Estimation Using Object Keypoint Similarity Loss[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition.New Orleans:IEEE,
2022:2637-2646., articleTitle=YOLO-Pose:Enhancing YOLO for Multi Person Pose Estimation Using Object Keypoint Similarity Loss, refAbstract=null), Reference(id=1251895530037658214, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=2117, pageEnd=2125, url=null, language=null, rfNumber=[12], rfOrder=11, authorNames=LIN T Y, DOLLAR P, GIRSHICK R, journalName=null, refType=null, unstructuredReference=
LIN T Y,
DOLLAR P,
GIRSHICK R,
et al. Feature Pyramid Networks for Object Detection[C]//Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Honolulu:IEEE,
2017:2117-2125., articleTitle=Feature Pyramid Networks for Object Detection, refAbstract=null), Reference(id=1251895530150904428, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=8759, pageEnd=8768, url=null, language=null, rfNumber=[13], rfOrder=12, authorNames=LIU S, QI L, QIN H F, journalName=null, refType=null, unstructuredReference=
LIU S,
QI L,
QIN H F,
et al. Path Aggregation Network for Instance Segmentation[C]//Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Salt Lake City:IEEE,
2018:8759-8768., articleTitle=Path Aggregation Network for Instance Segmentation, refAbstract=null), Reference(id=1251895530259956340, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=18, issue=null, pageStart=1355857, pageEnd=null, url=null, language=null, rfNumber=[14], rfOrder=13, authorNames=YUAN Z J, SHAO P W, LI J R, journalName=Frontiers in Neurorobotics, refType=null, unstructuredReference=
YUAN Z J,
SHAO P W,
LI J R,
et al. YOLOv8-ACU:Improved YOLOv8-Pose for Facial Acupoint Detection[J].
Frontiers in Neurorobotics,
2024,
18:1355857., articleTitle=YOLOv8-ACU:Improved YOLOv8-Pose for Facial Acupoint Detection, refAbstract=null), Reference(id=1251895530385785464, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=60, issue=17, pageStart=203, pageEnd=215, url=null, language=null, rfNumber=[15], rfOrder=14, authorNames=高民, 陈高华, 古佳欣, journalName=计算机工程与应用, refType=null, unstructuredReference=高民,陈高华,古佳欣,
等.FLM-YOLOv8:一种轻量级的口罩佩戴检测算法[J].
计算机工程与应用,
2024,
60(17):203-215., articleTitle=FLM-YOLOv8:一种轻量级的口罩佩戴检测算法, refAbstract=null), Reference(id=1251895530473865852, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2023, volume=9, issue=4, pageStart=733, pageEnd=752, url=null, language=null, rfNumber=[16], rfOrder=15, authorNames=GUO M H, LU C Z, LIU Z N, journalName=Computational Visual Media, refType=null, unstructuredReference=
GUO M H,
LU C Z,
LIU Z N,
et al. Visual Attention Network[J].
Computational Visual Media,
2023,
9(4):733-752., articleTitle=Visual Attention Network, refAbstract=null), Reference(id=1251895530574529155, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=236, issue=null, pageStart=121352, pageEnd=null, url=null, language=null, rfNumber=[17], rfOrder=16, authorNames=LAU K W, PO L M, REHMAN Y A U, journalName=Expert Systems with Applications, refType=null, unstructuredReference=
LAU K W,
PO L M,
REHMAN Y A U. Large Separable Kernel Attention:Rethinking the Large Kernel Attention Design in CNN[J].
Expert Systems with Applications,
2024,
236:121352., articleTitle=Large Separable Kernel Attention:Rethinking the Large Kernel Attention Design in CNN, refAbstract=null), Reference(id=1251895530683581064, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[18], rfOrder=17, authorNames=王伊萌, journalName=基于感受野的多层级特征融合交通标志检测算法研究, refType=null, unstructuredReference=王伊萌.
基于感受野的多层级特征融合交通标志检测算法研究[D].西安:长安大学,
2024., articleTitle=null, refAbstract=null), Reference(id=1251895530784244366, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=60, issue=9, pageStart=79, pageEnd=89, url=null, language=null, rfNumber=[19], rfOrder=18, authorNames=史涛, 崔杰, 李松, journalName=计算机工程与应用, refType=null, unstructuredReference=史涛,崔杰,李松.优化改进YOLOv8实现实时无人机车辆检测的算法[J].
计算机工程与应用,
2024,
60(9):79-89., articleTitle=优化改进YOLOv8实现实时无人机车辆检测的算法, refAbstract=null), Reference(id=1251895530918462098, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025, volume=25, issue=5, pageStart=1405, pageEnd=null, url=null, language=null, rfNumber=[20], rfOrder=19, authorNames=WANG Y, OUYANG C, PENG H, journalName=Sensors, refType=null, unstructuredReference=
WANG Y,
OUYANG C,
PENG H,
et al. YOLO-ALW:An Enhanced High-precision Model for Chili Maturity Detection[J].
Sensors,
2025,
25(5):1405., articleTitle=YOLO-ALW:An Enhanced High-precision Model for Chili Maturity Detection, refAbstract=null), Reference(id=1251895531044291224, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=20, pageStart=6506, pageEnd=null, url=null, language=null, rfNumber=[21], rfOrder=20, authorNames=ZHOU Q, WANG Z, ZHONG Y W, journalName=Sensors, refType=null, unstructuredReference=
ZHOU Q,
WANG Z,
ZHONG Y W,
et al. Efficient Optimized YOLOv8 Model with Extended Vision[J].
Sensors,
2024,
24(20):6506., articleTitle=Efficient Optimized YOLOv8 Model with Extended Vision, refAbstract=null), Reference(id=1251895531170120353, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=13, pageStart=4088, pageEnd=null, url=null, language=null, rfNumber=[22], rfOrder=21, authorNames=WANG C J, WANG Y F, journalName=Sensors, refType=null, unstructuredReference=
WANG C J,
WANG Y F. SLGA-YOLO: A Lightweight Castings Surface Defect Detection Method Based on Fusion-enhanced Attention Mechanism and Self-architecture[J].
Sensors,
2024,
24(13):4088., articleTitle=SLGA-YOLO: A Lightweight Castings Surface Defect Detection Method Based on Fusion-enhanced Attention Mechanism and Self-architecture, refAbstract=null), Reference(id=1251895531237229224, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=14, issue=1, pageStart=429, pageEnd=null, url=null, language=null, rfNumber=[23], rfOrder=22, authorNames=LI N, YE T R, ZHOU Z H, journalName=Applied Sciences, refType=null, unstructuredReference=
LI N,
YE T R,
ZHOU Z H,
et al. Enhanced YOLOv8 with BiFPN-SimAM for Precise Defect Detection in Miniature Capacitors[J].
Applied Sciences,
2024,
14(1):429., articleTitle=Enhanced YOLOv8 with BiFPN-SimAM for Precise Defect Detection in Miniature Capacitors, refAbstract=null), Reference(id=1251895531337892527, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=10781, pageEnd=10790, url=null, language=null, rfNumber=[24], rfOrder=23, authorNames=TAN M, PANG R, LE Q V, journalName=null, refType=null, unstructuredReference=
TAN M,
PANG R,
LE Q V. Efficientdet:Scalable and Efficient Object Detection[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle:IEEE,
2020:10781-10790., articleTitle=Efficientdet:Scalable and Efficient Object Detection, refAbstract=null), Reference(id=1251895531417584309, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025, volume=62, issue=2, pageStart=441, pageEnd=455, url=null, language=null, rfNumber=[25], rfOrder=24, authorNames=王新蕾, 廖晨旭, 王硕, journalName=激光与光电子学进展, refType=null, unstructuredReference=王新蕾,廖晨旭,王硕,
等.面向鱼眼摄像头目标检测的轻量级网络[J].
激光与光电子学进展,
2025,
62(2):441-455., articleTitle=面向鱼眼摄像头目标检测的轻量级网络, refAbstract=null), Reference(id=1251895531505664701, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2020, volume=34, issue=7, pageStart=12993, pageEnd=13000, url=null, language=null, rfNumber=[26], rfOrder=25, authorNames=ZHENG Z H, WANG P, LIU W, journalName=null, refType=null, unstructuredReference=
ZHENG Z H,
WANG P,
LIU W,
et al. Distance-IoU Loss:Faster and Better Learning for Bounding Box Regression[C]//Proceedings of the AAAI Conference on Artificial Intelligence. Palo Alto:AAAI Press,
2020,
34(7):12993-13000., articleTitle=Distance-IoU Loss:Faster and Better Learning for Bounding Box Regression, refAbstract=null), Reference(id=1251895531618910915, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025, volume=36, issue=5, pageStart=1054, pageEnd=1064, url=null, language=null, rfNumber=[27], rfOrder=26, authorNames=罗亮, 郎霄, 祖国庆, journalName=中国机械工程, refType=null, unstructuredReference=罗亮,郎霄,祖国庆,
等.一种基于改进YOLOv8n的气缸套缺陷检测方法[J].
中国机械工程,
2025,
36(5):1054-1064., articleTitle=一种基于改进YOLOv8n的气缸套缺陷检测方法, refAbstract=null), Reference(id=1251895531702797001, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=15, issue=5, pageStart=737, pageEnd=null, url=null, language=null, rfNumber=[28], rfOrder=27, authorNames=YAO J S, SONG B, CHEN X Y, journalName=Forests, refType=null, unstructuredReference=
YAO J S,
SONG B,
CHEN X Y,
et al. Pine-YOLO: A Method for Detecting Pine Wilt Disease in Unmanned Aerial Vehicle Remote Sensing Images[J].
Forests,
2024,
15(5):737., articleTitle=Pine-YOLO: A Method for Detecting Pine Wilt Disease in Unmanned Aerial Vehicle Remote Sensing Images, refAbstract=null), Reference(id=1251895531853791952, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025, volume=51, issue=1, pageStart=196, pageEnd=209, url=null, language=null, rfNumber=[29], rfOrder=28, authorNames=张朝阳, 张上, 胡益民, journalName=无线电通信技术, refType=null, unstructuredReference=张朝阳,张上,胡益民,
等.动态聚焦多维注意力遥感弱小目标检测[J].
无线电通信技术,
2025,
51(1):196-209., articleTitle=动态聚焦多维注意力遥感弱小目标检测, refAbstract=null), Reference(id=1251895531975426772, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025-05-12, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[30], rfOrder=29, authorNames=TONG Z J, CHEN Y H, XU Z W, journalName=null, refType=null, unstructuredReference=
TONG Z J,
CHEN Y H,
XU Z W,
et al. Wise-IoU:Bounding Box Regression Loss with Dynamic Focusing Mechanism[EB/OL]. (2023-01-24)[
2025-05-12].
https://arxiv.org/abs/2301.10051., articleTitle=Wise-IoU:Bounding Box Regression Loss with Dynamic Focusing Mechanism, refAbstract=null), Reference(id=1251895532050924250, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=19, pageStart=8267, pageEnd=null, url=null, language=null, rfNumber=[31], rfOrder=30, authorNames=RAN X S, HE S, LI R, journalName=Sensors, refType=null, unstructuredReference=
RAN X S,
HE S,
LI R. Research on Fatigued-driving Detection Method by Integrating Lightweight YOLOv5s and Facial 3D Keypoints[J].
Sensors,
2023,
23(19):8267., articleTitle=Research on Fatigued-driving Detection Method by Integrating Lightweight YOLOv5s and Facial 3D Keypoints, refAbstract=null), Reference(id=1251895532134810335, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=5694, pageEnd=5703, url=null, language=null, rfNumber=[32], rfOrder=31, authorNames=MA X Y, DAI X L, BAI Y F, journalName=null, refType=null, unstructuredReference=
MA X Y,
DAI X L,
BAI Y F,
et al. Rewrite the Stars[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle: IEEE,
2024:5694-5703., articleTitle=Rewrite the Stars, refAbstract=null), Reference(id=1251895532214502115, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=12021, pageEnd=12031, url=null, language=null, rfNumber=[33], rfOrder=32, authorNames=CHEN J R, KAO S H, HE H, journalName=null, refType=null, unstructuredReference=
CHEN J R,
KAO S H,
HE H,
et al. Run,Don't Walk:Chasing Higher FLOPS for Faster Neural Networks[C]//Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Vancouver: IEEE,
2023:12021-12031., articleTitle=Run,Don't Walk:Chasing Higher FLOPS for Faster Neural Networks, refAbstract=null), Reference(id=1251895533791560428, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2022, volume=35, issue=null, pageStart=4203, pageEnd=4217, url=null, language=null, rfNumber=[34], rfOrder=33, authorNames=YANG J W, LI C Y, DAI X Y, journalName=Advances in Neural Information Processing Systems, refType=null, unstructuredReference=
YANG J W,
LI C Y,
DAI X Y,
et al. Focal Modulation Networks[J].
Advances in Neural Information Processing Systems,
2022,
35:4203-4217., articleTitle=Focal Modulation Networks, refAbstract=null), Reference(id=1251895533900612339, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=1, pageStart=8861446, pageEnd=null, url=null, language=null, rfNumber=[35], rfOrder=34, authorNames=LI L H, ZHAO S W, SUN R Z, journalName=Computational Intelligence and Neuroscience, refType=null, unstructuredReference=
LI L H,
ZHAO S W,
SUN R Z,
et al. AFI-Net:Attentionguided Feature Integration Network for RGBD Saliency Detection[J].
Computational Intelligence and Neuroscience,
2021(1):8861446., articleTitle=AFI-Net:Attentionguided Feature Integration Network for RGBD Saliency Detection, refAbstract=null), Reference(id=1251895533984498424, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=21, issue=3, pageStart=62, pageEnd=null, url=null, language=null, rfNumber=[36], rfOrder=35, authorNames=LI H L, LI J, WEI H B, journalName=Journal of Real-time Image Processing, refType=null, unstructuredReference=
LI H L,
LI J,
WEI H B,
et al. Slim-neck by GSConv:A Lightweight-design for Real-time Detector Architectures[J].
Journal of Real-time Image Processing,
2024,
21(3):62., articleTitle=Slim-neck by GSConv:A Lightweight-design for Real-time Detector Architectures, refAbstract=null), Reference(id=1251895534131299070, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025-05-12, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[37], rfOrder=36, authorNames=XU X Z, JIANG Y Q, CHEN W H, journalName=null, refType=null, unstructuredReference=
XU X Z,
JIANG Y Q,
CHEN W H,
et al. DAMO-YOLO:A Report on Real-time Object Detection Design[EB/OL]. (2022-11-23)[
2025-05-12].
https://arxiv.org/abs/2211.15444., articleTitle=DAMO-YOLO:A Report on Real-time Object Detection Design, refAbstract=null), Reference(id=1251895534219379459, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2025-04-15, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[38], rfOrder=37, authorNames=LI C Y, LI L L, GENG Y F, journalName=null, refType=null, unstructuredReference=
LI C Y,
LI L L,
GENG Y F,
et al. YOLOv6 v3.0: A Full-scale Reloading[EB/OL]. (2023-01-13)[
2025-04-15].
https://arxiv.org/abs/2301.05586., articleTitle=YOLOv6 v3.0: A Full-scale Reloading, refAbstract=null), Reference(id=1251895534299071242, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, doi=null, pmid=null, pmcid=null, year=2024, volume=147, issue=null, pageStart=105057, pageEnd=null, url=null, language=null, rfNumber=[39], rfOrder=38, authorNames=KANG M, TING C M, TING F F, journalName=Image and Vision Computing, refType=null, unstructuredReference=
KANG M,
TING C M,
TING F F,
et al. ASF-YOLO:A Novel YOLO Model with Attentional Scale Sequence Fusion for Cell Instance Segmentation[J].
Image and Vision Computing,
2024,
147:105057., articleTitle=ASF-YOLO:A Novel YOLO Model with Attentional Scale Sequence Fusion for Cell Instance Segmentation, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1251895520554336470, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, xref=1., ext=[AuthorCompanyExt(id=1251895520566919383, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520554336470, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.School of Big Data and Computer Science, Guizhou Normal University, Guiyang 550025, China), AuthorCompanyExt(id=1251895520587890905, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520554336470, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.贵州师范大学 大数据与计算机科学学院,贵州 贵阳 550025)]), AuthorCompany(id=1251895520759857381, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, xref=2., ext=[AuthorCompanyExt(id=1251895520768245990, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520759857381, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2.College of Computer Science and Technology, Harbin Engineering University, Harbin 150001, China), AuthorCompanyExt(id=1251895520776634599, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, companyId=1251895520759857381, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2.哈尔滨工程大学 计算机科学与技术学院,黑龙江 哈尔滨 150001)])], figs=[ArticleFig(id=1251895522890563935, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 1, caption=
Improved network structure of YOLOv8n-Pose, figureFileSmall=ZlMpyEui6Ek186WeIQFBAg==, figureFileBig=er0TL6twC5Oq796QyLKqYA==, tableContent=null), ArticleFig(id=1251895522982838627, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图1, caption=
YOLOv8n-Pose改进网络结构, figureFileSmall=ZlMpyEui6Ek186WeIQFBAg==, figureFileBig=er0TL6twC5Oq796QyLKqYA==, tableContent=null), ArticleFig(id=1251895523096084841, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 2, caption=
Improved SPPF structure, figureFileSmall=H7rCBlG0IB/fOEg5Vvcbcg==, figureFileBig=D1rQNcPWY1d1tbzjihFXEQ==, tableContent=null), ArticleFig(id=1251895523192553839, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图2, caption=
改进的SPPF结构, figureFileSmall=H7rCBlG0IB/fOEg5Vvcbcg==, figureFileBig=D1rQNcPWY1d1tbzjihFXEQ==, tableContent=null), ArticleFig(id=1251895523280634228, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 3, caption=
Principle of LKA large kernel convolution decomposition, figureFileSmall=pbXMg+Gc69rOZK7duH6PEA==, figureFileBig=Nos8mnMGr8+ukjV6fjm1HQ==, tableContent=null), ArticleFig(id=1251895524891246972, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图3, caption=
LKA大核卷积分解原理, figureFileSmall=pbXMg+Gc69rOZK7duH6PEA==, figureFileBig=Nos8mnMGr8+ukjV6fjm1HQ==, tableContent=null), ArticleFig(id=1251895525000298880, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 4, caption=
LSKA convolution separation calculation principle, figureFileSmall=NP2QV9+/QnqPsKy79gI5TQ==, figureFileBig=48DCrCRDdaU3Xr0xYJKzsQ==, tableContent=null), ArticleFig(id=1251895525084184966, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图4, caption=
LSKA卷积分离计算原理, figureFileSmall=NP2QV9+/QnqPsKy79gI5TQ==, figureFileBig=48DCrCRDdaU3Xr0xYJKzsQ==, tableContent=null), ArticleFig(id=1251895525168071051, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 5, caption=
BiFPN network structure, figureFileSmall=RTot2X66x9ExS/XikwgDNA==, figureFileBig=PMJFyvINPbW8jN+E6oXo9Q==, tableContent=null), ArticleFig(id=1251895525285511572, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图5, caption=
BiFPN网络结构, figureFileSmall=RTot2X66x9ExS/XikwgDNA==, figureFileBig=PMJFyvINPbW8jN+E6oXo9Q==, tableContent=null), ArticleFig(id=1251895525373591960, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 6, caption=
Comparison of the experimental data of the model, figureFileSmall=D36wVKAVj6OAwXvPuEgxfQ==, figureFileBig=0t9p/7dTvnMqgcT6izGwHQ==, tableContent=null), ArticleFig(id=1251895525503615389, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图6, caption=
模型对比实验数据, figureFileSmall=D36wVKAVj6OAwXvPuEgxfQ==, figureFileBig=0t9p/7dTvnMqgcT6izGwHQ==, tableContent=null), ArticleFig(id=1251895525595890086, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 7, caption=
Comparison effect diagram of visualization heat map, figureFileSmall=kCFvaazl4j617KTZvGnaSg==, figureFileBig=Syz3jHPZjkmGLqHvBPJJHw==, tableContent=null), ArticleFig(id=1251895525776245161, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图7, caption=
可视化热力图对比效果, figureFileSmall=kCFvaazl4j617KTZvGnaSg==, figureFileBig=Syz3jHPZjkmGLqHvBPJJHw==, tableContent=null), ArticleFig(id=1251895525881102767, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Fig. 8, caption=
Comparison effect of models, figureFileSmall=ZrjYBHO45nbmfd224ZKsxA==, figureFileBig=bdp5qECrYjKVKv6Ent8lTA==, tableContent=null), ArticleFig(id=1251895525964988851, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=图8, caption=
模型对比效果, figureFileSmall=ZrjYBHO45nbmfd224ZKsxA==, figureFileBig=bdp5qECrYjKVKv6Ent8lTA==, tableContent=null), ArticleFig(id=1251895526074040762, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Tab. 1, caption=
Experimental environment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 名称 | 配置 |
|---|
| 操作系统 | Windows 10 |
| 内存/GB | 767 |
| CPU | Intel(R)Xeon(R)Gold 6342 |
| GPU | NVIDIA RTX A6000(47 GB) |
| 开发环境 | PyTorch 1.10.1,CUDA 11.3 |
), ArticleFig(id=1251895526157926843, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=表1, caption=
实验环境
, figureFileSmall=null, figureFileBig=null, tableContent=
| 名称 | 配置 |
|---|
| 操作系统 | Windows 10 |
| 内存/GB | 767 |
| CPU | Intel(R)Xeon(R)Gold 6342 |
| GPU | NVIDIA RTX A6000(47 GB) |
| 开发环境 | PyTorch 1.10.1,CUDA 11.3 |
), ArticleFig(id=1251895526237618623, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Tab. 2, caption=
Comparison of ablation experiment results
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验 | SPPF-LSKA | BiFPN | Wise-IoU | P/% | R/% | mAP@0.5/% | mAP@0.5:0.95/% | Params/M |
|---|
| 1 | × | × | × | 83.8 | 74.1 | 79.5 | 49.2 | 3.3 |
| 2 | √ | × | × | 85.2 | 74.4 | 80.1 | 49.9 | 3.5 |
| 3 | √ | √ | × | 84.6 | 75.3 | 81.3 | 50.9 | 4.0 |
| 4 | √ | √ | √ | 85.7 | 76.8 | 81.7 | 51.1 | 4.0 |
), ArticleFig(id=1251895526342476229, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=表2, caption=
消融实验结果对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验 | SPPF-LSKA | BiFPN | Wise-IoU | P/% | R/% | mAP@0.5/% | mAP@0.5:0.95/% | Params/M |
|---|
| 1 | × | × | × | 83.8 | 74.1 | 79.5 | 49.2 | 3.3 |
| 2 | √ | × | × | 85.2 | 74.4 | 80.1 | 49.9 | 3.5 |
| 3 | √ | √ | × | 84.6 | 75.3 | 81.3 | 50.9 | 4.0 |
| 4 | √ | √ | √ | 85.7 | 76.8 | 81.7 | 51.1 | 4.0 |
), ArticleFig(id=1251895526459916748, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Tab. 3, caption=
Comparative experiment of feature extraction backbone network
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | Params/M | P/% | R/% | mAP@0.5/% | *mAP@0.5:0.95/% | GFLOPs |
|---|
| YOLOv8n-Pose | 3.3 | 83.9 | 74.0 | 79.3 | 49.3 | 9.3 |
| YOLOv8n-StarNet-Pose | 2.5 | 82.9 | 72.9 | 78.1 | 47.0 | 7.6 |
| YOLOv8n-FastNet-Pose | 4.4 | 84.0 | 76.0 | 80.7 | 50.1 | 11.8 |
| YOLOv8n-FocalModulation-Pose | 3.4 | 84.2 | 74.5 | 79.9 | 50.0 | 9.4 |
| YOLOv8n-AFI-Pose | 3.2 | 84.8 | 74.2 | 80.2 | 49.6 | 9.2 |
| YOLOv8n-Pose+SPPF_LSKA | 3.5 | 85.2 | 74.4 | 80.4 | 49.9 | 9.5 |
), ArticleFig(id=1251895526573162961, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=表3, caption=
特征提取骨干网络对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | Params/M | P/% | R/% | mAP@0.5/% | *mAP@0.5:0.95/% | GFLOPs |
|---|
| YOLOv8n-Pose | 3.3 | 83.9 | 74.0 | 79.3 | 49.3 | 9.3 |
| YOLOv8n-StarNet-Pose | 2.5 | 82.9 | 72.9 | 78.1 | 47.0 | 7.6 |
| YOLOv8n-FastNet-Pose | 4.4 | 84.0 | 76.0 | 80.7 | 50.1 | 11.8 |
| YOLOv8n-FocalModulation-Pose | 3.4 | 84.2 | 74.5 | 79.9 | 50.0 | 9.4 |
| YOLOv8n-AFI-Pose | 3.2 | 84.8 | 74.2 | 80.2 | 49.6 | 9.2 |
| YOLOv8n-Pose+SPPF_LSKA | 3.5 | 85.2 | 74.4 | 80.4 | 49.9 | 9.5 |
), ArticleFig(id=1251895526678020569, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Tab. 4, caption=
Comparison experiment of feature fusion networks
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | P/% | R/% | mAP@0.5/% | mAP@0.5:0.95/% | Params/M | 权重/M |
|---|
| SlimNeck[36] | 82.7 | 73.7 | 78.1 | 46.4 | 3.1 | 6.5 |
| RepGFPN[37] | 83.8 | 74.0 | 79.6 | 49.0 | 3.5 | 7.5 |
| EfficientRepBiPAN[38] | 82.1 | 73.6 | 78.2 | 47.2 | 3.0 | 6.4 |
| ASF[39] | 82.8 | 75.0 | 79.6 | 49.5 | 3.3 | 7.0 |
| BiFPN | 83.6 | 76.1 | 81.1 | 50.9 | 3.7 | 7.8 |
), ArticleFig(id=1251895526770295267, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=表4, caption=
特征融合网络对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | P/% | R/% | mAP@0.5/% | mAP@0.5:0.95/% | Params/M | 权重/M |
|---|
| SlimNeck[36] | 82.7 | 73.7 | 78.1 | 46.4 | 3.1 | 6.5 |
| RepGFPN[37] | 83.8 | 74.0 | 79.6 | 49.0 | 3.5 | 7.5 |
| EfficientRepBiPAN[38] | 82.1 | 73.6 | 78.2 | 47.2 | 3.0 | 6.4 |
| ASF[39] | 82.8 | 75.0 | 79.6 | 49.5 | 3.3 | 7.0 |
| BiFPN | 83.6 | 76.1 | 81.1 | 50.9 | 3.7 | 7.8 |
), ArticleFig(id=1251895526862569961, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Tab. 5, caption=
Comparative experiments of mainstream models
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 图像大小/piexl | Params/M | mAP@0.5/% |
|---|
| YOLOv5s6-Pose | 640×640 | 15.0 | 84.3 |
| YOLOx-Pose-tiny | 416×416 | 6.0 | 79.3 |
| YOLOv7-W6-Pose | 960×960 | 80.0 | 94.0 |
| YOLOv8n-Pose | 640×640 | 3.2 | 79.5 |
| 本文模型 | 640×640 | 4.0 | 81.7 |
), ArticleFig(id=1251895526963233265, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=表5, caption=
主流模型对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 图像大小/piexl | Params/M | mAP@0.5/% |
|---|
| YOLOv5s6-Pose | 640×640 | 15.0 | 84.3 |
| YOLOx-Pose-tiny | 416×416 | 6.0 | 79.3 |
| YOLOv7-W6-Pose | 960×960 | 80.0 | 94.0 |
| YOLOv8n-Pose | 640×640 | 3.2 | 79.5 |
| 本文模型 | 640×640 | 4.0 | 81.7 |
), ArticleFig(id=1251895527076479478, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=EN, label=Tab. 6, caption=
Model generalization experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | P | R | mAP@0.5 | mAP@0.5:0.95 |
|---|
| YOLOv8n-Pose | 85.3 | 80.0 | 83.8 | 46.4 |
| YOLOv11n-Pose | 85.0 | 80.0 | 83.8 | 45.9 |
| YOLOv12n-Pose | 84.5 | 79.0 | 82.3 | 43.9 |
| 本文模型 | 85.2 | 81.6 | 84.4 | 47.3 |
), ArticleFig(id=1251895527147782653, tenantId=1146029695717560320, journalId=1251234473337991274, articleId=1251893512128639586, language=CN, label=表6, caption=
模型泛化实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | P | R | mAP@0.5 | mAP@0.5:0.95 |
|---|
| YOLOv8n-Pose | 85.3 | 80.0 | 83.8 | 46.4 |
| YOLOv11n-Pose | 85.0 | 80.0 | 83.8 | 45.9 |
| YOLOv12n-Pose | 84.5 | 79.0 | 82.3 | 43.9 |
| 本文模型 | 85.2 | 81.6 | 84.4 | 47.3 |
)], attaches=null, journal=Journal(id=1251231494887223395, delFlag=0, nameCn=无线电通信技术, nameEn=Radio Communications Technology, nameHistory1=null, nameHistory2=null, issn=1003-3114, eissn=, cn=13-1099/TN, coden=null, periodic=1, language=CN, oaType=1, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=, officePhone=, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=veWCdfK9mJVXm/uFgI4wQA==, journalPrice=null, startedYear=null, abbrevIsoEn=Radio Communications Technology, journalRemark=null, publicationField=null, createdTime=1776246435141, updatedTime=1776397604574, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=R, firstLetterEn=R, subjectCode=Engineering, subjectName=工程, subjectCodeEn=Engineering, subjectNameEn=null, picCn=veWCdfK9mJVXm/uFgI4wQA==, picEn=OSQVHuARoHUd1TQ4ONLQrQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1251865545604285354, language=CN, name=无线电通信技术, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1776397604609, updatedTime=1776397604609, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://wxdt.cbpt.cnki.net/index.aspx?t=1, submissionEditorUrl=https://wxdt.cbpt.cnki.net/index.aspx?t=3, submissionReviewUrl=https://wxdt.cbpt.cnki.net/index.aspx?t=2, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1251865545646228395, language=EN, name=Radio Communications Technology, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1776397604619, updatedTime=1776397604619, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://wxdt.cbpt.cnki.net/index.aspx?t=1, submissionEditorUrl=https://wxdt.cbpt.cnki.net/index.aspx?t=3, submissionReviewUrl=https://wxdt.cbpt.cnki.net/index.aspx?t=2, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1251234473337991274, websiteList=[Website(id=1251257283515203650, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1251234473337991274, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/wxdtxjs/CN, language=CN, createTime=1776252583627, createBy=18614031015, updateTime=1776253691546, updateBy=18614031015, name=无线电通信技术-中文, tplId=1146099689490845704, title=无线电通信技术, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1251262047678313076, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=articleTextType, value=kx, createTime=1776253719491, updateTime=1776253719491, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047653147249, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=banner, value=null, createTime=1776253719485, updateTime=1776253719485, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047707673207, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=grayFlag, value=0, createTime=1776253719498, updateTime=1776253719498, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047644758640, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=logo, value=https://castjournals.cast.org.cn/joweb/wxdtxjs/CN/file/pic?fileId=sk5LMh+QbAm+98l18HjovQ==, createTime=1776253719483, updateTime=1776253719483, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047720256121, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=minRunFlag, value=0, createTime=1776253719501, updateTime=1776253719501, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047669924467, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/wxdtxjs/CN/file/pic, createTime=1776253719489, updateTime=1776253719489, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047716061816, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=silenceFlag, value=0, createTime=1776253719500, updateTime=1776253719500, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047661535858, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1776253719487, updateTime=1776253719487, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047682507381, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=themeColor, value=null, createTime=1776253719492, updateTime=1776253719492, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262047690895990, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283515203650, code=themeStyle, value=null, createTime=1776253719494, updateTime=1776253719494, creator=18614031015, updator=18614031015)]), Website(id=1251257283607478339, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1251234473337991274, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/wxdtxjs/EN, language=EN, createTime=1776252583648, createBy=18614031015, updateTime=1776253687916, updateBy=18614031015, name=无线电通信技术-英文, tplId=1146101810881728533, title=Radio Communications Technology, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1251262071707484468, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=articleTextType, value=kx, createTime=1776253725220, updateTime=1776253725220, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071690707249, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=banner, value=null, createTime=1776253725216, updateTime=1776253725216, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071724261687, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=grayFlag, value=0, createTime=1776253725224, updateTime=1776253725224, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071682318640, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=logo, value=https://castjournals.cast.org.cn/joweb/wxdtxjs/EN/file/pic?fileId=sk5LMh+QbAm+98l18HjovQ==, createTime=1776253725214, updateTime=1776253725214, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071732650297, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=minRunFlag, value=0, createTime=1776253725226, updateTime=1776253725226, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071703290163, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/wxdtxjs/EN/file/pic, createTime=1776253725219, updateTime=1776253725219, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071728455992, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=silenceFlag, value=0, createTime=1776253725225, updateTime=1776253725225, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071694901554, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1776253725217, updateTime=1776253725217, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071711678773, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=themeColor, value=null, createTime=1776253725221, updateTime=1776253725221, creator=18614031015, updator=18614031015), WebsiteProps(id=1251262071720067382, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251257283607478339, code=themeStyle, value=null, createTime=1776253725223, updateTime=1776253725223, creator=18614031015, updator=18614031015)])], journalTitle=无线电通信技术, weixinUrl=null, journalUrl=https://wxdt.cbpt.cnki.net/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Radio Communications Technology, journalPhotoCn=veWCdfK9mJVXm/uFgI4wQA==, journalPhotoEn=OSQVHuARoHUd1TQ4ONLQrQ==, journalFirstLetter=R, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/wxdtxjs/CN/10.3969/j.issn.1003-3114.2025.05.015, detailUrlEn=https://castjournals.cast.org.cn/joweb/wxdtxjs/EN/10.3969/j.issn.1003-3114.2025.05.015, pdfUrlCn=https://castjournals.cast.org.cn/joweb/wxdtxjs/CN/PDF/10.3969/j.issn.1003-3114.2025.05.015, pdfUrlEn=https://castjournals.cast.org.cn/joweb/wxdtxjs/EN/PDF/10.3969/j.issn.1003-3114.2025.05.015, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)