Article(id=1149781961000051646, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149781952959574654, articleNumber=null, orderNo=null, doi=10.12404/j.issn.1671-1815.2402441, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=research-article, receivedDate=1712332800000, receivedDateStr=2024-04-06, revisedDate=1733414400000, revisedDateStr=2024-12-06, acceptedDate=null, acceptedDateStr=null, onlineDate=1752058981417, onlineDateStr=2025-07-09, pubDate=1743091200000, pubDateStr=2025-03-28, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1752058981417, onlineIssueDateStr=2025-07-09, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1752058981417, creator=13701087609, updateTime=1752058981417, updator=13701087609, issue=Issue{id=1149781952959574654, tenantId=1146029695717560320, journalId=1146123166801305609, year='2025', volume='25', issue='9', pageStart='3529', pageEnd='3967', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=0, createTime=1752058979501, creator=13701087609, updateTime=1776333392421, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1251596220226027613, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149781952959574654, language=EN, specialIssueTitle=, coverIllustrator=, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1251596220226027614, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1149781952959574654, language=CN, specialIssueTitle=, coverIllustrator=, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=3778, endPage=3787, ext={EN=ArticleExt(id=1149781961205572543, articleId=1149781961000051646, tenantId=1146029695717560320, journalId=1146123166801305609, language=EN, title=Small and Medium-sized Obstacle Detection Methods in Intelligent Driving Scenarios, columnId=1156262729162810294, journalTitle=Science Technology and Engineering, columnName=Papers·Automation and Computational Technology, runingTitle=null, highlight=null, articleAbstract=
Aiming at the problems such as small and medium-sized obstacles on the road are prone to miss detection, small target obstacles are difficult to detect, and the number of model parameters is large in smart driving scenarios, the obstacle target detection algorithm with improved YOLOv8n was proposed. Distribution shifting convolution (DSConv) was used in the backbone network to replace floating point operation with integer operation, reducing the amount of redundant computation, and maintaining the accuracy by imitating the original convolution layer by quantization and distribution shifting. By adding small target detection layer, the feature information of small target can be captured better and the scale characteristics of small target can be adapted. Combined with SimAM parameterless attention mechanism, SPPF-SimAM module was introduced to improve the quality and diversity of feature representation, and the detection accuracy was improved without increasing the number of parameters. By combining ghost-shuffle convolution (GSConv) and VoV-GSCSP modules, the neck feature fusion network was lightweight, reducing the number of parameters and calculation of the model. The experimental results show that the accuracy, recall, and mean average precision of the improved model are improved by 1.6%, 8.0%, and 6.2%, respectively. The number of parameters is reduced by 6.7% compared with the original model, and the proposed algorithm effectively improves the detection accuracy of small and medium-sized obstacles in smart driving scenarios, and achieves a better balance between the detection performance and the model lightweighting.
, correspAuthors=Xin-yuan NAN, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Xiao-yu LONG, Xin-yuan NAN), CN=ArticleExt(id=1149781993971475440, articleId=1149781961000051646, tenantId=1146029695717560320, journalId=1146123166801305609, language=CN, title=智能驾驶场景下的中小型障碍物检测方法, columnId=1156262729783567290, journalTitle=科学技术与工程, columnName=论文·自动化技术、计算机技术, runingTitle=null, highlight=null, articleAbstract=
针对智能驾驶场景下路面中小型障碍物易发生漏检、小目标障碍物难检测、模型参数量大等问题,提出了改进YOLOv8n的障碍物目标检测算法。在主干网络中融入分布移位卷积(distribution shifting convolution,DSConv),将浮点运算替换为整数运算,减少了冗余计算量,通过量化和分布移位的方式模仿原始卷积层,维持了准确率;通过添加小目标检测层,更好地捕捉小目标的特征信息,适配小目标的尺度特征;结合SimAM无参数注意力机制,引入SPPF-SimAM模块,提高特征表示的质量与多样性,在不增加参数量的情况下实现了检测精度的提升;通过组合鬼影混洗卷积(ghost-shuffle convolution,GSConv)和VoV-GSCSP模块的方式轻量化颈部特征融合网络,降低了模型的参数量和计算量。实验结果表明,改进后模型的准确率、召回率、平均精度均值相较于原始模型分别提升了1.6%、8.0%、6.2%,参数量降低了6.7%,所提算法有效提升了智能驾驶场景下中小型障碍物的检测精度,并且在检测性能与模型轻量化之间达到较好的平衡。
, correspAuthors=南新元, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=Nxp6AX12snMDpbxKN79g8w==, magXml=jhE60zYt3Tdt5NFKdt7YOw==, pdfUrl=null, pdf=MXtah3yFi03XwM1eI0wBLA==, pdfFileSize=8212545, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=/K8xPS9Kj3ruaXqii8vtFw==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=Isu36LHNjQutlcULPixHzA==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=龙小羽, 南新元)}, authors=[Author(id=1251249353340436784, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=874480489@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251249353428517175, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, authorId=1251249353340436784, language=EN, stringName=Xiao-yu LONG, firstName=Xiao-yu, middleName=null, lastName=LONG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=School of Electrical Engineering, Xinjiang University, Urumqi 830017, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251249353508208957, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, authorId=1251249353340436784, language=CN, stringName=龙小羽, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=新疆大学电气工程学院, 乌鲁木齐 830017, bio={"content":"
龙小羽(2000—),女,汉族,新疆和静人,硕士研究生。研究方向:深度学习、目标检测。E-mail:874480489@qq.com。
"}, bioImg=null, bioContent=
龙小羽(2000—),女,汉族,新疆和静人,硕士研究生。研究方向:深度学习、目标检测。E-mail:874480489@qq.com。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251249353264939303, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, xref=null, ext=[AuthorCompanyExt(id=1251249353269133608, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, companyId=1251249353264939303, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Electrical Engineering, Xinjiang University, Urumqi 830017, China), AuthorCompanyExt(id=1251249353277522217, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, companyId=1251249353264939303, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=新疆大学电气工程学院, 乌鲁木齐 830017)])]), Author(id=1251249353613066564, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=xynan@xju.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1251249353764061514, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, authorId=1251249353613066564, language=EN, stringName=Xin-yuan NAN, firstName=Xin-yuan, middleName=null, lastName=NAN, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=School of Electrical Engineering, Xinjiang University, Urumqi 830017, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251249353956999508, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, authorId=1251249353613066564, language=CN, stringName=南新元, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=新疆大学电气工程学院, 乌鲁木齐 830017, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251249353264939303, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, xref=null, ext=[AuthorCompanyExt(id=1251249353269133608, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, companyId=1251249353264939303, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Electrical Engineering, Xinjiang University, Urumqi 830017, China), AuthorCompanyExt(id=1251249353277522217, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, companyId=1251249353264939303, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=新疆大学电气工程学院, 乌鲁木齐 830017)])])], keywords=[Keyword(id=1251249355697635687, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, orderNo=1, keyword=obstacle detection), Keyword(id=1251249355861213551, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, orderNo=2, keyword=YOLOv8n), Keyword(id=1251249355953488248, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, orderNo=3, keyword=intelligent driving), Keyword(id=1251249356041568640, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, orderNo=4, keyword=small target detection), Keyword(id=1251249356154814858, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, orderNo=5, keyword=attention mechanism), Keyword(id=1251249356255478165, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, orderNo=1, keyword=障碍物检测), Keyword(id=1251249356343558558, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, orderNo=2, keyword=YOLOv8n), Keyword(id=1251249356448416168, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, orderNo=3, keyword=智能驾驶), Keyword(id=1251249356637159861, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, orderNo=4, keyword=小目标检测), Keyword(id=1251249356754600388, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, orderNo=5, keyword=注意力机制)], refs=[Reference(id=1251249363008308200, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=58, issue=15, pageStart=68, pageEnd=77, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=茅智慧, 朱佳利, 吴鑫, journalName=计算机工程与应用, refType=null, unstructuredReference=茅智慧, 朱佳利, 吴鑫,
等. 基于YOLO的自动驾驶目标检测研究综述[J].
计算机工程与应用,
2022,
58(15): 68-77., articleTitle=基于YOLO的自动驾驶目标检测研究综述, refAbstract=null), Reference(id=1251249363121554420, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=58, issue=15, pageStart=68, pageEnd=77, url=null, language=null, rfNumber=[1], rfOrder=1, authorNames=Mao Zhihui, Zhu Jiali, Wu Xin, journalName=Computer Engineering and Applications, refType=null, unstructuredReference=
Mao Zhihui,
Zhu Jiali,
Wu Xin,
et al. Review of YOLO based target detection for autonomous driving[J].
Computer Engineering and Applications,
2022,
58(15): 68-77., articleTitle=Review of YOLO based target detection for autonomous driving, refAbstract=null), Reference(id=1251249364677641217, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=2102, pageEnd=null, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=Breitenstein J, Termöhlen J A, Lipinski D, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Breitenstein J,
Termöhlen J A,
Lipinski D,
et al. Corner cases for visual perception in automated driving: some guidance on detection approaches[J].
ArXiv Preprint,
2021: 2102.05897., articleTitle=Corner cases for visual perception in automated driving: some guidance on detection approaches, refAbstract=null), Reference(id=1251249364849606670, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[3], rfOrder=3, authorNames=Gupta K, Javed S A, Gandhi V, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Gupta K,
Javed S A,
Gandhi V,
et al. Mergenet: a deep net architecture for small obstacle discovery[J].
ArXiv Preprint,
2018: 1803.06508., articleTitle=Mergenet: a deep net architecture for small obstacle discovery, refAbstract=null), Reference(id=1251249365021573144, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2019, volume=47, issue=S1, pageStart=213, pageEnd=216, url=null, language=null, rfNumber=[4], rfOrder=4, authorNames=俞骏威, 张黎明, 陈凯, journalName=同济大学学报(自然科学版), refType=null, unstructuredReference=俞骏威, 张黎明, 陈凯,
等. 基于道路消失点的远距离路面微小障碍物检测[J].
同济大学学报(自然科学版),
2019,
47(S1): 213-216., articleTitle=基于道路消失点的远距离路面微小障碍物检测, refAbstract=null), Reference(id=1251249365155790882, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2019, volume=47, issue=S1, pageStart=213, pageEnd=216, url=null, language=null, rfNumber=[4], rfOrder=5, authorNames=Yu Junwei, Zhang Liming, Chen Kai, journalName=Journal of Tongji University(Natural Science), refType=null, unstructuredReference=
Yu Junwei,
Zhang Liming,
Chen Kai,
et al. Long-distance small road obstacles detection based on road vanishing point[J].
Journal of Tongji University(Natural Science),
2019,
47(S1): 213-216., articleTitle=Long-distance small road obstacles detection based on road vanishing point, refAbstract=null), Reference(id=1251249365277425712, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=23, issue=9, pageStart=16318, pageEnd=16329, url=null, language=null, rfNumber=[5], rfOrder=6, authorNames=Song T J, Jeong J, Kim J H, journalName=IEEE Transactions on Intelligent Transportation Systems, refType=null, unstructuredReference=
Song T J,
Jeong J,
Kim J H. End-to-end real-time obstacle detection network for safe self-driving via multi-task learning[J].
IEEE Transactions on Intelligent Transportation Systems,
2022,
23(9): 16318-16329., articleTitle=End-to-end real-time obstacle detection network for safe self-driving via multi-task learning, refAbstract=null), Reference(id=1251249365436809277, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=5, pageStart=2051, pageEnd=2058, url=null, language=null, rfNumber=[6], rfOrder=7, authorNames=吴晨曦, 应保胜, 许小伟, journalName=科学技术与工程, refType=null, unstructuredReference=吴晨曦, 应保胜, 许小伟,
等. 基于改进单步多框目标检测的道路小目标检测算法[J].
科学技术与工程,
2023,
23(5): 2051-2058., articleTitle=基于改进单步多框目标检测的道路小目标检测算法, refAbstract=null), Reference(id=1251249365571027016, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=5, pageStart=2051, pageEnd=2058, url=null, language=null, rfNumber=[6], rfOrder=8, authorNames=Wu Chenxi, Ying Baosheng, Xu Xiaowei, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Wu Chenxi,
Ying Baosheng,
Xu Xiaowei,
et al. Road small target detection algorithm based on improved single shot multibox detector[J].
Science Technology and Engineering,
2023,
23(5): 2051-2058., articleTitle=Road small target detection algorithm based on improved single shot multibox detector, refAbstract=null), Reference(id=1251249365742993498, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2024, volume=60, issue=5, pageStart=336, pageEnd=346, url=null, language=null, rfNumber=[7], rfOrder=9, authorNames=李旭, 宋焕生, 史勤, journalName=计算机工程与应用, refType=null, unstructuredReference=李旭, 宋焕生, 史勤,
等. CIEFRNet: 面向高速公路的抛洒物检测算法[J].
计算机工程与应用,
2024,
60(5): 336-346., articleTitle=CIEFRNet: 面向高速公路的抛洒物检测算法, refAbstract=null), Reference(id=1251249365881405540, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2024, volume=60, issue=5, pageStart=336, pageEnd=346, url=null, language=null, rfNumber=[7], rfOrder=10, authorNames=Li Xu, Song Huansheng, Shi Qin, journalName=Computer Engineering and Applications, refType=null, unstructuredReference=
Li Xu,
Song Huansheng,
Shi Qin,
et al. CIEFRNet: abandoned objects detection algorithm for highway[J].
Computer Engineering and Applications,
2024,
60(5): 336-346., articleTitle=CIEFRNet: abandoned objects detection algorithm for highway, refAbstract=null), Reference(id=1251249365990457452, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=5148, pageEnd=5157, url=null, language=null, rfNumber=[8], rfOrder=11, authorNames=Nascimento M G, Fawcett R, Prisacariu V A, journalName=Proceedings of the IEEE/CVF International Conference on Computer Vision, refType=null, unstructuredReference=
Nascimento M G,
Fawcett R,
Prisacariu V A. DSConv: efficient convolution operator[C]//
Proceedings of the IEEE/CVF International Conference on Computer Vision. Seoul: IEEE,
2019: 5148-5157., articleTitle=DSConv: efficient convolution operator, refAbstract=null), Reference(id=1251249366116286583, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=11863, pageEnd=11874, url=null, language=null, rfNumber=[9], rfOrder=12, authorNames=Yang L, Zhang R Y, Li L, journalName=International Conference on Machine Learning, refType=null, unstructuredReference=
Yang L,
Zhang R Y,
Li L,
et al. SimAM:a simple, parameter-free attention module for convolutional neural networks[C]//
International Conference on Machine Learning. Online: PMLR,
2021: 11863-11874., articleTitle=SimAM:a simple, parameter-free attention module for convolutional neural networks, refAbstract=null), Reference(id=1251249366237921409, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[10], rfOrder=13, authorNames=Li H, Li J, Wei H, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Li H,
Li J,
Wei H,
et al. Slim-neck by GSConv: a better design paradigm of detector architectures for autonomous vehicles[J].
ArXiv Preprint,
2022: 2206.02424., articleTitle=Slim-neck by GSConv: a better design paradigm of detector architectures for autonomous vehicles, refAbstract=null), Reference(id=1251249366401499275, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=1099, pageEnd=1106, url=null, language=null, rfNumber=[11], rfOrder=14, authorNames=Pinggera P, Ramos S, Gehrig S, journalName=null, refType=null, unstructuredReference=
Pinggera P,
Ramos S,
Gehrig S,
et al. Lost and found:detecting small road hazards for self-driving vehicles[C]//2016 IEEE/RSJ International Conference on Intelligent Robots and Systems(IROS). Daejeon: IEEE,
2016: 1099-1106., articleTitle=Lost and found:detecting small road hazards for self-driving vehicles, refAbstract=null), Reference(id=1251249366510551187, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=8513, pageEnd=8520, url=null, language=null, rfNumber=[12], rfOrder=15, authorNames=Singh A, Kamireddypalli A, Gandhi V, journalName=null, refType=null, unstructuredReference=
Singh A,
Kamireddypalli A,
Gandhi V,
et al. Lidar guided small obstacle segmentation[C]//2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS). Las Vegas: IEEE,
2020: 8513-8520., articleTitle=Lidar guided small obstacle segmentation, refAbstract=null), Reference(id=1251249366636380325, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=3776, pageEnd=3794, url=null, language=null, rfNumber=[13], rfOrder=16, authorNames=Maag K, Chan R, Uhlemeyer S, journalName=Proceedings of the Asian Conference on Computer Vision, refType=null, unstructuredReference=
Maag K,
Chan R,
Uhlemeyer S,
et al. Two video data sets for tracking and retrieval of out of distribution objects[C]//
Proceedings of the Asian Conference on Computer Vision. Macau: Springer,
2022: 3776-3794., articleTitle=Two video data sets for tracking and retrieval of out of distribution objects, refAbstract=null), Reference(id=1251249366762209458, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=406, pageEnd=423, url=null, language=null, rfNumber=[14], rfOrder=17, authorNames=Li K, Chen K, Wang H, journalName=European Conference on Computer Vision, refType=null, unstructuredReference=
Li K,
Chen K,
Wang H,
et al. Coda: a real-world road corner case dataset for object detection in autonomous driving[C]//
European Conference on Computer Vision. Tel Aviv: Springer,
2022: 406-423., articleTitle=Coda: a real-world road corner case dataset for object detection in autonomous driving, refAbstract=null), Reference(id=1251249366984507590, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=2209, pageEnd=null, url=null, language=null, rfNumber=[15], rfOrder=18, authorNames=Li C, Zhou A, Yao A, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Li C,
Zhou A,
Yao A. Omni-dimensional dynamic convolution[J].
ArXiv Preprint,
2022: 2209.07947., articleTitle=Omni-dimensional dynamic convolution, refAbstract=null), Reference(id=1251249367118725330, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1251, pageEnd=1258, url=null, language=null, rfNumber=[16], rfOrder=19, authorNames=Chollet F, journalName=Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Chollet F. Xception: deep learning with depthwise separable convolutions[C]//
Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition. Honolulu: IEEE,
2017: 1251-1258., articleTitle=Xception: deep learning with depthwise separable convolutions, refAbstract=null), Reference(id=1251249367261331677, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=1580, pageEnd=1589, url=null, language=null, rfNumber=[17], rfOrder=20, authorNames=Han K, Wang Y, Tian Q, journalName=Proceedings of the IEEE/CVF conference on computer vision and pattern recognition, refType=null, unstructuredReference=
Han K,
Wang Y,
Tian Q,
et al. Ghostnet: more features from cheap operations[C]//
Proceedings of the IEEE/CVF conference on computer vision and pattern recognition. Seattle: IEEE,
2020: 1580-1589., articleTitle=Ghostnet: more features from cheap operations, refAbstract=null), Reference(id=1251249367412326635, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=3139, pageEnd=3148, url=null, language=null, rfNumber=[18], rfOrder=21, authorNames=Misra D, Nalamada T, Arasanipalai A, journalName=IEEE/CVF Winter Conference on Applications of Computer Vision, refType=null, unstructuredReference=
Misra D,
Nalamada T,
Arasanipalai A,
et al. Rotate to attend: convolutional triplet attention module[C]//
IEEE/CVF Winter Conference on Applications of Computer Vision. Waikoloa: IEEE,
2021: 3139-3148., articleTitle=Rotate to attend: convolutional triplet attention module, refAbstract=null), Reference(id=1251249367609458940, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=2235, pageEnd=9, url=null, language=null, rfNumber=[19], rfOrder=22, authorNames=Zhang Q L, Yang Y B, journalName=ICASSP-IEEE International Conference on Acoustics, refType=null, unstructuredReference=
Zhang Q L,
Yang Y B. SA-Net: shuffle attention for deep convolutional neural networks[C]//
ICASSP-IEEE International Conference on Acoustics. Toronto: IEEE,
2021: 2235-9., articleTitle=SA-Net: shuffle attention for deep convolutional neural networks, refAbstract=null), Reference(id=1251249369215877382, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2024, volume=236, issue=null, pageStart=121352, pageEnd=null, url=null, language=null, rfNumber=[20], rfOrder=23, authorNames=Lau K W, Po L M, Rehman Y A U, journalName=Expert Systems with Applications, refType=null, unstructuredReference=
Lau K W,
Po L M,
Rehman Y A U. Large separable kernel attention: rethinking the large kernel attention design in CNN[J].
Expert Systems with Applications,
2024,
236: 121352., articleTitle=Large separable kernel attention: rethinking the large kernel attention design in CNN, refAbstract=null), Reference(id=1251249369371066638, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2023, volume=45, issue=2, pageStart=1489, pageEnd=1500, url=null, language=null, rfNumber=[21], rfOrder=24, authorNames=Li Y H, Yao T, Pan Y W, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Li Y H,
Yao T,
Pan Y W,
et al. Contextual transformer networks for visual recognition[J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2023,
45(2): 1489-1500., articleTitle=Contextual transformer networks for visual recognition, refAbstract=null), Reference(id=1251249369555616027, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=21, pageEnd=37, url=null, language=null, rfNumber=[22], rfOrder=25, authorNames=Liu W, Anguelov D, Erhan D, journalName=European Conference on Computer Vision, refType=null, unstructuredReference=
Liu W,
Anguelov D,
Erhan D,
et al. SSD: single shot multibox detector[C]//
European Conference on Computer Vision. Amsterdam: Springer,
2016: 21-37., articleTitle=SSD: single shot multibox detector, refAbstract=null), Reference(id=1251249369689833765, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[23], rfOrder=26, authorNames=Zhou X, Wang D, Krähenbühl P, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Zhou X,
Wang D,
Krähenbühl P. Objects as points[J].
ArXiv Preprint,
2019: 1904.07850., articleTitle=Objects as points, refAbstract=null), Reference(id=1251249369811468586, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[24], rfOrder=27, authorNames=Redmon J, Farhadi A, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Redmon J,
Farhadi A. YOLOv3: an incremental improvement[J].
ArXiv Preprint,
2018: 1804.02767., articleTitle=YOLOv3: an incremental improvement, refAbstract=null), Reference(id=1251249369949880628, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=7464, pageEnd=7475, url=null, language=null, rfNumber=[25], rfOrder=28, authorNames=Wang C Y, Bochkovskiy A, Liao H Y M, journalName=Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition, refType=null, unstructuredReference=
Wang C Y,
Bochkovskiy A,
Liao H Y M. YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors[C]//
Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition. Vancouver: IEEE,
2023: 7464-7475., articleTitle=YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors, refAbstract=null), Reference(id=1251249370067321144, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[26], rfOrder=29, authorNames=Ge Z, Liu S, Wang F, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Ge Z,
Liu S,
Wang F,
et al. YOLOX: exceeding YOLO series in 2021[J].
ArXiv Preprint,
2021: 2107.08430., articleTitle=YOLOX: exceeding YOLO series in 2021, refAbstract=null), Reference(id=1251249370188955970, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[27], rfOrder=30, authorNames=Wang C Y, Yeh I H, Liao H Y M, journalName=ArXiv Preprint, refType=null, unstructuredReference=
Wang C Y,
Yeh I H,
Liao H Y M. YOLOv9: learning what you want to learn using programmable gradient information[J].
ArXiv Preprint,
2024: 2402.13616., articleTitle=YOLOv9: learning what you want to learn using programmable gradient information, refAbstract=null), Reference(id=1251249370348339533, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2015, volume=111, issue=null, pageStart=98, pageEnd=136, url=null, language=null, rfNumber=[28], rfOrder=31, authorNames=Everingham M, Eslami S A, Van Gool L, journalName=International Journal of Computer Vision, refType=null, unstructuredReference=
Everingham M,
Eslami S A,
Van Gool L,
et al. The pascal visual object classes challenge: a retrospective[J].
International Journal of Computer Vision,
2015,
111: 98-136., articleTitle=The pascal visual object classes challenge: a retrospective, refAbstract=null), Reference(id=1251249370465780059, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, doi=null, pmid=null, pmcid=null, year=2013, volume=32, issue=11, pageStart=1231, pageEnd=1237, url=null, language=null, rfNumber=[29], rfOrder=32, authorNames=Geiger A, Lenz P, Stiller C, journalName=The International Journal of Robotics Research, refType=null, unstructuredReference=
Geiger A,
Lenz P,
Stiller C,
et al. Vision meets robotics: the KITTI dataset[J].
The International Journal of Robotics Research,
2013,
32(11): 1231-1237., articleTitle=Vision meets robotics: the KITTI dataset, refAbstract=null)], funds=[Fund(id=1251249362622432186, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, awardId=62303394, language=CN, fundingSource=国家自然科学基金(62303394), fundOrder=null, country=null), Fund(id=1251249362748261318, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, awardId=2022D01C694, language=CN, fundingSource=新疆维吾尔自治区自然科学基金(2022D01C694), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1251249353264939303, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, xref=null, ext=[AuthorCompanyExt(id=1251249353269133608, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, companyId=1251249353264939303, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Electrical Engineering, Xinjiang University, Urumqi 830017, China), AuthorCompanyExt(id=1251249353277522217, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, companyId=1251249353264939303, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=新疆大学电气工程学院, 乌鲁木齐 830017)])], figs=[ArticleFig(id=1251249357153059295, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.1, caption=
Improvement of YOLOv8n network structure, figureFileSmall=MziJWHR5uuEwXUxa/enH9w==, figureFileBig=bVlF1Y6dWBcB9UWCVCmGPA==, tableContent=null), ArticleFig(id=1251249357337608680, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图1, caption=
改进的YOLOv8n网络结构, figureFileSmall=MziJWHR5uuEwXUxa/enH9w==, figureFileBig=bVlF1Y6dWBcB9UWCVCmGPA==, tableContent=null), ArticleFig(id=1251249357505380858, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.2, caption=
DSConv module structure, figureFileSmall=FcOB10GMAAPeWF3G4Hsw2w==, figureFileBig=/96cffKEgrVUg9y3afd94w==, tableContent=null), ArticleFig(id=1251249357627015686, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图2, caption=
DSConv模块结构, figureFileSmall=FcOB10GMAAPeWF3G4Hsw2w==, figureFileBig=/96cffKEgrVUg9y3afd94w==, tableContent=null), ArticleFig(id=1251249357727678997, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.3, caption=
SimAM module structure, figureFileSmall=Bpoc90CLTkyyzWILQdUY+w==, figureFileBig=IIPRnq1lmrcfudqaJeBg4w==, tableContent=null), ArticleFig(id=1251249357912228389, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图3, caption=
SimAM模块结构 X为特征图;C、H、W分别为特征图的通道数、高、宽
, figureFileSmall=Bpoc90CLTkyyzWILQdUY+w==, figureFileBig=IIPRnq1lmrcfudqaJeBg4w==, tableContent=null), ArticleFig(id=1251249358025474609, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.4, caption=
SPPF-SimAM module structure, figureFileSmall=+NCWMW1b68SB5voyJh8GwA==, figureFileBig=nEvffrjS+3WdsxYGjOpLyg==, tableContent=null), ArticleFig(id=1251249358109360699, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图4, caption=
SPPF-SimAM模块结构, figureFileSmall=+NCWMW1b68SB5voyJh8GwA==, figureFileBig=nEvffrjS+3WdsxYGjOpLyg==, tableContent=null), ArticleFig(id=1251249358226801224, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.5, caption=
GSConv module structure, figureFileSmall=dWQzYMTmNG7WLP/yW7sLDg==, figureFileBig=1cyJ0HNt9KCFAyyRVhpobQ==, tableContent=null), ArticleFig(id=1251249358323270230, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图5, caption=
GSConv模块结构 c1、c2分别为输入和输出通道数
, figureFileSmall=dWQzYMTmNG7WLP/yW7sLDg==, figureFileBig=1cyJ0HNt9KCFAyyRVhpobQ==, tableContent=null), ArticleFig(id=1251249358432322150, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.6, caption=
GS bottleneck and VoV-GSCSP module structure, figureFileSmall=+SA/GEQ+meYXsUUfh9scVw==, figureFileBig=JiCxaJOilLyzYpSVVVcPhQ==, tableContent=null), ArticleFig(id=1251249358524596849, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图6, caption=
GS bottleneck和VoV-GSCSP模块结构, figureFileSmall=+SA/GEQ+meYXsUUfh9scVw==, figureFileBig=JiCxaJOilLyzYpSVVVcPhQ==, tableContent=null), ArticleFig(id=1251249358616871550, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.7, caption=
Comparison plot of the detection results, figureFileSmall=71Neu8k6I5B3ld83BVl+LQ==, figureFileBig=N5UNEo6NcaW1Y2+BEhGVkQ==, tableContent=null), ArticleFig(id=1251249360227484303, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图7, caption=
检测结果对比图, figureFileSmall=71Neu8k6I5B3ld83BVl+LQ==, figureFileBig=N5UNEo6NcaW1Y2+BEhGVkQ==, tableContent=null), ArticleFig(id=1251249360332341914, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Fig.8, caption=
Mean average precision curve before and after improvement, figureFileSmall=vC2sVlIblmojdwe5JnGO9A==, figureFileBig=uoILOC9yLKQ//xHcDQ1HkA==, tableContent=null), ArticleFig(id=1251249360466559655, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=图8, caption=
改进前后平均精度均值曲线图, figureFileSmall=vC2sVlIblmojdwe5JnGO9A==, figureFileBig=uoILOC9yLKQ//xHcDQ1HkA==, tableContent=null), ArticleFig(id=1251249360600777398, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 1, caption=
Statistics on dataset labels
, figureFileSmall=null, figureFileBig=null, tableContent=
| 障碍物类别 | 标签数量 |
| 训练集 | 验证集 | 测试集 | 合计 |
| 路锥 | 2 311 | 279 | 350 | 2 940 |
| 石墩 | 1 788 | 186 | 182 | 2 156 |
| 废弃轮胎 | 835 | 82 | 95 | 1 012 |
| 小动物 | 1 160 | 129 | 151 | 1 440 |
| 球类 | 489 | 57 | 54 | 600 |
| 箱式货物 | 2 173 | 277 | 292 | 2 742 |
| 水瓶 | 692 | 100 | 130 | 922 |
| 水马 | 1 157 | 112 | 105 | 1 374 |
| 施工标志牌 | 579 | 58 | 81 | 718 |
| 防撞桶 | 983 | 136 | 117 | 1 236 |
| 路桩 | 1 548 | 148 | 228 | 1 924 |
| 石块 | 1 483 | 169 | 160 | 1 812 |
| 塑料袋 | 565 | 48 | 63 | 676 |
| 三角警示牌 | 270 | 30 | 26 | 326 |
| 合计 | 16 033 | 1 811 | 2 034 | 19 878 |
), ArticleFig(id=1251249360701440707, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表1, caption=
数据集标签统计
, figureFileSmall=null, figureFileBig=null, tableContent=
| 障碍物类别 | 标签数量 |
| 训练集 | 验证集 | 测试集 | 合计 |
| 路锥 | 2 311 | 279 | 350 | 2 940 |
| 石墩 | 1 788 | 186 | 182 | 2 156 |
| 废弃轮胎 | 835 | 82 | 95 | 1 012 |
| 小动物 | 1 160 | 129 | 151 | 1 440 |
| 球类 | 489 | 57 | 54 | 600 |
| 箱式货物 | 2 173 | 277 | 292 | 2 742 |
| 水瓶 | 692 | 100 | 130 | 922 |
| 水马 | 1 157 | 112 | 105 | 1 374 |
| 施工标志牌 | 579 | 58 | 81 | 718 |
| 防撞桶 | 983 | 136 | 117 | 1 236 |
| 路桩 | 1 548 | 148 | 228 | 1 924 |
| 石块 | 1 483 | 169 | 160 | 1 812 |
| 塑料袋 | 565 | 48 | 63 | 676 |
| 三角警示牌 | 270 | 30 | 26 | 326 |
| 合计 | 16 033 | 1 811 | 2 034 | 19 878 |
), ArticleFig(id=1251249360831464151, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 2, caption=
Comparison result of introducing different convolutions
, figureFileSmall=null, figureFileBig=null, tableContent=
| 卷积 | mAP/% | Parameters/106 | GFLOPs | FPS/(帧·s-1) |
| Conv | 84.6 | 3.0 | 8.1 | 60 |
| ODConv | 83.7 | 3.0 | 7.1 | 60 |
| DWConv | 84.5 | 2.6 | 7.2 | 67 |
| GhostConv | 84.3 | 2.8 | 7.7 | 52 |
| DSConv | 84.8 | 3.0 | 7.1 | 73 |
), ArticleFig(id=1251249360948904680, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表2, caption=
引入不同卷积的对比结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 卷积 | mAP/% | Parameters/106 | GFLOPs | FPS/(帧·s-1) |
| Conv | 84.6 | 3.0 | 8.1 | 60 |
| ODConv | 83.7 | 3.0 | 7.1 | 60 |
| DWConv | 84.5 | 2.6 | 7.2 | 67 |
| GhostConv | 84.3 | 2.8 | 7.7 | 52 |
| DSConv | 84.8 | 3.0 | 7.1 | 73 |
), ArticleFig(id=1251249361062150902, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 3, caption=
Comparison result of SPPF combined with different attentional mechanisms
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| SPPF | 84.6 | 3.0 | 8.1 | 60 |
SPPF-Triplet Attention | 85.1 | 3.0 | 8.1 | 64 |
SPPF-Shuffle Attention | 84.6 | 3.0 | 8.1 | 67 |
| SPPF-LSKA | 84.6 | 3.3 | 8.3 | 67 |
SPPF-CoT Attention | 84.9 | 5.3 | 9.9 | 55 |
| SPPF-SimAM | 85.3 | 3.0 | 8.1 | 66 |
), ArticleFig(id=1251249361183785739, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表3, caption=
SPPF与不同注意力机制结合的对比结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| SPPF | 84.6 | 3.0 | 8.1 | 60 |
SPPF-Triplet Attention | 85.1 | 3.0 | 8.1 | 64 |
SPPF-Shuffle Attention | 84.6 | 3.0 | 8.1 | 67 |
| SPPF-LSKA | 84.6 | 3.3 | 8.3 | 67 |
SPPF-CoT Attention | 84.9 | 5.3 | 9.9 | 55 |
| SPPF-SimAM | 85.3 | 3.0 | 8.1 | 66 |
), ArticleFig(id=1251249361292837663, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 4, caption=
Comparison result of mAP of different obstacle classes
, figureFileSmall=null, figureFileBig=null, tableContent=
| 障碍物类别 | 准确率/% | | 召回率/% | | mAP/% |
| YOLOv8n | 本文算法 | YOLOv8n | 本文算法 | YOLOv8n | 本文算法 |
| 路锥 | 88.4 | 92.5 | | 74.0 | 77.4 | | 81.0 | 87.0 |
| 石墩 | 82.5 | 92.8 | | 70.9 | 78.2 | | 79.1 | 88.1 |
| 废弃轮胎 | 88.2 | 95.0 | | 88.4 | 99.2 | | 94.8 | 98.2 |
| 小动物 | 95.7 | 79.8 | | 90.7 | 84.6 | | 94.7 | 84.3 |
| 球类 | 97.1 | 98.1 | | 72.2 | 92.6 | | 91.8 | 97.7 |
| 箱式货物 | 97.8 | 98.2 | | 92.4 | 95.4 | | 96.9 | 98.6 |
| 水瓶 | 79.9 | 77.8 | | 63.1 | 75.4 | | 74.0 | 83.9 |
| 水马 | 81.1 | 81.4 | | 75.2 | 74.3 | | 80.5 | 85.9 |
| 施工标志牌 | 90.6 | 88.7 | | 77.8 | 82.7 | | 82.7 | 88.1 |
| 防撞桶 | 86.8 | 91.0 | | 72.8 | 77.9 | | 82.9 | 89.1 |
| 路桩 | 83.1 | 89.2 | | 55.3 | 69.3 | | 71.8 | 84.9 |
| 石块 | 88.1 | 93.0 | | 70.0 | 94.4 | | 79.2 | 97.7 |
| 塑料袋 | 88.8 | 91.7 | | 77.8 | 81.0 | | 85.3 | 90.4 |
| 三角警示牌 | 95.6 | 79.8 | | 84.0 | 84.6 | | 89.0 | 84.3 |
| 平均值 | 88.8 | 90.4 | | 76.0 | 84.0 | | 84.6 | 90.8 |
), ArticleFig(id=1251249361439638321, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表4, caption=
不同障碍物类别平均精度均值对比结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 障碍物类别 | 准确率/% | | 召回率/% | | mAP/% |
| YOLOv8n | 本文算法 | YOLOv8n | 本文算法 | YOLOv8n | 本文算法 |
| 路锥 | 88.4 | 92.5 | | 74.0 | 77.4 | | 81.0 | 87.0 |
| 石墩 | 82.5 | 92.8 | | 70.9 | 78.2 | | 79.1 | 88.1 |
| 废弃轮胎 | 88.2 | 95.0 | | 88.4 | 99.2 | | 94.8 | 98.2 |
| 小动物 | 95.7 | 79.8 | | 90.7 | 84.6 | | 94.7 | 84.3 |
| 球类 | 97.1 | 98.1 | | 72.2 | 92.6 | | 91.8 | 97.7 |
| 箱式货物 | 97.8 | 98.2 | | 92.4 | 95.4 | | 96.9 | 98.6 |
| 水瓶 | 79.9 | 77.8 | | 63.1 | 75.4 | | 74.0 | 83.9 |
| 水马 | 81.1 | 81.4 | | 75.2 | 74.3 | | 80.5 | 85.9 |
| 施工标志牌 | 90.6 | 88.7 | | 77.8 | 82.7 | | 82.7 | 88.1 |
| 防撞桶 | 86.8 | 91.0 | | 72.8 | 77.9 | | 82.9 | 89.1 |
| 路桩 | 83.1 | 89.2 | | 55.3 | 69.3 | | 71.8 | 84.9 |
| 石块 | 88.1 | 93.0 | | 70.0 | 94.4 | | 79.2 | 97.7 |
| 塑料袋 | 88.8 | 91.7 | | 77.8 | 81.0 | | 85.3 | 90.4 |
| 三角警示牌 | 95.6 | 79.8 | | 84.0 | 84.6 | | 89.0 | 84.3 |
| 平均值 | 88.8 | 90.4 | | 76.0 | 84.0 | | 84.6 | 90.8 |
), ArticleFig(id=1251249361552884546, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 5, caption=
Results of ablation experiments
, figureFileSmall=null, figureFileBig=null, tableContent=
| 编号 | DSConv | 小目标 检测层 | SPPF-SimAM | GSConv+VoV- GSCSP | 准确率/% | 召回率/% | mAP/% | Parameters/106 | GFLOPs | FPS/(帧·s-1) |
| A | × | × | × | × | 88.8 | 76.0 | 84.6 | 3.0 | 8.1 | 60 |
| B | √ | × | × | × | 89.3 | 75.0 | 84.8 | 3.0 | 7.1 | 73 |
| C | × | √ | × | × | 90.2 | 84.7 | 90.1 | 3.0 | 12.5 | 68 |
| D | × | × | √ | × | 91.6 | 75.1 | 85.3 | 3.0 | 8.1 | 66 |
| E | × | × | × | √ | 88.9 | 74.3 | 84.7 | 2.8 | 7.5 | 62 |
| F | √ | √ | × | × | 91.7 | 82.8 | 90.7 | 3.0 | 11.5 | 68 |
| G | √ | √ | √ | × | 92.7 | 84.2 | 90.9 | 3.0 | 11.5 | 51 |
| H | √ | √ | √ | √ | 90.4 | 84.0 | 90.8 | 2.8 | 10.5 | 53 |
), ArticleFig(id=1251249361666130762, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表5, caption=
消融实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 编号 | DSConv | 小目标 检测层 | SPPF-SimAM | GSConv+VoV- GSCSP | 准确率/% | 召回率/% | mAP/% | Parameters/106 | GFLOPs | FPS/(帧·s-1) |
| A | × | × | × | × | 88.8 | 76.0 | 84.6 | 3.0 | 8.1 | 60 |
| B | √ | × | × | × | 89.3 | 75.0 | 84.8 | 3.0 | 7.1 | 73 |
| C | × | √ | × | × | 90.2 | 84.7 | 90.1 | 3.0 | 12.5 | 68 |
| D | × | × | √ | × | 91.6 | 75.1 | 85.3 | 3.0 | 8.1 | 66 |
| E | × | × | × | √ | 88.9 | 74.3 | 84.7 | 2.8 | 7.5 | 62 |
| F | √ | √ | × | × | 91.7 | 82.8 | 90.7 | 3.0 | 11.5 | 68 |
| G | √ | √ | √ | × | 92.7 | 84.2 | 90.9 | 3.0 | 11.5 | 51 |
| H | √ | √ | √ | √ | 90.4 | 84.0 | 90.8 | 2.8 | 10.5 | 53 |
), ArticleFig(id=1251249361745822552, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 6, caption=
Results of the mainstream model comparison experiments
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| SSD | 59.4 | 25.3 | 62.1 | 15 |
| CenterNet | 55.8 | 32.7 | 109.7 | 33 |
| YOLOv3-tiny | 66.6 | 8.7 | 12.9 | 63 |
| YOLOv5s | 74.2 | 7.1 | 16.0 | 56 |
| YOLOv7 | 80.2 | 36.5 | 103.4 | 46 |
| YOLOv7-tiny | 70.6 | 6.0 | 13.1 | 64 |
| YOLOX-s | 68.9 | 8.9 | 26.8 | 69 |
| YOLOX-tiny | 63.3 | 5.0 | 15.3 | 70 |
| YOLOv8s | 89.5 | 11.1 | 28.5 | 55 |
| YOLOv9s | 89.3 | 9.6 | 38.8 | 19 |
| 本文算法 | 90.8 | 2.8 | 10.5 | 53 |
), ArticleFig(id=1251249361880040295, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表6, caption=
主流模型对比实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| SSD | 59.4 | 25.3 | 62.1 | 15 |
| CenterNet | 55.8 | 32.7 | 109.7 | 33 |
| YOLOv3-tiny | 66.6 | 8.7 | 12.9 | 63 |
| YOLOv5s | 74.2 | 7.1 | 16.0 | 56 |
| YOLOv7 | 80.2 | 36.5 | 103.4 | 46 |
| YOLOv7-tiny | 70.6 | 6.0 | 13.1 | 64 |
| YOLOX-s | 68.9 | 8.9 | 26.8 | 69 |
| YOLOX-tiny | 63.3 | 5.0 | 15.3 | 70 |
| YOLOv8s | 89.5 | 11.1 | 28.5 | 55 |
| YOLOv9s | 89.3 | 9.6 | 38.8 | 19 |
| 本文算法 | 90.8 | 2.8 | 10.5 | 53 |
), ArticleFig(id=1251249361951343474, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 7, caption=
Comparison result of the model before and after improvement on PASCAL VOC 2012
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| YOLOv8n | 56.4 | 3.0 | 8.1 | 88 |
| 本文算法 | 57.0 | 2.8 | 10.5 | 61 |
), ArticleFig(id=1251249362052006786, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表7, caption=
改进前后模型在PASCAL VOC 2012的对比实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| YOLOv8n | 56.4 | 3.0 | 8.1 | 88 |
| 本文算法 | 57.0 | 2.8 | 10.5 | 61 |
), ArticleFig(id=1251249362152670091, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=EN, label=Table 8, caption=
Comparison result of the model before and after improvement on KITTI
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| YOLOv8n | 76.9 | 3.0 | 8.1 | 75 |
| 本文算法 | 78.2 | 2.8 | 10.5 | 53 |
), ArticleFig(id=1251249362240750488, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1149781961000051646, language=CN, label=表8, caption=
改进前后模型在KITTI的对比实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 算法 | mAP/% | Parameters/ 106 | GFLOPs | FPS/ (帧·s-1) |
| YOLOv8n | 76.9 | 3.0 | 8.1 | 75 |
| 本文算法 | 78.2 | 2.8 | 10.5 | 53 |
)], attaches=null, journal=Journal(id=1146119176004939786, delFlag=0, nameCn=科学技术与工程, nameEn=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, issn=1671-1815, eissn=, cn=11-4688/T, coden=null, periodic=4, language=CN, oaType=是, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=UKU/O7GSka5polgCTkbIIw==, journalPrice=null, startedYear=null, abbrevIsoEn=Sci Technol Eng, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1754445529766, createdBy=null, updatedBy=13701087609, firstLetterCn=S, firstLetterEn=S, subjectCode=Natural Sciences, subjectName=自然科学, subjectCodeEn=Natural Sciences, subjectNameEn=null, picCn=UKU/O7GSka5polgCTkbIIw==, picEn=5hwlULoNwcbj3xUmVi9MAQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1159791870395564357, language=CN, name=科学技术与工程, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529793, updatedTime=1754445529793, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=http://www.stae.com.cn/jsygc/site/menus/20090429150146001, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1159791870441701702, language=EN, name=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529804, updatedTime=1754445529804, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146123166801305609, websiteList=[Website(id=1148243202391400884, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/CN, language=CN, createTime=1751692112777, createBy=18614031015, updateTime=1753520965431, updateBy=18614031015, name=科学技术与工程-中文站点, tplId=1146099689490845704, title=科学技术与工程, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148622798802673703, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=articleTextType, value=kx, createTime=1751782615614, updateTime=1751782615614, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798781702180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=banner, value=null, createTime=1751782615609, updateTime=1751782615609, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798769119267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1751782615606, updateTime=1751782615606, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798794285094, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782615612, updateTime=1751782615612, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798790090789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782615611, updateTime=1751782615611, creator=18614031015, updator=18614031015)]), Website(id=1155914124811976731, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/EN, language=EN, createTime=1753521003206, createBy=18614031015, updateTime=1753521003206, updateBy=18614031015, name=科学技术与工程-英文站点, tplId=1146101810881728533, title=Science Technology and Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155914371227308235, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=articleTextType, value=kx, createTime=1753521061952, updateTime=1753521061952, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371210531016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=banner, value=null, createTime=1753521061947, updateTime=1753521061947, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371202142407, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1753521061945, updateTime=1753521061945, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371223113930, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753521061950, updateTime=1753521061950, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371218919625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753521061949, updateTime=1753521061949, creator=18614031015, updator=18614031015)])], journalTitle=科学技术与工程, weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Science Technology and Engineering, journalPhotoCn=UKU/O7GSka5polgCTkbIIw==, journalPhotoEn=5hwlULoNwcbj3xUmVi9MAQ==, journalFirstLetter=S, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/10.12404/j.issn.1671-1815.2402441, detailUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/10.12404/j.issn.1671-1815.2402441, pdfUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/PDF/10.12404/j.issn.1671-1815.2402441, pdfUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/PDF/10.12404/j.issn.1671-1815.2402441, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)