Article(id=1209816724317278467, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1209811339510411616, articleNumber=null, orderNo=null, doi=10.12404/j.issn.1671-1815.2405983, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=research-article, receivedDate=1723132800000, receivedDateStr=2024-08-09, revisedDate=1734883200000, revisedDateStr=2024-12-23, acceptedDate=null, acceptedDateStr=null, onlineDate=1766372384385, onlineDateStr=2025-12-22, pubDate=1751904000000, pubDateStr=2025-07-08, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1766372384385, onlineIssueDateStr=2025-12-22, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1766372384385, creator=13701087609, updateTime=1766372384385, updator=13701087609, issue=Issue{id=1209811339510411616, tenantId=1146029695717560320, journalId=1146123166801305609, year='2025', volume='25', issue='19', pageStart='7885', pageEnd='8315', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=null, createTime=1766371100547, creator=13701087609, updateTime=1766373228996, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1209820266960654935, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1209811339510411616, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1209820266960654936, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1209811339510411616, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=8151, endPage=8157, ext={EN=ArticleExt(id=1209816724766069031, articleId=1209816724317278467, tenantId=1146029695717560320, journalId=1146123166801305609, language=EN, title=Improved YOLOv8 Bird Recognition Algorithm Integrates ViT and Multi-scale Attention, columnId=1209816719539966141, journalTitle=Science Technology and Engineering, columnName=Papers∙Automation and Computational Technology, runingTitle=null, highlight=null, articleAbstract=
In order to solve the problems of inaccurate dense target recognition and difficult detection of small targets in bird recognition, a bird recognition algorithm based on improved YOLOv8 was proposed. Firstly, in order to solve the problem of difficult dense object recognition, the multi-scale linear attention mechanism EfficientViT was used to replace the backbone network to realize the global receptive field and multi-scale learning, improve the performance and efficiency of the model, and improve the dense object recognition effect. Then, in order to solve the problem that it is difficult to detect small target birds and is prone to missed detection, an efficient multi-scale attention EMA (efficient multi-scale attention) mechanism was introduced to realize cross-dimensional aggregation features through channel recombination, so as to better capture global information, realize multi-scale feature fusion, and reduce the probability of missed detection. The experimental results show that the mAP50 of the improved model on the benchmark dataset CUB-200-2011 and birds28 reaches 77.1% and 88.4%, respectively, which is 4.5 and 5.4 percentage points higher than the original YOLOv8 model, respectively, which verifies the effectiveness of the improved model.
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Qiang ZHANG, Can-zhi ZHANG, Heng CAO, Teng-jiao YUAN), CN=ArticleExt(id=1209816727483978139, articleId=1209816724317278467, tenantId=1146029695717560320, journalId=1146123166801305609, language=CN, title=融合ViT与多尺度注意力的改进YOLOv8飞鸟识别算法, columnId=1209816721498706113, journalTitle=科学技术与工程, columnName=论文∙自动化技术、计算机技术, runingTitle=null, highlight=null, articleAbstract=
针对飞鸟识别中存在密集目标识别不准确、小目标检测困难等问题,提出一种基于改进YOLOv8的飞鸟识别算法。首先,针对密集目标识别难度大的问题,采用多尺度线性注意力机制EfficientViT替换骨干网络,实现全局感受野和多尺度学习,提升模型性能和效率的同时提高密集目标识别效果。然后,针对小目标飞鸟检测困难、容易出现漏检的问题,引入高效多尺度注意力 (efficient multi-scale attention, EMA)机制,通过通道重组实现跨维度聚合特征,从而更好地捕捉全局信息,实现多尺度特征融合,减少漏检概率。实验结果表明,改进模型在鸟类识别基准数据集CUB-200-2011和自制数据集birds28上的mAP50分别达到77.1%和88.4%,较原始YOLOv8模型分别提高了4.5和5.4个百分点,验证了改进模型的有效性。
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=Gph4PJGXgmIyT8InqDoFfg==, magXml=zqD8l59mdxtJJxb0ZrVoDg==, pdfUrl=null, pdf=LtQw/UmYW4JN2vJ/L/ZSSA==, pdfFileSize=10107090, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=OFsI+vJhwMzIv6EQ1qyNuw==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=8RZyDPDTPeEfgMLsx/gD7A==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=张强, 张灿智, 曹恒, 员腾蛟)}, authors=[Author(id=1209929297222038490, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=271198043@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1209929297322701791, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929297222038490, language=EN, stringName=Qiang ZHANG, firstName=Qiang, middleName=null, lastName=ZHANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1209929297419170788, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929297222038490, language=CN, stringName=张强, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=中国民用航空飞行学院空中交通管理学院, 德阳 618300, bio={"content":"
张强(1986—),男,汉族,四川广安人,博士,教授。研究方向:民航通信导航监视、低空监视。E-mail:271198043@qq.com。
"}, bioImg=null, bioContent=
张强(1986—),男,汉族,四川广安人,博士,教授。研究方向:民航通信导航监视、低空监视。E-mail:271198043@qq.com。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1209929297108792275, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, xref=null, ext=[AuthorCompanyExt(id=1209929297117180884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China), AuthorCompanyExt(id=1209929297125569493, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国民用航空飞行学院空中交通管理学院, 德阳 618300)])]), Author(id=1209929297498862569, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1209929297591137261, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929297498862569, language=EN, stringName=Can-zhi ZHANG, firstName=Can-zhi, middleName=null, lastName=ZHANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1209929297675023343, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929297498862569, language=CN, stringName=张灿智, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=中国民用航空飞行学院空中交通管理学院, 德阳 618300, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1209929297108792275, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, xref=null, ext=[AuthorCompanyExt(id=1209929297117180884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China), AuthorCompanyExt(id=1209929297125569493, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国民用航空飞行学院空中交通管理学院, 德阳 618300)])]), Author(id=1209929297767298037, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1209929297918292989, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929297767298037, language=EN, stringName=Heng CAO, firstName=Heng, middleName=null, lastName=CAO, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1209929297997984768, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929297767298037, language=CN, stringName=曹恒, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=中国民用航空飞行学院空中交通管理学院, 德阳 618300, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1209929297108792275, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, xref=null, ext=[AuthorCompanyExt(id=1209929297117180884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China), AuthorCompanyExt(id=1209929297125569493, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国民用航空飞行学院空中交通管理学院, 德阳 618300)])]), Author(id=1209929298111229957, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1209929298199310345, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929298111229957, language=EN, stringName=Teng-jiao YUAN, firstName=Teng-jiao, middleName=null, lastName=YUAN, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1209929298283196429, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, authorId=1209929298111229957, language=CN, stringName=员腾蛟, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=中国民用航空飞行学院空中交通管理学院, 德阳 618300, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1209929297108792275, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, xref=null, ext=[AuthorCompanyExt(id=1209929297117180884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China), AuthorCompanyExt(id=1209929297125569493, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国民用航空飞行学院空中交通管理学院, 德阳 618300)])])], keywords=[Keyword(id=1209929298450968592, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, orderNo=1, keyword=bird recognition), Keyword(id=1209929298547437588, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, orderNo=2, keyword=multi-scale attention), Keyword(id=1209929298635517976, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, orderNo=3, keyword=dense target recognition), Keyword(id=1209929299835088919, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, orderNo=4, keyword=YOLOv8), Keyword(id=1209929299935752221, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, orderNo=5, keyword=EfficientViT), Keyword(id=1209929300011249694, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, orderNo=6, keyword=EMA), Keyword(id=1209929300124495906, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, orderNo=1, keyword=飞鸟识别), Keyword(id=1209929300225159204, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, orderNo=2, keyword=多尺度注意力), Keyword(id=1209929300304850985, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, orderNo=3, keyword=密集目标识别), Keyword(id=1209929300413902894, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, orderNo=4, keyword=YOLOv8), Keyword(id=1209929300518760500, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, orderNo=5, keyword=EfficientViT), Keyword(id=1209929300627812407, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, orderNo=6, keyword=EMA)], refs=[Reference(id=1209929304536903846, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=19, pageStart=22867, pageEnd=22879, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=Zhang C, Shi F, Zhang X, journalName=IEEE Sensors Journal, refType=null, unstructuredReference=
Zhang C,
Shi F,
Zhang X, et al. Airport near-altitude flying birds detection based on information compensation multi-scale feature fusion[J].
IEEE Sensors Journal,
2023,
23(19): 22867-22879., articleTitle=Airport near-altitude flying birds detection based on information compensation multi-scale feature fusion, refAbstract=null), Reference(id=1209929304650150056, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2020, volume=7, issue=3, pageStart=26, pageEnd=null, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=Metz I C, Ellerbroek J, Mühlhausen T, journalName=Aerospace, refType=null, unstructuredReference=
Metz I C,
Ellerbroek J,
Mühlhausen T, et al. The bird strike challenge[J].
Aerospace,
2020,
7(3): 26., articleTitle=The bird strike challenge, refAbstract=null), Reference(id=1209929304734036136, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2020, volume=11, issue=9, pageStart=1072, pageEnd=1085, url=null, language=null, rfNumber=[3], rfOrder=2, authorNames=Ferreira A C, Silva L R, Renna F, journalName=Methods in Ecology and Evolution, refType=null, unstructuredReference=
Ferreira A C,
Silva L R,
Renna F, et al. Deep learning-based methods for individual recognition in small birds[J].
Methods in Ecology and Evolution,
2020,
11(9): 1072-1085., articleTitle=Deep learning-based methods for individual recognition in small birds, refAbstract=null), Reference(id=1209929304822116523, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=27, issue=null, pageStart=1677, pageEnd=1690, url=null, language=null, rfNumber=[4], rfOrder=3, authorNames=Liu H, Zhang C, Deng Y, journalName=IEEE Transactions on Multimedia, refType=null, unstructuredReference=
Liu H,
Zhang C,
Deng Y, et al. TransIFC: invariant cues-aware feature concentration learning for efficient fine-grained bird image classification[J].
IEEE Transactions on Multimedia,
2023,
27: 1677-1690., articleTitle=TransIFC: invariant cues-aware feature concentration learning for efficient fine-grained bird image classification, refAbstract=null), Reference(id=1209929304893419695, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=13, issue=2, pageStart=264, pageEnd=null, url=null, language=null, rfNumber=[5], rfOrder=4, authorNames=Wang K, Yang F, Chen Z, journalName=Animals, refType=null, unstructuredReference=
Wang K,
Yang F,
Chen Z, et al. A fine-grained bird classification method based on attention and decoupled knowledge distillation[J].
Animals,
2023,
13(2): 264., articleTitle=A fine-grained bird classification method based on attention and decoupled knowledge distillation, refAbstract=null), Reference(id=1209929304952139955, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=1, pageEnd=6, url=null, language=null, rfNumber=[6], rfOrder=5, authorNames=Chakraborti T, McCane B, Mills S, journalName=null, refType=null, unstructuredReference=
Chakraborti T,
McCane B,
Mills S, et al. CoCoNet:a collaborative convolutional network applied to fine-grained bird species classification[C]// 2020 35th International Conference on Image and Vision Computing New Zealand (IVCNZ). New York: IEEE,
2020: 1-6., articleTitle=CoCoNet:a collaborative convolutional network applied to fine-grained bird species classification, refAbstract=null), Reference(id=1209929305019248823, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=9, pageStart=3727, pageEnd=3736, url=null, language=null, rfNumber=[7], rfOrder=6, authorNames=任书杰, 胡勇, 何文祥, journalName=科学技术与工程, refType=null, unstructuredReference=任书杰, 胡勇, 何文祥, 等. 基于深度学习的砂岩组分显微图像识别[J].
科学技术与工程,
2024,
24(9): 3727-3736., articleTitle=基于深度学习的砂岩组分显微图像识别, refAbstract=null), Reference(id=1209929305086357687, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=9, pageStart=3727, pageEnd=3736, url=null, language=null, rfNumber=[7], rfOrder=7, authorNames=Ren Shujie, Hu Yong, He Wenxiang, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Ren Shujie,
Hu Yong,
He Wenxiang, et al. Microscopic image recognition of sandstone components based on deep learning[J].
Science Technology and Engineering,
2024,
24(9): 3727-3736., articleTitle=Microscopic image recognition of sandstone components based on deep learning, refAbstract=null), Reference(id=1209929305153466552, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=17, pageStart=7059, pageEnd=7065, url=null, language=null, rfNumber=[8], rfOrder=8, authorNames=林开颜, 牛程远, 张浩平, journalName=科学技术与工程, refType=null, unstructuredReference=林开颜, 牛程远, 张浩平, 等. 基于深度学习的景观植物颜色特征提取方法[J].
科学技术与工程,
2024,
24(17): 7059-7065., articleTitle=基于深度学习的景观植物颜色特征提取方法, refAbstract=null), Reference(id=1209929305266712764, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=17, pageStart=7059, pageEnd=7065, url=null, language=null, rfNumber=[8], rfOrder=9, authorNames=Lin Kaiyan, Niu Chengyuan, Zhang Haoping, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Lin Kaiyan,
Niu Chengyuan,
Zhang Haoping, et al. A method for extracting color characteristics of landscape plants based on deep learning[J].
Science Technology and Engineering,
2024,
24(17): 7059-7065., articleTitle=A method for extracting color characteristics of landscape plants based on deep learning, refAbstract=null), Reference(id=1209929305367376064, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=60, issue=8, pageStart=46, pageEnd=55, url=null, language=null, rfNumber=[9], rfOrder=10, authorNames=谢威宇, 张强, journalName=计算机工程与应用, refType=null, unstructuredReference=谢威宇, 张强. 基于深度学习的图像中无人机与飞鸟检测研究综述[J].
计算机工程与应用,
2024,
60(8): 46-55., articleTitle=基于深度学习的图像中无人机与飞鸟检测研究综述, refAbstract=null), Reference(id=1209929305438679235, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=60, issue=8, pageStart=46, pageEnd=55, url=null, language=null, rfNumber=[9], rfOrder=11, authorNames=Xie Weiyu, Zhang Qiang, journalName=Computer Engineering and Applications, refType=null, unstructuredReference=
Xie Weiyu,
Zhang Qiang. Review on detection of drones and birds in photoelectric images based on deep learning convolutional neural network[J].
Computer Engineering and Applications,
2024,
60(8): 46-55., articleTitle=Review on detection of drones and birds in photoelectric images based on deep learning convolutional neural network, refAbstract=null), Reference(id=1209929305518371015, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2020, volume=8, issue=null, pageStart=116663, pageEnd=116674, url=null, language=null, rfNumber=[10], rfOrder=12, authorNames=Won C S, journalName=IEEE Access, refType=null, unstructuredReference=
Won C S. Multi-scale CNN for fine-grained image recognition[J].
IEEE Access,
2020,
8: 116663-116674., articleTitle=Multi-scale CNN for fine-grained image recognition, refAbstract=null), Reference(id=1209929305585479883, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2020, volume=57, issue=3, pageStart=102186, pageEnd=null, url=null, language=null, rfNumber=[11], rfOrder=13, authorNames=Tan M, Zhou J, Peng Z, journalName=Information Processing & Management, refType=null, unstructuredReference=
Tan M,
Zhou J,
Peng Z, et al. Fine-grained image classification with factorized deep user click feature[J].
Information Processing & Management,
2020,
57(3): 102186., articleTitle=Fine-grained image classification with factorized deep user click feature, refAbstract=null), Reference(id=1209929305652588749, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=17, pageEnd=34, url=null, language=null, rfNumber=[12], rfOrder=14, authorNames=Bellafkir H, Vogelbacher M, Schneider D, journalName=International Conference on Networked Systems, refType=null, unstructuredReference=
Bellafkir H,
Vogelbacher M,
Schneider D, et al. Edge-based bird species recognition
via active learning[C]//
International Conference on Networked Systems. Cham: Springer Nature Switzerland,
2023: 17-34., articleTitle=Edge-based bird species recognition
via active learning, refAbstract=null), Reference(id=1209929305728086224, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=17, pageStart=7205, pageEnd=7213, url=null, language=null, rfNumber=[13], rfOrder=15, authorNames=宣以国, 余成波, 蒋启超, journalName=科学技术与工程, refType=null, unstructuredReference=宣以国, 余成波, 蒋启超, 等. 基于改进 YOLOv7 的道路裂缝和坑洞检测算法[J].
科学技术与工程,
2024,
24(17): 7205-7213., articleTitle=基于改进 YOLOv7 的道路裂缝和坑洞检测算法, refAbstract=null), Reference(id=1209929305807778003, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=17, pageStart=7205, pageEnd=7213, url=null, language=null, rfNumber=[13], rfOrder=16, authorNames=Xuan Yiguo, Yu Chengbo, Jiang Qichao, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Xuan Yiguo,
Yu Chengbo,
Jiang Qichao, et al. Improved YOLOv7 road crack and pothole detection algorithm[J].
Science Technology and Engineering,
2024,
24(17): 7205-7213., articleTitle=Improved YOLOv7 road crack and pothole detection algorithm, refAbstract=null), Reference(id=1209929305883275478, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=28, pageEnd=38, url=null, language=null, rfNumber=[14], rfOrder=17, authorNames=Kumar A, Das S D, journalName=Computer Vision Applications, refType=null, unstructuredReference=
Kumar A,
Das S D. Bird species classification using transfer learning with multistage training[C]//
Computer Vision Applications: Third Workshop, WCVA 2018. Singapore: Springer,
2019: 28-38., articleTitle=Bird species classification using transfer learning with multistage training, refAbstract=null), Reference(id=1209929305962967256, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=44, issue=4, pageStart=1114, pageEnd=1120, url=null, language=null, rfNumber=[15], rfOrder=18, authorNames=陈天华, 朱家煊, 印杰, journalName=计算机应用, refType=null, unstructuredReference=陈天华, 朱家煊, 印杰. 基于注意力机制的鸟类识别算法[J].
计算机应用,
2024,
44(4): 1114-1120., articleTitle=基于注意力机制的鸟类识别算法, refAbstract=null), Reference(id=1209929306051047641, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2024, volume=44, issue=4, pageStart=1114, pageEnd=1120, url=null, language=null, rfNumber=[15], rfOrder=19, authorNames=Chen Tianhua, Zhu Jiaxuan, Yin Jie, journalName=Journal of Computer Applications, refType=null, unstructuredReference=
Chen Tianhua,
Zhu Jiaxuan,
Yin Jie. Bird recognition algorithm based on attention mechanism[J].
Journal of Computer Applications,
2024,
44(4): 1114-1120., articleTitle=Bird recognition algorithm based on attention mechanism, refAbstract=null), Reference(id=1209929306126545118, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=2039, pageEnd=2048, url=null, language=null, rfNumber=[16], rfOrder=20, authorNames=Cohen A S, Cont R, Rossier A, journalName=International Conference on Machine Learning, refType=null, unstructuredReference=
Cohen A S,
Cont R,
Rossier A, et al. Scaling properties of deep residual networks[C]//
International Conference on Machine Learning. New York: PMLR,
2021: 2039-2048., articleTitle=Scaling properties of deep residual networks, refAbstract=null), Reference(id=1209929306210431198, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=7, issue=5, pageStart=304, pageEnd=null, url=null, language=null, rfNumber=[17], rfOrder=21, authorNames=Li Y, Fan Q, Huang H, journalName=Drones, refType=null, unstructuredReference=
Li Y,
Fan Q,
Huang H, et al. A modified YOLOv8 detection network for UAV aerial image recognition[J].
Drones,
2023,
7(5): 304., articleTitle=A modified YOLOv8 detection network for UAV aerial image recognition, refAbstract=null), Reference(id=1209929306290122977, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=13, issue=24, pageStart=12977, pageEnd=null, url=null, language=null, rfNumber=[18], rfOrder=22, authorNames=Wu T, Dong Y, journalName=Applied Sciences, refType=null, unstructuredReference=
Wu T,
Dong Y. YOLO-SE: improved YOLOv8 for remote sensing object detection and recognition[J].
Applied Sciences,
2023,
13(24): 12977., articleTitle=YOLO-SE: improved YOLOv8 for remote sensing object detection and recognition, refAbstract=null), Reference(id=1209929306394980580, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2020, volume=11929, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[19], rfOrder=23, authorNames=Dosovitskiy A, Beyer L, Kolesnikov A, journalName=arXiv preprint arXiv: 2010, refType=null, unstructuredReference=
Dosovitskiy A,
Beyer L,
Kolesnikov A, et al. An image is worth 16×16 words: Transformers for image recognition at scale[J].
arXiv preprint arXiv: 2010.
11929,
2020., articleTitle=An image is worth 16×16 words: Transformers for image recognition at scale, refAbstract=null), Reference(id=1209929306478866661, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2021, volume=34, issue=null, pageStart=12077, pageEnd=12090, url=null, language=null, rfNumber=[20], rfOrder=24, authorNames=Xie E, Wang W, Yu Z, journalName=Advances in Neural Information Processing Systems, refType=null, unstructuredReference=
Xie E,
Wang W,
Yu Z, et al. SegFormer: simple and efficient design for semantic segmentation with transformers[J].
Advances in Neural Information Processing Systems,
2021,
34: 12077-12090., articleTitle=SegFormer: simple and efficient design for semantic segmentation with transformers, refAbstract=null), Reference(id=1209929306562752742, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2022, volume=35, issue=null, pageStart=1140, pageEnd=1156, url=null, language=null, rfNumber=[21], rfOrder=25, authorNames=Guo M H, Lu C Z, Hou Q, journalName=Advances in Neural Information Processing Systems, refType=null, unstructuredReference=
Guo M H,
Lu C Z,
Hou Q, et al. Segnext: rethinking convolutional attention design for semantic segmentation[J].
Advances in Neural Information Processing Systems,
2022,
35: 1140-1156., articleTitle=Segnext: rethinking convolutional attention design for semantic segmentation, refAbstract=null), Reference(id=1209929306650833130, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=17302, pageEnd=17313, url=null, language=null, rfNumber=[22], rfOrder=26, authorNames=Cai H, Li J, Hu M, journalName=Proceedings of the IEEE/CVF International Conference on Computer Vision, refType=null, unstructuredReference=
Cai H,
Li J,
Hu M, et al. Efficientvit: lightweight multi-scale attention for high-resolution dense prediction[C]//
Proceedings of the IEEE/CVF International Conference on Computer Vision. New York: IEEE,
2023: 17302-17313., articleTitle=Efficientvit: lightweight multi-scale attention for high-resolution dense prediction, refAbstract=null), Reference(id=1209929306764079342, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=1, pageEnd=5, url=null, language=null, rfNumber=[23], rfOrder=27, authorNames=Ouyang D, He S, Zhang G, journalName=2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), refType=null, unstructuredReference=
Ouyang D,
He S,
Zhang G, et al. Efficient multi-scale attention module with cross-spatial learning[C]//
2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP). New York: IEEE,
2023: 1-5., articleTitle=Efficient multi-scale attention module with cross-spatial learning, refAbstract=null)], funds=[Fund(id=1209929303102451874, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, awardId=ZJ2023-007, language=CN, fundingSource=中央高校基本科研业务费专项(ZJ2023-007), fundOrder=null, country=null), Fund(id=1209929303182143650, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, awardId=202101199029, language=CN, fundingSource=教育部产学合作协同育人项目(202101199029), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1209929297108792275, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, xref=null, ext=[AuthorCompanyExt(id=1209929297117180884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Air Traffic Management, Civil Aviation Flight University of China, Deyang 618300, China), AuthorCompanyExt(id=1209929297125569493, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, companyId=1209929297108792275, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国民用航空飞行学院空中交通管理学院, 德阳 618300)])], figs=[ArticleFig(id=1209929300783001663, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.1, caption=
Inter-class and intra-class differences, figureFileSmall=K6qOmRwcoKjaoHiUkE2FyA==, figureFileBig=UJthX/BY72wJePbpm3iVvw==, tableContent=null), ArticleFig(id=1209929300904636484, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图1, caption=
类间差异与类内差异, figureFileSmall=K6qOmRwcoKjaoHiUkE2FyA==, figureFileBig=UJthX/BY72wJePbpm3iVvw==, tableContent=null), ArticleFig(id=1209929301038854218, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.2, caption=
Schematic diagram of a multiscale linear attention model, figureFileSmall=mI5hpiiRAq+fn1NV/uN7ZQ==, figureFileBig=AnLQYnlYuAM4DnMo1iJeIA==, tableContent=null), ArticleFig(id=1209929301139517518, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图2, caption=
多尺度线性注意力模型示意图, figureFileSmall=mI5hpiiRAq+fn1NV/uN7ZQ==, figureFileBig=AnLQYnlYuAM4DnMo1iJeIA==, tableContent=null), ArticleFig(id=1209929301256958036, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.3, caption=
Schematic diagram of the EMA structure, figureFileSmall=RqiWyy3luJ2dqN2CQ+yQZg==, figureFileBig=o6NXPDCBFWYe0tga9wBZ8A==, tableContent=null), ArticleFig(id=1209929301340844119, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图3, caption=
EMA结构示意图 C表示输入通道的数量;H和W分别表示输入特征的空间维度
, figureFileSmall=RqiWyy3luJ2dqN2CQ+yQZg==, figureFileBig=o6NXPDCBFWYe0tga9wBZ8A==, tableContent=null), ArticleFig(id=1209929301424730204, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.4, caption=
Data set situation of CUB-200-2011, figureFileSmall=Nt1IBWZXT7Ax7VoeJsujmA==, figureFileBig=070+253JMDM+LMXKREVLfw==, tableContent=null), ArticleFig(id=1209929301512810595, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图4, caption=
CUB-200-2011数据集情况, figureFileSmall=Nt1IBWZXT7Ax7VoeJsujmA==, figureFileBig=070+253JMDM+LMXKREVLfw==, tableContent=null), ArticleFig(id=1209929301592502373, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.5, caption=
Data set situation of birds28, figureFileSmall=1XWTxDx4Cyi/qOqsJs6Vvw==, figureFileBig=LX1GKSvjY68oL5KA27G0Cw==, tableContent=null), ArticleFig(id=1209929301659611242, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图5, caption=
birds28数据集情况, figureFileSmall=1XWTxDx4Cyi/qOqsJs6Vvw==, figureFileBig=LX1GKSvjY68oL5KA27G0Cw==, tableContent=null), ArticleFig(id=1209929301735108717, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.6, caption=
Original YOLOv8 model recognition effect, figureFileSmall=TTC9iVNPU+H3Cgse3t1Lew==, figureFileBig=FklzDwP5+OBf/z/fH68Y9g==, tableContent=null), ArticleFig(id=1209929301827383408, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图6, caption=
原始YOLOv8模型识别效果, figureFileSmall=TTC9iVNPU+H3Cgse3t1Lew==, figureFileBig=FklzDwP5+OBf/z/fH68Y9g==, tableContent=null), ArticleFig(id=1209929301907075190, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Fig.7, caption=
The improved YOLOv8 model recognition effect, figureFileSmall=xfVQdPTiBkjn2CH3l74r5g==, figureFileBig=36jo1e8ZEGWucOr3ow3HzQ==, tableContent=null), ArticleFig(id=1209929302032904315, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=图7, caption=
改进后的YOLOv8模型识别效果, figureFileSmall=xfVQdPTiBkjn2CH3l74r5g==, figureFileBig=36jo1e8ZEGWucOr3ow3HzQ==, tableContent=null), ArticleFig(id=1209929302112596096, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Table 1, caption=
Experimental environmental parameter
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 设置 |
| epoch | 300 |
| batch | 16 |
| Imgsz | 640 |
| workers | 4 |
| lr0 | 0.01 |
| momentum | 0.937 |
| weight_decay | 0.000 5 |
), ArticleFig(id=1209929302192287875, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=表1, caption=
实验环境参数
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 设置 |
| epoch | 300 |
| batch | 16 |
| Imgsz | 640 |
| workers | 4 |
| lr0 | 0.01 |
| momentum | 0.937 |
| weight_decay | 0.000 5 |
), ArticleFig(id=1209929302276173957, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Table 2, caption=
CUB-200-2011 data set ablation experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv8 | 0.726 | 0.62 | 3.37 | 9.9 |
| YOLOv8-EMA | 0.742 | 0.64 | 3.38 | 10 |
| YOLOv8-EfficientViT | 0.756 | 0.642 | 4.37 | 11.2 |
YOLOv8-EfficientViT- EMA | 0.771 | 0.654 | 4.39 | 11.3 |
), ArticleFig(id=1209929302330699911, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=表2, caption=
CUB-200-2011数据集消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv8 | 0.726 | 0.62 | 3.37 | 9.9 |
| YOLOv8-EMA | 0.742 | 0.64 | 3.38 | 10 |
| YOLOv8-EfficientViT | 0.756 | 0.642 | 4.37 | 11.2 |
YOLOv8-EfficientViT- EMA | 0.771 | 0.654 | 4.39 | 11.3 |
), ArticleFig(id=1209929302393614474, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Table 3, caption=
birds28 data set ablation experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv8 | 0.830 | 0.592 | 3.01 | 8.2 |
| YOLOv8-EMA | 0.827 | 0.586 | 3.02 | 8.4 |
| YOLOv8-EfficientViT | 0.882 | 0.646 | 4.01 | 9.5 |
YOLOv8-EfficientViT- EMA | 0.884 | 0.655 | 4.02 | 9.6 |
), ArticleFig(id=1209929302494277773, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=表3, caption=
birds28数据集消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv8 | 0.830 | 0.592 | 3.01 | 8.2 |
| YOLOv8-EMA | 0.827 | 0.586 | 3.02 | 8.4 |
| YOLOv8-EfficientViT | 0.882 | 0.646 | 4.01 | 9.5 |
YOLOv8-EfficientViT- EMA | 0.884 | 0.655 | 4.02 | 9.6 |
), ArticleFig(id=1209929302594941073, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Table 4, caption=
CUB-200-2011 data set model comparison experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv5 | 0.687 | 0.580 | 2.87 | 8.9 |
| YOLOv6 | 0.666 | 0.572 | 4.68 | 14.0 |
| YOLOv8-ghost | 0.716 | 0.615 | 2.08 | 6.8 |
| YOLOv8-ghost-EMA | 0.718 | 0.611 | 2.68 | 8.2 |
| YOLOv8-BiFPN | 0.749 | 0.639 | 3.15 | 9.9 |
| Resnet18 | 0.770 | 0.642 | 13.69 | 36.9 |
YOLOv8-EfficientViT- EMA | 0.771 | 0.654 | 4.39 | 11.3 |
), ArticleFig(id=1209929302703992980, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=表4, caption=
CUB-200-2011数据集模型对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv5 | 0.687 | 0.580 | 2.87 | 8.9 |
| YOLOv6 | 0.666 | 0.572 | 4.68 | 14.0 |
| YOLOv8-ghost | 0.716 | 0.615 | 2.08 | 6.8 |
| YOLOv8-ghost-EMA | 0.718 | 0.611 | 2.68 | 8.2 |
| YOLOv8-BiFPN | 0.749 | 0.639 | 3.15 | 9.9 |
| Resnet18 | 0.770 | 0.642 | 13.69 | 36.9 |
YOLOv8-EfficientViT- EMA | 0.771 | 0.654 | 4.39 | 11.3 |
), ArticleFig(id=1209929302834016411, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=EN, label=Table 5, caption=
birds28 dataset model comparison experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv5 | 0.827 | 0.577 | 2.51 | 7.2 |
| YOLOv6 | 0.751 | 0.523 | 4.24 | 11.9 |
| YOLOv8-ghost | 0.804 | 0.574 | 1.72 | 5.2 |
| YOLOv8-ghost-EMA | 0.808 | 0.569 | 1.73 | 5.2 |
| YOLOv8-BiFPN | 0.836 | 0.598 | 2.79 | 8.3 |
| Resnet18 | 0.795 | 0.539 | 13.33 | 35.1 |
YOLOv8-EfficientViT- EMA | 0.884 | 0.655 | 4.02 | 9.6 |
), ArticleFig(id=1209929302917902492, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1209816724317278467, language=CN, label=表5, caption=
birds28数据集模型对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | mAP50 | mAP50-95 | 参数量/ 106 | GFLOPs |
| YOLOv5 | 0.827 | 0.577 | 2.51 | 7.2 |
| YOLOv6 | 0.751 | 0.523 | 4.24 | 11.9 |
| YOLOv8-ghost | 0.804 | 0.574 | 1.72 | 5.2 |
| YOLOv8-ghost-EMA | 0.808 | 0.569 | 1.73 | 5.2 |
| YOLOv8-BiFPN | 0.836 | 0.598 | 2.79 | 8.3 |
| Resnet18 | 0.795 | 0.539 | 13.33 | 35.1 |
YOLOv8-EfficientViT- EMA | 0.884 | 0.655 | 4.02 | 9.6 |
)], attaches=null, journal=Journal(id=1146119176004939786, delFlag=0, nameCn=科学技术与工程, nameEn=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, issn=1671-1815, eissn=, cn=11-4688/T, coden=null, periodic=4, language=CN, oaType=是, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=UKU/O7GSka5polgCTkbIIw==, journalPrice=null, startedYear=null, abbrevIsoEn=Sci Technol Eng, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1754445529766, createdBy=null, updatedBy=13701087609, firstLetterCn=S, firstLetterEn=S, subjectCode=Natural Sciences, subjectName=自然科学, subjectCodeEn=Natural Sciences, subjectNameEn=null, picCn=UKU/O7GSka5polgCTkbIIw==, picEn=5hwlULoNwcbj3xUmVi9MAQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1159791870395564357, language=CN, name=科学技术与工程, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529793, updatedTime=1754445529793, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=http://www.stae.com.cn/jsygc/site/menus/20090429150146001, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1159791870441701702, language=EN, name=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529804, updatedTime=1754445529804, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146123166801305609, websiteList=[Website(id=1148243202391400884, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/CN, language=CN, createTime=1751692112777, createBy=18614031015, updateTime=1753520965431, updateBy=18614031015, name=科学技术与工程-中文站点, tplId=1146099689490845704, title=科学技术与工程, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148622798802673703, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=articleTextType, value=kx, createTime=1751782615614, updateTime=1751782615614, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798781702180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=banner, value=null, createTime=1751782615609, updateTime=1751782615609, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798769119267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1751782615606, updateTime=1751782615606, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798794285094, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782615612, updateTime=1751782615612, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798790090789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782615611, updateTime=1751782615611, creator=18614031015, updator=18614031015)]), Website(id=1155914124811976731, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/EN, language=EN, createTime=1753521003206, createBy=18614031015, updateTime=1753521003206, updateBy=18614031015, name=科学技术与工程-英文站点, tplId=1146101810881728533, title=Science Technology and Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155914371227308235, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=articleTextType, value=kx, createTime=1753521061952, updateTime=1753521061952, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371210531016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=banner, value=null, createTime=1753521061947, updateTime=1753521061947, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371202142407, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1753521061945, updateTime=1753521061945, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371223113930, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753521061950, updateTime=1753521061950, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371218919625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753521061949, updateTime=1753521061949, creator=18614031015, updator=18614031015)])], journalTitle=科学技术与工程, weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Science Technology and Engineering, journalPhotoCn=UKU/O7GSka5polgCTkbIIw==, journalPhotoEn=5hwlULoNwcbj3xUmVi9MAQ==, journalFirstLetter=S, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/10.12404/j.issn.1671-1815.2405983, detailUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/10.12404/j.issn.1671-1815.2405983, pdfUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/PDF/10.12404/j.issn.1671-1815.2405983, pdfUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/PDF/10.12404/j.issn.1671-1815.2405983, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)