Article(id=1251226683488022656, tenantId=1146029695717560320, journalId=1251194772300279900, issueId=1251226682309423223, articleNumber=null, orderNo=null, doi=10.20079/j.issn.1001-893x.240812001, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1723392000000, receivedDateStr=2024-08-12, revisedDate=1728748800000, revisedDateStr=2024-10-13, acceptedDate=null, acceptedDateStr=null, onlineDate=1776245288011, onlineDateStr=2026-04-15, pubDate=1764259200000, pubDateStr=2025-11-28, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1776245288011, onlineIssueDateStr=2026-04-15, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1776245288011, creator=13041195026, updateTime=1776245288011, updator=13041195026, issue=Issue{id=1251226682309423223, tenantId=1146029695717560320, journalId=1251194772300279900, year='2025', volume='65', issue='11', pageStart='1729', pageEnd='1954', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1776245287729, creator=13041195026, updateTime=1776246742124, updator=13041195026, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1251232782568080068, tenantId=1146029695717560320, journalId=1251194772300279900, issueId=1251226682309423223, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1251232782568080069, tenantId=1146029695717560320, journalId=1251194772300279900, issueId=1251226682309423223, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=1798, endPage=1805, ext={EN=ArticleExt(id=1251226683756458113, articleId=1251226683488022656, tenantId=1146029695717560320, journalId=1251194772300279900, language=EN, title=Pyramid-enhancedand Cross-semantic Interaction Network for Lightweight Real-time Image Object Detection, columnId=1251226683223781499, journalTitle=Telecommunication Engineering, columnName=Application Fundamental Research and Advanced Technology, runingTitle=null, highlight=null, articleAbstract=
Recently, with the development of deep learning, the field of lightweight object detection has witnessed significant progress. However, mainstream lightweight detectors ignore the extraction of multi-scale semantic information. In addition, these approaches ignore the relationship between deep semantic features and shallow detail features. To relieve above shortcomings, a Pyramid Pooling Enhanced Multi-scale Network(PPMENet) is proposed and an Efficient Pyramid Pooling Block (EPPB) is designed to extract multi-scale deep semantic information,strengthening the feature expression ability of the model. On the other hand, a Cross Semantic Level Interaction Attention Module (CSIAM) is designed to enhance information interaction between features at different semantic levels. Experimental results on the MS COCO 2017 test set show that PPMENet gets 28.0% average precision, only with 2.16×106 model size and 0.97GFLOPs,and achieves inference speed of 218 frame/s. Compared with other methods, PPMENet realizes a good balance between detection accuracy and model execution efficiency.
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Wei LU), CN=ArticleExt(id=1251226695362097668, articleId=1251226683488022656, tenantId=1146029695717560320, journalId=1251194772300279900, language=CN, title=基于金字塔增强与跨语义交互的轻量图像目标检测网络, columnId=1251226683383165054, journalTitle=电讯技术, columnName=应用基础与前沿技术, runingTitle=null, highlight=null, articleAbstract=
近年来,轻量化目标检测领域取得了显著进展。然而,现有主流方法缺乏多尺度语义信息的提取,且忽略了深层语义特征与浅层细节特征之间的关系。针对上述缺陷,提出了金字塔池化多尺度增强网络(Pyramid Pooling Enhanced Multi-scale Network,PPMENet),通过设计一个高效金字塔池化模块(Efficient Pyramid Pooling Block,EPPB)来提取多尺度深层语义信息,以加强模型的特征表达能力。另一方面,设计了跨语义交互注意力模块(Cross Semantic Level Interaction Attention Module,CSIAM)以增强不同语义特征之间的联系。MS COCO 2017测试集的实验结果表明,PPMENet取得了28.0%平均精度,模型大小仅有2.16×106,GFLOPs为0.97,并获得了218 frame/s的推理速度。与其他方法相比,PPMENet在精度和执行效率间取得了较好的平衡。
, correspAuthors=null, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=MfOayf/yLXsTIPeVDc1reg==, magXml=eyKmdO8PBokg8JelsWFdJg==, pdfUrl=null, pdf=1FlcDU42yvIzSKEbrpZdXg==, pdfFileSize=5408002, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=5EYox508DG1bzawYCU4+VA==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=CPv1I460TkK2r8pfemLY8Q==, mapNumber=null, authorCompany=null, fund=null, authors=
陆蔚 女,1977年生于江苏无锡,2010年获工程硕士学位,现为副教授、高级工程师,主要研究方向为计算机视觉、图像处理。
, authorsList=陆蔚)}, authors=[Author(id=1251226695815082545, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=4137701@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1251226695919940153, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, authorId=1251226695815082545, language=EN, stringName=Wei LU, firstName=Wei, middleName=null, lastName=LU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=School of Internet of Things Engineering,Jiangsu Vocational College of Information Technology,Wuxi 214153,China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1251226696041574981, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, authorId=1251226695815082545, language=CN, stringName=陆蔚, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=江苏信息职业技术学院 物联网工程学院,江苏 无锡 214153, bio={"content":"
陆蔚 女,1977年生于江苏无锡,2010年获工程硕士学位,现为副教授、高级工程师,主要研究方向为计算机视觉、图像处理。
"}, bioImg=null, bioContent=
陆蔚 女,1977年生于江苏无锡,2010年获工程硕士学位,现为副教授、高级工程师,主要研究方向为计算机视觉、图像处理。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1251226695689253408, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, xref=null, ext=[AuthorCompanyExt(id=1251226695697642017, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, companyId=1251226695689253408, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Internet of Things Engineering,Jiangsu Vocational College of Information Technology,Wuxi 214153,China), AuthorCompanyExt(id=1251226695710224932, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, companyId=1251226695689253408, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=江苏信息职业技术学院 物联网工程学院,江苏 无锡 214153)])])], keywords=[Keyword(id=1251226696175792725, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, orderNo=1, keyword=real-time image object detection), Keyword(id=1251226696310010464, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, orderNo=2, keyword=lightweight network), Keyword(id=1251226696435839599, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, orderNo=3, keyword=multi-scale feature extraction), Keyword(id=1251226696603611770, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, orderNo=4, keyword=attention mechanism), Keyword(id=1251226696712663686, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, orderNo=5, keyword=feature fusion), Keyword(id=1251226696851075730, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, orderNo=1, keyword=实时图像目标检测), Keyword(id=1251226696943350424, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, orderNo=2, keyword=轻量级网络), Keyword(id=1251226697077568165, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, orderNo=3, keyword=多尺度特征提取), Keyword(id=1251226697174037168, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, orderNo=4, keyword=注意力机制), Keyword(id=1251226697287283384, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, orderNo=5, keyword=特征融合)], refs=[Reference(id=1251226700806304621, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2023, volume=63, issue=9, pageStart=1291, pageEnd=1299, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=李翠锦, 瞿中, journalName=电讯技术, refType=null, unstructuredReference=李翠锦, 瞿中.复杂交通环境下多层交叉融合多目标检测[J].
电讯技术,
2023,
63(9):1291-1299., articleTitle=复杂交通环境下多层交叉融合多目标检测, refAbstract=null), Reference(id=1251226700940522355, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2022, volume=62, issue=2, pageStart=259, pageEnd=265, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=杨艳红, 钟宝江, 徐云龙, journalName=电讯技术, refType=null, unstructuredReference=杨艳红, 钟宝江, 徐云龙,
等.改进的SSD算法在智慧交通中的应用[J].
电讯技术,
2022,
62(2):259-265., articleTitle=改进的SSD算法在智慧交通中的应用, refAbstract=null), Reference(id=1251226701057962874, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=1314, pageEnd=1324, url=null, language=null, rfNumber=[3], rfOrder=2, authorNames=HOWARD A, SANDLER M, CHEN B, journalName=null, refType=null, unstructuredReference=
HOWARD A,
SANDLER M,
CHEN B,
et al. Searching for MobileNetV3[C]//2019 IEEE/CVF International Conference on Computer Vision. Seoul: IEEE,
2019:1314-1324., articleTitle=Searching for MobileNetV3, refAbstract=null), Reference(id=1251226701158626178, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=6717, pageEnd=6726, url=null, language=null, rfNumber=[4], rfOrder=3, authorNames=QIN Z, LI Z M, ZHANG Z N, journalName=null, refType=null, unstructuredReference=
QIN Z,
LI Z M,
ZHANG Z N,
et al. ThunderNet:towards real-time generic object detection on mobile devices[C]//2019 IEEE/CVF International Conference on Computer Vision. Seoul:IEEE,
2019:6717-6726., articleTitle=ThunderNet:towards real-time generic object detection on mobile devices, refAbstract=null), Reference(id=1251226701267678087, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=122, pageEnd=138, url=null, language=null, rfNumber=[5], rfOrder=4, authorNames=MA N N, ZHANG X Y, ZHENG H T, journalName=null, refType=null, unstructuredReference=
MA N N,
ZHANG X Y,
ZHENG H T,
et al. ShuffleNet V2: practical guidelines for efficient CNN architecture design[C]//2018 European Confererue on Computer Vision. Cham:Springer,
2018:122-138., articleTitle=ShuffleNet V2: practical guidelines for efficient CNN architecture design, refAbstract=null), Reference(id=1251226701372535695, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=13024, pageEnd=13033, url=null, language=null, rfNumber=[6], rfOrder=5, authorNames=WANG C Y, BOCHKOVSKIY A, LIAO H M, journalName=null, refType=null, unstructuredReference=
WANG C Y,
BOCHKOVSKIY A,
LIAO H M. Scaled-YOLOv4:scaling cross stage partial network[C]//2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Nashville:IEEE,
2021:13024-13033., articleTitle=Scaled-YOLOv4:scaling cross stage partial network, refAbstract=null), Reference(id=1251226701473198999, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=59, pageEnd=70, url=null, language=null, rfNumber=[7], rfOrder=6, authorNames=LI Y, LI J, LIN W, journalName=null, refType=null, unstructuredReference=
LI Y,
LI J,
LIN W,
et al. Tiny-DSOD:lightweight object detection for resource-restricted usages[C]//The 29th British Machine Vision Conference. Newcastle: ACM,
2018:59-70., articleTitle=Tiny-DSOD:lightweight object detection for resource-restricted usages, refAbstract=null), Reference(id=1251226701569667998, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=936, pageEnd=944, url=null, language=null, rfNumber=[8], rfOrder=7, authorNames=LIN T Y, DOLLÁR P, GIRSHICK R, journalName=null, refType=null, unstructuredReference=
LIN T Y,
DOLLÁR P,
GIRSHICK R,
et al. Feature pyramid networks for object detection[C]//2017 IEEE Conference on Computer Vision and Pattern Recognition. Honolulu:IEEE,
2017:936-944., articleTitle=Feature pyramid networks for object detection, refAbstract=null), Reference(id=1251226701779383209, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=2243, pageEnd=2247, url=null, language=null, rfNumber=[9], rfOrder=8, authorNames=TANG Q K, LI J, SHI Z P, journalName=null, refType=null, unstructuredReference=
TANG Q K,
LI J,
SHI Z P,
et al. LightDet:a lightweight and accurate object detection network[C]//2020 IEEE International Conference on Acoustics,Speech and Signal Processing. Barcelona:IEEE,
2020:2243-2247., articleTitle=LightDet:a lightweight and accurate object detection network, refAbstract=null), Reference(id=1251226701896823729, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=10778, pageEnd=10787, url=null, language=null, rfNumber=[10], rfOrder=9, authorNames=TAN M X, PANG R M, LE Q V, journalName=null, refType=null, unstructuredReference=
TAN M X,
PANG R M,
LE Q V. EfficientDet:scalable and efficient object detection[C]//2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle:IEEE,
2020:10778-10787., articleTitle=EfficientDet:scalable and efficient object detection, refAbstract=null), Reference(id=1251226701989098429, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=2730, pageEnd=2734, url=null, language=null, rfNumber=[11], rfOrder=10, authorNames=ZHANG Y M, LEE C C, HSIEH J W, journalName=null, refType=null, unstructuredReference=
ZHANG Y M,
LEE C C,
HSIEH J W,
et al. CSL-YOLO:a cross-stage lightweight object detector with low FLOPs[C]//2022 IEEE International Symposium on Circuits and Systems. Austin:IEEE,
2022:2730-2734., articleTitle=CSL-YOLO:a cross-stage lightweight object detector with low FLOPs, refAbstract=null), Reference(id=1251226702098150346, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2006, volume=null, issue=null, pageStart=850, pageEnd=855, url=null, language=null, rfNumber=[12], rfOrder=11, authorNames=NEUBECK A, VAN G, journalName=null, refType=null, unstructuredReference=
NEUBECK A,
VAN G. Efficient non-maximum suppression[C]//The 18th International Conference on Pattern Recognition. Hong Kong,China:IEEE,
2006:850-855., articleTitle=Efficient non-maximum suppression, refAbstract=null), Reference(id=1251226702186230743, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=7132, pageEnd=7141, url=null, language=null, rfNumber=[13], rfOrder=12, authorNames=HU J, SHEN L, SUN G, journalName=null, refType=null, unstructuredReference=
HU J,
SHEN L,
SUN G. Squeeze-and-excitation networks[C]//2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Salt Lake City: IEEE,
2018:7132-7141., articleTitle=Squeeze-and-excitation networks, refAbstract=null), Reference(id=1251226703784260575, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=740, pageEnd=755, url=null, language=null, rfNumber=[14], rfOrder=13, authorNames=LIN T Y, MAIRE M, BELONGIE S, journalName=null, refType=null, unstructuredReference=
LIN T Y,
MAIRE M,
BELONGIE S,
et al. Microsoft COCO:common objects in context[C]//2014 European Conference on Computer Vision. Cham: Springer,
2014:740-755., articleTitle=Microsoft COCO:common objects in context, refAbstract=null), Reference(id=1251226703880729578, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2010, volume=88, issue=2, pageStart=303, pageEnd=338, url=null, language=null, rfNumber=[15], rfOrder=14, authorNames=EVERINGHAM M, VAN GOOL L, WILLIAMS C K I, journalName=International Journal of Computer Vision, refType=null, unstructuredReference=
EVERINGHAM M,
VAN GOOL L,
WILLIAMS C K I,
et al. The pascal visual object classes(VOC) challenge[J].
International Journal of Computer Vision,
2010,
88(2):303-338., articleTitle=The pascal visual object classes(VOC) challenge, refAbstract=null), Reference(id=1251226703989781492, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=1086, pageEnd=1097, url=null, language=null, rfNumber=[16], rfOrder=15, authorNames=MICIKEVICIUS P, NARANH S, ALBEN J, journalName=null, refType=null, unstructuredReference=
MICIKEVICIUS P,
NARANH S,
ALBEN J,
et al. Mixed Precision Training[C]//The 6th International Conference on Learning Representations. Vancouver:IEEE,
2018:1086-1097., articleTitle=Mixed Precision Training, refAbstract=null), Reference(id=1251226704086250494, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2024-08-20, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[17], rfOrder=16, authorNames=GE Z, LIU S, WANG F, journalName=null, refType=null, unstructuredReference=
GE Z,
LIU S,
WANG F,
et al. YOLOx:exceeding YOLO series in 2021[EB/OL]. (2021-08-06)[
2024-08-20].
https://arxiv.org/abs/2107.08430., articleTitle=YOLOx:exceeding YOLO series in 2021, refAbstract=null), Reference(id=1251226704191107076, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=21, pageEnd=37, url=null, language=null, rfNumber=[18], rfOrder=17, authorNames=LIU W, ANGUELOV D, ERHAN D, journalName=null, refType=null, unstructuredReference=
LIU W,
ANGUELOV D,
ERHAN D,
et al. SSD:single shot MultiBox detector[C]//The 14th European Conference on Computer Vision. Cham:Springer,
2016:21-37., articleTitle=SSD:single shot MultiBox detector, refAbstract=null), Reference(id=1251226704279187467, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=7464, pageEnd=7475, url=null, language=null, rfNumber=[19], rfOrder=18, authorNames=WANG C Y, BOCHKOVSKIY A, LIAO H M, journalName=null, refType=null, unstructuredReference=
WANG C Y,
BOCHKOVSKIY A,
LIAO H M. YOLOv7:trainable bag-of-freebies sets new state-of-the-art for real-time object detectors[C]//2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Vancouver:IEEE,
2023:7464-7475., articleTitle=YOLOv7:trainable bag-of-freebies sets new state-of-the-art for real-time object detectors, refAbstract=null), Reference(id=1251226704379850774, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2024-08-20, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[20], rfOrder=19, authorNames=WANG C Y, YEH I H, LIAO H Y M, journalName=null, refType=null, unstructuredReference=
WANG C Y,
YEH I H,
LIAO H Y M. YOLOv9:learning what you want to learn using programmable gradient information[EB/OL]. (2024-02-21)[
2024-08-20].
https://arxiv.org/abs/2402.13616., articleTitle=YOLOv9:learning what you want to learn using programmable gradient information, refAbstract=null), Reference(id=1251226704484708381, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=3421, pageEnd=3446, url=null, language=null, rfNumber=[21], rfOrder=20, authorNames=MEHTA S, RASTEGARI M, journalName=null, refType=null, unstructuredReference=
MEHTA S,
RASTEGARI M. MobileViT: light-weight, general-purpose, and mobile-friendly vision transformer[C]//The 10th International Conference on Learning Representations. Washington DC:IEEE,
2022:3421-3446., articleTitle=MobileViT: light-weight, general-purpose, and mobile-friendly vision transformer, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1251226695689253408, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, xref=null, ext=[AuthorCompanyExt(id=1251226695697642017, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, companyId=1251226695689253408, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Internet of Things Engineering,Jiangsu Vocational College of Information Technology,Wuxi 214153,China), AuthorCompanyExt(id=1251226695710224932, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, companyId=1251226695689253408, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=江苏信息职业技术学院 物联网工程学院,江苏 无锡 214153)])], figs=[ArticleFig(id=1251226697505387210, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=t8yqRP/QD4H4PzpRqOV1sw==, figureFileBig=5EYox508DG1bzawYCU4+VA==, tableContent=null), ArticleFig(id=1251226697647993558, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=图1, caption=
PPMENet的整体结构, figureFileSmall=t8yqRP/QD4H4PzpRqOV1sw==, figureFileBig=5EYox508DG1bzawYCU4+VA==, tableContent=null), ArticleFig(id=1251226699346686701, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=MqX//0cQCirm2Cpan6JUig==, figureFileBig=nV/dIUVLX8zs1fDWeWYMcQ==, tableContent=null), ArticleFig(id=1251226699451544308, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=图2, caption=
PPSU两个版本的详细结构, figureFileSmall=MqX//0cQCirm2Cpan6JUig==, figureFileBig=nV/dIUVLX8zs1fDWeWYMcQ==, tableContent=null), ArticleFig(id=1251226699556401916, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=GSLaRPf57wuC4meMpZEQWw==, figureFileBig=J/YpGNtO/1DRRtfuhI6qPw==, tableContent=null), ArticleFig(id=1251226699648676618, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=图3, caption=
EPPB详细结构, figureFileSmall=GSLaRPf57wuC4meMpZEQWw==, figureFileBig=J/YpGNtO/1DRRtfuhI6qPw==, tableContent=null), ArticleFig(id=1251226699736757012, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=6vyxvkWpIvcTbIgZeGMzpQ==, figureFileBig=qUUFtE4PfJRHP3ZFwIYQYg==, tableContent=null), ArticleFig(id=1251226699850003227, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=图4, caption=
CSIAM的详细结构, figureFileSmall=6vyxvkWpIvcTbIgZeGMzpQ==, figureFileBig=qUUFtE4PfJRHP3ZFwIYQYg==, tableContent=null), ArticleFig(id=1251226699933889315, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=iThV06BaQZN3b4HX2dHLTQ==, figureFileBig=VAd7/IzLpmbZg79JNz4Vgg==, tableContent=null), ArticleFig(id=1251226700021969709, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=图5, caption=
PPMENet在MS COCO测试集中和其他方法的检测结果对比, figureFileSmall=iThV06BaQZN3b4HX2dHLTQ==, figureFileBig=VAd7/IzLpmbZg79JNz4Vgg==, tableContent=null), ArticleFig(id=1251226700101661494, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | FLOPs/109 | 参数量/106 | AP/% | AP50/% | AP75/% | 推理速度/(frame/s) |
|---|
| MobileNetV3-SSDLite [3] | 0.8 | 4.3 | 22.1 | — | — | — |
| MobileViT-XS-SSDLite [21] | — | 2.7 | 24.8 | — | — | 76 |
| SSD[18] | 38.6 | 34.3 | 25.5 | 43.6 | 36.2 | — |
| Tiny-DSOD[7] | 1.12 | 1.15 | 23.2 | 40.4 | 22.8 | 105 |
| Tiny-YOLOV4[6] | 3.45 | 6.1 | 21.7 | 40.2 | — | 371 |
| Nano YOLOX[17] | 1.08 | 0.91 | 25.3 | — | — | — |
| Tiny-YOLOX[17] | 6.45 | 5.06 | 31.8 | 49.0 | 33.8 | — |
| CSL-YOLO[11] | 1.4 | 3.2 | 24.5 | 44.0 | 24.2 | — |
| Tiny-YOLOV7[19] | 13.8 | 6.3 | 38.7 | 56.7 | 41.7 | 273 |
| PPMENet | 0.97 | 2.16 | 28.0 | 44.4 | 29.4 | 218 |
), ArticleFig(id=1251226700210713408, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=表1, caption=
PPMENet在MS COCO 2017测试集上与其他轻量级检测器的性能对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | FLOPs/109 | 参数量/106 | AP/% | AP50/% | AP75/% | 推理速度/(frame/s) |
|---|
| MobileNetV3-SSDLite [3] | 0.8 | 4.3 | 22.1 | — | — | — |
| MobileViT-XS-SSDLite [21] | — | 2.7 | 24.8 | — | — | 76 |
| SSD[18] | 38.6 | 34.3 | 25.5 | 43.6 | 36.2 | — |
| Tiny-DSOD[7] | 1.12 | 1.15 | 23.2 | 40.4 | 22.8 | 105 |
| Tiny-YOLOV4[6] | 3.45 | 6.1 | 21.7 | 40.2 | — | 371 |
| Nano YOLOX[17] | 1.08 | 0.91 | 25.3 | — | — | — |
| Tiny-YOLOX[17] | 6.45 | 5.06 | 31.8 | 49.0 | 33.8 | — |
| CSL-YOLO[11] | 1.4 | 3.2 | 24.5 | 44.0 | 24.2 | — |
| Tiny-YOLOV7[19] | 13.8 | 6.3 | 38.7 | 56.7 | 41.7 | 273 |
| PPMENet | 0.97 | 2.16 | 28.0 | 44.4 | 29.4 | 218 |
), ArticleFig(id=1251226700332348233, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | GFLOPs | 参数量/106 | mAP/% | 速度/(frame/s) |
|---|
| SSD[18] | 35.3 | 26.29 | 76.5 | 46 |
| Tiny-DSOD[7] | 1.10 | — | 72.1 | 105 |
| ThunderNet[4] | 1.30 | — | 78.6 | 214 |
| PPMENet | 0.95 | 2.14 | 78.2 | 252 |
), ArticleFig(id=1251226700412040014, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=表2, caption=
PPMENet在Pascal VOC 2007测试集上与其他检测器的性能对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | GFLOPs | 参数量/106 | mAP/% | 速度/(frame/s) |
|---|
| SSD[18] | 35.3 | 26.29 | 76.5 | 46 |
| Tiny-DSOD[7] | 1.10 | — | 72.1 | 105 |
| ThunderNet[4] | 1.30 | — | 78.6 | 214 |
| PPMENet | 0.95 | 2.14 | 78.2 | 252 |
), ArticleFig(id=1251226700542063448, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | EPPB | CSIAM-CA | CSIAM-SA | 参数量/106 | GFLOPs | AP/% |
|---|
| PPMENet | × | × | × | 1.78 | 0.85 | 25.2 |
| √ | × | × | 2.01 | 0.91 | 26.8 |
| √ | √ | × | 2.07 | 0.94 | 27.3 |
| √ | × | √ | 2.10 | 0.95 | 27.2 |
| √ | √ | √ | 2.16 | 0.97 | 27.7 |
), ArticleFig(id=1251226700655309664, tenantId=1146029695717560320, journalId=1251194772300279900, articleId=1251226683488022656, language=CN, label=表3, caption=
本文所提出的模块消融实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | EPPB | CSIAM-CA | CSIAM-SA | 参数量/106 | GFLOPs | AP/% |
|---|
| PPMENet | × | × | × | 1.78 | 0.85 | 25.2 |
| √ | × | × | 2.01 | 0.91 | 26.8 |
| √ | √ | × | 2.07 | 0.94 | 27.3 |
| √ | × | √ | 2.10 | 0.95 | 27.2 |
| √ | √ | √ | 2.16 | 0.97 | 27.7 |
)], attaches=null, journal=Journal(id=1251193998841266264, delFlag=0, nameCn=电讯技术, nameEn=Telecommunication Engineering, nameHistory1=null, nameHistory2=null, issn=1001-893X, eissn=null, cn=51-1267/TN, coden=null, periodic=0, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=CpBmHoMzpESavU+iEMTBmw==, journalPrice=null, startedYear=null, abbrevIsoEn=Telecommunication Engineering, journalRemark=null, publicationField=null, createdTime=1776237495387, updatedTime=1776238086301, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=T, firstLetterEn=T, subjectCode=Engineering, subjectName=null, subjectCodeEn=Engineering, subjectNameEn=null, picCn=CpBmHoMzpESavU+iEMTBmw==, picEn=jCOIy2zOaGJZ/y3z2gPZzg==, jcr=null, cjcr=null, exts=[JournalExt(id=1251196477385687352, language=CN, name=电讯技术, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1776238086315, updatedTime=1776238086315, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://www.teleonline.cn/dxjs/ch/author/login.aspx, submissionEditorUrl=https://www.teleonline.cn/dxjs/ch/login.aspx, submissionReviewUrl=https://www.teleonline.cn/dxjs/ch/auditor/login.aspx, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1251196477469573433, language=EN, name=Telecommunication Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1776238086335, updatedTime=1776238086335, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://www.teleonline.cn/dxjs/ch/author/login.aspx, submissionEditorUrl=https://www.teleonline.cn/dxjs/ch/login.aspx, submissionReviewUrl=https://www.teleonline.cn/dxjs/ch/auditor/login.aspx, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1251194772300279900, websiteList=[Website(id=1251197148327522670, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1251194772300279900, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/dxjs/CN, language=CN, createTime=1776238246280, createBy=18614031015, updateTime=1776238378770, updateBy=18614031015, name=电讯技术-中文, tplId=1146099689490845704, title=电讯技术, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1251197904854135502, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=articleTextType, value=kx, createTime=1776238426650, updateTime=1776238426650, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904833163979, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=banner, value=null, createTime=1776238426645, updateTime=1776238426645, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904870912721, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=grayFlag, value=0, createTime=1776238426654, updateTime=1776238426654, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904824775370, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=logo, value=https://castjournals.cast.org.cn/joweb/dxjs/CN/file/pic?fileId=BBd4SC9puESjyaw04bneig==, createTime=1776238426643, updateTime=1776238426643, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904883495635, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=minRunFlag, value=0, createTime=1776238426657, updateTime=1776238426657, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904845746893, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/dxjs/CN/file/pic, createTime=1776238426648, updateTime=1776238426648, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904875107026, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=silenceFlag, value=0, createTime=1776238426655, updateTime=1776238426655, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904841552588, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1776238426647, updateTime=1776238426647, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904858329807, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=themeColor, value=null, createTime=1776238426651, updateTime=1776238426651, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197904866718416, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148327522670, code=themeStyle, value=null, createTime=1776238426653, updateTime=1776238426653, creator=18614031015, updator=18614031015)]), Website(id=1251197148512072052, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1251194772300279900, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/dxjs/EN, language=EN, createTime=1776238246324, createBy=18614031015, updateTime=1776238398944, updateBy=18614031015, name=电讯技术-英文, tplId=1146101810881728533, title=Telecommunication Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1251197930175152619, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=articleTextType, value=kx, createTime=1776238432687, updateTime=1776238432687, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930154181096, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=banner, value=null, createTime=1776238432682, updateTime=1776238432682, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930200318446, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=grayFlag, value=0, createTime=1776238432693, updateTime=1776238432693, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930141598183, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=logo, value=https://castjournals.cast.org.cn/joweb/dxjs/EN/file/pic?fileId=BBd4SC9puESjyaw04bneig==, createTime=1776238432679, updateTime=1776238432679, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930212901360, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=minRunFlag, value=0, createTime=1776238432696, updateTime=1776238432696, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930170958314, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/dxjs/EN/file/pic, createTime=1776238432686, updateTime=1776238432686, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930204512751, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=silenceFlag, value=0, createTime=1776238432694, updateTime=1776238432694, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930162569705, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1776238432684, updateTime=1776238432684, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930183541228, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=themeColor, value=null, createTime=1776238432689, updateTime=1776238432689, creator=18614031015, updator=18614031015), WebsiteProps(id=1251197930191929837, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1251197148512072052, code=themeStyle, value=null, createTime=1776238432691, updateTime=1776238432691, creator=18614031015, updator=18614031015)])], journalTitle=电讯技术, weixinUrl=null, journalUrl=https://www.teleonline.cn/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Telecommunication Engineering, journalPhotoCn=CpBmHoMzpESavU+iEMTBmw==, journalPhotoEn=jCOIy2zOaGJZ/y3z2gPZzg==, journalFirstLetter=T, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/dxjs/CN/10.20079/j.issn.1001-893x.240812001, detailUrlEn=https://castjournals.cast.org.cn/joweb/dxjs/EN/10.20079/j.issn.1001-893x.240812001, pdfUrlCn=https://castjournals.cast.org.cn/joweb/dxjs/CN/PDF/10.20079/j.issn.1001-893x.240812001, pdfUrlEn=https://castjournals.cast.org.cn/joweb/dxjs/EN/PDF/10.20079/j.issn.1001-893x.240812001, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)