Article(id=1244336192716652605, tenantId=1146029695717560320, journalId=1244323073571209252, issueId=1244336186114819067, articleNumber=null, orderNo=null, doi=10.13695/j.cnki.12-1222/o3.2025.10.002, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1728921600000, receivedDateStr=2024-10-15, revisedDate=null, revisedDateStr=null, acceptedDate=1753804800000, acceptedDateStr=2025-07-30, onlineDate=1774602466991, onlineDateStr=2026-03-27, pubDate=1761753600000, pubDateStr=2025-10-30, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1774602466991, onlineIssueDateStr=2026-03-27, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1774602466991, creator=13701087609, updateTime=1774602466991, updator=13701087609, issue=Issue{id=1244336186114819067, tenantId=1146029695717560320, journalId=1244323073571209252, year='2025', volume='33', issue='10', pageStart='955', pageEnd='1060', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=null, createTime=1774602465418, creator=13701087609, updateTime=1774604459075, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1244344548185452773, tenantId=1146029695717560320, journalId=1244323073571209252, issueId=1244336186114819067, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1244344548185452774, tenantId=1146029695717560320, journalId=1244323073571209252, issueId=1244336186114819067, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=963, endPage=971, ext={EN=ArticleExt(id=1244336193010253898, articleId=1244336192716652605, tenantId=1146029695717560320, journalId=1244323073571209252, language=EN, title=A fast heterogeneous image retrieval method for UAV scene matching and positioning, columnId=1244336188069364733, journalTitle=Journal of Chinese Inertial Technology, columnName=Integrated Navigation Technology, runingTitle=null, highlight=null, articleAbstract=
The scene matching and positioning of Unmanned aerial vehicles (UAVs) are prone to mismatching or even retrieval failure due to the differences in domain, observation angle and other factors between UAV images and satellite reference images. To address this issue, a rapid cross-source image retrieval method based on salient location features is proposed. Firstly, to solve the matching failure caused by scene and time differences between UAV images and reference images, a salient position feature extraction module is designed, which can extract more effective context information while reducing the computational complexity. Secondly, a label smoothing loss function is introduced to enhance the generalization ability of the model. Finally, a block-wise fine-tuning strategy is proposed to alleviate the overfitting problem of large models like vision transformer (ViT) under limited training data conditions. The experimental results show that the proposed method achieves 86.01% and 96.52% respectively in R@1 and R@5 on the DenseUAV dataset, and 76.04% in mAP, which is improved by 5.83%, 3.53% and 9.49% respectively compared with ViT-S. The retrieval time for a single image is 9.55 ms on the DenseUAV dataset, indicating the effectiveness of the proposed method in UAV cross-source scene matching.
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Xiaoguo ZHANG, Tianyu LI, Zhihao SHI, Yujin KUANG), CN=ArticleExt(id=1244336202929783145, articleId=1244336192716652605, tenantId=1146029695717560320, journalId=1244323073571209252, language=CN, title=一种用于无人机景象匹配定位的异源图像快速检索方法, columnId=1244336188241331200, journalTitle=中国惯性技术学报, columnName=组合导航技术, runingTitle=null, highlight=null, articleAbstract=
无人机景象匹配定位时,由于无人机图像和卫星基准图像之间域、观察角度等因素不同,容易出现误匹配甚至检索失败。针对上述问题,提出了一种基于显著位置特征的异源图像快速检索方法。首先,针对无人机图像与基准图像因获取场景和时间差异导致匹配失败的问题,设计了显著位置特征提取模块,在降低计算复杂度的同时能够提取更有效的上下文信息。其次,引入标签平滑损失函数,提升了模型的泛化能力。最后,提出分块微调策略以缓解大模型视觉Transformer在有限训练数据条件下的过拟合问题。实验结果表明,所提方法在DenseUAV数据集上R@1和R@5分别达到了86.01%和96.52%,mAP达到了76.04%,较现有主流方法ViT-S分别提升5.83%、3.53%和9.49%,单张图像检索时间为9.55 ms,表明所提方法在无人机异源景象匹配中的有效性。
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=MYqBOseRIGtk12XSFRqjsA==, magXml=F+EclVMCNWkXrQ3IGAnToQ==, pdfUrl=null, pdf=etgd/2BTrydlfM2EK3OOWg==, pdfFileSize=2753591, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=jk93qXjtRSKIJFmqRU7qJA==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=ZAHZUW63kYwDhr0g1EXnCQ==, mapNumber=null, authorCompany=null, fund=null, authors=
张小国(1973—),男,教授,从事视觉导航定位。
, authorsList=张小国, 李天宇, 史志豪, 况余进)}, authors=[Author(id=1244336203693146502, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1244336203869307276, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336203693146502, language=EN, stringName=Xiaoguo ZHANG, firstName=Xiaoguo, middleName=null, lastName=ZHANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1244336204066439572, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336203693146502, language=CN, stringName=张小国, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=东南大学 仪器科学与工程学院,南京 210096, bio={"content":"
张小国(1973—),男,教授,从事视觉导航定位。
"}, bioImg=null, bioContent=
张小国(1973—),男,教授,从事视觉导航定位。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1244336203479236986, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, xref=null, ext=[AuthorCompanyExt(id=1244336203508597115, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China), AuthorCompanyExt(id=1244336203537957245, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=东南大学 仪器科学与工程学院,南京 210096)])]), Author(id=1244336204217434525, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1244336204381012389, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336204217434525, language=EN, stringName=Tianyu LI, firstName=Tianyu, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1244336204548784557, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336204217434525, language=CN, stringName=李天宇, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=东南大学 仪器科学与工程学院,南京 210096, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1244336203479236986, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, xref=null, ext=[AuthorCompanyExt(id=1244336203508597115, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China), AuthorCompanyExt(id=1244336203537957245, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=东南大学 仪器科学与工程学院,南京 210096)])]), Author(id=1244336204666225073, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1244336206138425781, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336204666225073, language=EN, stringName=Zhihao SHI, firstName=Zhihao, middleName=null, lastName=SHI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1244336206255866299, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336204666225073, language=CN, stringName=史志豪, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=东南大学 仪器科学与工程学院,南京 210096, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1244336203479236986, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, xref=null, ext=[AuthorCompanyExt(id=1244336203508597115, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China), AuthorCompanyExt(id=1244336203537957245, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=东南大学 仪器科学与工程学院,南京 210096)])]), Author(id=1244336206356529605, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1244336206490747339, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336206356529605, language=EN, stringName=Yujin KUANG, firstName=Yujin, middleName=null, lastName=KUANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1244336206603993552, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, authorId=1244336206356529605, language=CN, stringName=况余进, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=东南大学 仪器科学与工程学院,南京 210096, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1244336203479236986, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, xref=null, ext=[AuthorCompanyExt(id=1244336203508597115, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China), AuthorCompanyExt(id=1244336203537957245, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=东南大学 仪器科学与工程学院,南京 210096)])])], keywords=[Keyword(id=1244336206780154330, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, orderNo=1, keyword=GNSS-denied), Keyword(id=1244336206876623327, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, orderNo=2, keyword=UAV visual positioning), Keyword(id=1244336206964703716, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, orderNo=3, keyword=remote sensing imagery), Keyword(id=1244336207052784106, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, orderNo=4, keyword=heterogeneous image retrieval), Keyword(id=1244336207145058799, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, orderNo=1, keyword=GNSS拒止), Keyword(id=1244336207258305012, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, orderNo=2, keyword=无人机视觉定位), Keyword(id=1244336207379939834, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, orderNo=3, keyword=遥感影像), Keyword(id=1244336207606432258, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, orderNo=4, keyword=异源图像检索)], refs=[Reference(id=1244336213075804832, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2024, volume=32, issue=01, pageStart=052, pageEnd=057, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=尚克军, 赵亮, 张伟建, journalName=中国惯性技术学报, refType=null, unstructuredReference=尚克军, 赵亮, 张伟建,
等. 基于深度特征正射匹配的无人机视觉定位方法[J].
中国惯性技术学报,
2024,
32(01): 052-057., articleTitle=基于深度特征正射匹配的无人机视觉定位方法, refAbstract=null), Reference(id=1244336213180662437, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2024, volume=32, issue=01, pageStart=052, pageEnd=057, url=null, language=null, rfNumber=[1], rfOrder=1, authorNames=Shang K, Zhao L, Zhang W, journalName=Journal of Chinese Inertial Technology, refType=null, unstructuredReference=
Shang K,
Zhao L,
Zhang W,
et al. Unmanned aerial vehicle visual localization method based on deep feature orthorectification matching[J].
Journal of Chinese Inertial Technology,
2024,
32(01): 052-057., articleTitle=Unmanned aerial vehicle visual localization method based on deep feature orthorectification matching, refAbstract=null), Reference(id=1244336213390377644, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2022, volume=30, issue=05, pageStart=582, pageEnd=588, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=韩勇强, 于潇颖, 纪泽源, journalName=中国惯性技术学报, refType=null, unstructuredReference=韩勇强, 于潇颖, 纪泽源,
等. 面向城市复杂环境的GNSS/INS高精度图优化算法[J].
中国惯性技术学报,
2022,
30(05): 582-588., articleTitle=面向城市复杂环境的GNSS/INS高精度图优化算法, refAbstract=null), Reference(id=1244336213545566897, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2022, volume=30, issue=05, pageStart=582, pageEnd=588, url=null, language=null, rfNumber=[2], rfOrder=3, authorNames=Han Y, Yu X, Ji Z, journalName=Journal of Chinese Inertial Technology, refType=null, unstructuredReference=
Han Y,
Yu X,
Ji Z,
et al. The high-precision factor graph optimization algorithm of GNSS/INS for urban complex environment[J].
Journal of Chinese Inertial Technology,
2022,
30(05): 582-588., articleTitle=The high-precision factor graph optimization algorithm of GNSS/INS for urban complex environment, refAbstract=null), Reference(id=1244336215076487862, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2004, volume=60, issue=2, pageStart=91, pageEnd=110, url=null, language=null, rfNumber=[3], rfOrder=4, authorNames=Lowe D G, journalName=International Journal of Computer Vision, refType=null, unstructuredReference=
Lowe D G. Distinctive image features from scale-invariant keypoints[J].
International Journal of Computer Vision,
2004,
60(2): 91-110., articleTitle=Distinctive image features from scale-invariant keypoints, refAbstract=null), Reference(id=1244336215219094203, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1998, pageEnd=2006, url=null, language=null, rfNumber=[4], rfOrder=5, authorNames=Tian Y, Chen C, Shah M, journalName=null, refType=null, unstructuredReference=
Tian Y,
Chen C,
Shah M. Cross-view image matching for geo-localization in urban environments[C]//2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR).
2017: 1998-2006., articleTitle=Cross-view image matching for geo-localization in urban environments, refAbstract=null), Reference(id=1244336215323951806, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2024, volume=32, issue=04, pageStart=363, pageEnd=370+378, url=null, language=null, rfNumber=[5], rfOrder=6, authorNames=王小攀, 李建胜, 王安成, journalName=中国惯性技术学报, refType=null, unstructuredReference=王小攀, 李建胜, 王安成,
等. 面向无人机绝对定位的遥感影像快速检索方法[J].
中国惯性技术学报,
2024,
32(04): 363-370+378., articleTitle=面向无人机绝对定位的遥感影像快速检索方法, refAbstract=null), Reference(id=1244336215449780930, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2024, volume=32, issue=04, pageStart=363, pageEnd=370+378, url=null, language=null, rfNumber=[5], rfOrder=7, authorNames=Wang X, Li J, Wang A, journalName=Journal of Chinese Inertial Technology, refType=null, unstructuredReference=
Wang X,
Li J,
Wang A,
et al. Fast retrieval method of remote sensing image for UAV absolute location[J].
Journal of Chinese Inertial Technology,
2024,
32(04): 363-370+378., articleTitle=Fast retrieval method of remote sensing image for UAV absolute location, refAbstract=null), Reference(id=1244336215521084102, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[6], rfOrder=8, authorNames=Dosovitskiy A, Beyer L, Kolesnikov A, journalName=arxiv preprint arxiv: 2010.11929, refType=null, unstructuredReference=
Dosovitskiy A,
Beyer L,
Kolesnikov A,
et al. An image is worth 16x16 words: transformers for image recognition at scale[J].
arxiv preprint arxiv: 2010.11929,
2020., articleTitle=An image is worth 16x16 words: transformers for image recognition at scale, refAbstract=null), Reference(id=1244336215592387275, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2022, volume=32, issue=7, pageStart=4376, pageEnd=4389, url=null, language=null, rfNumber=[7], rfOrder=9, authorNames=Dai M, Hu J H, Zhuang J D, journalName=IEEE Transactions on Circuits and Systems for Video Technology, refType=null, unstructuredReference=
Dai M,
Hu J H,
Zhuang J D,
et al. A transformer-based feature segmentation and region alignment method for UAV-view geo-localization[J].
IEEE Transactions on Circuits and Systems for Video Technology,
2022,
32(7): 4376-4389., articleTitle=A transformer-based feature segmentation and region alignment method for UAV-view geo-localization, refAbstract=null), Reference(id=1244336215676273357, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[8], rfOrder=10, authorNames=Yang H, Lu X, Zhu Y, journalName=arxiv preprint arxiv: 2107.00842, refType=null, unstructuredReference=
Yang H,
Lu X,
Zhu Y. Cross-view geo-localization with evolving transformer[J].
arxiv preprint arxiv: 2107.00842,
2021., articleTitle=Cross-view geo-localization with evolving transformer, refAbstract=null), Reference(id=1244336215797908181, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2023, volume=33, issue=null, pageStart=493, pageEnd=508, url=null, language=null, rfNumber=[9], rfOrder=11, authorNames=Dai M, Zheng E, Feng Z, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Dai M,
Zheng E,
Feng Z,
et al. Vision-based UAV self-positioning in low-altitude urban environments[J].
IEEE Transactions on Image Processing,
2023,
33: 493-508., articleTitle=Vision-based UAV self-positioning in low-altitude urban environments, refAbstract=null), Reference(id=1244336215923737309, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2022, volume=140, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[10], rfOrder=12, authorNames=Zhang K, Qi S, Cai J, journalName=Computers in biology and medicine, refType=null, unstructuredReference=
Zhang K,
Qi S,
Cai J,
et al. Content-based image retrieval with a convolutional siamese neural network: Distinguishing lung cancer and tuberculosis in CT images[J].
Computers in biology and medicine,
2022,
140: 105096., articleTitle=Content-based image retrieval with a convolutional siamese neural network: Distinguishing lung cancer and tuberculosis in CT images, refAbstract=null), Reference(id=1244336216024400609, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[11], rfOrder=13, authorNames=Yuan Z, Zhang H, Lu P, journalName=arXiv preprint arXiv: 2406.08552, refType=null, unstructuredReference=
Yuan Z,
Zhang H,
Lu P,
et al. Ditfastattn: Attention compression for diffusion transformer models[J].
arXiv preprint arXiv: 2406.08552,
2024., articleTitle=Ditfastattn: Attention compression for diffusion transformer models, refAbstract=null), Reference(id=1244336216120869605, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=285, pageEnd=302, url=null, language=null, rfNumber=[12], rfOrder=14, authorNames=Wang P, Wang X, Wang F, journalName=null, refType=null, unstructuredReference=
Wang P,
Wang X,
Wang F,
et al. Kvt: k-nn attention for boosting vision transformers[C]//European conference on computer vision. Cham: Springer Nature Switzerland,
2022: 285-302., articleTitle=Kvt: k-nn attention for boosting vision transformers, refAbstract=null), Reference(id=1244336216221532903, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[13], rfOrder=15, authorNames=Fang S, Li K, Li Z, journalName=arxiv preprint arxiv: 2106.04996, refType=null, unstructuredReference=
Fang S,
Li K,
Li Z. Salient positions based attention network for image classification[J].
arxiv preprint arxiv: 2106.04996,
2021., articleTitle=Salient positions based attention network for image classification, refAbstract=null), Reference(id=1244336216313807594, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2023, volume=62, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[14], rfOrder=16, authorNames=Gao T, Li Z, Wen Y, journalName=IEEE Transactions on Geoscience and Remote Sensing, refType=null, unstructuredReference=
Gao T,
Li Z,
Wen Y,
et al. Attention-free global multiscale fusion network for remote sensing object detection[J].
IEEE Transactions on Geoscience and Remote Sensing,
2023,
62: 5603214., articleTitle=Attention-free global multiscale fusion network for remote sensing object detection, refAbstract=null), Reference(id=1244336216443831022, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=1, pageEnd=8, url=null, language=null, rfNumber=[15], rfOrder=17, authorNames=Huo J, journalName=Security and Communication Networks, refType=null, unstructuredReference=
Huo J. A study of spatial attention and squeeze excitation block fusion improved resnet for identifying bank notes[J].
Security and Communication Networks,
2021: 1-8., articleTitle=A study of spatial attention and squeeze excitation block fusion improved resnet for identifying bank notes, refAbstract=null), Reference(id=1244336216557077231, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=10347, pageEnd=10357, url=null, language=null, rfNumber=[16], rfOrder=18, authorNames=Touvron H, Cord M, Douze M, journalName=null, refType=null, unstructuredReference=
Touvron H,
Cord M,
Douze M,
et al. Training data-efficient image transformers & distillation through attention[C]//International conference on machine learning. PMLR,
2021: 10347-10357., articleTitle=Training data-efficient image transformers & distillation through attention, refAbstract=null), Reference(id=1244336216695489268, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[17], rfOrder=19, authorNames=Howard J, Ruder S, journalName=arxiv preprint arxiv: 1801.06146, refType=null, unstructuredReference=
Howard J,
Ruder S. Fine-tuned language models for text classification[J].
arxiv preprint arxiv: 1801.06146,
2018., articleTitle=Fine-tuned language models for text classification, refAbstract=null), Reference(id=1244336216859067127, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2021, volume=13, issue=19, pageStart=3979, pageEnd=null, url=null, language=null, rfNumber=[18], rfOrder=20, authorNames=Zhuang J, Dai M, Chen X, journalName=Remote Sensing, refType=null, unstructuredReference=
Zhuang J,
Dai M,
Chen X,
et al. A faster and more effective cross-view matching method of UAV and satellite images for UAV geolocalization[J].
Remote Sensing,
2021,
13(19): 3979., articleTitle=A faster and more effective cross-view matching method of UAV and satellite images for UAV geolocalization, refAbstract=null), Reference(id=1244336216955536120, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2021, volume=32, issue=2, pageStart=867, pageEnd=879, url=null, language=null, rfNumber=[19], rfOrder=21, authorNames=Wang T, Zheng Z, Yan C, journalName=IEEE Transactions on Circuits and Systems for Video Technology, refType=null, unstructuredReference=
Wang T,
Zheng Z,
Yan C,
et al. Each part matters: Local patterns facilitate cross-view geo-localization[J].
IEEE Transactions on Circuits and Systems for Video Technology,
2021,
32(2): 867-879., articleTitle=Each part matters: Local patterns facilitate cross-view geo-localization, refAbstract=null), Reference(id=1244336217081365244, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[20], rfOrder=22, authorNames=Chen Q, Wang T, Yang Z, journalName=arXiv preprint arXiv: 2403.04172, refType=null, unstructuredReference=
Chen Q,
Wang T,
Yang Z,
et al. SDPL: Shifting-dense partition learning for UAV-view geo-localization[J].
arXiv preprint arXiv: 2403.04172,
2024., articleTitle=SDPL: Shifting-dense partition learning for UAV-view geo-localization, refAbstract=null)], funds=[Fund(id=1244336212908032664, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, awardId=62073078, language=CN, fundingSource=国家自然科学基金(62073078), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1244336203479236986, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, xref=null, ext=[AuthorCompanyExt(id=1244336203508597115, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=School of Instrument Science and Engineering, Southeast University, Nanjing 210096, China), AuthorCompanyExt(id=1244336203537957245, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, companyId=1244336203479236986, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=东南大学 仪器科学与工程学院,南京 210096)])], figs=[ArticleFig(id=1244336207891644944, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.1, caption=
Fast algorithm for heterogeneous image retrival, figureFileSmall=bM2sXWw9UcPIENLJV7V0lg==, figureFileBig=jk93qXjtRSKIJFmqRU7qJA==, tableContent=null), ArticleFig(id=1244336208030056979, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图1, caption=
异源图像快速检索算法, figureFileSmall=bM2sXWw9UcPIENLJV7V0lg==, figureFileBig=jk93qXjtRSKIJFmqRU7qJA==, tableContent=null), ArticleFig(id=1244336208311075355, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.2, caption=
SPNet model structure diagram, figureFileSmall=OUtM3pu0bbREbrOgdQCI8Q==, figureFileBig=pVwP09uvAqEGTQCugJoNgw==, tableContent=null), ArticleFig(id=1244336208428515872, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图2, caption=
SPNet模型结构图, figureFileSmall=OUtM3pu0bbREbrOgdQCI8Q==, figureFileBig=pVwP09uvAqEGTQCugJoNgw==, tableContent=null), ArticleFig(id=1244336208499819044, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.3, caption=
SPKA module diagram, figureFileSmall=qPpGWWNFZHFQJvEV0B+x3g==, figureFileBig=ME0/81tneDpZg3j4939nHg==, tableContent=null), ArticleFig(id=1244336208587899432, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图3, caption=
SPKA模块图, figureFileSmall=qPpGWWNFZHFQJvEV0B+x3g==, figureFileBig=ME0/81tneDpZg3j4939nHg==, tableContent=null), ArticleFig(id=1244336208671785518, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.4, caption=
UAV view of the dataset, figureFileSmall=fXI0sys6S//4Sf/FooqYPg==, figureFileBig=ubc6EajEluAn6xTuHx/DiA==, tableContent=null), ArticleFig(id=1244336208772448817, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图4, caption=
数据集无人机视角, figureFileSmall=fXI0sys6S//4Sf/FooqYPg==, figureFileBig=ubc6EajEluAn6xTuHx/DiA==, tableContent=null), ArticleFig(id=1244336208889889330, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.5, caption=
Satellite view of the dataset, figureFileSmall=dYJ+fcql0oAwUsKiHbJrgQ==, figureFileBig=Dz2SDL4eV8VtLOqqGhQSQQ==, tableContent=null), ArticleFig(id=1244336208998941240, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图5, caption=
数据集卫星视角, figureFileSmall=dYJ+fcql0oAwUsKiHbJrgQ==, figureFileBig=Dz2SDL4eV8VtLOqqGhQSQQ==, tableContent=null), ArticleFig(id=1244336210563416637, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.6, caption=
Comparison of R@K indicators of different methods, figureFileSmall=aOaMHrxGz3dVVbHpwxDyXA==, figureFileBig=RwzwymGCTz8RROplHu2CQA==, tableContent=null), ArticleFig(id=1244336210664079937, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图6, caption=
不同方法R@K指标对比, figureFileSmall=aOaMHrxGz3dVVbHpwxDyXA==, figureFileBig=RwzwymGCTz8RROplHu2CQA==, tableContent=null), ArticleFig(id=1244336210777326151, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.7, caption=
SPNet Retrieval results, figureFileSmall=aQzTzBT5KZbXo2VsQkVibQ==, figureFileBig=LPviqAmy63yPOXOF/7RCug==, tableContent=null), ArticleFig(id=1244336210873795143, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图7, caption=
SPNet检索结果, figureFileSmall=aQzTzBT5KZbXo2VsQkVibQ==, figureFileBig=LPviqAmy63yPOXOF/7RCug==, tableContent=null), ArticleFig(id=1244336210961875532, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Fig.8, caption=
Comparison of retrival results between SPNet and baseline, figureFileSmall=xjousl/Rb2nhwgtAZ83ZJw==, figureFileBig=ujc6QATCD/MhMv1ConMhyA==, tableContent=null), ArticleFig(id=1244336211070927440, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=图8, caption=
SPNet与基准模型检索结果对比, figureFileSmall=xjousl/Rb2nhwgtAZ83ZJw==, figureFileBig=ujc6QATCD/MhMv1ConMhyA==, tableContent=null), ArticleFig(id=1244336211179979349, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| Input: - 大小为[c, h*w]的矩阵Q |
|---|
| - 超参数k |
| Output: - 大小为[c, k]的矩阵K |
| 1.计算QT在通道维度上的平方 |
| 2.按照通道维度对QT求和,得到Qpow |
| 3.选择Qpow中最大的k个位置,记为indexk |
| 4.返回矩阵K=Q(c, indexk) |
), ArticleFig(id=1244336211280642650, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=算法1, caption=
SPS算法
, figureFileSmall=null, figureFileBig=null, tableContent=
| Input: - 大小为[c, h*w]的矩阵Q |
|---|
| - 超参数k |
| Output: - 大小为[c, k]的矩阵K |
| 1.计算QT在通道维度上的平方 |
| 2.按照通道维度对QT求和,得到Qpow |
| 3.选择Qpow中最大的k个位置,记为indexk |
| 4.返回矩阵K=Q(c, indexk) |
), ArticleFig(id=1244336211377111646, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 1. | 冻结所有的Transformer块B |
| 2. | 初始化参数: |
| t=2, b=12, lr=3e-4, lrdecay=0.85 |
| 3. | while 0 <=i<epochs do |
| | if i%t==0 and b > 0 then |
| | | unfreeze B[b] |
| | | b←b-1 |
| | | lr←lr*lrdecay |
), ArticleFig(id=1244336211486163554, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=算法2, caption=
分块微调
, figureFileSmall=null, figureFileBig=null, tableContent=
| 1. | 冻结所有的Transformer块B |
| 2. | 初始化参数: |
| t=2, b=12, lr=3e-4, lrdecay=0.85 |
| 3. | while 0 <=i<epochs do |
| | if i%t==0 and b > 0 then |
| | | unfreeze B[b] |
| | | b←b-1 |
| | | lr←lr*lrdecay |
), ArticleFig(id=1244336211700073065, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Tab.1, caption=
Experimental environment configuration
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验环境 | 配置 |
|---|
| CPU | Intel(R) Xeon(R) Gold 6330CPU @ 2.00GHz |
| GPU | NVIDIA GeForce RTX 3090 |
| 深度学习框架 | Pytorch 1.10.0 |
| 编程语言 | Python 3.8 |
| 操作系统 | Ubuntu 18.04 |
), ArticleFig(id=1244336211796542062, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=表1, caption=
实验环境配置
, figureFileSmall=null, figureFileBig=null, tableContent=
| 实验环境 | 配置 |
|---|
| CPU | Intel(R) Xeon(R) Gold 6330CPU @ 2.00GHz |
| GPU | NVIDIA GeForce RTX 3090 |
| 深度学习框架 | Pytorch 1.10.0 |
| 编程语言 | Python 3.8 |
| 操作系统 | Ubuntu 18.04 |
), ArticleFig(id=1244336211934954096, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Tab.2, caption=
Dense UAV dataset composition
, figureFileSmall=null, figureFileBig=null, tableContent=
| Subset | UAV | Satellite | Classes | Universities |
|---|
| Training | 6768 | 13536 | 2256 | 10 |
| Query | 2331 | 4662 | 777 | 4 |
| Gallery | 9099 | 18198 | 3033 | 14 |
), ArticleFig(id=1244336212035617396, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=表2, caption=
DenseUAV数据集构成
, figureFileSmall=null, figureFileBig=null, tableContent=
| Subset | UAV | Satellite | Classes | Universities |
|---|
| Training | 6768 | 13536 | 2256 | 10 |
| Query | 2331 | 4662 | 777 | 4 |
| Gallery | 9099 | 18198 | 3033 | 14 |
), ArticleFig(id=1244336212144669303, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Tab.3, caption=
The impact of different improvement methods on model performance
, figureFileSmall=null, figureFileBig=null, tableContent=
| Method | R@1 | R@5 |
|---|
| Baseline | 80.18% | 93.99% |
| Baseline+LSCE | 81.77% | 94.55% |
| Baseline+SPKA | 84.98% | 95.71% |
| Baseline+BW-FT | 80.49% | 94.15% |
| Baseline+LSCE+SPKA+BW-FT | 86.01% | 96.52% |
), ArticleFig(id=1244336212253721215, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=表3, caption=
不同改进方法对模型性能的影响
, figureFileSmall=null, figureFileBig=null, tableContent=
| Method | R@1 | R@5 |
|---|
| Baseline | 80.18% | 93.99% |
| Baseline+LSCE | 81.77% | 94.55% |
| Baseline+SPKA | 84.98% | 95.71% |
| Baseline+BW-FT | 80.49% | 94.15% |
| Baseline+LSCE+SPKA+BW-FT | 86.01% | 96.52% |
), ArticleFig(id=1244336212337607295, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Tab.4, caption=
Performance comparison of different methods on DenseUAV dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| Method | Params | InferTime | R@1 | R@5 | mAP |
|---|
| ResNet50 | 27.8 M | 10.20 ms | 16.52% | 39.30% | 23.14% |
| EfficientNet-B3 | 14.1 M | 23.40 ms | 42.81% | 64.52% | 39.7% |
| EfficientNet-B5 | 32.3 M | 33.85 ms | 44.96% | 67.78% | 47.25% |
| ConvNext-T | 30.1 M | 8.45 ms | 60.23% | 81.94% | 46.27% |
| DeiT-S | 23.7 M | 9.60 ms | 71.77% | 89.70% | 59.35% |
| PvTv2-B2 | 26.8 M | 20.45 ms | 77.99% | 92.79% | 67.76% |
| Swinv2-T | 29.9 M | 19.25 ms | 77.99% | 92.49% | 69.05% |
| ViT-S(Baseline)[9] | 23.3 M | 9.45 ms | 80.18% | 93.99% | 69.45% |
| FSRA | 26.0 M | 10.55 ms | 82.58% | 94.94% | 69.80% |
| LPN | 26.0 M | 10.60 ms | 83.05% | 94.89% | 73.12% |
| SPNet(ours) | 23.6 M | 9.55 ms | 86.01% | 96.52% | 76.04% |
), ArticleFig(id=1244336212480213641, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=表4, caption=
DenseUAV数据集上不同方法性能对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| Method | Params | InferTime | R@1 | R@5 | mAP |
|---|
| ResNet50 | 27.8 M | 10.20 ms | 16.52% | 39.30% | 23.14% |
| EfficientNet-B3 | 14.1 M | 23.40 ms | 42.81% | 64.52% | 39.7% |
| EfficientNet-B5 | 32.3 M | 33.85 ms | 44.96% | 67.78% | 47.25% |
| ConvNext-T | 30.1 M | 8.45 ms | 60.23% | 81.94% | 46.27% |
| DeiT-S | 23.7 M | 9.60 ms | 71.77% | 89.70% | 59.35% |
| PvTv2-B2 | 26.8 M | 20.45 ms | 77.99% | 92.79% | 67.76% |
| Swinv2-T | 29.9 M | 19.25 ms | 77.99% | 92.49% | 69.05% |
| ViT-S(Baseline)[9] | 23.3 M | 9.45 ms | 80.18% | 93.99% | 69.45% |
| FSRA | 26.0 M | 10.55 ms | 82.58% | 94.94% | 69.80% |
| LPN | 26.0 M | 10.60 ms | 83.05% | 94.89% | 73.12% |
| SPNet(ours) | 23.6 M | 9.55 ms | 86.01% | 96.52% | 76.04% |
), ArticleFig(id=1244336212668957327, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=EN, label=Tab.5, caption=
Comparison of performance with different SOTA methods
, figureFileSmall=null, figureFileBig=null, tableContent=
| Method | BackBone | R@1 | R@5 |
|---|
| MSBA | ResNet50 | 46.13% | 64.22% |
| LPN | ResNet50 | 32.43% | 56.80% |
| SDPL | ResNet50 | 7.08% | 14.07% |
| LPN | ViT-S | 83.05% | 94.89% |
| Baseline | ViT-S | 80.18% | 93.99% |
| SPNet(Ours) | ViT-S | 86.01% | 96.52% |
), ArticleFig(id=1244336212765426322, tenantId=1146029695717560320, journalId=1244323073571209252, articleId=1244336192716652605, language=CN, label=表5, caption=
不同SOTA方法性能对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| Method | BackBone | R@1 | R@5 |
|---|
| MSBA | ResNet50 | 46.13% | 64.22% |
| LPN | ResNet50 | 32.43% | 56.80% |
| SDPL | ResNet50 | 7.08% | 14.07% |
| LPN | ViT-S | 83.05% | 94.89% |
| Baseline | ViT-S | 80.18% | 93.99% |
| SPNet(Ours) | ViT-S | 86.01% | 96.52% |
)], attaches=null, journal=Journal(id=1244322988720439331, delFlag=0, nameCn=中国惯性技术学报, nameEn=Journal of Chinese Inertial Technology, nameHistory1=null, nameHistory2=null, issn=1005-6734, eissn=null, cn=12-1222/O3, coden=null, periodic=0, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=7nvD63MqplRkIkJ92cFBSg==, journalPrice=null, startedYear=null, abbrevIsoEn=Journal of Chinese Inertial Technology, journalRemark=null, publicationField=null, createdTime=1774599318917, updatedTime=1774599470892, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=J, firstLetterEn=J, subjectCode=Engineering, subjectName=null, subjectCodeEn=Engineering, subjectNameEn=null, picCn=7nvD63MqplRkIkJ92cFBSg==, picEn=Hm2jABG2m8rYJTbG/YkinA==, jcr=null, cjcr=null, exts=[JournalExt(id=1244323626233741507, language=CN, name=中国惯性技术学报, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1774599470909, updatedTime=1774599470909, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.zggxjsxb.com/journalx_zggxjs/authorLogOn.action, submissionEditorUrl=http://www.zggxjsxb.com/journalx_zggxjs/editorLogOn.action, submissionReviewUrl=http://www.zggxjsxb.com/journalx_zggxjs/expertLogOn.action, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1244323626288267460, language=EN, name=Journal of Chinese Inertial Technology, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1774599470922, updatedTime=1774599470922, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.zggxjsxb.com/journalx_zggxjs/authorLogOn.action, submissionEditorUrl=http://www.zggxjsxb.com/journalx_zggxjs/editorLogOn.action, submissionReviewUrl=http://www.zggxjsxb.com/journalx_zggxjs/expertLogOn.action, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1244323073571209252, websiteList=[Website(id=1244323687596409029, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1244323073571209252, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zggxjsxb/CN, language=CN, createTime=1774599485546, createBy=18614031015, updateTime=1774599505954, updateBy=18614031015, name=中国惯性技术学报-中文, tplId=1146099689490845704, title=中国惯性技术学报, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1244325136388698877, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=articleTextType, value=kx, createTime=1774599830958, updateTime=1774599830958, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136342561530, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=banner, value=null, createTime=1774599830947, updateTime=1774599830947, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136443224832, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=grayFlag, value=0, createTime=1774599830971, updateTime=1774599830971, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136313201401, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=logo, value=https://castjournals.cast.org.cn/joweb/zggxjsxb/CN/file/pic?fileId=ouj3QpSM21aiIQie73dEiw==, createTime=1774599830940, updateTime=1774599830940, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136468390658, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=minRunFlag, value=0, createTime=1774599830977, updateTime=1774599830977, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136371921660, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zggxjsxb/CN/file/pic, createTime=1774599830954, updateTime=1774599830954, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136460002049, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=silenceFlag, value=0, createTime=1774599830975, updateTime=1774599830975, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136355144443, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1774599830950, updateTime=1774599830950, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136401281790, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=themeColor, value=null, createTime=1774599830961, updateTime=1774599830961, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325136409670399, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687596409029, code=themeStyle, value=null, createTime=1774599830964, updateTime=1774599830964, creator=18614031015, updator=18614031015)]), Website(id=1244323687697072327, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1244323073571209252, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zggxjsxb/EN, language=EN, createTime=1774599485564, createBy=18614031015, updateTime=1774599521174, updateBy=18614031015, name=中国惯性技术学报-英文, tplId=1146101810881728533, title=Journal of Chinese Inertial Technology, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1244325165878850311, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=articleTextType, value=kx, createTime=1774599837989, updateTime=1774599837989, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165849490180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=banner, value=null, createTime=1774599837982, updateTime=1774599837982, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165899821834, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=grayFlag, value=0, createTime=1774599837994, updateTime=1774599837994, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165841101571, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=logo, value=https://castjournals.cast.org.cn/joweb/zggxjsxb/EN/file/pic?fileId=ouj3QpSM21aiIQie73dEiw==, createTime=1774599837980, updateTime=1774599837980, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165916599052, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=minRunFlag, value=0, createTime=1774599837998, updateTime=1774599837998, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165870461702, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zggxjsxb/EN/file/pic, createTime=1774599837987, updateTime=1774599837987, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165908210443, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=silenceFlag, value=0, createTime=1774599837996, updateTime=1774599837996, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165862073093, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1774599837985, updateTime=1774599837985, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165887238920, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=themeColor, value=null, createTime=1774599837991, updateTime=1774599837991, creator=18614031015, updator=18614031015), WebsiteProps(id=1244325165895627529, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1244323687697072327, code=themeStyle, value=null, createTime=1774599837993, updateTime=1774599837993, creator=18614031015, updator=18614031015)])], journalTitle=中国惯性技术学报, weixinUrl=null, journalUrl=http://www.zggxjsxb.com/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Journal of Chinese Inertial Technology, journalPhotoCn=7nvD63MqplRkIkJ92cFBSg==, journalPhotoEn=Hm2jABG2m8rYJTbG/YkinA==, journalFirstLetter=J, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/zggxjsxb/CN/10.13695/j.cnki.12-1222/o3.2025.10.002, detailUrlEn=https://castjournals.cast.org.cn/joweb/zggxjsxb/EN/10.13695/j.cnki.12-1222/o3.2025.10.002, pdfUrlCn=https://castjournals.cast.org.cn/joweb/zggxjsxb/CN/PDF/10.13695/j.cnki.12-1222/o3.2025.10.002, pdfUrlEn=https://castjournals.cast.org.cn/joweb/zggxjsxb/EN/PDF/10.13695/j.cnki.12-1222/o3.2025.10.002, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)