Article(id=1249044011915350829, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, articleNumber=null, orderNo=null, doi=10.11834/jig.240615, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1729440000000, receivedDateStr=2024-10-21, revisedDate=1747843200000, revisedDateStr=2025-05-22, acceptedDate=null, acceptedDateStr=null, onlineDate=1775724898555, onlineDateStr=2026-04-09, pubDate=1765814400000, pubDateStr=2025-12-16, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1775724898555, onlineIssueDateStr=2026-04-09, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1775724898555, creator=13041195026, updateTime=1775724898555, updator=13041195026, issue=Issue{id=1249044006114628363, tenantId=1146029695717560320, journalId=1249024232475115590, year='2025', volume='30', issue='12', pageStart='3707', pageEnd='3968', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1775724897161, creator=13041195026, updateTime=1775726353303, updator=13041195026, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1249050113662984471, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1249050113667178776, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=3870, endPage=3883, ext={EN=ArticleExt(id=1249044013215585084, articleId=1249044011915350829, tenantId=1146029695717560320, journalId=1249024232475115590, language=EN, title=Adaptive ground-truth heatmap generation for bottom-up human pose estimation, columnId=1249044008786400014, journalTitle=Journal of Image and Graphics, columnName=Image Understanding and Computer Vision, runingTitle=null, highlight=null, articleAbstract=
Objective Human pose estimation aims to locate skeletal keypoints of individuals in a given image. As a fundamental task in computer vision, human pose estimation has wide applications in human activity recognition, person re-identification, pose tracking, and related fields. Two main approaches for human pose estimation are available: top-down and bottom-up. Top-down methods first detect human bodies in the image, crop out each person, and then estimate the keypoint coordinates. While effective, these methods perform poorly in cases of occlusion, and their computation cost increases with the number of people in the image. In contrast, bottom-up methods detect all identity-independent keypoints simultaneously and then group them into individual poses. These methods are typically lightweight and fast but must handle varying human scales. Bottom-up human pose estimation methods commonly use 2D Gaussian kernels to generate keypoint heatmaps as regression targets because they provide rich spatial information. However, conventional approaches apply Gaussian kernels with a fixed variance across all keypoints, resulting in uniform heatmap structures. This uniformity is problematic given the existing scale variability in bottom-up methods. On the one hand, different keypoints cover different pixel areas in images, and using large Gaussian kernels may introduce semantic ambiguity, particularly for small joints. On the other hand, differences in keypoint scale imply different levels of annotation uncertainty, which the heatmap variance should ideally reflect. The variance of the Gaussian kernel represents uncertainty; thus, it should be proportional to the scale and ambiguity associated with each keypoint. Aiming to address these issues, an adaptive heatmap generation network (AHGNet) for bottom-up human pose estimation is proposed. AHGNet estimates the appropriate radius of the Gaussian kernel for each keypoint by integrating inherent scale information and geometric relationships. Through formula derivation, the relationship between the radius and the Gaussian kernel variance is established, enabling the creation of customized, scale-adaptive ground-truth heatmaps. This approach improves localization accuracy by effectively aligning the heatmap structure with the spatial characteristics of each keypoint.
Method First, an adaptive heatmap generation module is introduced. This module combines the inherent scale information from image features and the geometric relationship between adjacent keypoints to constrain the coverage areas of kernels. Keypoint scale is defined by semantic coverage areas in images. However, in the actual scene, accurately allowing pixel areas to occupy keypoints is almost impossible, and determining the potential relationship between Gaussian kernels and coverage areas is difficult. Interestingly, the areas occupied by keypoints are found to be related to geometric distance from adjacent keypoints. Therefore, an adaptive heatmap generation module is introduced to generate kernel scale maps of keypoints. This module combine the geometric relationship between adjacent keypoints and inherent scale information from image features. Second, local probabilistic consistency loss is presented to define the distance between the predicted and ground truth heatmaps globally and locally. Most methods based on heatmap regression use L2 loss for supervised learning. However, as the loss function for heatmap regression, L2 loss assumes that each pixel point is independent and overlooks the local structural correlation, making it difficult to describe the probability distribution of heatmaps. A keypoint heatmap is a probability distribution that describes pixels belonging to a certain joint. Thus, KL Divergence must be added to describe local probability consistency. Moreover, samples with large prediction errors are difficult to predict; thus, the weight of difficult samples should be increased. Similarly, the weight of easily detected samples should be reduced. Therefore, the dynamic weight is added to balance the contribution of different samples. Inspired by focal loss, which allows the model to actively focus on hard-to-detect samples, this paper utilizes dynamic weights to reduce the contribution of easily detected samples while enhancing the contribution of hard-to-detect samples.
Result HrHRNet is used as the baseline to establish AHGNet for bottom-up human pose estimation. The model is tested on two public datasets: MS COCO and CrowdPose. Experimental results reveal that AHGNet surpasses HrHRNet in terms of average precision (AP), achieving 72.1% AP and 74.1% AP on COCO test-dev and CrowdPose dataset, providing improvements of +1.6% AP and +6.5% AP, respectively. In addition, the substantial improvement on the CrowdPose dataset with crowded scenes indicates that AHGNet helps alleviate the problem of human scale changes in complex crowded scenes. Simultaneously, the ablation experiments verified the effectiveness of the proposed method.
Conclusion AHGNet leverages geometric features between adjacent keypoints and inherent scale information within the image to generate adaptive heatmaps as groundtruth. This network further employs a local probability consistency loss function to address the challenges posed by various human scales, effectively improving the accuracy of bottom-up human pose estimation. AHGNet provides a new paradigm for optimizing supervision signals in bottom-up pose estimation. By dynamically adjusting the Gaussian kernel scale and enforcing local probability constraints, it effectively reduces multiscale ambiguity in complex scenarios.
, correspAuthors=Kaige Li, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Ling Jiang, Zhuocheng Liu, Yuan Xiong, Wei Wu, Kaige Li), CN=ArticleExt(id=1249044019725145058, articleId=1249044011915350829, tenantId=1146029695717560320, journalId=1249024232475115590, language=CN, title=面向自下而上人体姿态估计的自适应真值热力图生成方法, columnId=1249044009054835474, journalTitle=中国图象图形学报, columnName=图像理解和计算机视觉, runingTitle=null, highlight=null, articleAbstract=
目的 热力图回归方法因能够提供丰富的空间信息,在人体姿态估计领域受到广泛关注。然而,由于传统真值热力图通常由固定标准差的2D高斯核覆盖标注点位置生成,当人体尺度变化较大时,固定的高斯核覆盖范围可能与关键点的实际语义区域不匹配,导致模型对关键点定位的模糊性和语义不确定性。对此,提出面向自下而上人体姿态估计的自适应真值热力图生成方法。
方法 首先设计一种自适应真值热力图生成模块,通过学习图像中关键点的固有尺度信息以及近邻关键点之间的几何关系生成自适应尺度因子,为图像定制尺度自适应的真值热力图。另外,由于现有方法使用的热力图损失函数未能有效捕捉局部结构的相关性,导致其对关键点位置偏差不敏感。为此,提出局部概率一致性损失函数,通过在热力图的局部区域上计算结构相似性,提升模型对局部结构的学习和理解,同时引入动态权重来平衡样本的贡献,进一步引导模型优化方向,提高模型鲁棒性。
结果 在两个公开数据集MS COCO(Microsoft common objects in context)和CrowdPose上进行实验评估,实验结果表明所提方法相较对比工作,关键点检测平均准确率分别提高1.6%与6.5%,达到72.1%和74.1%,验证了所提方法的有效性。此外,所提方法在拥挤场景的CrowPose数据集上也能带来显著的性能提升,这进一步表明其能够有效缓解复杂场景中的人体尺度变化带来的问题。同时消融实验验证了所提方法的有效性。
结论 提出的面向自下而上人体姿态估计的自适应真值热力图生成方法,通过学习图像中关键点的固有尺度信息以及近邻关键点之间的几何关系生成自适应热力图作为真值,结合局部概率一致性损失函数来处理图像中尺度变化问题,有效提高了人体姿态估计准确率。
, correspAuthors=李凯歌, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=vvWAzAf4sK6I3pa9umrEjg==, magXml=hIuejL3tSYYZqcwpB1ZPKA==, pdfUrl=null, pdf=mZ4RlQgioHwNQik9ygY9BA==, pdfFileSize=12377567, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=slEhsZ689y+AYOvUldC8lg==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=tef0UkK/DVpz+SYhLINj/g==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=江玲, 刘卓程, 熊源, 吴威, 李凯歌)}, authors=[Author(id=1249044020270403593, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=jiangjiang@aust.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044020484313104, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044020270403593, language=EN, stringName=Ling Jiang, firstName=Ling, middleName=null, lastName=Jiang, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer Science and Engineering, Anhui University of Science & Technology, Huainan232001, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044022069760025, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044020270403593, language=CN, stringName=江玲, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1安徽理工大学计算机科学与工程学院,淮南232001, bio={"content":"
江玲,女,讲师,主要研究方向为计算机视觉和图像分析与理解。E-mail: jiangjiang@aust.edu.cn
"}, bioImg=null, bioContent=
江玲,女,讲师,主要研究方向为计算机视觉和图像分析与理解。E-mail: jiangjiang@aust.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044020022940660, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=1, ext=[AuthorCompanyExt(id=1249044020031329269, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020022940660, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Anhui University of Science & Technology, Huainan232001, China), AuthorCompanyExt(id=1249044020048106486, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020022940660, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1安徽理工大学计算机科学与工程学院,淮南232001)])]), Author(id=1249044022250115111, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=likg@mail.sysu.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044022405304372, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044022250115111, language=EN, stringName=Zhuocheng Liu, firstName=Zhuocheng, middleName=null, lastName=Liu, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044022522744890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044022250115111, language=CN, stringName=刘卓程, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191, bio={"content":"
李凯歌,通信作者,男,博士后,主要研究方向为计算机视觉、图像分析与理解和虚拟现实。E-mail: likg@mail.sysu.edu.cn
"}, bioImg=null, bioContent=
李凯歌,通信作者,男,博士后,主要研究方向为计算机视觉、图像分析与理解和虚拟现实。E-mail: likg@mail.sysu.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044020173934592, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=2, ext=[AuthorCompanyExt(id=1249044020182323202, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China), AuthorCompanyExt(id=1249044020194906116, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191)])]), Author(id=1249044022627602501, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=zcliu@buaa.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044022698905675, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044022627602501, language=EN, stringName=Yuan Xiong, firstName=Yuan, middleName=null, lastName=Xiong, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044024653451345, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044022627602501, language=CN, stringName=熊源, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191, bio={"content":"
刘卓程,男,硕士研究生,主要研究方向为计算机视觉和图像分析与理解。E-mail: zcliu@buaa.edu.cn
"}, bioImg=null, bioContent=
刘卓程,男,硕士研究生,主要研究方向为计算机视觉和图像分析与理解。E-mail: zcliu@buaa.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044020173934592, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=2, ext=[AuthorCompanyExt(id=1249044020182323202, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China), AuthorCompanyExt(id=1249044020194906116, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191)])]), Author(id=1249044024833806427, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=xiongyuanxy@buaa.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044025035133033, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044024833806427, language=EN, stringName=Wei Wu, firstName=Wei, middleName=null, lastName=Wu, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044026616385647, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044024833806427, language=CN, stringName=吴威, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191, bio={"content":"
熊源,男,博士研究生,主要研究方向为计算机视觉和三维重建。E-mail: xiongyuanxy@buaa.edu.cn
"}, bioImg=null, bioContent=
熊源,男,博士研究生,主要研究方向为计算机视觉和三维重建。E-mail: xiongyuanxy@buaa.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044020173934592, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=2, ext=[AuthorCompanyExt(id=1249044020182323202, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China), AuthorCompanyExt(id=1249044020194906116, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191)])]), Author(id=1249044026725437558, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, orderNo=4, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=wuwei@buaa.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1249044026821906555, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044026725437558, language=EN, stringName=Kaige Li, firstName=Kaige, middleName=null, lastName=Li, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, *, address=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044026909986946, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, authorId=1249044026725437558, language=CN, stringName=李凯歌, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, *, address=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191, bio={"content":"
吴威,男,教授,博士生导师,主要研究方向为计算机视觉、图像分析与理解和虚拟现实。E-mail: wuwei@buaa.edu.cn
"}, bioImg=null, bioContent=
吴威,男,教授,博士生导师,主要研究方向为计算机视觉、图像分析与理解和虚拟现实。E-mail: wuwei@buaa.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044020173934592, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=2, ext=[AuthorCompanyExt(id=1249044020182323202, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China), AuthorCompanyExt(id=1249044020194906116, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191)])])], keywords=[Keyword(id=1249044027031621767, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, orderNo=1, keyword=human pose estimation), Keyword(id=1249044027115507853, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, orderNo=2, keyword=adaptive scale), Keyword(id=1249044027191005329, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, orderNo=3, keyword=bottom-up), Keyword(id=1249044027274891415, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, orderNo=4, keyword=heatmap regression), Keyword(id=1249044027362971805, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, orderNo=5, keyword=dynamic weight), Keyword(id=1249044027480412325, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, orderNo=1, keyword=人体姿态估计), Keyword(id=1249044027555909803, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, orderNo=2, keyword=自适应尺度), Keyword(id=1249044027677544623, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, orderNo=3, keyword=自下而上), Keyword(id=1249044027736264884, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, orderNo=4, keyword=热力图回归), Keyword(id=1249044027820150971, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, orderNo=5, keyword=动态权重)], refs=[Reference(id=1249044031959929146, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=11833, pageEnd=11843, url=null, language=null, rfNumber=null, rfOrder=0, authorNames=Brasó G, Kister N and Leal-Taixé L, journalName=null, refType=null, unstructuredReference=
Brasó G,
Kister N and Leal-Taixé L.
2021. The center of attention: center-keypoint grouping via attention for multi-person pose estimation//Proceedings of 2021 IEEE/CVF International Conference on Computer Vision. Montreal, Canada: IEEE:11833-11843 [DOI:
10.1109/ICCV48922.2021.01164], articleTitle=The center of attention: center-keypoint grouping via attention for multi-person pose estimation, refAbstract=null), Reference(id=1249044032043815230, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=455, pageEnd=472, url=null, language=null, rfNumber=null, rfOrder=1, authorNames=Cai Y H, Wang Z C, Luo Z X, Yin B Y, Du A G, Wang H Q, Zhang X Y, Zhou X Y, Zhou E J, Sun J, journalName=null, refType=null, unstructuredReference=
Cai Y H,
Wang Z C,
Luo Z X,
Yin B Y,
Du A G,
Wang H Q,
Zhang X Y,
Zhou X Y,
Zhou E J and
Sun J.
2020. Learning delicate local representations for multi-person pose estimation//Proceedings of the 16th European Conference on Computer Vision. Glasgow, UK: Springer:455-472 [DOI:
10.1007/978-3-030-58580-8_27], articleTitle=Learning delicate local representations for multi-person pose estimation, refAbstract=null), Reference(id=1249044032136089922, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1302, pageEnd=1310, url=null, language=null, rfNumber=null, rfOrder=2, authorNames=Cao Z, Simon T, Wei S E, Sheikh Y, journalName=null, refType=null, unstructuredReference=
Cao Z,
Simon T,
Wei S E and
Sheikh Y.
2017. Realtime multi-person 2D pose estimation using part affinity fields//Proceedings of 2017 IEEE Conference on Computer Vision and Pattern Recognition. Honolulu, USA: IEEE:1302-1310 [DOI:
10.1109/CVPR.2017.143], articleTitle=Realtime multi-person 2D pose estimation using part affinity fields, refAbstract=null), Reference(id=1249044032236753221, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=7103, pageEnd=7112, url=null, language=null, rfNumber=null, rfOrder=3, authorNames=Chen Y L, Wang Z C, Peng Y X, Zhang Z Q, Yu G, Sun J, journalName=null, refType=null, unstructuredReference=
Chen Y L,
Wang Z C,
Peng Y X,
Zhang Z Q,
Yu G and
Sun J.
2018. Cascaded pyramid network for multi-person pose estimation//Proceedings of 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Salt Lake City, USA: IEEE:7103-7112 [DOI:
10.1109/CVPR.2018.00742], articleTitle=Cascaded pyramid network for multi-person pose estimation, refAbstract=null), Reference(id=1249044032345805129, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=5385, pageEnd=5394, url=null, language=null, rfNumber=null, rfOrder=4, authorNames=Cheng B W, Xiao B, Wang J D, Shi H H, Huang T S, Zhang L, journalName=null, refType=null, unstructuredReference=
Cheng B W,
Xiao B,
Wang J D,
Shi H H,
Huang T S and
Zhang L.
2020. HigheRHRnet: scale-aware representation learning for bottom-up human pose estimation//Proceedings of 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle, USA: IEEE:5385-5394 [DOI:
10.1109/CVPR42600.2020.00543], articleTitle=HigheRHRnet: scale-aware representation learning for bottom-up human pose estimation, refAbstract=null), Reference(id=1249044032433885516, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2022, volume=501, issue=null, pageStart=246, pageEnd=257, url=null, language=null, rfNumber=null, rfOrder=5, authorNames=Ding Y, Zhang Z L, Zhao X F, Hong D F, Cai W, Yu C G, Yang N J, Cai W W, journalName=Neurocomputing, refType=null, unstructuredReference=
Ding Y,
Zhang Z L,
Zhao X F,
Hong D F,
Cai W,
Yu C G,
Yang N J and
Cai W W.
2022. Multi-feature fusion: graph neural network and CNN combining for hyperspectral image classification.
Neurocomputing,
501: 246-257 [DOI:
10.1016/j.neucom.2022.06.031], articleTitle=Multi-feature fusion: graph neural network and CNN combining for hyperspectral image classification, refAbstract=null), Reference(id=1249044032517771602, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2024, volume=29, issue=12, pageStart=3712, pageEnd=3726, url=null, language=null, rfNumber=null, rfOrder=6, authorNames=Jia W, Li J, Li S J, Zhao Y, Min H, journalName=Journal of Image and Graphics, refType=null, unstructuredReference=
Jia W,
Li J,
Li S J,
Zhao Y and
Min H.
2024. A high-order graph convolutional network for homomorphic and heterogeneous skeletal motion retargeting.
Journal of Image and Graphics,
29(12): 3712-3726, articleTitle=A high-order graph convolutional network for homomorphic and heterogeneous skeletal motion retargeting, refAbstract=null), Reference(id=1249044032610046292, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2024, volume=29, issue=12, pageStart=3712, pageEnd=3726, url=null, language=null, rfNumber=null, rfOrder=7, authorNames=贾伟, 李骏, 李书杰, 赵洋, 闵海, journalName=中国图象图形学报, refType=null, unstructuredReference=贾伟, 李骏, 李书杰, 赵洋, 闵海.
2024. 面向同胚异构骨骼运动重定向的高阶图卷积网络.
中国图象图形学报,
29(12): 3712-3726 [DOI:
10.11834/jig.230909], articleTitle=面向同胚异构骨骼运动重定向的高阶图卷积网络, refAbstract=null), Reference(id=1249044032723292505, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2022a, volume=504, issue=null, pageStart=16, pageEnd=29, url=null, language=null, rfNumber=null, rfOrder=8, authorNames=Jiang J J, He Z X, Zhao X Y, Zhang S Y, Wu C R, Wang Y, journalName=Neurocomputing, refType=null, unstructuredReference=
Jiang J J,
He Z X,
Zhao X Y,
Zhang S Y,
Wu C R and
Wang Y.
2022a. MLFNet: monocular lifting fusion network for 6DoF texture-less object pose estimation.
Neurocomputing,
504: 16-29 [DOI:
10.1016/j.neucom.2022.06.096], articleTitle=MLFNet: monocular lifting fusion network for 6DoF texture-less object pose estimation, refAbstract=null), Reference(id=1249044032815567194, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2022b, volume=null, issue=null, pageStart=643, pageEnd=659, url=null, language=null, rfNumber=null, rfOrder=9, authorNames=Jiang W T, Jin S, Liu W T, Qian C, Luo P, Liu S, journalName=null, refType=null, unstructuredReference=
Jiang W T,
Jin S,
Liu W T,
Qian C,
Luo P and
Liu S.
2022b. PoseTrans: a simple yet effective pose transformation augmentation for human pose estimation//Proceedings of the 17th European Conference on Computer Vision. Tel Aviv, Israel: Springer:643-659 [DOI:
10.1007/978-3-031-20065-6_37], articleTitle=PoseTrans: a simple yet effective pose transformation augmentation for human pose estimation, refAbstract=null), Reference(id=1249044032903647580, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=731, pageEnd=746, url=null, language=null, rfNumber=null, rfOrder=10, authorNames=Ke L P, Chang M C, Qi H G, Lyu S W, journalName=null, refType=null, unstructuredReference=
Ke L P,
Chang M C,
Qi H G and
Lyu S W.
2018. Multi-scale structure-aware network for human pose estimation//Proceedings of the 15th European Conference on Computer Vision (ECCV). Munich, Germany: Springer:731-746 [DOI:
10.1007/978-3-030-01216-8_44], articleTitle=Multi-scale structure-aware network for human pose estimation, refAbstract=null), Reference(id=1249044033000116576, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=11969, pageEnd=11978, url=null, language=null, rfNumber=null, rfOrder=11, authorNames=Kreiss S, Bertoni L, Alahi A, journalName=null, refType=null, unstructuredReference=
Kreiss S,
Bertoni L and
Alahi A.
2019. PifPaf: composite fields for human pose estimation//Proceedings of 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Long Beach, USA: IEEE:11969-11978 [DOI:
10.1109/CVPR.2019.01225], articleTitle=PifPaf: composite fields for human pose estimation, refAbstract=null), Reference(id=1249044033075614051, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=11354, pageEnd=11361, url=null, language=null, rfNumber=null, rfOrder=12, authorNames=Li J, Su W, Wang Z F, journalName=null, refType=null, unstructuredReference=
Li J,
Su W and
Wang Z F.
2020. Simple pose: rethinking and improving a bottom-up approach for multi-person pose estimation//Proceedings of the 34th AAAI Conference on Artificial Intelligence. New York, USA: AAAI:11354-11361 [DOI:
10.1609/aaai.v34i07.6797], articleTitle=Simple pose: rethinking and improving a bottom-up approach for multi-person pose estimation, refAbstract=null), Reference(id=1249044033176277351, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2019a, volume=null, issue=null, pageStart=10855, pageEnd=10864, url=null, language=null, rfNumber=null, rfOrder=13, authorNames=Li J F, Wang C, Zhu H, Mao Y H, Fang H S, Lu C W, journalName=null, refType=null, unstructuredReference=
Li J F,
Wang C,
Zhu H,
Mao Y H,
Fang H S and
Lu C W.
2019a. CrowdPose: efficient crowded scenes pose estimation and a new benchmark//Proceedings of 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Long Beach, USA: IEEE:10855-10864 [DOI:
10.1109/CVPR.2019.01112], articleTitle=CrowdPose: efficient crowded scenes pose estimation and a new benchmark, refAbstract=null), Reference(id=1249044033239191914, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=1944, pageEnd=1953, url=null, language=null, rfNumber=null, rfOrder=14, authorNames=Li K, Wang S J, Zhang X, Xu Y F, Xu W J, Tu Z W, journalName=null, refType=null, unstructuredReference=
Li K,
Wang S J,
Zhang X,
Xu Y F,
Xu W J and
Tu Z W.
2021. Pose recognition with cascade transformers//Proceedings of 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Nashville, USA: IEEE:1944-1953 [DOI:
10.1109/CVPR46437.2021.00198], articleTitle=Pose recognition with cascade transformers, refAbstract=null), Reference(id=1249044033352438128, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2019b, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=15, authorNames=Li W B, Wang Z C, Yin B Y, Peng Q X, Du Y M, Xiao T Z, Yu G, Lu H T, Wei Y C, Sun J, journalName=null, refType=null, unstructuredReference=
Li W B,
Wang Z C,
Yin B Y,
Peng Q X,
Du Y M,
Xiao T Z,
Yu G,
Lu H T,
Wei Y C and
Sun J.
2019b. Rethinking on multi-stage networks for human pose estimation [EB/OL]. [2024-10-21].
https://arxiv.org/pdf/1901.00148.pdf, articleTitle=Rethinking on multi-stage networks for human pose estimation, refAbstract=null), Reference(id=1249044033436324211, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2020, volume=42, issue=2, pageStart=318, pageEnd=327, url=null, language=null, rfNumber=null, rfOrder=16, authorNames=Lin T Y, Goyal P, Girshick R, He K M and Dollár P, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Lin T Y,
Goyal P,
Girshick R,
He K M and Dollár P.
2020. Focal loss for dense object detection.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
42(2): 318-327 [DOI:
10.1109/TPAMI.2018.2858826], articleTitle=Focal loss for dense object detection, refAbstract=null), Reference(id=1249044033511821686, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=740, pageEnd=755, url=null, language=null, rfNumber=null, rfOrder=17, authorNames=Lin T Y, Maire M, Belongie S, Hays J, Perona P, Ramanan D, Dollár P and Zitnick C L, journalName=null, refType=null, unstructuredReference=
Lin T Y,
Maire M,
Belongie S,
Hays J,
Perona P,
Ramanan D,
Dollár P and Zitnick C L.
2014. Microsoft COCO: common objects in context//Proceedings of the 13th European Conference on Computer Vision (ECCV). Zurich, Switzerland: Springer:740-755 [DOI:
10.1007/978-3-319-10602-1_48], articleTitle=Microsoft COCO: common objects in context, refAbstract=null), Reference(id=1249044033599902074, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=14983, pageEnd=14992, url=null, language=null, rfNumber=null, rfOrder=18, authorNames=Liu H, Chen Q, Tan Z C, Liu J J, Wan, J, Su X B, Li X L, Yao K, Han J Y, Ding E R, Zhao Y, Wang J D, journalName=null, refType=null, unstructuredReference=
Liu H,
Chen Q,
Tan Z C,
Liu J J, Wan, J,
Su X B,
Li X L,
Yao K,
Han J Y,
Ding E R,
Zhao Y and
Wang J D.
2023. Group pose: a simple baseline for end-to-end multi-person pose estimation//Proceedings of 2023 IEEE/CVF International Conference on Computer Vision. Paris, France: IEEE:14983-14992 [DOI:
10.1109/ICCV51070.2023.01380], articleTitle=Group pose: a simple baseline for end-to-end multi-person pose estimation, refAbstract=null), Reference(id=1249044033671205247, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=13259, pageEnd=13268, url=null, language=null, rfNumber=null, rfOrder=19, authorNames=Luo Z X, Wang Z C, Huang Y, Wang L, Tan T N, Zhou E J, journalName=null, refType=null, unstructuredReference=
Luo Z X,
Wang Z C,
Huang Y,
Wang L,
Tan T N and
Zhou E J.
2021. Rethinking the heatmap regression for bottom-up human pose estimation//Proceedings of 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Nashville, USA: IEEE:13259-13268 [DOI:
10.1109/CVPR46437.2021.01306], articleTitle=Rethinking the heatmap regression for bottom-up human pose estimation, refAbstract=null), Reference(id=1249044033763479935, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=20, authorNames=Mao W A, Ge Y T, Shen C H, Tian Z, Wang X L, Wang Z B, journalName=null, refType=null, unstructuredReference=
Mao W A,
Ge Y T,
Shen C H,
Tian Z,
Wang X L and
Wang Z B.
2021. TFPose: direct human pose estimation with transformers [EB/OL]. [2024-10-21].
https://arxiv.org/pdf/2103.15320.pdf, articleTitle=TFPose: direct human pose estimation with transformers, refAbstract=null), Reference(id=1249044033826394497, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=37, pageEnd=54, url=null, language=null, rfNumber=null, rfOrder=21, authorNames=McNally W, Vats K, Wong A, McPhee J, journalName=null, refType=null, unstructuredReference=
McNally W,
Vats K,
Wong A and
McPhee J.
2022. Rethinking keypoint representations: modeling keypoints and poses as objects for multi-person human pose estimation//Proceedings of the 17th European Conference on Computer Vision. Tel Aviv, Israel: Springer:37-54 [DOI:
10.1007/978-3-031-20068-7_3], articleTitle=Rethinking keypoint representations: modeling keypoints and poses as objects for multi-person human pose estimation, refAbstract=null), Reference(id=1249044033910280580, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=483, pageEnd=499, url=null, language=null, rfNumber=null, rfOrder=22, authorNames=Newell A, Yang K Y, Deng J, journalName=null, refType=null, unstructuredReference=
Newell A,
Yang K Y and
Deng J.
2016. Stacked hourglass networks for human pose estimation//Proceedings of the 14th European Conference on Computer Vision. Amsterdam, the Netherlands: Springer:483-499 [DOI:
10.1007/978-3-319-46484-8_29], articleTitle=Stacked hourglass networks for human pose estimation, refAbstract=null), Reference(id=1249044034002555271, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=282, pageEnd=299, url=null, language=null, rfNumber=null, rfOrder=23, authorNames=Papandreou G, Zhu T, Chen L C, Gidaris S, Tompson J, Murphy K, journalName=null, refType=null, unstructuredReference=
Papandreou G,
Zhu T,
Chen L C,
Gidaris S,
Tompson J and
Murphy K.
2018. PersonLab: person pose estimation and instance segmentation with a bottom-up, part-based, geometric embedding model//Proceedings of the 15th European Conference on Computer Vision (ECCV). Munich, Germany: Springer:282-299 [DOI:
10.1007/978-3-030-01264-9_17], articleTitle=PersonLab: person pose estimation and instance segmentation with a bottom-up, part-based, geometric embedding model, refAbstract=null), Reference(id=1249044035546059146, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=24, authorNames=Qi T, Bayramli B, Ali U, Zhang Q C, Lu H T, journalName=null, refType=null, unstructuredReference=
Qi T,
Bayramli B,
Ali U,
Zhang Q C and
Lu H T.
2019. Spatial shortcut network for human pose estimation [EB/OL]. [2024-10-21].
https://arxiv.org/pdf/1904.03141.pdf, articleTitle=Spatial shortcut network for human pose estimation, refAbstract=null), Reference(id=1249044035759968657, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=350, pageEnd=366, url=null, language=null, rfNumber=null, rfOrder=25, authorNames=Sekii T, journalName=null, refType=null, unstructuredReference=
Sekii T.
2018. Pose proposal networks//Proceedings of the 15th European Conference on Computer Vision (ECCV). Munich, Germany: Springer:350-366 [DOI:
10.1007/978-3-030-01261-8_21], articleTitle=Pose proposal networks, refAbstract=null), Reference(id=1249044035852243347, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=11059, pageEnd=11068, url=null, language=null, rfNumber=null, rfOrder=26, authorNames=Shi D H, Wei X, Li L Q, Ren Y, Tan W M, journalName=null, refType=null, unstructuredReference=
Shi D H,
Wei X,
Li L Q,
Ren Y and
Tan W M.
2022. End-to-end multi-person pose estimation with transformers//Proceedings of 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition. New Orleans, USA: IEEE:11059-11068 [DOI:
10.1109/CVPR52688.2022.01079], articleTitle=End-to-end multi-person pose estimation with transformers, refAbstract=null), Reference(id=1249044035965489557, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=5686, pageEnd=5696, url=null, language=null, rfNumber=null, rfOrder=27, authorNames=Sun K, Xiao B, Liu D, Wang J D, journalName=null, refType=null, unstructuredReference=
Sun K,
Xiao B,
Liu D and
Wang J D.
2019. Deep high-resolution representation learning for human pose estimation//Proceedings of 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Long Beach, USA: IEEE:5686-5696 [DOI:
10.1109/CVPR.2019.00584], articleTitle=Deep high-resolution representation learning for human pose estimation, refAbstract=null), Reference(id=1249044036074541462, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=536, pageEnd=553, url=null, language=null, rfNumber=null, rfOrder=28, authorNames=Sun X, Xiao B, Wei F Y, Liang S, Wei Y C, journalName=null, refType=null, unstructuredReference=
Sun X,
Xiao B,
Wei F Y,
Liang S and
Wei Y C.
2018. Integral human pose regression//Proceedings of the 15th European Conference on Computer Vision (ECCV). Munich, Germany: Springer:536-553 [DOI:
10.1007/978-3-030-01231-1_33], articleTitle=Integral human pose regression, refAbstract=null), Reference(id=1249044036158427546, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=1653, pageEnd=1660, url=null, language=null, rfNumber=null, rfOrder=29, authorNames=Toshev A, Szegedy C, journalName=null, refType=null, unstructuredReference=
Toshev A and
Szegedy C.
2014. DeepPose: human pose estimation via deep neural networks//Proceedings of 2014 IEEE Conference on Computer Vision and Pattern Recognition. Columbus, USA: IEEE:1653-1660 [DOI:
10.1109/CVPR.2014.214], articleTitle=DeepPose: human pose estimation via deep neural networks, refAbstract=null), Reference(id=1249044036233925019, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=30, authorNames=Yang J, Zeng A L, Liu S L, Li F, Zhang R M, Zhang L, journalName=null, refType=null, unstructuredReference=
Yang J,
Zeng A L,
Liu S L,
Li F,
Zhang R M and
Zhang L.
2023. Explicit box detection unifies end-to-end multi-person pose estimation//Proceedings of the 11th International Conference on Learning Representations. Kigali, Rwanda: ICLR, articleTitle=Explicit box detection unifies end-to-end multi-person pose estimation, refAbstract=null), Reference(id=1249044036334588317, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1290, pageEnd=1299, url=null, language=null, rfNumber=null, rfOrder=31, authorNames=Yang W, Li S, Ouyang W L, Li H S, Wang X G, journalName=null, refType=null, unstructuredReference=
Yang W,
Li S,
Ouyang W L,
Li H S and
Wang X G.
2017. Learning feature pyramids for human pose estimation//Proceedings of 2017 IEEE International Conference on Computer Vision. Venice, Italy: IEEE:1290-1299 [DOI:
10.1109/ICCV.2017.144], articleTitle=Learning feature pyramids for human pose estimation, refAbstract=null), Reference(id=1249044036431057311, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2024, volume=29, issue=11, pageStart=3319, pageEnd=3344, url=null, language=null, rfNumber=null, rfOrder=32, authorNames=Yu L, Du C J, Yan Z Q, Zhao H J, He S J, journalName=Journal of Image and Graphics, refType=null, unstructuredReference=
Yu L,
Du C J,
Yan Z Q,
Zhao H J and
He S J.
2024. Review of 2D human pose encoding and decoding methods: from the perspective of ambiguity mitigation.
Journal of Image and Graphics,
29(11): 3319-3344, articleTitle=Review of 2D human pose encoding and decoding methods: from the perspective of ambiguity mitigation, refAbstract=null), Reference(id=1249044036523332001, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2024, volume=29, issue=11, pageStart=3319, pageEnd=3344, url=null, language=null, rfNumber=null, rfOrder=33, authorNames=喻莉, 杜聪炬, 闫增强, 赵慧娟, 何双江, journalName=中国图象图形学报, refType=null, unstructuredReference=喻莉, 杜聪炬, 闫增强, 赵慧娟, 何双江.
2024. 二维人体姿态编解码方法综述: 从解决歧义性问题的角度出发.
中国图象图形学报,
29(11): 3319-3344 [DOI:
10.11834/jig.230648], articleTitle=二维人体姿态编解码方法综述: 从解决歧义性问题的角度出发, refAbstract=null), Reference(id=1249044036611412386, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=589, pageEnd=597, url=null, language=null, rfNumber=null, rfOrder=34, authorNames=Zhang Y Y, Zhou D S, Chen S Q, Gao S H, Ma Y, journalName=null, refType=null, unstructuredReference=
Zhang Y Y,
Zhou D S,
Chen S Q,
Gao S H and
Ma Y.
2016. Single-image crowd counting via multi-column convolutional neural network//Proceedings of 2016 IEEE Conference on Computer Vision and Pattern Recognition. Las Vegas, USA: IEEE:589-597 [DOI:
10.1109/CVPR.2016.70], articleTitle=Single-image crowd counting via multi-column convolutional neural network, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1249044020022940660, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=1, ext=[AuthorCompanyExt(id=1249044020031329269, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020022940660, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Anhui University of Science & Technology, Huainan232001, China), AuthorCompanyExt(id=1249044020048106486, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020022940660, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1安徽理工大学计算机科学与工程学院,淮南232001)]), AuthorCompany(id=1249044020173934592, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, xref=2, ext=[AuthorCompanyExt(id=1249044020182323202, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing100191, China), AuthorCompanyExt(id=1249044020194906116, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, companyId=1249044020173934592, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2北京航空航天大学虚拟现实技术与系统全国重点实验室,北京100191)])], figs=[ArticleFig(id=1249044027954368706, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Fig.1, caption=
Comparisons of Gaussian kernel coverage area for keypoints at different scales, figureFileSmall=oIPQvM93+Z9HcvzIlMXyrA==, figureFileBig=slEhsZ689y+AYOvUldC8lg==, tableContent=null), ArticleFig(id=1249044028038254792, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=图1, caption=
不同尺度关键点的高斯核覆盖面积对比, figureFileSmall=oIPQvM93+Z9HcvzIlMXyrA==, figureFileBig=slEhsZ689y+AYOvUldC8lg==, tableContent=null), ArticleFig(id=1249044028231192784, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Fig.2, caption=
AHGNet framework, figureFileSmall=5Cc2Mf9ajGI2Q0mpb6gBqw==, figureFileBig=OeqCD+RkwNVnRQl/NN2UCA==, tableContent=null), ArticleFig(id=1249044028319273174, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=图2, caption=
AHGNet框架图, figureFileSmall=5Cc2Mf9ajGI2Q0mpb6gBqw==, figureFileBig=OeqCD+RkwNVnRQl/NN2UCA==, tableContent=null), ArticleFig(id=1249044028432519385, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Fig.3, caption=
The relationship between the standard deviation and truncation area of Gaussian kernel, figureFileSmall=T8aVncoCCoqRoHkTZ3060A==, figureFileBig=/tyd6PUAtsC53If+1GsxkA==, tableContent=null), ArticleFig(id=1249044028537376988, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=图3, caption=
高斯核的标准差与截断面积的关系图, figureFileSmall=T8aVncoCCoqRoHkTZ3060A==, figureFileBig=/tyd6PUAtsC53If+1GsxkA==, tableContent=null), ArticleFig(id=1249044028629651680, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Fig.4, caption=
Adjust the truncation radius of the Gaussian kernel using the geometric relationship between adjacent keypoints to obtain an adaptive ground-truth heatmap ((a) geometric vectors; (b) adaptive ground-truth heatmaps;(c) standard ground-truth heatmaps), figureFileSmall=IPdZxYN/CCipNlwaKnIdyQ==, figureFileBig=51JPeo79KvTtQKLHZjATxg==, tableContent=null), ArticleFig(id=1249044028738703589, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=图4, caption=
利用相邻关键点之间的几何关系调整高斯核截断半径获取自适应真值热力图, figureFileSmall=IPdZxYN/CCipNlwaKnIdyQ==, figureFileBig=51JPeo79KvTtQKLHZjATxg==, tableContent=null), ArticleFig(id=1249044028814201064, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Fig.5, caption=
An example of L2 loss reduction but center unchanged, figureFileSmall=2tn+evovmfyx8f+2xY0EhA==, figureFileBig=b2Y31A1BN6HeywViU9ysOw==, tableContent=null), ArticleFig(id=1249044028944224497, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=图5, caption=
L2损失减小但中心点不变的示例, figureFileSmall=2tn+evovmfyx8f+2xY0EhA==, figureFileBig=b2Y31A1BN6HeywViU9ysOw==, tableContent=null), ArticleFig(id=1249044029044887797, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Fig.6, caption=
Visualization results on COCO dataset, figureFileSmall=73gfUv/l8L7P13ergbiPCw==, figureFileBig=eREoZwW3kDp1qGA+k5INzA==, tableContent=null), ArticleFig(id=1249044029116190969, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=图6, caption=
COCO数据集上的可视化结果, figureFileSmall=73gfUv/l8L7P13ergbiPCw==, figureFileBig=eREoZwW3kDp1qGA+k5INzA==, tableContent=null), ArticleFig(id=1249044029225242881, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Tab.1, caption=
Comparisons with other methods on COCO test set
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 输入/像素 | AP | AP50 | AP75 | APM | APL |
|---|
| 非多尺度实验 | CenterNet-DLA(Zhang等,2016) | 512 | 57.9 | 84.7 | 63.1 | 52.5 | 67.4 |
| CenterNet-HG(Zhang等,2016) | 512 | 63.0 | 86.8 | 69.6 | 58.9 | 70.4 |
| OpenPose(Cao等,2017) | 368 | 61.8 | 84.9 | 67.5 | 57.1 | 68.2 |
| PersonLab(Papandreou等,2018) | 1 401 | 66.5 | 88.0 | 72.6 | 62.4 | 72.3 |
| PifPaf(Kreiss等,2019) | 641 | 66.7 | - | - | 62.4 | 72.9 |
| HrHRNet-W32(Cheng等,2020) | 512 | 66.4 | 87.5 | 72.8 | 61.2 | 74.2 |
| AHGNet-W32(本文) | 512 | 68.7 | 89.2 | 75.4 | 63.1 | 76.5 |
| SWAHR-W32(Luo等,2021) | 512 | 67.9 | 88.9 | 74.5 | 62.4 | 75.5 |
| SWAHR-W48(Luo等,2021) | 640 | 70.2 | 89.9 | 76.9 | 65.2 | 77.0 |
| ED-Pose(Yang等,2023) | - | 69.8 | 90.2 | 77.2 | 64.3 | 77.4 |
| GroupPose(Liu等,2023) | - | 70.2 | 90.5 | 77.8 | 64.7 | 78.0 |
| HrHRNet-W48(Cheng等,2020) | 640 | 68.4 | 88.2 | 75.1 | 64.4 | 74.2 |
| AHGNet-W48(本文) | 640 | 70.9 | 89.9 | 77.0 | 65.9 | 76.6 |
| 多尺度实验 | PersonLab(Papandreou等,2018) | 1 401 | 68.7 | 89.0 | 75.4 | 64.1 | 75.5 |
| HrHRNet-W32(Cheng等,2020) | 512 | 69.0 | 89.0 | 75.8 | 64.4 | 75.2 |
| CKG(Brasó等,2021) | 640 | 71.1 | 90.5 | 77.5 | 66.9 | 76.7 |
| PETR(Shi等,2022) | - | 71.2 | 91.4 | 77.6 | 66.9 | 78.0 |
| PoseTrans(Jiang等,2022b) | 512 | 69.9 | 89.3 | 77.0 | 65.2 | 76.2 |
| KAPAO-M(McNally等,2022) | 1 024 | 70.3 | 91.2 | 77.8 | 66.3 | 76.8 |
| HrHRNet-W48(Cheng等,2020) | 640 | 70.5 | 89.3 | 77.2 | 66.6 | 75.8 |
| AHGNet-W48(本文) | 640 | 72.1 | 90.6 | 78.9 | 68.1 | 77.3 |
), ArticleFig(id=1249044029300740357, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表1, caption=
不同方法在COCO测试集实验结果对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 输入/像素 | AP | AP50 | AP75 | APM | APL |
|---|
| 非多尺度实验 | CenterNet-DLA(Zhang等,2016) | 512 | 57.9 | 84.7 | 63.1 | 52.5 | 67.4 |
| CenterNet-HG(Zhang等,2016) | 512 | 63.0 | 86.8 | 69.6 | 58.9 | 70.4 |
| OpenPose(Cao等,2017) | 368 | 61.8 | 84.9 | 67.5 | 57.1 | 68.2 |
| PersonLab(Papandreou等,2018) | 1 401 | 66.5 | 88.0 | 72.6 | 62.4 | 72.3 |
| PifPaf(Kreiss等,2019) | 641 | 66.7 | - | - | 62.4 | 72.9 |
| HrHRNet-W32(Cheng等,2020) | 512 | 66.4 | 87.5 | 72.8 | 61.2 | 74.2 |
| AHGNet-W32(本文) | 512 | 68.7 | 89.2 | 75.4 | 63.1 | 76.5 |
| SWAHR-W32(Luo等,2021) | 512 | 67.9 | 88.9 | 74.5 | 62.4 | 75.5 |
| SWAHR-W48(Luo等,2021) | 640 | 70.2 | 89.9 | 76.9 | 65.2 | 77.0 |
| ED-Pose(Yang等,2023) | - | 69.8 | 90.2 | 77.2 | 64.3 | 77.4 |
| GroupPose(Liu等,2023) | - | 70.2 | 90.5 | 77.8 | 64.7 | 78.0 |
| HrHRNet-W48(Cheng等,2020) | 640 | 68.4 | 88.2 | 75.1 | 64.4 | 74.2 |
| AHGNet-W48(本文) | 640 | 70.9 | 89.9 | 77.0 | 65.9 | 76.6 |
| 多尺度实验 | PersonLab(Papandreou等,2018) | 1 401 | 68.7 | 89.0 | 75.4 | 64.1 | 75.5 |
| HrHRNet-W32(Cheng等,2020) | 512 | 69.0 | 89.0 | 75.8 | 64.4 | 75.2 |
| CKG(Brasó等,2021) | 640 | 71.1 | 90.5 | 77.5 | 66.9 | 76.7 |
| PETR(Shi等,2022) | - | 71.2 | 91.4 | 77.6 | 66.9 | 78.0 |
| PoseTrans(Jiang等,2022b) | 512 | 69.9 | 89.3 | 77.0 | 65.2 | 76.2 |
| KAPAO-M(McNally等,2022) | 1 024 | 70.3 | 91.2 | 77.8 | 66.3 | 76.8 |
| HrHRNet-W48(Cheng等,2020) | 640 | 70.5 | 89.3 | 77.2 | 66.6 | 75.8 |
| AHGNet-W48(本文) | 640 | 72.1 | 90.6 | 78.9 | 68.1 | 77.3 |
), ArticleFig(id=1249044029401403659, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Tab.2, caption=
Comparisons with other methods on CrowdPose test set
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | AP | AP50 | AP75 | APE | APM | APH |
|---|
| 非多尺度实验 | HrHRNet-W48(Cheng等,2020) | 65.9 | 86.4 | 706 | 73.3 | 66.5 | 57.9 |
| SWAHR-W48(Luo等,2021) | 71.6 | 88.5 | 77.6 | 78.9 | 72.4 | 63.0 |
| AHGNet-W48(本文) | 72.6 | 90.6 | 78.5 | 79.6 | 73.3 | 64.0 |
| | | | | | | |
| 多尺度实验 | HrHRNet-W48(Cheng等,2020) | 67.6 | 87.4 | 72.6 | 75.8 | 68.1 | 58.9 |
| SWAHR-W48(Luo等,2021) | 73.8 | 90.5 | 79.9 | 81.2 | 74.7 | 64.7 |
| AHGNet-W48(本文) | 74.1 | 91.2 | 79.8 | 81.3 | 74.8 | 65.3 |
), ArticleFig(id=1249044029476901134, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表2, caption=
不同方法在CrowdPose测试集实验结果对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | AP | AP50 | AP75 | APE | APM | APH |
|---|
| 非多尺度实验 | HrHRNet-W48(Cheng等,2020) | 65.9 | 86.4 | 706 | 73.3 | 66.5 | 57.9 |
| SWAHR-W48(Luo等,2021) | 71.6 | 88.5 | 77.6 | 78.9 | 72.4 | 63.0 |
| AHGNet-W48(本文) | 72.6 | 90.6 | 78.5 | 79.6 | 73.3 | 64.0 |
| | | | | | | |
| 多尺度实验 | HrHRNet-W48(Cheng等,2020) | 67.6 | 87.4 | 72.6 | 75.8 | 68.1 | 58.9 |
| SWAHR-W48(Luo等,2021) | 73.8 | 90.5 | 79.9 | 81.2 | 74.7 | 64.7 |
| AHGNet-W48(本文) | 74.1 | 91.2 | 79.8 | 81.3 | 74.8 | 65.3 |
), ArticleFig(id=1249044031024599315, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Table 3, caption=
The impact of Gaussian kernel standard deviation σ on model accuracy
, figureFileSmall=null, figureFileBig=null, tableContent=
 | AP | APM | APL |
|---|
| 1.0 | 64.9 | 61.2 | 71.0 |
| 1.5 | 65.1 | 61.2 | 72.3 |
| 2.0 | 66.6 | 61.3 | 75.0 |
| 2.5 | 66.1 | 60.1 | 75.2 |
| 3.0 | 65.4 | 58.3 | 75.4 |
), ArticleFig(id=1249044031116874007, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表3, caption=
高斯核标准差σ对模型精度的影响
, figureFileSmall=null, figureFileBig=null, tableContent=
 | AP | APM | APL |
|---|
| 1.0 | 64.9 | 61.2 | 71.0 |
| 1.5 | 65.1 | 61.2 | 72.3 |
| 2.0 | 66.6 | 61.3 | 75.0 |
| 2.5 | 66.1 | 60.1 | 75.2 |
| 3.0 | 65.4 | 58.3 | 75.4 |
), ArticleFig(id=1249044031196565784, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Table 4, caption=
Experimental results on the effectiveness of different modules
, figureFileSmall=null, figureFileBig=null, tableContent=
| AHGM | KL 散度 | 动态权重 | AP | AP50 | AP75 | APM | APL |
|---|
| - | - | - | 67.1 | 86.2 | 73.0 | 61.5 | 76.1 |
| √ | - | - | 68.4 | 76.4 | 74.3 | 61.5 | 77.7 |
| - | √ | - | 68.3 | 87.3 | 74.1 | 62.0 | 77.2 |
| - | - | √ | 68.0 | 87.5 | 74.1 | 62.3 | 76.8 |
| √ | √ | - | 69.2 | 88.2 | 74.6 | 63.1 | 77.9 |
| √ | - | √ | 68.8 | 87.7 | 74.8 | 62.6 | 77.7 |
| √ | √ | √ | 69.7 | 88.1 | 75.0 | 63.3 | 78.6 |
), ArticleFig(id=1249044031309811995, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表4, caption=
不同模块的有效性实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| AHGM | KL 散度 | 动态权重 | AP | AP50 | AP75 | APM | APL |
|---|
| - | - | - | 67.1 | 86.2 | 73.0 | 61.5 | 76.1 |
| √ | - | - | 68.4 | 76.4 | 74.3 | 61.5 | 77.7 |
| - | √ | - | 68.3 | 87.3 | 74.1 | 62.0 | 77.2 |
| - | - | √ | 68.0 | 87.5 | 74.1 | 62.3 | 76.8 |
| √ | √ | - | 69.2 | 88.2 | 74.6 | 63.1 | 77.9 |
| √ | - | √ | 68.8 | 87.7 | 74.8 | 62.6 | 77.7 |
| √ | √ | √ | 69.7 | 88.1 | 75.0 | 63.3 | 78.6 |
), ArticleFig(id=1249044031418863904, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Tab.5, caption=
Experimental results of different KL divergence calculation box sizes
, figureFileSmall=null, figureFileBig=null, tableContent=
| KL散度计算框大小 | AP/% |
|---|
| 3 × 3 | 68.7 |
| 5 × 5 | 69.1 |
| 7 × 7 | 69.1 |
| 9 × 9 | 69.7 |
| 11 × 11 | 69.2 |
| 13 × 13 | 69.1 |
), ArticleFig(id=1249044031502749988, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表5, caption=
不同KL散度计算框大小的实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| KL散度计算框大小 | AP/% |
|---|
| 3 × 3 | 68.7 |
| 5 × 5 | 69.1 |
| 7 × 7 | 69.1 |
| 9 × 9 | 69.7 |
| 11 × 11 | 69.2 |
| 13 × 13 | 69.1 |
), ArticleFig(id=1249044031599218985, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Tab.6, caption=
Experimental results of different dynamic weight indices
, figureFileSmall=null, figureFileBig=null, tableContent=
| γ | AP/% |
|---|
| 0.5 | 68.8 |
| 1 | 69.7 |
| 2 | 65.8 |
| 3 | 58.6 |
), ArticleFig(id=1249044031678910765, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表6, caption=
不同动态权重指数的实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| γ | AP/% |
|---|
| 0.5 | 68.8 |
| 1 | 69.7 |
| 2 | 65.8 |
| 3 | 58.6 |
), ArticleFig(id=1249044031766991152, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=EN, label=Tab.7, caption=
Experimental results on the effectiveness of the multi-scale fusion module
, figureFileSmall=null, figureFileBig=null, tableContent=
| 多尺度融合模块 | AP | AP50 | AP75 | APM | APL |
|---|
| 未采用 | 69.7 | 88.1 | 75.0 | 63.3 | 78.6 |
| 采用 | 70.1 | 88.0 | 76.2 | 66.9 | 78.7 |
), ArticleFig(id=1249044031842488628, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044011915350829, language=CN, label=表7, caption=
多尺度融合模块有效性实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 多尺度融合模块 | AP | AP50 | AP75 | APM | APL |
|---|
| 未采用 | 69.7 | 88.1 | 75.0 | 63.3 | 78.6 |
| 采用 | 70.1 | 88.0 | 76.2 | 66.9 | 78.7 |
)], attaches=null, journal=Journal(id=1249023527618129992, delFlag=0, nameCn=中国图象图形学报, nameEn=Journal of Image and Graphics, nameHistory1=null, nameHistory2=null, issn=1006-8961, eissn=null, cn=11-3758, coden=CODEN ZTTXFZ, periodic=0, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=uirXtX858YS3zEpFXZttJA==, journalPrice=null, startedYear=null, abbrevIsoEn=Journal of Image and Graphics, journalRemark=null, publicationField=null, createdTime=1775720014721, updatedTime=1775720337198, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=J, firstLetterEn=J, subjectCode=Engineering, subjectName=null, subjectCodeEn=Engineering, subjectNameEn=null, picCn=uirXtX858YS3zEpFXZttJA==, picEn=bud7qaxfvWHeFsbyBTAiKQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1249024880377786590, language=CN, name=中国图象图形学报, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1775720337242, updatedTime=1775720337242, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=e6369def-2842-41d8, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-editor&redirect_uri=https%3A%2F%2Fcjigeditor.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=9ccec05b-6bd, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=1e8a31c8-5434-4f78, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1249024880449089759, language=EN, name=Journal of Image and Graphics, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1775720337259, updatedTime=1775720337259, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=e6369def-2842-41d8, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-editor&redirect_uri=https%3A%2F%2Fcjigeditor.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=9ccec05b-6bd, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=1e8a31c8-5434-4f78, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1249024232475115590, websiteList=[Website(id=1249025782459334881, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1249024232475115590, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN, language=CN, createTime=1775720552315, createBy=18614031015, updateTime=1775720586268, updateBy=18614031015, name=中国图象图形学报-中文, tplId=1146099689490845704, title=中国图象图形学报, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1249026166254928133, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=articleTextType, value=kx, createTime=1775720643819, updateTime=1775720643819, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166221373698, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=banner, value=null, createTime=1775720643811, updateTime=1775720643811, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166271705352, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=grayFlag, value=0, createTime=1775720643823, updateTime=1775720643823, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166212985089, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/file/pic?fileId=TDRjKTHfgAnvFKZaDA70wA==, createTime=1775720643809, updateTime=1775720643809, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166288482570, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=minRunFlag, value=0, createTime=1775720643827, updateTime=1775720643827, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166246539524, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/file/pic, createTime=1775720643817, updateTime=1775720643817, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166280093961, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=silenceFlag, value=0, createTime=1775720643825, updateTime=1775720643825, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166233956611, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1775720643814, updateTime=1775720643814, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166259122438, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=themeColor, value=null, createTime=1775720643820, updateTime=1775720643820, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166267511047, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=themeStyle, value=null, createTime=1775720643822, updateTime=1775720643822, creator=18614031015, updator=18614031015)]), Website(id=1249025782681633001, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1249024232475115590, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN, language=EN, createTime=1775720552368, createBy=18614031015, updateTime=1775720607118, updateBy=18614031015, name=中国图象图形学报-英文, tplId=1146101810881728533, title=Journal of Image and Graphics, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1249026195371786511, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=articleTextType, value=kx, createTime=1775720650761, updateTime=1775720650761, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195355009292, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=banner, value=null, createTime=1775720650757, updateTime=1775720650757, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195392758034, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=grayFlag, value=0, createTime=1775720650766, updateTime=1775720650766, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195342426379, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/file/pic?fileId=TDRjKTHfgAnvFKZaDA70wA==, createTime=1775720650754, updateTime=1775720650754, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195409535252, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=minRunFlag, value=0, createTime=1775720650770, updateTime=1775720650770, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195367592206, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/file/pic, createTime=1775720650760, updateTime=1775720650760, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195401146643, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=silenceFlag, value=0, createTime=1775720650768, updateTime=1775720650768, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195359203597, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1775720650758, updateTime=1775720650758, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195380175120, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=themeColor, value=null, createTime=1775720650763, updateTime=1775720650763, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195388563729, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=themeStyle, value=null, createTime=1775720650765, updateTime=1775720650765, creator=18614031015, updator=18614031015)])], journalTitle=中国图象图形学报, weixinUrl=null, journalUrl=https://www.cjig.cn/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Journal of Image and Graphics, journalPhotoCn=uirXtX858YS3zEpFXZttJA==, journalPhotoEn=bud7qaxfvWHeFsbyBTAiKQ==, journalFirstLetter=J, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/10.11834/jig.240615, detailUrlEn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/10.11834/jig.240615, pdfUrlCn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/PDF/10.11834/jig.240615, pdfUrlEn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/PDF/10.11834/jig.240615, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)