Article(id=1249044017384726928, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, articleNumber=null, orderNo=null, doi=10.11834/jig.250040, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1739721600000, receivedDateStr=2025-02-17, revisedDate=1748275200000, revisedDateStr=2025-05-27, acceptedDate=null, acceptedDateStr=null, onlineDate=1775724899850, onlineDateStr=2026-04-09, pubDate=1765814400000, pubDateStr=2025-12-16, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1775724899850, onlineIssueDateStr=2026-04-09, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1775724899850, creator=13041195026, updateTime=1775724899850, updator=13041195026, issue=Issue{id=1249044006114628363, tenantId=1146029695717560320, journalId=1249024232475115590, year='2025', volume='30', issue='12', pageStart='3707', pageEnd='3968', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1775724897161, creator=13041195026, updateTime=1775726353303, updator=13041195026, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1249050113662984471, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1249050113667178776, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=3855, endPage=3869, ext={EN=ArticleExt(id=1249044021193154979, articleId=1249044017384726928, tenantId=1146029695717560320, journalId=1249024232475115590, language=EN, title=Dual-stage guided weakly supervised semantic segmentation with Gaussian correction, columnId=1249044008786400014, journalTitle=Journal of Image and Graphics, columnName=Image Understanding and Computer Vision, runingTitle=null, highlight=null, articleAbstract=
Objective Weakly supervised semantic segmentation (WSSS) aims to reduce the cost associated with annotating “strong” pixel-level labels by using “weak” labels, such as points, bounding boxes, image-level class labels, and scribbles. Among these, image-level class labels are the most cost-effective and readily available; however, leveraging them for precise segmentation remains a considerable challenge. A widely used WSSS approach based on image-level class labels generally comprises the following steps: 1) training a neural network for image classification using the class labels; 2) using the trained network to generate class activation maps (CAMs), which serve as seed regions for the segmentation task; and 3) refining these CAMs into pseudo-labels, which are then used as the ground truth to supervise a segmentation network. These steps can be integrated into a single collaborative stage; typically, single-stage frameworks are highly efficient due to their simplified training pipeline. However, the quality of pseudo-labels is crucial to the overall performance of semantic segmentation. High-quality pseudo-labels result in superior segmentation outcomes, whereas noisy or inaccurate pseudo-labels hinder the capability of the model to learn meaningful features. WSSS based on image-level labels faces considerable challenges due to the absence of precise positional and shape-related information, making it difficult to generate accurate segmentation maps. These challenges have led to the development of various approaches, which can be broadly categorized into two types: single-stage methods and multistage methods. Although single-stage methods offer greater efficiency and simplify the overall training process, they often produce less accurate pseudo-labels. This condition is due to the limited refinement of CAMs, resulting in imprecise supervision signals that ultimately degrade segmentation performance. Aiming to alleviate these limitations, a simple yet novel single-stage WSSS framework that incorporates knowledge distillation is introduced to enhance pseudo-label quality without relying on any additional external supervision. The framework enhances the feature learning process within the teacher-student network using a dual-stage knowledge distillation module. This module allows the student network to acquire more dynamic and informative knowledge from the teacher network while preserving key features, thereby enhancing the overall robustness of the student model. Moreover, to further improve segmentation accuracy, a pseudo-label correction module based on a Gaussian mixture model (GMM) is introduced. This module refines the pseudo-labels by modeling the distribution of the CAMs, resulting in highly accurate and reliable supervision signals. The combination of dual-stage knowledge distillation and the Gaussian correction module ensures accurate learning and improved segmentation results, even under weak supervision signals such as image-level labels. Ultimately, the proposed method effectively mitigates the impact of noise during training and enhances the accuracy of the generated pseudo-labels, resulting in superior semantic segmentation outcomes in WSSS tasks.
Method A novel weakly-supervised semantic segmentation method, aimed at addressing the challenges posed by noisy data points and weak supervision, is proposed. First, a dual-stage knowledge interaction module is introduced to enhance the feature learning process of the teacher and student networks. By enabling highly effective knowledge exchange between the two networks, the proposed approach notably reduces the impact of noise during training, leading to robust feature extraction. Additionally, a Gaussian correction module is proposed to enhance the quality of pseudo-labels. This module refines the pseudo-labels by modeling the distribution of class activation maps. By fitting the distribution more accurately, the module corrects potential errors in the pseudo-labels, ensuring that the model learns from high-quality, refined labels. Therefore, the method boosts the overall performance of weakly-supervised semantic segmentation, making it more robust to noise and improving segmentation accuracy. This method provides a promising solution for weakly-supervised segmentation tasks.
Result The mIoU values of this method on the PASCAL VOC 2012 and MS COCO 2014 datasets were 74.8% and 42.3%, respectively, surpassing other comparative methods. Specifically, on the PASCAL VOC 2012 dataset, the proposed method achieved a 3.7% improvement over ToCo, an 8.8% enhancement compared to AFA, a 7.5% increase relative to TSCD, and 1.1% compared to BECO. On the MS COCO 2014 dataset, the method improved performance by 2.2% compared to TSCD, 3.4% compared to AFA, and 5.3% compared to AuxSegNet+. Additionally, the mIoU values of different categories are compared on the PASCAL VOC 2012 validation set. The experimental results showed that the method outperformed the competing methods in 16 categories. Notably, for the background class, the method achieved an mIoU of 92.4%, the highest among all methods evaluated. This result indicates that the method effectively leverages the Gaussian correction module to reduce misclassification of background regions, thereby improving segmentation performance. Furthermore, the method achieved notable improvements in categories such as bird, bottle, car, chair, and cow, further demonstrating its effectiveness.
Conclusion The proposed method effectively mitigates the impact of noise during training and address the issue of incomplete pseudo-label generation through the integration of a dual-stage knowledge distillation module and a Gaussian correction module. This approach achieves remarkable performance improvements compared to existing methods. Overall, the results demonstrate notable advantages in end-to-end weakly supervised semantic segmentation and holds considerable research value.
, correspAuthors=Wenjian Wang, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Xuefei Bai, Yuanhui Wang, Wenjie Xu, Gaoxia Jiang, Wenjian Wang), CN=ArticleExt(id=1249044032186425864, articleId=1249044017384726928, tenantId=1146029695717560320, journalId=1249024232475115590, language=CN, title=融合高斯修正的双阶段指导弱监督语义分割, columnId=1249044009054835474, journalTitle=中国图象图形学报, columnName=图像理解和计算机视觉, runingTitle=null, highlight=null, articleAbstract=
目的 端到端的弱监督语义分割模型因其高效的训练效率备受关注,然而现有研究还存在语义信息提取不充分、生成的伪标签质量较低等不足。针对上述问题,本文提出一种基于知识蒸馏的端到端弱监督语义分割框架,通过双阶段知识交互模块增强学生网络和教师网络之间的知识传递,同时借助高斯修正模块对伪标签进行修正。
方法 首先,设计双阶段知识交互模块强化教师网络和学生网络的特征学习过程,有效降低训练过程中的噪声干扰。其次,为了生成高质量的伪标签,设计了高斯修正模块,通过拟合类激活图的分布,利用EM(expectation maximization)算法估算每个像素点的噪声概率,并依据与邻域像素的相似度关系修正伪标签,进而提升弱监督语义分割网络的性能。
结果 本文方法在PASCAL VOC 2012(pattern analysis, statical modeling and computational learning visual object classes 2012)和MS COCO 2014(Microsoft common objects in context 2014)数据集上的mIoU(mean intersection over union)值分别达到74.8%和42.3%,优于其他对比方法。
结论 通过双阶段知识交互模块以及高斯修正模块,有效降低了图像内部噪声以及潜在的标签噪声对训练过程的影响,并且改善了伪标签生成不完整的问题,与现有方法相比取得了显著的性能提升,在端到端的弱监督语义分割方法中展现出明显的优越性,具有一定的研究价值。
, correspAuthors=王文剑, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=hHLGsfp8aJbQXFGGk9MMXw==, magXml=2//JxrjC9G/WmHcgbWMQDA==, pdfUrl=null, pdf=88CWczOu1w50OMePOizlpQ==, pdfFileSize=4140637, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=bmTo3WOx444WpPC2RxZ+mw==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=4SjfczZIvIbO4qfMRSIGFA==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=白雪飞, 王渊辉, 许文杰, 姜高霞, 王文剑)}, authors=[Author(id=1249044033423745590, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=baixuefei@sxu.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044033536991802, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044033423745590, language=EN, stringName=Xuefei Bai, firstName=Xuefei, middleName=null, lastName=Bai, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044033692181055, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044033423745590, language=CN, stringName=白雪飞, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1山西大学计算机与信息技术学院,太原030006, bio={"content":"
白雪飞,女,副教授,主要研究方向为图像处理和机器学习。E-mail:baixuefei@sxu.edu.cn
"}, bioImg=null, bioContent=
白雪飞,女,副教授,主要研究方向为图像处理和机器学习。E-mail:baixuefei@sxu.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044032991732257, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=1, ext=[AuthorCompanyExt(id=1249044033021092387, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China), AuthorCompanyExt(id=1249044033104978470, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1山西大学计算机与信息技术学院,太原030006)])]), Author(id=1249044033834787402, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=wjwang@sxu.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044033985782354, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044033834787402, language=EN, stringName=Yuanhui Wang, firstName=Yuanhui, middleName=null, lastName=Wang, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044035600589406, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044033834787402, language=CN, stringName=王渊辉, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1山西大学计算机与信息技术学院,太原030006, bio={"content":"
王文剑,通信作者,女,教授,主要研究方向为机器学习、计算智能和图像处理。E-mail: wjwang@sxu.edu.cn
"}, bioImg=null, bioContent=
王文剑,通信作者,女,教授,主要研究方向为机器学习、计算智能和图像处理。E-mail: wjwang@sxu.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044032991732257, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=1, ext=[AuthorCompanyExt(id=1249044033021092387, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China), AuthorCompanyExt(id=1249044033104978470, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1山西大学计算机与信息技术学院,太原030006)])]), Author(id=1249044035797721702, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=wangyuanhui2@sxu.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044035910967922, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044035797721702, language=EN, stringName=Wenjie Xu, firstName=Wenjie, middleName=null, lastName=Xu, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044036070351486, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044035797721702, language=CN, stringName=许文杰, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1山西大学计算机与信息技术学院,太原030006, bio={"content":"
王渊辉,男,硕士研究生,主要研究方向为图像处理和机器学习。E-mail: wangyuanhui2@sxu.edu.cn
"}, bioImg=null, bioContent=
王渊辉,男,硕士研究生,主要研究方向为图像处理和机器学习。E-mail: wangyuanhui2@sxu.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044032991732257, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=1, ext=[AuthorCompanyExt(id=1249044033021092387, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China), AuthorCompanyExt(id=1249044033104978470, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1山西大学计算机与信息技术学院,太原030006)])]), Author(id=1249044036187792007, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=202322409023@email.sxu.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044036322009748, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044036187792007, language=EN, stringName=Gaoxia Jiang, firstName=Gaoxia, middleName=null, lastName=Jiang, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044036594639516, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044036187792007, language=CN, stringName=姜高霞, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1山西大学计算机与信息技术学院,太原030006, bio={"content":"
许文杰,男,硕士研究生,主要研究方向为图像处理和机器学习。E-mail: 202322409023@email.sxu.edu.cn
"}, bioImg=null, bioContent=
许文杰,男,硕士研究生,主要研究方向为图像处理和机器学习。E-mail: 202322409023@email.sxu.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044032991732257, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=1, ext=[AuthorCompanyExt(id=1249044033021092387, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China), AuthorCompanyExt(id=1249044033104978470, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1山西大学计算机与信息技术学院,太原030006)])]), Author(id=1249044036770800289, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, orderNo=4, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=jianggaoxia@sxu.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1249044037060207280, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044036770800289, language=EN, stringName=Wenjian Wang, firstName=Wenjian, middleName=null, lastName=Wang, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, *, address=
2Key Laboratory of Computational Intelligence and Chinese Information Processing (Shanxi University), Ministry of Education, Taiyuan030006, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044037232173754, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, authorId=1249044036770800289, language=CN, stringName=王文剑, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, *, address=
2计算智能与中文信息处理教育部重点实验室(山西大学),太原030006, bio={"content":"
姜高霞,男,副教授,主要研究方向为机器学习和数据挖掘。E-mail: jianggaoxia@sxu.edu.cn
"}, bioImg=null, bioContent=
姜高霞,男,副教授,主要研究方向为机器学习和数据挖掘。E-mail: jianggaoxia@sxu.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044033226613290, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=2, ext=[AuthorCompanyExt(id=1249044033264362028, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044033226613290, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2Key Laboratory of Computational Intelligence and Chinese Information Processing (Shanxi University), Ministry of Education, Taiyuan030006, China), AuthorCompanyExt(id=1249044033293722157, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044033226613290, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2计算智能与中文信息处理教育部重点实验室(山西大学),太原030006)])])], keywords=[Keyword(id=1249044037609661129, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, orderNo=1, keyword=deep learning), Keyword(id=1249044037869707987, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, orderNo=2, keyword=end-to-end weakly supervised semantic segmentation), Keyword(id=1249044038041674458, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, orderNo=3, keyword=Gaussian mixture model (GMM)), Keyword(id=1249044038234612451, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, orderNo=4, keyword=knowledge distillation), Keyword(id=1249044038368830185, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, orderNo=5, keyword=class activation map (CAM)), Keyword(id=1249044038540796654, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, orderNo=1, keyword=深度学习), Keyword(id=1249044040088494838, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, orderNo=2, keyword=端到端弱监督语义分割), Keyword(id=1249044040356930304, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, orderNo=3, keyword=高斯混合模型(GMM)), Keyword(id=1249044040637948687, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, orderNo=4, keyword=知识蒸馏), Keyword(id=1249044040860246813, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, orderNo=5, keyword=类激活图(CAM))], refs=[Reference(id=1249044046434477011, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=4253, pageEnd=4262, url=null, language=null, rfNumber=null, rfOrder=0, authorNames=Araslanov N, Roth S, journalName=null, refType=null, unstructuredReference=
Araslanov N and
Roth S.
2020. Single-stage semantic segmentation from image labels//Proceedings of 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle, USA: IEEE:4253-4262 [DOI:
10.1109/cvpr42600.2020.00431], articleTitle=Single-stage semantic segmentation from image labels, refAbstract=null), Reference(id=1249044046593860573, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=549, pageEnd=565, url=null, language=null, rfNumber=null, rfOrder=1, authorNames=Bearman A, Russakovsky O, Ferrari V, Li F F, journalName=null, refType=null, unstructuredReference=
Bearman A,
Russakovsky O,
Ferrari V and
Li F F.
2016. What’s the point: semantic segmentation with point supervision//Proceedings of the 14th European Conference on Computer Vision. Amsterdam, the Netherlands: Springer:549-565 [DOI:
10.1007/978-3-319-46478-7_34], articleTitle=What’s the point: semantic segmentation with point supervision, refAbstract=null), Reference(id=1249044046853907428, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=9650, pageEnd=9660, url=null, language=null, rfNumber=null, rfOrder=2, authorNames=Caron M, Touvron H, Misra I, Jegou H, Mairal J, Bojanowski P, Joulin A, journalName=null, refType=null, unstructuredReference=
Caron M,
Touvron H,
Misra I,
Jegou H,
Mairal J,
Bojanowski P and
Joulin A.
2021. Emerging properties in self-supervised vision transformers//Proceedings of 2021 IEEE/CVF International Conference on Computer Vision. Montreal, Canada: IEEE:9650-9660 [DOI:
10.1109/iccv48922.2021.00951], articleTitle=Emerging properties in self-supervised vision transformers, refAbstract=null), Reference(id=1249044047134925805, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=8991, pageEnd=9000, url=null, language=null, rfNumber=null, rfOrder=3, authorNames=Chang Y T, Wang Q S, Hung W C, Piramuthu R, Tsai Y H, Yang M H, journalName=null, refType=null, unstructuredReference=
Chang Y T,
Wang Q S,
Hung W C,
Piramuthu R,
Tsai Y H and
Yang M H.
2020. Weakly supervised semantic segmentation via sub-category exploration//Proceedings of 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle, USA: IEEE:8991-9000 [DOI:
10.1109/cvpr42600.2020.00901], articleTitle=Weakly supervised semantic segmentation via sub-category exploration, refAbstract=null), Reference(id=1249044047311086581, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2018, volume=40, issue=4, pageStart=834, pageEnd=848, url=null, language=null, rfNumber=null, rfOrder=4, authorNames=Chen L C, Papandreou G, Kokkinos I, Murphy K, Yuille A L, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Chen L C,
Papandreou G,
Kokkinos I,
Murphy K and
Yuille A L.
2018. DeepLab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected CRFs.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
40(4): 834-848 [DOI:
10.1109/tpami.2017.2699184], articleTitle=DeepLab: semantic image segmentation with deep convolutional nets, atrous convolution, and fully connected CRFs, refAbstract=null), Reference(id=1249044047483053050, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022a, volume=null, issue=null, pageStart=4278, pageEnd=4288, url=null, language=null, rfNumber=null, rfOrder=5, authorNames=Chen Q, Yang L X, Lai J H, Xie X H, journalName=null, refType=null, unstructuredReference=
Chen Q,
Yang L X,
Lai J H and
Xie X H.
2022a. Self-supervised image-specific prototype exploration for weakly supervised semantic segmentation//Proceedings of 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition. New Orleans, USA: IEEE:4278-4288 [DOI:
10.1109/cvpr52688.2022.00425], articleTitle=Self-supervised image-specific prototype exploration for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044049089470468, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022b, volume=null, issue=null, pageStart=969, pageEnd=978, url=null, language=null, rfNumber=null, rfOrder=6, authorNames=Chen Z Z, Wang T, Wu X W, Hua X S, Zhang H W, Sun Q R, journalName=null, refType=null, unstructuredReference=
Chen Z Z,
Wang T,
Wu X W,
Hua X S,
Zhang H W and
Sun Q R.
2022b. Class re-activation maps for weakly-supervised semantic segmentation//Proceedings of 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition. New Orleans, USA: IEEE:969-978 [DOI:
10.1109/cvpr52688.2022.00104], articleTitle=Class re-activation maps for weakly-supervised semantic segmentation, refAbstract=null), Reference(id=1249044049211105292, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=1422, pageEnd=1430, url=null, language=null, rfNumber=null, rfOrder=7, authorNames=Doersch C, Gupta A, Efros A A, journalName=null, refType=null, unstructuredReference=
Doersch C,
Gupta A and
Efros A A.
2015. Unsupervised visual representation learning by context prediction//Proceedings of 2015 IEEE International Conference on Computer Vision. Santiago, Chile: IEEE:1422-1430 [DOI:
10.1109/iccv.2015.167], articleTitle=Unsupervised visual representation learning by context prediction, refAbstract=null), Reference(id=1249044049307574291, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=16, pageEnd=16, url=null, language=null, rfNumber=null, rfOrder=8, authorNames=Dosovitskiy A, Beyer L, Kolesnikov A, Weissenborn D, Zhai X H, journalName=null, refType=null, unstructuredReference=
Dosovitskiy A,
Beyer L,
Kolesnikov A,
Weissenborn D and
Zhai X H.
2021. An image is worth16 × 16 words: transformers for image recognition at scale [EB/OL]. [2025-02-17].
https://arxiv.org/pdf/2010.11929.pdf, articleTitle=An image is worth, refAbstract=null), Reference(id=1249044049441792030, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2011, volume=41, issue=1, pageStart=64, pageEnd=74, url=null, language=null, rfNumber=null, rfOrder=9, authorNames=Du Y Z, Arslanturk E, Zhou Z, Belcher C, journalName=Video based noncooperative iris image segmentation, refType=null, unstructuredReference=
Du Y Z,
Arslanturk E,
Zhou Z and
Belcher C.
2011.
Video based noncooperative iris image segmentation. IEEE Transactions on Systems, Man, and Cybernetics, Part B: Cybernetics,
41(1): 64-74 [DOI:
10.1109/tsmcb.2010.2045371], articleTitle=null, refAbstract=null), Reference(id=1249044049576009765, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2015, volume=111, issue=1, pageStart=98, pageEnd=136, url=null, language=null, rfNumber=null, rfOrder=10, authorNames=Everingham M, Eslami S M A, Van Gool L, Williams C K I, Winn J and Zisserman A, journalName=International Journal of Computer Vision, refType=null, unstructuredReference=
Everingham M,
Eslami S M A,
Van Gool L,
Williams C K I,
Winn J and Zisserman A.
2015. The Pascal visual object classes challenge: a retrospective.
International Journal of Computer Vision,
111(1): 98-136 [DOI:
10.1007/s11263-014-0733-5], articleTitle=The Pascal visual object classes challenge: a retrospective, refAbstract=null), Reference(id=1249044049655701548, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=2886, pageEnd=2895, url=null, language=null, rfNumber=null, rfOrder=11, authorNames=Gao W, Wan F, Pan X J, Peng Z L, Tian Q, Han Z J, Zhou B L, Ye Q X, journalName=null, refType=null, unstructuredReference=
Gao W,
Wan F,
Pan X J,
Peng Z L,
Tian Q,
Han Z J,
Zhou B L and
Ye Q X.
2021. TS-CAM: token semantic coupled attention map for weakly supervised object localization//Proceedings of 2021 IEEE/CVF International Conference on Computer Vision. Montreal, Canada: IEEE:2886-2895 [DOI:
10.1109/iccv48922.2021.00288], articleTitle=TS-CAM: token semantic coupled attention map for weakly supervised object localization, refAbstract=null), Reference(id=1249044049773142068, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=129, issue=6, pageStart=1789, pageEnd=1819, url=null, language=null, rfNumber=null, rfOrder=12, authorNames=Gou J P, Yu B S, Maybank S J, Tao D C, journalName=International Journal of Computer Vision, refType=null, unstructuredReference=
Gou J P,
Yu B S,
Maybank S J and
Tao D C.
2021. Knowledge distillation: a survey.
International Journal of Computer Vision,
129(6): 1789-1819 [DOI:
10.1007/s11263-021-01453-z], articleTitle=Knowledge distillation: a survey, refAbstract=null), Reference(id=1249044049873805371, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=13, authorNames=Hinton G, Vinyals O, Dean J, journalName=null, refType=null, unstructuredReference=
Hinton G,
Vinyals O and
Dean J.
2015. Distilling the knowledge in a neural network [EB/OL]. [2025-02-17].
https://arxiv.org/pdf/1503.02531.pdf, articleTitle=Distilling the knowledge in a neural network, refAbstract=null), Reference(id=1249044049966080066, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=7014, pageEnd=7023, url=null, language=null, rfNumber=null, rfOrder=14, authorNames=Huang Z L, Wang X G, Wang J S, Liu W Y, Wang J D, journalName=null, refType=null, unstructuredReference=
Huang Z L,
Wang X G,
Wang J S,
Liu W Y and
Wang J D.
2018. Weakly-supervised semantic segmentation network with deep seeded region growing//Proceedings of 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Salt Lake City, USA: IEEE:7014-7023 [DOI:
10.1109/cvpr.2018.00733], articleTitle=Weakly-supervised semantic segmentation network with deep seeded region growing, refAbstract=null), Reference(id=1249044050062549065, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=12866, pageEnd=12873, url=null, language=null, rfNumber=null, rfOrder=15, authorNames=Jiang G X, Zhang J, Bai X F, Wang W J, Meng D Y, journalName=null, refType=null, unstructuredReference=
Jiang G X,
Zhang J,
Bai X F,
Wang W J and
Meng D Y.
2024. Which is more effective in label noise cleaning, correction or filtering?//Proceedings of the 38th AAAI Conference on Artificial Intelligence. Vancouver, Canada: AAAI:12866-12873 [DOI:
10.1609/aaai.v38i11.29183], articleTitle=Which is more effective in label noise cleaning, correction or filtering?, refAbstract=null), Reference(id=1249044050163212370, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=695, pageEnd=711, url=null, language=null, rfNumber=null, rfOrder=16, authorNames=Kolesnikov A, Lampert C H, journalName=null, refType=null, unstructuredReference=
Kolesnikov A and
Lampert C H.
2016. Seed, expand and constrain: three principles for weakly-supervised image segmentation//Proceedings of the 14th European Conference on Computer Vision. Amsterdam, the Netherlands: Springer:695-711 [DOI:
10.1007/978-3-319-46493-0_42], articleTitle=Seed, expand and constrain: three principles for weakly-supervised image segmentation, refAbstract=null), Reference(id=1249044050272264281, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021b, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=17, authorNames=Lee J, Choi J, Mork J C, Yoon S, journalName=null, refType=null, unstructuredReference=
Lee J,
Choi J,
Mork J C and
Yoon S.
2021b. Reducing information bottleneck for weakly supervised semantic segmentation [EB/OL]. [2025-02-17].
https://arxiv.org/pdf/2110.06530.pdf, articleTitle=Reducing information bottleneck for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044050377121886, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=5267, pageEnd=5276, url=null, language=null, rfNumber=null, rfOrder=18, authorNames=Lee J, Kim E, Lee S, Lee J, Yoon S, journalName=null, refType=null, unstructuredReference=
Lee J,
Kim E,
Lee S,
Lee J and
Yoon S.
2019. FickleNet: weakly and semi-supervised semantic image segmentation using stochastic inference//Proceedings of 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Long Beach, USA: IEEE:5267-5276 [DOI:
10.1109/cvpr.2019.00541], articleTitle=FickleNet: weakly and semi-supervised semantic image segmentation using stochastic inference, refAbstract=null), Reference(id=1249044050507145320, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021a, volume=null, issue=null, pageStart=4071, pageEnd=4080, url=null, language=null, rfNumber=null, rfOrder=19, authorNames=Lee J, Kim E, Yoon S, journalName=null, refType=null, unstructuredReference=
Lee J,
Kim E and
Yoon S.
2021a. Anti-adversarially manipulated attributions for weakly and semi-supervised semantic segmentation//Proceedings of 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Nashville, USA: IEEE:4071-4080 [DOI:
10.1109/cvpr46437.2021.00406], articleTitle=Anti-adversarially manipulated attributions for weakly and semi-supervised semantic segmentation, refAbstract=null), Reference(id=1249044050591031406, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=1447, pageEnd=1455, url=null, language=null, rfNumber=null, rfOrder=20, authorNames=Li Y, Duan Y Q, Kuang Z H, Chen Y M, Zhang W, Li X M, journalName=null, refType=null, unstructuredReference=
Li Y,
Duan Y Q,
Kuang Z H,
Chen Y M,
Zhang W and
Li X M.
2022. Uncertainty estimation via response scaling for pseudo-mask noise mitigation in weakly-supervised semantic segmentation//Proceedings of the 36th AAAI Conference on Artificial Intelligence. Virtually: AAAI:1447-1455 [DOI:
10.1609/aaai.v36i2.20034], articleTitle=Uncertainty estimation via response scaling for pseudo-mask noise mitigation in weakly-supervised semantic segmentation, refAbstract=null), Reference(id=1249044050683306104, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=3159, pageEnd=3167, url=null, language=null, rfNumber=null, rfOrder=21, authorNames=Lin D, Dai J F, Jia J Y, He K M, Sun J, journalName=null, refType=null, unstructuredReference=
Lin D,
Dai J F,
Jia J Y,
He K M and
Sun J.
2016. ScribbleSup: scribble-supervised convolutional networks for semantic segmentation//Proceedings of 2016 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Las Vegas, USA: IEEE:3159-3167 [DOI:
10.1109/cvpr.2016.344], articleTitle=ScribbleSup: scribble-supervised convolutional networks for semantic segmentation, refAbstract=null), Reference(id=1249044050758803582, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=740, pageEnd=755, url=null, language=null, rfNumber=null, rfOrder=22, authorNames=Lin T Y, Maire M, Belongie S, Hays J, Perona P, Ramanan D, Dollár P, Zitnick C L, journalName=null, refType=null, unstructuredReference=
Lin T Y,
Maire M,
Belongie S,
Hays J,
Perona P,
Ramanan D,
Dollár P and
Zitnick C L.
2014. Microsoft COCO: common objects in context//Proceedings of the 13th European Conference on Computer Vision. Zurich, Switzerland: Springer:740-755 [DOI:
10.1007/978-3-319-10602-1_48], articleTitle=Microsoft COCO: common objects in context, refAbstract=null), Reference(id=1249044050846883973, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=19574, pageEnd=19584, url=null, language=null, rfNumber=null, rfOrder=23, authorNames=Rong S H, Tu B H, Wang Z L, Li J J, journalName=null, refType=null, unstructuredReference=
Rong S H,
Tu B H,
Wang Z L and
Li J J.
2023. Boundary-enhanced co-training for weakly supervised semantic segmentation//Proceedings of 2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Vancouver, Canada: IEEE:19574-19584 [DOI:
10.1109/cvpr52729.2023.01875], articleTitle=Boundary-enhanced co-training for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044050951741581, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=16846, pageEnd=16855, url=null, language=null, rfNumber=null, rfOrder=24, authorNames=Ru L X, Zhan Y B, Yu B S, Du B, journalName=null, refType=null, unstructuredReference=
Ru L X,
Zhan Y B,
Yu B S and
Du B.
2022. Learning affinity from attention: end-to-end weakly-supervised semantic segmentation with transformers//Proceedings of 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition. New Orleans, USA: IEEE:16846-16855 [DOI:
10.1109/cvpr52688.2022.01634], articleTitle=Learning affinity from attention: end-to-end weakly-supervised semantic segmentation with transformers, refAbstract=null), Reference(id=1249044051064987795, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=3093, pageEnd=3102, url=null, language=null, rfNumber=null, rfOrder=25, authorNames=Ru L X, Zheng H L, Zhan Y B, Du B, journalName=null, refType=null, unstructuredReference=
Ru L X,
Zheng H L,
Zhan Y B and
Du B.
2023. Token contrast for weakly-supervised semantic segmentation//Proceedings of 2023 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Vancouver, Canada: IEEE:3093-3102 [DOI:
10.1109/cvpr52729.2023.00302], articleTitle=Token contrast for weakly-supervised semantic segmentation, refAbstract=null), Reference(id=1249044051169845401, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=3544, pageEnd=3553, url=null, language=null, rfNumber=null, rfOrder=26, authorNames=Singh K K, Lee Y J, journalName=null, refType=null, unstructuredReference=
Singh K K and
Lee Y J.
2017. Hide-and-Seek: forcing a network to be meticulous for weakly-supervised object and action localization//Proceedings of 2017 IEEE International Conference on Computer Vision. Venice, Italy: IEEE:3544-3553 [DOI:
10.1109/iccv.2017.381], articleTitle=Hide-and-Seek: forcing a network to be meticulous for weakly-supervised object and action localization, refAbstract=null), Reference(id=1249044051262120095, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=7004, pageEnd=7014, url=null, language=null, rfNumber=null, rfOrder=27, authorNames=Su Y K, Sun R Z, Lin G S, Wu Q Y, journalName=null, refType=null, unstructuredReference=
Su Y K,
Sun R Z,
Lin G S and
Wu Q Y.
2021. Context decoupling augmentation for weakly supervised semantic segmentation//Proceedings of 2021 IEEE/CVF International Conference on Computer Vision. Montreal, Canada: IEEE:7004-7014 [DOI:
10.1109/iccv48922.2021.00692], articleTitle=Context decoupling augmentation for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044051341811881, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=1354, pageEnd=1362, url=null, language=null, rfNumber=null, rfOrder=28, authorNames=Wang X, You S D, Li X, Ma H M, journalName=null, refType=null, unstructuredReference=
Wang X,
You S D,
Li X and
Ma H M.
2018. Weakly-supervised semantic segmentation by iteratively mining common object features//Proceedings of 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Salt Lake City, USA: IEEE:1354-1362 [DOI:
10.1109/cvpr.2018.00147], articleTitle=Weakly-supervised semantic segmentation by iteratively mining common object features, refAbstract=null), Reference(id=1249044051434086572, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=12275, pageEnd=12284, url=null, language=null, rfNumber=null, rfOrder=29, authorNames=Wang Y D, Zhang J, Kan M N, Shan S G, Chen X L, journalName=null, refType=null, unstructuredReference=
Wang Y D,
Zhang J,
Kan M N,
Shan S G and
Chen X L.
2020. Self-supervised equivariant attention mechanism for weakly supervised semantic segmentation//Proceedings of 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle, USA: IEEE:12275-12284 [DOI:
10.1109/cvpr42600.2020.01229], articleTitle=Self-supervised equivariant attention mechanism for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044051555721398, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1568, pageEnd=1576, url=null, language=null, rfNumber=null, rfOrder=30, authorNames=Wei Y C, Feng J S, Liang X D, Cheng M M, Zhao Y, Yan S C, journalName=null, refType=null, unstructuredReference=
Wei Y C,
Feng J S,
Liang X D,
Cheng M M,
Zhao Y and
Yan S C.
2017. Object region mining with adversarial erasing: a simple classification to semantic segmentation approach//Proceedings of 2017 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Honolulu, USA: IEEE:1568-1576 [DOI:
10.1109/cvpr.2017.687], articleTitle=Object region mining with adversarial erasing: a simple classification to semantic segmentation approach, refAbstract=null), Reference(id=1249044051677356224, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=16765, pageEnd=16774, url=null, language=null, rfNumber=null, rfOrder=31, authorNames=Wu T, Huang J S, Gao G Y, Wei X M, Wei X L, Luo X, Liu C H, journalName=null, refType=null, unstructuredReference=
Wu T,
Huang J S,
Gao G Y,
Wei X M,
Wei X L,
Luo X and
Liu C H.
2021. Embedded discriminative attention mechanism for weakly supervised semantic segmentation//Proceedings of 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Nashville, USA: IEEE:16765-16774 [DOI:
10.1109/cvpr46437.2021.01649], articleTitle=Embedded discriminative attention mechanism for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044051786408135, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=null, pageStart=3534, pageEnd=3543, url=null, language=null, rfNumber=null, rfOrder=32, authorNames=Wu Y C, Ye X C, Yang K Q, Li J D, Li X Q, journalName=null, refType=null, unstructuredReference=
Wu Y C,
Ye X C,
Yang K Q,
Li J D and
Li X Q.
2024. DuPL: dual student with trustworthy progressive learning for robust weakly supervised semantic segmentation//Proceedings of 2024 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Seattle, USA: IEEE:3534-3543 [DOI:
10.1109/cvpr52733.2024.00339], articleTitle=DuPL: dual student with trustworthy progressive learning for robust weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044051937403087, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2025, volume=36, issue=3, pageStart=5082, pageEnd=5096, url=null, language=null, rfNumber=null, rfOrder=33, authorNames=Xu L, Bennamoun M, Boussaid F, Ouyang W L, Sohel F, Xu D, journalName=IEEE Transactions on Neural Networks and Learning Systems, refType=null, unstructuredReference=
Xu L,
Bennamoun M,
Boussaid F,
Ouyang W L,
Sohel F and
Xu D.
2025. Auxiliary tasks enhanced dual-affinity learning for weakly supervised semantic segmentation.
IEEE Transactions on Neural Networks and Learning Systems,
36(3): 5082-5096 [DOI:
10.1109/tnnls.2024.3373566], articleTitle=Auxiliary tasks enhanced dual-affinity learning for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044053518655704, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=4310, pageEnd=4319, url=null, language=null, rfNumber=null, rfOrder=34, authorNames=Xu L, Ouyang W L, Bennamoun M, Boussaid F, Xu D, journalName=null, refType=null, unstructuredReference=
Xu L,
Ouyang W L,
Bennamoun M,
Boussaid F and
Xu D.
2022. Multi-class token transformer for weakly supervised semantic segmentation//Proceedings of 2022 IEEE/CVF Conference on Computer Vision and Pattern Recognition. New Orleans, USA: IEEE:4310-4319 [DOI:
10.1109/cvpr52688.2022.00427], articleTitle=Multi-class token transformer for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044053631901919, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=3045, pageEnd=3053, url=null, language=null, rfNumber=null, rfOrder=35, authorNames=Xu R T, Wang C W, Sun J X, Xu S B, Meng W L, Zhang X P, journalName=null, refType=null, unstructuredReference=
Xu R T,
Wang C W,
Sun J X,
Xu S B,
Meng W L and
Zhang X P.
2023. Self correspondence distillation for end-to-end weakly-supervised semantic segmentation//Proceedings of the 37th AAAI Conference on Artificial Intelligence. Washington, USA: AAAI:3045-3053 [DOI:
10.1609/aaai.v37i3.25408], articleTitle=Self correspondence distillation for end-to-end weakly-supervised semantic segmentation, refAbstract=null), Reference(id=1249044053715788005, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2001, volume=null, issue=null, pageStart=145, pageEnd=148, url=null, language=null, rfNumber=null, rfOrder=36, authorNames=Xuan G R, Zhang W, Chai P Q, journalName=null, refType=null, unstructuredReference=
Xuan G R,
Zhang W and
Chai P Q.
2001. EM algorithms of Gaussian mixture model and hidden Markov model//Proceedings of 2001 International Conference on Image Processing. Thessaloniki, Greece: IEEE:145-148 [DOI:
10.1109/icip.2001.958974], articleTitle=EM algorithms of Gaussian mixture model and hidden Markov model, refAbstract=null), Reference(id=1249044053829034220, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=2623, pageEnd=2632, url=null, language=null, rfNumber=null, rfOrder=37, authorNames=Yao Y Z, Chen T, Xie G S, Zhang C Y, Shen F M, Wu Q, Tang Z M, Zhang J, journalName=null, refType=null, unstructuredReference=
Yao Y Z,
Chen T,
Xie G S,
Zhang C Y,
Shen F M,
Wu Q,
Tang Z M and
Zhang J.
2021. Non-salient region object mining for weakly supervised semantic segmentation//Proceedings of 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Nashville, USA: IEEE:2623-2632 [DOI:
10.1109/cvpr46437.2021.00265], articleTitle=Non-salient region object mining for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044053929697525, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=12765, pageEnd=12772, url=null, language=null, rfNumber=null, rfOrder=38, authorNames=Zhang B F, Xiao J M, Wei Y C, Sun M J, Huang K Z, journalName=null, refType=null, unstructuredReference=
Zhang B F,
Xiao J M,
Wei Y C,
Sun M J and
Huang K Z.
2020. Reliability does matter: an end-to-end weakly supervised semantic segmentation approach//Proceedings of the 34th AAAI Conference on Artificial Intelligence. New York, USA: AAAI:12765-12772 [DOI:
10.1609/aaai.v34i07.6971], articleTitle=Reliability does matter: an end-to-end weakly supervised semantic segmentation approach, refAbstract=null), Reference(id=1249044054021972219, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=7242, pageEnd=7251, url=null, language=null, rfNumber=null, rfOrder=39, authorNames=Zhang F, Gu C C, Zhang C Y, Dai Y C, journalName=null, refType=null, unstructuredReference=
Zhang F,
Gu C C,
Zhang C Y and
Dai Y C.
2021. Complementary patch for weakly supervised semantic segmentation//Proceedings of 2021 IEEE/CVF International Conference on Computer Vision. Montreal, Canada: IEEE:7242-7251 [DOI:
10.1109/iccv48922.2021.00715], articleTitle=Complementary patch for weakly supervised semantic segmentation, refAbstract=null), Reference(id=1249044054114246912, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022, volume=27, issue=8, pageStart=2516, pageEnd=2526, url=null, language=null, rfNumber=null, rfOrder=40, authorNames=Zhang W K, Liu W J, Sun X, Xu G L, Fu K, journalName=Journal of Image and Graphics, refType=null, unstructuredReference=
Zhang W K,
Liu W J,
Sun X,
Xu G L and
Fu K.
2022. Multi-source features adaptation fusion network for semantic segmentation in high-resolution remote sensing images.
Journal of Image and Graphics,
27(8): 2516-2526, articleTitle=Multi-source features adaptation fusion network for semantic segmentation in high-resolution remote sensing images, refAbstract=null), Reference(id=1249044054202327301, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022, volume=27, issue=8, pageStart=2516, pageEnd=2526, url=null, language=null, rfNumber=null, rfOrder=41, authorNames=张文凯, 刘文杰, 孙显, 许光銮, 付琨, journalName=中国图象图形学报, refType=null, unstructuredReference=张文凯, 刘文杰, 孙显, 许光銮, 付琨.
2022. 多源特征自适应融合网络的高分遥感影像语义分割.
中国图象图形学报,
27(8): 2516-2526 [DOI:
10.11834/jig.210054], articleTitle=多源特征自适应融合网络的高分遥感影像语义分割, refAbstract=null), Reference(id=1249044054277824778, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=2921, pageEnd=2929, url=null, language=null, rfNumber=null, rfOrder=42, authorNames=Zhou B L, Khosla A, Lapedriza A, Oliva A, Torralba A, journalName=null, refType=null, unstructuredReference=
Zhou B L,
Khosla A,
Lapedriza A,
Oliva A and
Torralba A.
2016. Learning deep features for discriminative localization//Proceedings of 2016 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Las Vegas, USA: IEEE:2921-2929 [DOI:
10.1109/cvpr.2016.319], articleTitle=Learning deep features for discriminative localization, refAbstract=null), Reference(id=1249044054508511504, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022a, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=43, authorNames=Zhou J H, Wei C, Wang H Y, Shen W, Xie C H, Yuille A, Kong T, journalName=null, refType=null, unstructuredReference=
Zhou J H,
Wei C,
Wang H Y,
Shen W,
Xie C H,
Yuille A and
Kong T.
2022a. iBOT: image BERT pre-training with online tokenizer [EB/OL]. [2025-02-17].
https://arxiv.org/pdf/2111.07832.pdf, articleTitle=iBOT: image BERT pre-training with online tokenizer, refAbstract=null), Reference(id=1249044054588203283, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, doi=null, pmid=null, pmcid=null, year=2022b, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=44, authorNames=Zhou Y Y, Yun X Y, Chai C, Liu Z Y, Fan W X, Luo X, journalName=null, refType=null, unstructuredReference=
Zhou Y Y,
Yun X Y,
Chai C,
Liu Z Y,
Fan W X and
Luo X.
2022b. Efficient textual explanations for complex road and traffic scenarios based on semantic segmentation [EB/OL]. [2025-02-17].
https://arxiv.org/pdf/2205.14118.pdf, articleTitle=Efficient textual explanations for complex road and traffic scenarios based on semantic segmentation, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1249044032991732257, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=1, ext=[AuthorCompanyExt(id=1249044033021092387, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer and Information Technology, Shanxi University, Taiyuan030006, China), AuthorCompanyExt(id=1249044033104978470, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044032991732257, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1山西大学计算机与信息技术学院,太原030006)]), AuthorCompany(id=1249044033226613290, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, xref=2, ext=[AuthorCompanyExt(id=1249044033264362028, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044033226613290, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2Key Laboratory of Computational Intelligence and Chinese Information Processing (Shanxi University), Ministry of Education, Taiyuan030006, China), AuthorCompanyExt(id=1249044033293722157, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, companyId=1249044033226613290, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2计算智能与中文信息处理教育部重点实验室(山西大学),太原030006)])], figs=[ArticleFig(id=1249044041103516457, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Fig.1, caption=
Overall framework, figureFileSmall=EPtvV5HxcQQOk4Vhe/49Ow==, figureFileBig=bmTo3WOx444WpPC2RxZ+mw==, tableContent=null), ArticleFig(id=1249044041195791152, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=图1, caption=
整体框架, figureFileSmall=EPtvV5HxcQQOk4Vhe/49Ow==, figureFileBig=bmTo3WOx444WpPC2RxZ+mw==, tableContent=null), ArticleFig(id=1249044041791382342, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Fig.2, caption=
Visualization of pseudo labels in ablation experiments, figureFileSmall=lS5xTHuT2LSbD8RYBF6ZoA==, figureFileBig=3AEBkSCtfQT71hjVNj1LjA==, tableContent=null), ArticleFig(id=1249044042013680459, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=图2, caption=
消融实验伪标签可视化, figureFileSmall=lS5xTHuT2LSbD8RYBF6ZoA==, figureFileBig=3AEBkSCtfQT71hjVNj1LjA==, tableContent=null), ArticleFig(id=1249044042215007061, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Fig.3, caption=
CAM visualization, figureFileSmall=L1EqErUxqkDn6cNdjeBb/Q==, figureFileBig=bdyOIyqPEYBDsEaL3bYLGw==, tableContent=null), ArticleFig(id=1249044042370196314, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=图3, caption=
CAM可视化((a) baseline; (b) + DSKD; (c) + GC + DSKD)
, figureFileSmall=L1EqErUxqkDn6cNdjeBb/Q==, figureFileBig=bdyOIyqPEYBDsEaL3bYLGw==, tableContent=null), ArticleFig(id=1249044042462471007, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Fig.4, caption=
Comparison of segmentation results of different methods on PASCAL VOC 2012 val set, figureFileSmall=rcEQ4jYTV1t8gQYhQ/ohoA==, figureFileBig=PolzxMj4PSbkP/St58fRkg==, tableContent=null), ArticleFig(id=1249044042600883046, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=图4, caption=
各方法在 PASCAL VOC 2012 验证集的分割结果对比((a) original images; (b) ground truth; (c) AFA; (d) TSCD; (e) ToCo; (f) ours)
, figureFileSmall=rcEQ4jYTV1t8gQYhQ/ohoA==, figureFileBig=PolzxMj4PSbkP/St58fRkg==, tableContent=null), ArticleFig(id=1249044042785432429, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Tab.1, caption=
Ablation experiment of pseudo label generation
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模块 | mIoU/% |
|---|
| Baseline | DSKD | GC |
|---|
| √ | - | - | 68.57 |
| √ | √ | - | 68.53 |
| √ | √ | √ | 69.67 |
), ArticleFig(id=1249044042957398901, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=表1, caption=
伪标签生成消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模块 | mIoU/% |
|---|
| Baseline | DSKD | GC |
|---|
| √ | - | - | 68.57 |
| √ | √ | - | 68.53 |
| √ | √ | √ | 69.67 |
), ArticleFig(id=1249044044597371774, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Tab.2, caption=
Comparison of CAM image generation and segmentation accuracy using different thresholds
, figureFileSmall=null, figureFileBig=null, tableContent=
| θh | θl | mIoU/% |
|---|
| 分割结果 | CAM |
|---|
| 0.75 | 0.35 | 69.012 | 70.966 |
| 0.85 | 0.25 | 69.670 | 71.429 |
| 0.90 | 0.20 | 69.390 | 70.892 |
), ArticleFig(id=1249044044911944587, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=表2, caption=
不同阈值生成CAM以及分割结果精度对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| θh | θl | mIoU/% |
|---|
| 分割结果 | CAM |
|---|
| 0.75 | 0.35 | 69.012 | 70.966 |
| 0.85 | 0.25 | 69.670 | 71.429 |
| 0.90 | 0.20 | 69.390 | 70.892 |
), ArticleFig(id=1249044045058745235, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Tab.3, caption=
Comparison of segmentation accuracy using different loss function weight settings
, figureFileSmall=null, figureFileBig=null, tableContent=
 |  |  | mIoU/% |
|---|
| 0.1 | 0.4 | 0.1 | 67.19 |
| 0.1 | 0.5 | 0.1 | 67.18 |
| 0.1 | 0.6 | 0.1 | 68.04 |
| 0.2 | 0.4 | 0.1 | 68.82 |
| 0.2 | 0.5 | 0.1 | 69.67 |
| 0.2 | 0.5 | 0.2 | 68.95 |
| 0.2 | 0.6 | 0.1 | 68.56 |
), ArticleFig(id=1249044045226517400, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=表3, caption=
不同损失函数权重生成分割结果精度对比
, figureFileSmall=null, figureFileBig=null, tableContent=
 |  |  | mIoU/% |
|---|
| 0.1 | 0.4 | 0.1 | 67.19 |
| 0.1 | 0.5 | 0.1 | 67.18 |
| 0.1 | 0.6 | 0.1 | 68.04 |
| 0.2 | 0.4 | 0.1 | 68.82 |
| 0.2 | 0.5 | 0.1 | 69.67 |
| 0.2 | 0.5 | 0.2 | 68.95 |
| 0.2 | 0.6 | 0.1 | 68.56 |
), ArticleFig(id=1249044045327180705, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Tab.4, caption=
Comparison of pseudo-label accuracy of different methods on PASCAL VOC 2012 dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 类别 | 方法 | 基干网络 | mIoU/% |
|---|
| 验证集 | 测试集 |
|---|
两阶段弱监督 语义分割方法 | SEAM | R38 | 64.5 | 65.7 |
| SC-CAM | R101 | 66.1 | 65.9 |
| AdvCAM | R101 | 68.1 | 68.0 |
| ReCAM | R101 | 68.5 | 68.4 |
| RIB | R101 | 68.3 | 68.6 |
| AuxSegNet+ | R38 | 70.7 | 70.9 |
| URN | R101 | 69.5 | 69.7 |
| BECO | MiT-B2 | 73.7 | 73.5 |
端到端弱监督 语义分割方法 | 1Stage | R38 | 62.7 | 62.9 |
| RPM | R38 | 62.7 | 64.3 |
| TSCD | MIT-B1 | 67.3 | 67.5 |
| AFA | MIT-B1 | 66.0 | 66.3 |
| DuPL | ViT-B | 73.3 | 72.8 |
| ToCo | ViT-B | 71.1 | 72.2 |
| 本文 | ViT-B | 74.8 | 73.9 |
), ArticleFig(id=1249044045457204133, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=表4, caption=
各方法在PASCAL VOC 2012数据集上生成伪标签精度对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 类别 | 方法 | 基干网络 | mIoU/% |
|---|
| 验证集 | 测试集 |
|---|
两阶段弱监督 语义分割方法 | SEAM | R38 | 64.5 | 65.7 |
| SC-CAM | R101 | 66.1 | 65.9 |
| AdvCAM | R101 | 68.1 | 68.0 |
| ReCAM | R101 | 68.5 | 68.4 |
| RIB | R101 | 68.3 | 68.6 |
| AuxSegNet+ | R38 | 70.7 | 70.9 |
| URN | R101 | 69.5 | 69.7 |
| BECO | MiT-B2 | 73.7 | 73.5 |
端到端弱监督 语义分割方法 | 1Stage | R38 | 62.7 | 62.9 |
| RPM | R38 | 62.7 | 64.3 |
| TSCD | MIT-B1 | 67.3 | 67.5 |
| AFA | MIT-B1 | 66.0 | 66.3 |
| DuPL | ViT-B | 73.3 | 72.8 |
| ToCo | ViT-B | 71.1 | 72.2 |
| 本文 | ViT-B | 74.8 | 73.9 |
), ArticleFig(id=1249044045612393390, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Tab.5, caption=
Comparison of pseudo-label generation accuracy of different methods on MS COCO 2014 dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 类别 | 方法 | 基干网络 | mIoU/% |
|---|
两阶段弱监督 语义分割方法 | SEAM | R38 | 31.9 |
| MCTformer | R38 | 42.0 |
| AuxSegNet+ | R38 | 37.0 |
| CDA | R38 | 33.2 |
| URN | R101 | 40.7 |
| SIPE | R101 | 40.6 |
端到端弱监督 语义分割方法 | TSCD | MIT-B1 | 39.2 |
| TSCD+CRF | MIT-B1 | 40.1 |
| AFA | MIT-B1 | 38.0 |
| AFA+CRF | MIT-B1 | 38.9 |
| 本文 | ViT-B | 42.3 |
), ArticleFig(id=1249044045717250995, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=表5, caption=
各方法在MS COCO 2014数据集上伪标签精度对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 类别 | 方法 | 基干网络 | mIoU/% |
|---|
两阶段弱监督 语义分割方法 | SEAM | R38 | 31.9 |
| MCTformer | R38 | 42.0 |
| AuxSegNet+ | R38 | 37.0 |
| CDA | R38 | 33.2 |
| URN | R101 | 40.7 |
| SIPE | R101 | 40.6 |
端到端弱监督 语义分割方法 | TSCD | MIT-B1 | 39.2 |
| TSCD+CRF | MIT-B1 | 40.1 |
| AFA | MIT-B1 | 38.0 |
| AFA+CRF | MIT-B1 | 38.9 |
| 本文 | ViT-B | 42.3 |
), ArticleFig(id=1249044045880828861, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=EN, label=Tab.6, caption=
mIoU comparison of different classes and methods on PASCAL VOC 2012 val set
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 点mIoU | bkg | aero | bike | bird | boat | bottle | bus | car | cat | chair | cow |
|---|
| TSCD | 67.3 | 87.4 | 70.6 | 61.6 | 75.2 | 55.4 | 62.8 | 75.1 | 57.7 | 77.4 | 39.4 | 77.4 |
| AFA | 66.0 | 85.8 | 71.4 | 58.8 | 73.8 | 57.7 | 57.8 | 77.8 | 66.7 | 77.7 | 27.7 | 79.5 |
| ToCo | 71.1 | 89.9 | 81.7 | 35.3 | 68.2 | 62.1 | 76.3 | 83.7 | 80.4 | 87.7 | 24.6 | 88.1 |
| 本文 | 74.8 | 92.4 | 86.5 | 47.6 | 80.5 | 65.8 | 80.3 | 85.1 | 82.1 | 90.6 | 42.1 | 91.1 |
| 方法 | table | dog | horse | mbk | person | plant | sheep | sofa | train | tv |
|---|
| TSCD | 71.7 | 66.6 | 69.1 | 49.7 | 76.8 | 42.9 | 60.1 | 42.9 | 60.5 | 53.3 |
| AFA | 43.6 | 74.1 | 68.7 | 64.2 | 62.7 | 51.3 | 75.6 | 39.2 | 59.2 | 43.9 |
| ToCo | 54.8 | 87.0 | 84.1 | 76.0 | 68.1 | 65.8 | 85.7 | 42.6 | 57.8 | 65.6 |
| 本文 | 65.1 | 86.9 | 88.2 | 77.8 | 82.7 | 66.7 | 88.7 | 51.7 | 61.3 | 57.1 |
), ArticleFig(id=1249044046069572552, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017384726928, language=CN, label=表6, caption=
各方法在PASCAL VOC 2012验证集上不同类别的mIoU对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 点mIoU | bkg | aero | bike | bird | boat | bottle | bus | car | cat | chair | cow |
|---|
| TSCD | 67.3 | 87.4 | 70.6 | 61.6 | 75.2 | 55.4 | 62.8 | 75.1 | 57.7 | 77.4 | 39.4 | 77.4 |
| AFA | 66.0 | 85.8 | 71.4 | 58.8 | 73.8 | 57.7 | 57.8 | 77.8 | 66.7 | 77.7 | 27.7 | 79.5 |
| ToCo | 71.1 | 89.9 | 81.7 | 35.3 | 68.2 | 62.1 | 76.3 | 83.7 | 80.4 | 87.7 | 24.6 | 88.1 |
| 本文 | 74.8 | 92.4 | 86.5 | 47.6 | 80.5 | 65.8 | 80.3 | 85.1 | 82.1 | 90.6 | 42.1 | 91.1 |
| 方法 | table | dog | horse | mbk | person | plant | sheep | sofa | train | tv |
|---|
| TSCD | 71.7 | 66.6 | 69.1 | 49.7 | 76.8 | 42.9 | 60.1 | 42.9 | 60.5 | 53.3 |
| AFA | 43.6 | 74.1 | 68.7 | 64.2 | 62.7 | 51.3 | 75.6 | 39.2 | 59.2 | 43.9 |
| ToCo | 54.8 | 87.0 | 84.1 | 76.0 | 68.1 | 65.8 | 85.7 | 42.6 | 57.8 | 65.6 |
| 本文 | 65.1 | 86.9 | 88.2 | 77.8 | 82.7 | 66.7 | 88.7 | 51.7 | 61.3 | 57.1 |
)], attaches=null, journal=Journal(id=1249023527618129992, delFlag=0, nameCn=中国图象图形学报, nameEn=Journal of Image and Graphics, nameHistory1=null, nameHistory2=null, issn=1006-8961, eissn=null, cn=11-3758, coden=CODEN ZTTXFZ, periodic=0, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=uirXtX858YS3zEpFXZttJA==, journalPrice=null, startedYear=null, abbrevIsoEn=Journal of Image and Graphics, journalRemark=null, publicationField=null, createdTime=1775720014721, updatedTime=1775720337198, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=J, firstLetterEn=J, subjectCode=Engineering, subjectName=null, subjectCodeEn=Engineering, subjectNameEn=null, picCn=uirXtX858YS3zEpFXZttJA==, picEn=bud7qaxfvWHeFsbyBTAiKQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1249024880377786590, language=CN, name=中国图象图形学报, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1775720337242, updatedTime=1775720337242, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=e6369def-2842-41d8, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-editor&redirect_uri=https%3A%2F%2Fcjigeditor.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=9ccec05b-6bd, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=1e8a31c8-5434-4f78, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1249024880449089759, language=EN, name=Journal of Image and Graphics, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1775720337259, updatedTime=1775720337259, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=e6369def-2842-41d8, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-editor&redirect_uri=https%3A%2F%2Fcjigeditor.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=9ccec05b-6bd, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=1e8a31c8-5434-4f78, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1249024232475115590, websiteList=[Website(id=1249025782459334881, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1249024232475115590, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN, language=CN, createTime=1775720552315, createBy=18614031015, updateTime=1775720586268, updateBy=18614031015, name=中国图象图形学报-中文, tplId=1146099689490845704, title=中国图象图形学报, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1249026166254928133, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=articleTextType, value=kx, createTime=1775720643819, updateTime=1775720643819, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166221373698, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=banner, value=null, createTime=1775720643811, updateTime=1775720643811, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166271705352, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=grayFlag, value=0, createTime=1775720643823, updateTime=1775720643823, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166212985089, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/file/pic?fileId=TDRjKTHfgAnvFKZaDA70wA==, createTime=1775720643809, updateTime=1775720643809, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166288482570, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=minRunFlag, value=0, createTime=1775720643827, updateTime=1775720643827, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166246539524, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/file/pic, createTime=1775720643817, updateTime=1775720643817, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166280093961, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=silenceFlag, value=0, createTime=1775720643825, updateTime=1775720643825, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166233956611, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1775720643814, updateTime=1775720643814, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166259122438, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=themeColor, value=null, createTime=1775720643820, updateTime=1775720643820, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166267511047, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=themeStyle, value=null, createTime=1775720643822, updateTime=1775720643822, creator=18614031015, updator=18614031015)]), Website(id=1249025782681633001, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1249024232475115590, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN, language=EN, createTime=1775720552368, createBy=18614031015, updateTime=1775720607118, updateBy=18614031015, name=中国图象图形学报-英文, tplId=1146101810881728533, title=Journal of Image and Graphics, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1249026195371786511, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=articleTextType, value=kx, createTime=1775720650761, updateTime=1775720650761, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195355009292, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=banner, value=null, createTime=1775720650757, updateTime=1775720650757, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195392758034, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=grayFlag, value=0, createTime=1775720650766, updateTime=1775720650766, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195342426379, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/file/pic?fileId=TDRjKTHfgAnvFKZaDA70wA==, createTime=1775720650754, updateTime=1775720650754, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195409535252, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=minRunFlag, value=0, createTime=1775720650770, updateTime=1775720650770, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195367592206, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/file/pic, createTime=1775720650760, updateTime=1775720650760, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195401146643, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=silenceFlag, value=0, createTime=1775720650768, updateTime=1775720650768, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195359203597, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1775720650758, updateTime=1775720650758, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195380175120, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=themeColor, value=null, createTime=1775720650763, updateTime=1775720650763, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195388563729, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=themeStyle, value=null, createTime=1775720650765, updateTime=1775720650765, creator=18614031015, updator=18614031015)])], journalTitle=中国图象图形学报, weixinUrl=null, journalUrl=https://www.cjig.cn/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Journal of Image and Graphics, journalPhotoCn=uirXtX858YS3zEpFXZttJA==, journalPhotoEn=bud7qaxfvWHeFsbyBTAiKQ==, journalFirstLetter=J, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/10.11834/jig.250040, detailUrlEn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/10.11834/jig.250040, pdfUrlCn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/PDF/10.11834/jig.250040, pdfUrlEn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/PDF/10.11834/jig.250040, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)