Article(id=1249044017850294679, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, articleNumber=null, orderNo=null, doi=10.11834/jig.240653, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1730908800000, receivedDateStr=2024-11-07, revisedDate=1745164800000, revisedDateStr=2025-04-21, acceptedDate=null, acceptedDateStr=null, onlineDate=1775724899970, onlineDateStr=2026-04-09, pubDate=1765814400000, pubDateStr=2025-12-16, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1775724899970, onlineIssueDateStr=2026-04-09, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1775724899970, creator=13041195026, updateTime=1775724899970, updator=13041195026, issue=Issue{id=1249044006114628363, tenantId=1146029695717560320, journalId=1249024232475115590, year='2025', volume='30', issue='12', pageStart='3707', pageEnd='3968', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1775724897161, creator=13041195026, updateTime=1775726353303, updator=13041195026, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1249050113662984471, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1249050113667178776, tenantId=1146029695717560320, journalId=1249024232475115590, issueId=1249044006114628363, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=3838, endPage=3854, ext={EN=ArticleExt(id=1249044022086541735, articleId=1249044017850294679, tenantId=1146029695717560320, journalId=1249024232475115590, language=EN, title=Cross-modal feature fusion and detail-enhanced RGB-D salient object detection, columnId=1249044008786400014, journalTitle=Journal of Image and Graphics, columnName=Image Understanding and Computer Vision, runingTitle=null, highlight=null, articleAbstract=
Objective RGB-D salient object detection (SOD) combines complementary information from RGB and depth images, offering substantially enhanced performance in complex and challenging scenes compared to RGB-only models. This technique has gained considerable attention in the academic community due to its capability to effectively capture salient objects by leveraging visual and spatial information. However, existing RGB-D detection models face several key challenges. First, efficiently utilizing and fusing multi-modal information from RGB and depth inputs remains a difficult task due to the inherent differences between the two modalities. RGB images provide rich color and texture details but lack depth information, whereas depth maps offer spatial cues but are often noisy or of low quality. Second, achieving accurate boundary detection is particularly challenging in cluttered or noisy environments. Noisy depth maps and cluttered backgrounds can obscure object contours, making it difficult to predict sharp and precise boundaries. These challenges highlight the urgent need for a robust model that can effectively integrate RGB and depth information while simultaneously addressing noise and enhancing boundary precision.
Method Aiming to address these challenges, a novel method, the cross-modal feature fusion and detail-enhanced RGB-D salient object detection network (CFADNet), is introduced. The proposed network incorporates two innovative modules: the cross-modal attention fusion enhancement module (CAFEM) and the boundary feature extraction module (BFEM). The CAFEM is designed to enhance the integration of RGB and depth features by leveraging attention mechanisms that emphasize the most informative aspects of each modality. Specifically, channel attention is applied to the RGB features to suppress noise and enhance critical color and texture details. Similarly, spatial attention is applied to the depth features to emphasize spatial regions that are relevant for salient object detection. This attention-based fusion mechanism ensures that the model effectively retains global semantic information from the depth map while preserving fine-grained details from the RGB image. The fusion process is structured in multiple layers, progressively integrating features at different scales to fully utilize the complementary strengths of RGB and depth modalities. In contrast, the BFEM is specifically designed to improve the accuracy of salient object boundaries. Accurate contour detection is crucial for generating high-quality saliency maps; thus, BFEM leverages low-level CNN features, which are rich in edge and texture information. These features are refined through channel attention, which filters out noise and irrelevant details, enhancing the clarity of boundary-related cues. The refined features are then used to guide cross-modal feature decoding, ensuring that the final saliency maps exhibit sharp and accurate boundaries. By combining the edge-extraction capabilities of low-level CNN features with the semantic richness of cross-modal features, BFEM notably improves boundary precision in RGB-D salient object detection.
Result Aiming to evaluate the performance of CFADNet, extensive experiments are conducted on four widely used RGB-D salient object detection datasets: NJU2K, NLPR, STERE, and SIP. These datasets encompass a wide range of diverse and challenging scenes, making them ideal for evaluating the generalization capability of the proposed model. CFADNet is compared against 16 state-of-the-art RGB-D salient object detection methods, including DCF, CIRNet, and CAVER, using standard quantitative metrics such as mean absolute error (MAE), F-measure(Fβ), and structural similarity (Sα). CFADNet demonstrated superior performance across all datasets, particularly excelling in the MAE metric. Specifically, this network outperformed the second-best method by 6.9%, 10.5%, 9.7%, and 2.4% on the NJU2K, NLPR, STERE, and SIP datasets, respectively. These substantial improvements highlight the effectiveness of the attention-based fusion strategy and edge refinement mechanisms. Furthermore, CFADNet consistently achieved higher F-measure and Sα scores, indicating that the model not only reduces pixel-level errors but also more accurately preserves the overall structure and shape of salient objects compared to competing methods. In addition to quantitative evaluations, qualitative comparisons are conducted to visually assess the performance of CFADNet in various challenging scenarios. Results show that the proposed method generates saliency maps with sharp and accurate boundaries, even in cases where salient objects exhibit complex edges or are embedded in cluttered and noisy backgrounds. This finding demonstrates the robustness of CFADNet in handling difficult scenes by effectively separating salient objects from their background while preserving fine boundary details. The visual results further confirm that CFADNet successfully captures global semantic information and local detail, ensuring accurate identification and clear isolation of salient objects from the background.
Conclusion This paper presents CFADNet, a cross-modal feature fusion and detail-enhancement network for RGB-D SOD, designed to address the two major challenges: effective multimodal feature fusion and accurate boundary detection. CFADNet introduces two novel modules, the CAFEM and the BFEM. CFADNet effectively integrates RGB and depth information while notably enhancing the precision of salient object boundaries. The attention mechanisms used in the CAF0EM enable the network to fully leverage the complementary information from RGB and depth modalities. Simultaneously, the BFEM module focuses on refining edge details, resulting in sharper and more accurate saliency predictions. Extensive experiments conducted on four benchmark datasets demonstrate that CFADNet consistently outperforms existing state-of-the-art methods, achieving superior performance across key evaluation metric, including MAE, F-measure, and structural similarity index. These findings highlight the robustness and strong generalization capability of CFADNet in diverse and challenging environments. By combining attention-based feature fusion with effective edge refinement, CFADNet emerges as a powerful and reliable solution for RGB-D salient object detection into complex scenarios. Future research could explore extending this approach to other multi-modal tasks, such as RGB-Thermal or multi-spectral image processing, where challenges related to multi-modal fusion and boundary detection are also prevalent. Additionally, optimizing the computational efficiency of CFADNet for real-time deployment represents a potential research direction, enabling its application in time-sensitive applications such as autonomous driving and robotics.
, correspAuthors=Xiaogang Song, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Xiaogang Song, Yuping Tan, Fuqiang Guo, Xiaofeng Lu, Xinhong Hei), CN=ArticleExt(id=1249044036313621140, articleId=1249044017850294679, tenantId=1146029695717560320, journalId=1249024232475115590, language=CN, title=跨模态特征融合与细节信息增强的RGB-D显著目标检测, columnId=1249044009054835474, journalTitle=中国图象图形学报, columnName=图像理解和计算机视觉, runingTitle=null, highlight=null, articleAbstract=
目的 RGB-D显著目标检测通过整合RGB图像和深度图像的互补信息,可以提高应对复杂和具有挑战性场景的显著目标检测(salient object detection,SOD)能力,取得了比RGB显著性检测模型更好的性能,受到高度关注。然而,现有RGB-D 检测模型面临如何高效利用输入的多模态信息进行融合以及如何提高显著目标边缘检测精度等问题。为此,提出一种跨模态特征融合与边缘细节增强的RGB-D显著目标检测方法。
方法 通过跨模态注意力融合增强模块(cross-modal attention fusion enhancement module,CAFEM)对不同模态特征进行注意力整合,使RGB图像和深度图像的互补信息充分融合,使模型充分利用多模态特征,从而提高模型的性能。但是两种模态的输入容易出现背景信息混淆、噪声增多、深度图质量低和目标轮廓提取困难的情况。为应对上述问题,提出一种卷积神经网络(convolutional neural network,CNN)低层特征引导的边缘特征提取模块(boundary feature extraction module,BFEM),通过通道注意力对低层特征携带的噪声进行过滤,然后使用低层细节特征引导跨模态融合特征进行聚焦解码以得到更加准确的显著图像。
结果 在4个RGB-D显著目标检测数据集进行实验,与16种代表性方法进行定量和定性实验对比。在平均绝对误差(mean absolute error, MAE)指标上,本文方法相较于排名第2的方法,在4个数据集上分别提升6.9%、10.5%、9.7%和2.4%。结果表明,本文方法在各场景均有优异表现。
结论 提出一种用于RGB-D显著目标检测的跨模态特征融合与细节信息增强网络(cross-modal feature fusion and detail-enhanced network,CFADNet),通过跨模态注意力融合增强模块(CAFEM),较好地实现了RGB特征与深度特征的融合。此外,构建了边缘特征提取模块(BFEM)提取低层细节特征,最终较为准确地定位显著物体并增强了边缘细节的清晰度。
, correspAuthors=宋霄罡, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=XG0DEImlKXWEZ9Bt3+9MOQ==, magXml=HsYVbuZLWxCfbj4tJpsveA==, pdfUrl=null, pdf=pBhJba9G/MB8ojWaMmeZWw==, pdfFileSize=4906729, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=5b9ITVT5R5PSNWyvQVLaeQ==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=b5hV4OpwcWM9+/2E8lmeFg==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=宋霄罡, 谭裕平, 郭富强, 鲁晓锋, 黑新宏)}, authors=[Author(id=1249044037634826956, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=songxg@xaut.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1249044037949399766, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044037634826956, language=EN, stringName=Xiaogang Song, firstName=Xiaogang, middleName=null, lastName=Song, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, *, address=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044038159114974, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044037634826956, language=CN, stringName=宋霄罡, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, *, address=
1西安理工大学计算机科学与工程学院,西安710048
2人机共融智能机器人陕西省高校工程研究中心,西安710048, bio={"content":"
宋霄罡,男,副教授,主要研究方向为计算机视觉和无人自主导航系统。E-mail: songxg@xaut.edu.cn
"}, bioImg=null, bioContent=
宋霄罡,男,副教授,主要研究方向为计算机视觉和无人自主导航系统。E-mail: songxg@xaut.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044037068595890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=1, ext=[AuthorCompanyExt(id=1249044037085373108, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China), AuthorCompanyExt(id=1249044037118927541, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1西安理工大学计算机科学与工程学院,西安710048)]), AuthorCompany(id=1249044037441888960, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=2, ext=[AuthorCompanyExt(id=1249044037467054785, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China), AuthorCompanyExt(id=1249044037488026307, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2人机共融智能机器人陕西省高校工程研究中心,西安710048)])]), Author(id=1249044038356247271, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=1179961190@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044038540796653, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044038356247271, language=EN, stringName=Yuping Tan, firstName=Yuping, middleName=null, lastName=Tan, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044040063329012, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044038356247271, language=CN, stringName=谭裕平, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1西安理工大学计算机科学与工程学院,西安710048, bio={"content":"
谭裕平,男,博士研究生,主要研究方向为显著目标检测和多模态融合。E-mail: 1179961190@qq.com
"}, bioImg=null, bioContent=
谭裕平,男,博士研究生,主要研究方向为显著目标检测和多模态融合。E-mail: 1179961190@qq.com
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044037068595890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=1, ext=[AuthorCompanyExt(id=1249044037085373108, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China), AuthorCompanyExt(id=1249044037118927541, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1西安理工大学计算机科学与工程学院,西安710048)])]), Author(id=1249044040344347391, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=3200441274@stu.xaut.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044040503730951, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044040344347391, language=EN, stringName=Fuqiang Guo, firstName=Fuqiang, middleName=null, lastName=Guo, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044040608588557, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044040344347391, language=CN, stringName=郭富强, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1西安理工大学计算机科学与工程学院,西安710048, bio={"content":"
郭富强,男,硕士研究生,主要研究方向为人工智能和目标检测。E-mail: 3200441274@stu.xaut.edu.cn
"}, bioImg=null, bioContent=
郭富强,男,硕士研究生,主要研究方向为人工智能和目标检测。E-mail: 3200441274@stu.xaut.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044037068595890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=1, ext=[AuthorCompanyExt(id=1249044037085373108, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China), AuthorCompanyExt(id=1249044037118927541, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1西安理工大学计算机科学与工程学院,西安710048)])]), Author(id=1249044040742806294, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=luxiaofeng@xaut.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044040897995550, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044040742806294, language=EN, stringName=Xiaofeng Lu, firstName=Xiaofeng, middleName=null, lastName=Lu, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044041028018981, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044040742806294, language=CN, stringName=鲁晓锋, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1西安理工大学计算机科学与工程学院,西安710048
2人机共融智能机器人陕西省高校工程研究中心,西安710048, bio={"content":"
鲁晓锋,男,教授,主要研究方向为模式识别和图像处理。E-mail: luxiaofeng@xaut.edu.cn
"}, bioImg=null, bioContent=
鲁晓锋,男,教授,主要研究方向为模式识别和图像处理。E-mail: luxiaofeng@xaut.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044037068595890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=1, ext=[AuthorCompanyExt(id=1249044037085373108, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China), AuthorCompanyExt(id=1249044037118927541, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1西安理工大学计算机科学与工程学院,西安710048)]), AuthorCompany(id=1249044037441888960, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=2, ext=[AuthorCompanyExt(id=1249044037467054785, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China), AuthorCompanyExt(id=1249044037488026307, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2人机共融智能机器人陕西省高校工程研究中心,西安710048)])]), Author(id=1249044041145459500, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, orderNo=4, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=heixinhong@xaut.edu.cn, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1249044041300648757, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044041145459500, language=EN, stringName=Xinhong Hei, firstName=Xinhong, middleName=null, lastName=Hei, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1249044041460032316, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, authorId=1249044041145459500, language=CN, stringName=黑新宏, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1西安理工大学计算机科学与工程学院,西安710048
2人机共融智能机器人陕西省高校工程研究中心,西安710048, bio={"content":"
黑新宏,男,教授,主要研究方向为计算机视觉和人工智能。E-mail: heixinhong@xaut.edu.cn
"}, bioImg=null, bioContent=
黑新宏,男,教授,主要研究方向为计算机视觉和人工智能。E-mail: heixinhong@xaut.edu.cn
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1249044037068595890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=1, ext=[AuthorCompanyExt(id=1249044037085373108, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China), AuthorCompanyExt(id=1249044037118927541, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1西安理工大学计算机科学与工程学院,西安710048)]), AuthorCompany(id=1249044037441888960, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=2, ext=[AuthorCompanyExt(id=1249044037467054785, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China), AuthorCompanyExt(id=1249044037488026307, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2人机共融智能机器人陕西省高校工程研究中心,西安710048)])])], keywords=[Keyword(id=1249044041690719041, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, orderNo=1, keyword=salient object detection(SOD)), Keyword(id=1249044042026263372, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, orderNo=2, keyword=attention mechanism), Keyword(id=1249044042126926671, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, orderNo=3, keyword=cross-modal), Keyword(id=1249044042307281752, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, orderNo=4, keyword=feature fusion), Keyword(id=1249044042395362141, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, orderNo=5, keyword=edge detail-enhancement), Keyword(id=1249044042470859617, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, orderNo=1, keyword=显著性目标检测(SOD)), Keyword(id=1249044042554745699, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, orderNo=2, keyword=注意力机制), Keyword(id=1249044042676380521, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, orderNo=3, keyword=跨模态), Keyword(id=1249044042869318512, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, orderNo=4, keyword=特征融合), Keyword(id=1249044043032896377, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, orderNo=5, keyword=边缘细节增强)], refs=[Reference(id=1249044050641363060, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=136, issue=null, pageStart=null, pageEnd=109194, url=null, language=null, rfNumber=null, rfOrder=0, authorNames=Bi H B, Wu R W, Liu Z Q, Zhu H H, Zhang C, Xiang T Z, journalName=Pattern Recognition, refType=null, unstructuredReference=
Bi H B,
Wu R W,
Liu Z Q,
Zhu H H,
Zhang C and
Xiang T Z.
2023. Cross-modal hierarchical interaction network for RGB-D salient object detection.
Pattern Recognition,
136: #109194 [DOI:
10.1016/j.patcog.2022.109194], articleTitle=Cross-modal hierarchical interaction network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044050737832060, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2018a, volume=null, issue=null, pageStart=3051, pageEnd=3060, url=null, language=null, rfNumber=null, rfOrder=1, authorNames=Chen H, Li Y F, journalName=null, refType=null, unstructuredReference=
Chen H and
Li Y F.
2018a. Progressively complementarity-aware fusion network for RGB-D salient object detection//Proceedings of 2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition. Salt Lake City, USA: IEEE:3051-3060 [DOI:
10.1109/CVPR.2018.00322], articleTitle=Progressively complementarity-aware fusion network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044050838495364, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=2, authorNames=Chen J N, Lu Y Y, Yu Q H, Luo X D, Adeli E, Wang Y, Lu L, Yuille A L, Zhou Y Y, journalName=null, refType=null, unstructuredReference=
Chen J N,
Lu Y Y,
Yu Q H,
Luo X D,
Adeli E,
Wang Y,
Lu L,
Yuille A L and
Zhou Y Y.
2021. TransUNet: transformers make strong encoders for medical image segmentation [EB/OL]. [2024-11-07].
https://arxiv.org/pdf/2102.04306.pdf, articleTitle=TransUNet: transformers make strong encoders for medical image segmentation, refAbstract=null), Reference(id=1249044050943352972, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=35, issue=3, pageStart=4309, pageEnd=4323, url=null, language=null, rfNumber=null, rfOrder=3, authorNames=Chen Q, Zhang Z X, Lu Y Y, Fu K R, Zhao Q J, journalName=IEEE Transactions on Neural Networks and Learning Systems, refType=null, unstructuredReference=
Chen Q,
Zhang Z X,
Lu Y Y,
Fu K R and
Zhao Q J.
2024. 3-D convolutional neural networks for RGB-D salient object detection and beyond.
IEEE Transactions on Neural Networks and Learning Systems,
35(3): 4309-4323 [DOI:
10.1109/TNNLS.2022.3202241], articleTitle=3-D convolutional neural networks for RGB-D salient object detection and beyond, refAbstract=null), Reference(id=1249044051027239058, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2018b, volume=null, issue=null, pageStart=236, pageEnd=252, url=null, language=null, rfNumber=null, rfOrder=4, authorNames=Chen S H, Tan X L, Wang B, Hu X L, journalName=null, refType=null, unstructuredReference=
Chen S H,
Tan X L,
Wang B and
Hu X L.
2018b. Reverse attention for salient object detection//Proceedings of the 15th European Conference on Computer Vision (ECCV). Munich, Germany: Springer:236-252 [DOI:
10.1007/978-3-030-01240-3_15], articleTitle=Reverse attention for salient object detection, refAbstract=null), Reference(id=1249044051102736534, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=522, issue=null, pageStart=152, pageEnd=164, url=null, language=null, rfNumber=null, rfOrder=5, authorNames=Chen T Y, Xiao J, Hu X G, Zhang G F, Wang S J, journalName=Neurocomputing, refType=null, unstructuredReference=
Chen T Y,
Xiao J,
Hu X G,
Zhang G F and
Wang S J.
2023. Adaptive fusion network for RGB-D salient object detection.
Neurocomputing,
522: 152-164 [DOI:
10.1016/j.neucom.2022.12.004], articleTitle=Adaptive fusion network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044051211788445, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=25, issue=null, pageStart=4253, pageEnd=4266, url=null, language=null, rfNumber=null, rfOrder=6, authorNames=Cheng X L, Zheng X, Pei J L, Tang H, Lyu Z, Chen C B, journalName=IEEE Transactions on Multimedia, refType=null, unstructuredReference=
Cheng X L,
Zheng X,
Pei J L,
Tang H,
Lyu Z and
Chen C B.
2023. Depth-induced gap-reducing network for RGB-D salient object detection: an interaction, guidance and refinement approach.
IEEE Transactions on Multimedia,
25: 4253-4266 [DOI:
10.1109/TMM.2022.3172852], articleTitle=Depth-induced gap-reducing network for RGB-D salient object detection: an interaction, guidance and refinement approach, refAbstract=null), Reference(id=1249044051320840358, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2013, volume=null, issue=null, pageStart=#112, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=7, authorNames=Ciptadi A, Hermans T, Rehg J M, journalName=null, refType=null, unstructuredReference=
Ciptadi A,
Hermans T and
Rehg J M.
2013. An in depth view of saliency//Proceedings of 2013 British Machine Vision Conference (BMVC). Bristol, UK: BMVC:#112 [DOI:
10.5244/C.27.112], articleTitle=An in depth view of saliency, refAbstract=null), Reference(id=1249044051442475182, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022, volume=31, issue=null, pageStart=6800, pageEnd=6815, url=null, language=null, rfNumber=null, rfOrder=8, authorNames=Cong R M, Lin Q W, Zhang C, Li C Y, Cao X C, Huang Q M, Zhao Y, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Cong R M,
Lin Q W,
Zhang C,
Li C Y,
Cao X C,
Huang Q M and
Zhao Y.
2022. CIR-Net: cross-modality interaction and refinement for RGB-D salient object detection.
IEEE Transactions on Image Processing,
31: 6800-6815 [DOI:
10.1109/TIP.2022.3216198], articleTitle=CIR-Net: cross-modality interaction and refinement for RGB-D salient object detection, refAbstract=null), Reference(id=1249044051513778354, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=406, pageEnd=416, url=null, language=null, rfNumber=null, rfOrder=9, authorNames=Cong R M, Liu H Y, Zhang C, Zhang W, Zheng F, Song R, Kwong S, journalName=null, refType=null, unstructuredReference=
Cong R M,
Liu H Y,
Zhang C,
Zhang W,
Zheng F,
Song R and
Kwong S.
2023. Point-aware interaction and CNN-induced refinement network for RGB-D salient object detection//Proceedings of the 31st ACM International Conference on Multimedia. Ottawa, Canada: ACM:406-416 [DOI:
10.1145/3581783.3611982], articleTitle=Point-aware interaction and CNN-induced refinement network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044051589275834, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=9, issue=1, pageStart=2624, pageEnd=2635, url=null, language=null, rfNumber=null, rfOrder=10, authorNames=Ding N, Zhang C, Eskandarian A, journalName=IEEE Transactions on Intelligent Vehicles, refType=null, unstructuredReference=
Ding N,
Zhang C and
Eskandarian A.
2024. SalienDet: a saliency-based feature enhancement algorithm for object detection for autonomous driving.
IEEE Transactions on Intelligent Vehicles,
9(1): 2624-2635 [DOI:
10.1109/TIV.2023.3287359], articleTitle=SalienDet: a saliency-based feature enhancement algorithm for object detection for autonomous driving, refAbstract=null), Reference(id=1249044051673161919, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=61, issue=null, pageStart=1, pageEnd=9, url=null, language=null, rfNumber=null, rfOrder=11, authorNames=Ding Y, Liu Z, Huang M K, Shi R, Wang X Y, journalName=Journal of Visual Communication and Image Representation, refType=null, unstructuredReference=
Ding Y,
Liu Z,
Huang M K,
Shi R and
Wang X Y.
2019. Depth-aware saliency detection using convolutional neural networks.
Journal of Visual Communication and Image Representation,
61: 1-9 [DOI:
10.1016/j.jvcir.2019.03.019], articleTitle=Depth-aware saliency detection using convolutional neural networks, refAbstract=null), Reference(id=1249044051786408134, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=32, issue=5, pageStart=2075, pageEnd=2089, url=null, language=null, rfNumber=null, rfOrder=12, authorNames=Fan D P, Lin Z, Zhang Z, Zhu M L, Cheng M M, journalName=IEEE Transactions on Neural Networks and Learning Systems, refType=null, unstructuredReference=
Fan D P,
Lin Z,
Zhang Z,
Zhu M L and
Cheng M M.
2021. Rethinking RGB-D salient object detection: models, data sets, and large-scale benchmarks.
IEEE Transactions on Neural Networks and Learning Systems,
32(5): 2075-2089 [DOI:
10.1109/TNNLS.2020.2996406], articleTitle=Rethinking RGB-D salient object detection: models, data sets, and large-scale benchmarks, refAbstract=null), Reference(id=1249044051929014477, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=594, issue=null, pageStart=null, pageEnd=127865, url=null, language=null, rfNumber=null, rfOrder=13, authorNames=Fang X, Jiang M F, Zhu J C, Shao X L, Wang H P, journalName=Neurocomputing, refType=null, unstructuredReference=
Fang X,
Jiang M F,
Zhu J C,
Shao X L and
Wang H P.
2024. GroupTransNet: group transformer network for RGB-D salient object detection.
Neurocomputing,
594: #127865 [DOI:
10.1016/j.neucom.2024.127865], articleTitle=GroupTransNet: group transformer network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044053476712660, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022, volume=44, issue=9, pageStart=5541, pageEnd=5559, url=null, language=null, rfNumber=null, rfOrder=14, authorNames=Fu K P, Fan D P, Ji G P, Zhao Q J, Shen J B, Zhu C, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Fu K P,
Fan D P,
Ji G P,
Zhao Q J,
Shen J B and
Zhu C.
2022. Siamese network for RGB-D salient object detection and beyond.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
44(9): 5541-5559 [DOI:
10.1109/TPAMI.2021.3073689], articleTitle=Siamese network for RGB-D salient object detection and beyond, refAbstract=null), Reference(id=1249044053552210138, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2012, volume=21, issue=9, pageStart=4290, pageEnd=4303, url=null, language=null, rfNumber=null, rfOrder=15, authorNames=Gao Y, Wang M, Tao D C, Ji R R, Dai Q H, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Gao Y,
Wang M,
Tao D C,
Ji R R and
Dai Q H.
2012. 3-D object retrieval and recognition with hypergraph analysis.
IEEE Transactions on Image Processing,
21(9): 4290-4303 [DOI:
10.1109/TIP.2012.2199502], articleTitle=3-D object retrieval and recognition with hypergraph analysis, refAbstract=null), Reference(id=1249044053640290530, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2018, volume=48, issue=11, pageStart=3171, pageEnd=3183, url=null, language=null, rfNumber=null, rfOrder=16, authorNames=Han J W, Chen H, Liu N, Yan C G, Li X L, journalName=IEEE Transactions on Cybernetics, refType=null, unstructuredReference=
Han J W,
Chen H,
Liu N,
Yan C G and
Li X L.
2018. CNNs-based RGB-D saliency detection via cross-view transfer and multiview fusion.
IEEE Transactions on Cybernetics,
48(11): 3171-3183 [DOI:
10.1109/TCYB.2017.2761775], articleTitle=CNNs-based RGB-D saliency detection via cross-view transfer and multiview fusion, refAbstract=null), Reference(id=1249044053711593701, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=41, issue=4, pageStart=815, pageEnd=828, url=null, language=null, rfNumber=null, rfOrder=17, authorNames=Hou Q B, Cheng M M, Hu X W, Borji A, Tu Z W, Torr P H S, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Hou Q B,
Cheng M M,
Hu X W,
Borji A,
Tu Z W and
Torr P H S.
2019. Deeply supervised salient object detection with short connections.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
41(4): 815-828 [DOI:
10.1109/TPAMI.2018.2815688], articleTitle=Deeply supervised salient object detection with short connections, refAbstract=null), Reference(id=1249044053782896873, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022, volume=24, issue=null, pageStart=1651, pageEnd=1664, url=null, language=null, rfNumber=null, rfOrder=18, authorNames=Huang N C, Yang Y, Zhang D W, Zhang Q, Han J G, journalName=IEEE Transactions on Multimedia, refType=null, unstructuredReference=
Huang N C,
Yang Y,
Zhang D W,
Zhang Q and
Han J G.
2022. Employing bilinear fusion and saliency prior information for RGB-D salient object detection.
IEEE Transactions on Multimedia,
24: 1651-1664 [DOI:
10.1109/TMM.2021.3069297], articleTitle=Employing bilinear fusion and saliency prior information for RGB-D salient object detection, refAbstract=null), Reference(id=1249044053850005742, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=23, issue=2, pageStart=509, pageEnd=518, url=null, language=null, rfNumber=null, rfOrder=19, authorNames=Jahanifar M, Tajeddin N Z, Asl B M, Gooya A, journalName=IEEE Journal of Biomedical and Health Informatics, refType=null, unstructuredReference=
Jahanifar M,
Tajeddin N Z,
Asl B M and
Gooya A.
2019. Supervised saliency map driven segmentation of lesions in dermoscopic images.
IEEE Journal of Biomedical and Health Informatics,
23(2): 509-518 [DOI:
10.1109/JBHI.2018.2839647], articleTitle=Supervised saliency map driven segmentation of lesions in dermoscopic images, refAbstract=null), Reference(id=1249044053942280438, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=9466, pageEnd=9476, url=null, language=null, rfNumber=null, rfOrder=20, authorNames=Ji W, Li J J, Yu S, Zhang M, Piao Y, Yao S Y, Bi Q, Ma K, Zheng Y F, Lu H C, Cheng L, journalName=null, refType=null, unstructuredReference=
Ji W,
Li J J,
Yu S,
Zhang M,
Piao Y,
Yao S Y,
Bi Q,
Ma K,
Zheng Y F,
Lu H C and
Cheng L.
2021. Calibrated RGB-D salient object detection//Proceedings of 2021 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). Nashville, USA: IEEE:9466-9476 [DOI:
10.1109/CVPR46437.2021.00935], articleTitle=Calibrated RGB-D salient object detection, refAbstract=null), Reference(id=1249044054034555132, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=1115, pageEnd=1119, url=null, language=null, rfNumber=null, rfOrder=21, authorNames=Ju R, Ge L, Geng W J, Ren T W, Wu G S, journalName=null, refType=null, unstructuredReference=
Ju R,
Ge L,
Geng W J,
Ren T W and
Wu G S.
2014. Depth saliency based on anisotropic center-surround difference//Proceedings of 2014 IEEE International Conference on Image Processing (ICIP). Paris, France: IEEE:1115-1119 [DOI:
10.1109/ICIP.2014.7025222], articleTitle=Depth saliency based on anisotropic center-surround difference, refAbstract=null), Reference(id=1249044054135218433, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=1, pageEnd=15, url=null, language=null, rfNumber=null, rfOrder=22, authorNames=Kingma D P, Ba J, journalName=null, refType=null, unstructuredReference=
Kingma D P and
Ba J.
2015. Adam: a method for stochastic optimization//Proceedings of the 3rd International Conference on Learning Representations. San Diego, USA: ICLR:1-15, articleTitle=Adam: a method for stochastic optimization, refAbstract=null), Reference(id=1249044054214910215, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=630, pageEnd=647, url=null, language=null, rfNumber=null, rfOrder=23, authorNames=Lee M, Park C, Cho S, Lee S, journalName=null, refType=null, unstructuredReference=
Lee M,
Park C,
Cho S and
Lee S.
2022. SPSN: superpixel prototype sampling network for RGB-D salient object detection//Proceedings of the 17th European Conference on Computer Vision (ECCV). Tel Aviv, Israel: Springer:630-647 [DOI:
10.1007/978-3-031-19818-2_36], articleTitle=SPSN: superpixel prototype sampling network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044054483345677, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=30, issue=null, pageStart=6855, pageEnd=6868, url=null, language=null, rfNumber=null, rfOrder=24, authorNames=Li J, Su J M, Xia C Q, Ma M C, Tian Y H, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Li J,
Su J M,
Xia C Q,
Ma M C and
Tian Y H.
2021. Salient object detection with purificatory mechanism and structural similarity loss.
IEEE Transactions on Image Processing,
30: 6855-6868 [DOI:
10.1109/TIP.2021.3099405], articleTitle=Salient object detection with purificatory mechanism and structural similarity loss, refAbstract=null), Reference(id=1249044054596591893, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=238, issue=null, pageStart=null, pageEnd=121778, url=null, language=null, rfNumber=null, rfOrder=25, authorNames=Liang B C, Luo H L, journalName=Expert Systems with Applications, refType=null, unstructuredReference=
Liang B C and
Luo H L.
2024. MEANet: an effective and lightweight solution for salient object detection in optical remote sensing images.
Expert Systems with Applications,
238: #121778 [DOI:
10.1016/j.eswa.2023.121778], articleTitle=MEANet: an effective and lightweight solution for salient object detection in optical remote sensing images, refAbstract=null), Reference(id=1249044054755975451, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2018, volume=275, issue=null, pageStart=2227, pageEnd=2238, url=null, language=null, rfNumber=null, rfOrder=26, authorNames=Liang F F, Duan L J, Ma W, Qiao Y H, Cai Z, Qing L, journalName=Neurocomputing, refType=null, unstructuredReference=
Liang F F,
Duan L J,
Ma W,
Qiao Y H,
Cai Z and
Qing L.
2018. Stereoscopic saliency model using contrast and depth-guided-background prior.
Neurocomputing,
275: 2227-2238 [DOI:
10.1016/j.neucom.2017.10.052], articleTitle=Stereoscopic saliency model using contrast and depth-guided-background prior, refAbstract=null), Reference(id=1249044054852444450, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022, volume=32, issue=3, pageStart=1378, pageEnd=1389, url=null, language=null, rfNumber=null, rfOrder=27, authorNames=Mei H Y, Liu Y Y, Wei Z Q, Zhou D S, Wei X P, Zhang Q, Yang X, journalName=IEEE Transactions on Circuits and Systems for Video Technology, refType=null, unstructuredReference=
Mei H Y,
Liu Y Y,
Wei Z Q,
Zhou D S,
Wei X P,
Zhang Q and
Yang X.
2022. Exploring dense context for salient object detection.
IEEE Transactions on Circuits and Systems for Video Technology,
32(3): 1378-1389 [DOI:
10.1109/TCSVT.2021.3069848], articleTitle=Exploring dense context for salient object detection, refAbstract=null), Reference(id=1249044054927941928, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2012, volume=null, issue=null, pageStart=454, pageEnd=461, url=null, language=null, rfNumber=null, rfOrder=28, authorNames=Niu Y Z, Geng Y J, Li X Q, Liu F, journalName=null, refType=null, unstructuredReference=
Niu Y Z,
Geng Y J,
Li X Q and
Liu F.
2012. Leveraging stereopsis for saliency analysis//Proceedings of 2012 IEEE Conference on Computer Vision and Pattern Recognition (CVPR). Providence, USA: IEEE:454-461 [DOI:
10.1109/CVPR.2012.6247708], articleTitle=Leveraging stereopsis for saliency analysis, refAbstract=null), Reference(id=1249044055020216621, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=32, issue=null, pageStart=892, pageEnd=904, url=null, language=null, rfNumber=null, rfOrder=29, authorNames=Pang Y W, Zhao X Q, Zhang L H, Lu H C, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Pang Y W,
Zhao X Q,
Zhang L H and
Lu H C.
2023. CAVER: cross-modal view-mixed transformer for bi-modal salient object detection.
IEEE Transactions on Image Processing,
32: 892-904 [DOI:
10.1109/TIP.2023.3234702], articleTitle=CAVER: cross-modal view-mixed transformer for bi-modal salient object detection, refAbstract=null), Reference(id=1249044055083131184, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=#721, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=30, authorNames=Paszke A, Gross S, Massa F, Lerer A, Bradbury J, Chanan G, Killeen T, Lin Z M, Gimelshein N, Antiga L, Desmaison A, Köpf A, Yang E, DeVito Z, Raison M, Tejani A, Chilamkurthy S, Steiner B, Fang L, Bai J J, Chintala S, journalName=null, refType=null, unstructuredReference=
Paszke A,
Gross S,
Massa F,
Lerer A,
Bradbury J,
Chanan G,
Killeen T,
Lin Z M,
Gimelshein N,
Antiga L,
Desmaison A,
Köpf A,
Yang E,
DeVito Z,
Raison M,
Tejani A,
Chilamkurthy S,
Steiner B,
Fang L,
Bai J J and
Chintala S.
2019. PyTorch: an imperative style, high-performance deep learning library//Proceedings of the 33rd International Conference on Neural Information Processing Systems. Vancouver, Canada: Curran Associates Inc.:#721, articleTitle=PyTorch, refAbstract=null), Reference(id=1249044055183794487, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=92, pageEnd=109, url=null, language=null, rfNumber=null, rfOrder=31, authorNames=Peng H W, Li B, Xiong W H, Hu W M, Ji R R, journalName=null, refType=null, unstructuredReference=
Peng H W,
Li B,
Xiong W H,
Hu W M and
Ji R R.
2014. RGBD salient object detection: a benchmark and algorithms//Proceedings of the 13th European Conference on Computer Vision (ECCV). Zurich, Switzerland: Springer:92-109 [DOI:
10.1007/978-3-319-10578-9_7], articleTitle=RGBD salient object detection: a benchmark and algorithms, refAbstract=null), Reference(id=1249044055267680573, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=25, pageEnd=32, url=null, language=null, rfNumber=null, rfOrder=32, authorNames=Ren J Q, Xiaojin Gong N, Yu L, Wenhui Zhou N, Yang M Y, journalName=null, refType=null, unstructuredReference=
Ren J Q,
Xiaojin Gong N,
Yu L,
Wenhui Zhou N and
Yang M Y.
2015. Exploiting global priors for RGB-D saliency detection//Proceedings of 2015 IEEE Conference on Computer Vision and Pattern Recognition Workshops (CVPRW). Boston, USA: IEEE:25-32 [DOI:
10.1109/CVPRW.2015.7301391], articleTitle=Exploiting global priors for RGB-D saliency detection, refAbstract=null), Reference(id=1249044055364149569, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2014, volume=24, issue=5, pageStart=769, pageEnd=779, url=null, language=null, rfNumber=null, rfOrder=33, authorNames=Ren Z X, Gao S H, Chia L T, Tsang I W H, journalName=IEEE Transactions on Circuits and Systems for Video Technology, refType=null, unstructuredReference=
Ren Z X,
Gao S H,
Chia L T and
Tsang I W H.
2014. Region-based saliency detection and its application in object recognition.
IEEE Transactions on Circuits and Systems for Video Technology,
24(5): 769-779 [DOI:
10.1109/TCSVT.2013.2280096], articleTitle=Region-based saliency detection and its application in object recognition, refAbstract=null), Reference(id=1249044055448035653, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=null, rfOrder=34, authorNames=Simonyan K, Zisserman A, journalName=null, refType=null, unstructuredReference=
Simonyan K and
Zisserman A.
2015. Very deep convolutional networks for large-scale image recognition//Proceedings of the 3rd International Conference on Learning Representations. San Diego, USA: ICLR, articleTitle=Very deep convolutional networks for large-scale image recognition, refAbstract=null), Reference(id=1249044055519338823, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=35, issue=4, pageStart=1899, pageEnd=1913, url=null, language=null, rfNumber=null, rfOrder=35, authorNames=Sun F M, Hu X H, Wu J Y, Sun J, Wang F S, journalName=Journal of Software, refType=null, unstructuredReference=
Sun F M,
Hu X H,
Wu J Y,
Sun J and
Wang F S.
2024. RGB-D salient object detection based on cross-modal interactive fusion and global awareness.
Journal of Software,
35(4): 1899-1913, articleTitle=RGB-D salient object detection based on cross-modal interactive fusion and global awareness, refAbstract=null), Reference(id=1249044055582253387, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=35, issue=4, pageStart=1899, pageEnd=1913, url=null, language=null, rfNumber=null, rfOrder=36, authorNames=孙福明, 胡锡航, 武景宇, 孙静, 王法胜, journalName=软件学报, refType=null, unstructuredReference=孙福明, 胡锡航, 武景宇, 孙静, 王法胜.
2024. 跨模态交互融合与全局感知的RGB-D显著性目标检测.
软件学报,
35(4): 1899-1913 [DOI:
10.13328/j.cnki.jos.006833], articleTitle=跨模态交互融合与全局感知的RGB-D显著性目标检测, refAbstract=null), Reference(id=1249044055653556559, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022a, volume=31, issue=null, pageStart=1285, pageEnd=1297, url=null, language=null, rfNumber=null, rfOrder=37, authorNames=Wang F Y, Pan J S, Xu S K, Tang J H, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Wang F Y,
Pan J S,
Xu S K and
Tang J H.
2022a. Learning discriminative cross-modality features for RGB-D saliency detection.
IEEE Transactions on Image Processing,
31: 1285-1297 [DOI:
10.1109/TIP.2022.3140606], articleTitle=Learning discriminative cross-modality features for RGB-D saliency detection, refAbstract=null), Reference(id=1249044055733248339, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022b, volume=44, issue=6, pageStart=3239, pageEnd=3259, url=null, language=null, rfNumber=null, rfOrder=38, authorNames=Wang W G, Lai Q X, Fu H Z, Shen J B, Ling H B, Yang R G, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Wang W G,
Lai Q X,
Fu H Z,
Shen J B,
Ling H B and
Yang R G.
2022b. Salient object detection in the deep learning era: an in-depth survey.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
44(6): 3239-3259 [DOI:
10.1109/TPAMI.2021.3051099], articleTitle=Salient object detection in the deep learning era: an in-depth survey, refAbstract=null), Reference(id=1249044055808745814, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=41, issue=7, pageStart=1531, pageEnd=1544, url=null, language=null, rfNumber=null, rfOrder=39, authorNames=Wang W G, Shen J B, Ling H B, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Wang W G,
Shen J B and
Ling H B.
2019. A deep network solution for attention and aesthetics aware photo cropping.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
41(7): 1531-1544 [DOI:
10.1109/TPAMI.2018.2840724], articleTitle=A deep network solution for attention and aesthetics aware photo cropping, refAbstract=null), Reference(id=1249044055884243290, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=43, issue=7, pageStart=2413, pageEnd=2428, url=null, language=null, rfNumber=null, rfOrder=40, authorNames=Wang W G, Shen J B, Lu X K, Hoi S C H, Ling H B, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Wang W G,
Shen J B,
Lu X K,
Hoi S C H and
Ling H B.
2021. Paying attention to video object pattern understanding.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
43(7): 2413-2428 [DOI:
10.1109/TPAMI.2020.2966453], articleTitle=Paying attention to video object pattern understanding, refAbstract=null), Reference(id=1249044055959740766, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=46, issue=3, pageStart=1635, pageEnd=1649, url=null, language=null, rfNumber=null, rfOrder=41, authorNames=Wang W G, Sun G L, Van Gool L, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Wang W G,
Sun G L and
Van Gool L.
2024. Looking beyond single images for weakly supervised semantic segmentation learning.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
46(3): 1635-1649 [DOI:
10.1109/TPAMI.2022.3168530], articleTitle=Looking beyond single images for weakly supervised semantic segmentation learning, refAbstract=null), Reference(id=1249044056064598370, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022a, volume=195, issue=null, pageStart=null, pageEnd=116614, url=null, language=null, rfNumber=null, rfOrder=42, authorNames=Wu J Y, Sun F M, Xu R, Meng J, Wang F S, journalName=Expert Systems with Applications, refType=null, unstructuredReference=
Wu J Y,
Sun F M,
Xu R,
Meng J and
Wang F S.
2022a. Aggregate interactive learning for RGB-D salient object detection.
Expert Systems with Applications,
195: #116614 [DOI:
10.1016/j.eswa.2022.116614], articleTitle=Aggregate interactive learning for RGB-D salient object detection, refAbstract=null), Reference(id=1249044056144290150, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=45, issue=11, pageStart=12760, pageEnd=12771, url=null, language=null, rfNumber=null, rfOrder=43, authorNames=Wu Y H, Liu Y, Zhan X, Cheng M M, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
Wu Y H,
Liu Y,
Zhan X and
Cheng M M.
2023. P2T: pyramid pooling transformer for scene understanding.
IEEE Transactions on Pattern Analysis and Machine Intelligence,
45(11): 12760-12771 [DOI:
10.1109/TPAMI.2022.3202765], articleTitle=P2T: pyramid pooling transformer for scene understanding, refAbstract=null), Reference(id=1249044056240759147, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022b, volume=31, issue=null, pageStart=3125, pageEnd=3136, url=null, language=null, rfNumber=null, rfOrder=44, authorNames=Wu Y H, Liu Y, Zhang L, Cheng M M, Ren B, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Wu Y H,
Liu Y,
Zhang L,
Cheng M M and
Ren B.
2022b. EDN: salient object detection via extremely-downsampled network.
IEEE Transactions on Image Processing,
31: 3125-3136 [DOI:
10.1109/TIP.2022.3164550], articleTitle=EDN: salient object detection via extremely-downsampled network, refAbstract=null), Reference(id=1249044056316256622, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=26, issue=null, pageStart=2648, pageEnd=2658, url=null, language=null, rfNumber=null, rfOrder=45, authorNames=Xiao F, Pu Z D, Chen J Q, Gao X P, journalName=IEEE Transactions on Multimedia, refType=null, unstructuredReference=
Xiao F,
Pu Z D,
Chen J Q and
Gao X P.
2024. DGFNet: depth-guided cross-modality fusion network for RGB-D salient object detection.
IEEE Transactions on Multimedia,
26: 2648-2658 [DOI:
10.1109/TMM.2023.3301280], articleTitle=DGFNet: depth-guided cross-modality fusion network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044056391754097, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=29, issue=5, pageStart=1252, pageEnd=1264, url=null, language=null, rfNumber=null, rfOrder=46, authorNames=Ye X Y, Zhu L, Wang W W, Fu Y, journalName=Journal of Image and Graphics, refType=null, unstructuredReference=
Ye X Y,
Zhu L,
Wang W W and
Fu Y.
2024. RGB_D salient object detection algorithm based on complementary information interaction.
Journal of Image and Graphics,
29(5): 1252-1264, articleTitle=RGB_D salient object detection algorithm based on complementary information interaction, refAbstract=null), Reference(id=1249044057973006708, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=29, issue=5, pageStart=1252, pageEnd=1264, url=null, language=null, rfNumber=null, rfOrder=47, authorNames=叶欣悦, 朱磊, 王文武, 付云, journalName=中国图象图形学报, refType=null, unstructuredReference=叶欣悦, 朱磊, 王文武, 付云.
2024. 互补特征交互融合的RGB_D实时显著目标检测.
中国图象图形学报,
29(5): 1252-1264 [DOI:
10.11834/jig.230583], articleTitle=互补特征交互融合的RGB_D实时显著目标检测, refAbstract=null), Reference(id=1249044058044309879, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=49, issue=3, pageStart=1259, pageEnd=1290, url=null, language=null, rfNumber=null, rfOrder=48, authorNames=Zhang R, Lyu Y, Zhang Z T, Ren L, Xie J, Zhang A L, Yan Z W, Mi O, journalName=Journal of China Coal Society, refType=null, unstructuredReference=
Zhang R,
Lyu Y,
Zhang Z T,
Ren L,
Xie J,
Zhang A L,
Yan Z W and
Mi O.
2024. Development and prospect of multidimensional information perception and intelligent construction in deep earth engineering.
Journal of China Coal Society,
49(3): 1259-1290, articleTitle=Development and prospect of multidimensional information perception and intelligent construction in deep earth engineering, refAbstract=null), Reference(id=1249044058128195963, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=49, issue=3, pageStart=1259, pageEnd=1290, url=null, language=null, rfNumber=null, rfOrder=49, authorNames=张茹, 吕游, 张泽天, 任利, 谢晶, 张安林, 严志伟, 米欧, journalName=煤炭学报, refType=null, unstructuredReference=张茹, 吕游, 张泽天, 任利, 谢晶, 张安林, 严志伟, 米欧.
2024. 深地工程多维信息感知与智能建造的发展与展望.
煤炭学报,
49(3): 1259-1290 [DOI:
10.13225/j.cnki.jccs.2023.1439], articleTitle=深地工程多维信息感知与智能建造的发展与展望, refAbstract=null), Reference(id=1249044058224664958, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=3469, pageEnd=3478, url=null, language=null, rfNumber=null, rfOrder=50, authorNames=Zhang M, Ren W S, Piao Y, Rong Z K, Lu H C, journalName=null, refType=null, unstructuredReference=
Zhang M,
Ren W S,
Piao Y,
Rong Z K and
Lu H C.
2020. Select, supplement and focus for RGB-D saliency detection//Proceedings of 2020 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). Seattle, USA: IEEE:3469-3478 [DOI:
10.1109/CVPR42600.2020.00353], articleTitle=Select, supplement and focus for RGB-D saliency detection, refAbstract=null), Reference(id=1249044058346299777, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2023, volume=25, issue=null, pageStart=5142, pageEnd=5154, url=null, language=null, rfNumber=null, rfOrder=51, authorNames=Zhang M, Yao S Y, Hu B Q, Piao Y, Ji W, journalName=IEEE Transactions on Multimedia, refType=null, unstructuredReference=
Zhang M,
Yao S Y,
Hu B Q,
Piao Y and
Ji W.
2023. C
2DFNet: criss-cross dynamic filter network for RGB-D salient object detection.
IEEE Transactions on Multimedia,
25: 5142-5154 [DOI:
10.1109/TMM.2022.3187856], articleTitle=C
2DFNet: criss-cross dynamic filter network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044058413408643, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=24, issue=7, pageStart=1096, pageEnd=1105, url=null, language=null, rfNumber=null, rfOrder=52, authorNames=Zhang Q, Li Y, Li W J, Lin J J, Xiao M, Chen F Y, journalName=Journal of Image and Graphics, refType=null, unstructuredReference=
Zhang Q,
Li Y,
Li W J,
Lin J J,
Xiao M and
Chen F Y.
2019. Salient object detection via deep features and multiple kernel boosting learning.
Journal of Image and Graphics,
24(7): 1096-1105, articleTitle=Salient object detection via deep features and multiple kernel boosting learning, refAbstract=null), Reference(id=1249044058472128902, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=24, issue=7, pageStart=1096, pageEnd=1105, url=null, language=null, rfNumber=null, rfOrder=53, authorNames=张晴, 李云, 李文举, 林家骏, 肖莽, 陈飞云, journalName=中国图象图形学报, refType=null, unstructuredReference=张晴, 李云, 李文举, 林家骏, 肖莽, 陈飞云.
2019. 融合深度特征和多核增强学习的显著目标检测.
中国图象图形学报,
24(7): 1096-1105 [DOI:
10.11834/jig.180224], articleTitle=融合深度特征和多核增强学习的显著目标检测, refAbstract=null), Reference(id=1249044058535043465, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2024, volume=34, issue=3, pageStart=1493, pageEnd=1507, url=null, language=null, rfNumber=null, rfOrder=54, authorNames=Zhang Q, Qin Q, Yang Y, Jiao Q, Han J G, journalName=IEEE Transactions on Circuits and Systems for Video Technology, refType=null, unstructuredReference=
Zhang Q,
Qin Q,
Yang Y,
Jiao Q and
Han J G.
2024. Feature calibrating and fusing network for RGB-D salient object detection.
IEEE Transactions on Circuits and Systems for Video Technology,
34(3): 1493-1507 [DOI:
10.1109/TCSVT.2023.3296581], articleTitle=Feature calibrating and fusing network for RGB-D salient object detection, refAbstract=null), Reference(id=1249044058614735245, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2019, volume=null, issue=null, pageStart=8778, pageEnd=8787, url=null, language=null, rfNumber=null, rfOrder=55, authorNames=Zhao J X, Liu J J, Fan D P, Cao Y, Yang J F, Cheng M M, journalName=null, refType=null, unstructuredReference=
Zhao J X,
Liu J J,
Fan D P,
Cao Y,
Yang J F and
Cheng M M.
2019. EGNet: edge guidance network for salient object detection//Proceedings of 2019 IEEE/CVF International Conference on Computer Vision (ICCV). Seoul, Korea (South): IEEE:8778-8787 [DOI:
10.1109/ICCV.2019.00887], articleTitle=EGNet: edge guidance network for salient object detection, refAbstract=null), Reference(id=1249044058686038416, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=47, issue=9, pageStart=2120, pageEnd=2131, url=null, language=null, rfNumber=null, rfOrder=56, authorNames=Zhao X K, Li M L, Zhang G, Li N, Li J S, journalName=Acta Automatica Sinica, refType=null, unstructuredReference=
Zhao X K,
Li M L,
Zhang G,
Li N and
Li J S.
2021. Object detection method based on saliency map fusion for UAV-borne thermal images.
Acta Automatica Sinica,
47(9): 2120-2131, articleTitle=Object detection method based on saliency map fusion for UAV-borne thermal images, refAbstract=null), Reference(id=1249044058765730195, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=47, issue=9, pageStart=2120, pageEnd=2131, url=null, language=null, rfNumber=null, rfOrder=57, authorNames=赵兴科, 李明磊, 张弓, 黎宁, 李家松, journalName=自动化学报, refType=null, unstructuredReference=赵兴科, 李明磊, 张弓, 黎宁, 李家松.
2021. 基于显著图融合的无人机载热红外图像目标检测方法.
自动化学报,
47(9): 2120-2131 [DOI:
10.16383/j.aas.c200021], articleTitle=基于显著图融合的无人机载热红外图像目标检测方法, refAbstract=null), Reference(id=1249044058878976407, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2022, volume=6, issue=3, pageStart=593, pageEnd=601, url=null, language=null, rfNumber=null, rfOrder=58, authorNames=Zhou W J, Pan S J, Lei J S, Yu L, journalName=IEEE Transactions on Emerging Topics in Computational Intelligence, refType=null, unstructuredReference=
Zhou W J,
Pan S J,
Lei J S and
Yu L.
2022. TMFNet: three-input multilevel fusion network for detecting salient objects in RGB-D images.
IEEE Transactions on Emerging Topics in Computational Intelligence,
6(3): 593-601 [DOI:
10.1109/TETCI.2021.3097393], articleTitle=TMFNet: three-input multilevel fusion network for detecting salient objects in RGB-D images, refAbstract=null), Reference(id=1249044058946085274, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=894, pageEnd=910, url=null, language=null, rfNumber=null, rfOrder=59, authorNames=Zhu X Z, Su W J, Lu L W, Li B, Wang X G, Dai J F, journalName=null, refType=null, unstructuredReference=
Zhu X Z,
Su W J,
Lu L W,
Li B,
Wang X G and
Dai J F.
2021. Deformable DETR: deformable transformers for end-to-end object detection//Proceedings of the 9th International Conference on Learning Representations. [s.l.]: ICLR:894-910, articleTitle=Deformable DETR: deformable transformers for end-to-end object detection, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1249044037068595890, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=1, ext=[AuthorCompanyExt(id=1249044037085373108, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1School of Computer Science and Engineering, Xi’an University of Technology, Xi’an710048, China), AuthorCompanyExt(id=1249044037118927541, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037068595890, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1西安理工大学计算机科学与工程学院,西安710048)]), AuthorCompany(id=1249044037441888960, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, xref=2, ext=[AuthorCompanyExt(id=1249044037467054785, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2Human Machine Integration Intelligent Robot Shaanxi Provincial University Engineering Research Center, Xi’an710048, China), AuthorCompanyExt(id=1249044037488026307, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, companyId=1249044037441888960, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2人机共融智能机器人陕西省高校工程研究中心,西安710048)])], figs=[ArticleFig(id=1249044044853224328, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.1, caption=
Cross-modal feature fusion and detail-enhanced network (CFADNet) architecture, figureFileSmall=b9xoypNJvQAZ/f1KIYZ5Rw==, figureFileBig=5b9ITVT5R5PSNWyvQVLaeQ==, tableContent=null), ArticleFig(id=1249044045054550930, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图1, caption=
跨模态特征融合与细节信息增强网络架构, figureFileSmall=b9xoypNJvQAZ/f1KIYZ5Rw==, figureFileBig=5b9ITVT5R5PSNWyvQVLaeQ==, tableContent=null), ArticleFig(id=1249044045482369958, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.2, caption=
Cross-modal attention fusion enhancement module (CAFEM) structure, figureFileSmall=2uhsbBWaG/bxmMtUcqM6Tw==, figureFileBig=z0xKJgosBNVy2igEVr9oYA==, tableContent=null), ArticleFig(id=1249044045608199085, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图2, caption=
跨模态注意力融合增强模块, figureFileSmall=2uhsbBWaG/bxmMtUcqM6Tw==, figureFileBig=z0xKJgosBNVy2igEVr9oYA==, tableContent=null), ArticleFig(id=1249044045742416822, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.3, caption=
Boundary feature extraction module (BFEM) structure, figureFileSmall=Jw3UhX9+iJ5m08zlf0QYlw==, figureFileBig=NC8dF7yhbgQw5vHFzvhwiQ==, tableContent=null), ArticleFig(id=1249044045876634556, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图3, caption=
边缘特征提取模块, figureFileSmall=Jw3UhX9+iJ5m08zlf0QYlw==, figureFileBig=NC8dF7yhbgQw5vHFzvhwiQ==, tableContent=null), ArticleFig(id=1249044046065378247, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.4, caption=
Intermediate feature visualization of BFEM, figureFileSmall=CbyjmQjrRgXz7Y0XCBb5Yw==, figureFileBig=iXODMvZOrlrtfr61nyfFyA==, tableContent=null), ArticleFig(id=1249044046300259280, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图4, caption=
边缘特征提取模块中间特征可视化, figureFileSmall=CbyjmQjrRgXz7Y0XCBb5Yw==, figureFileBig=iXODMvZOrlrtfr61nyfFyA==, tableContent=null), ArticleFig(id=1249044046493197272, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.5, caption=
Fβ curves, figureFileSmall=5un3Fwp3R4Q7kgl6tmJN6g==, figureFileBig=wIXYZKjSCZVLoZthmSx/Mg==, tableContent=null), ArticleFig(id=1249044046648386526, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图5, caption=
Fβ曲线, figureFileSmall=5un3Fwp3R4Q7kgl6tmJN6g==, figureFileBig=wIXYZKjSCZVLoZthmSx/Mg==, tableContent=null), ArticleFig(id=1249044046883267559, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.6, caption=
Precision-recall curves, figureFileSmall=6lD61WN/Udf/MR+Vx+sGrg==, figureFileBig=UtvkU0ax5LOMFVooO3v56A==, tableContent=null), ArticleFig(id=1249044047118148586, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图6, caption=
精度-召回率曲线, figureFileSmall=6lD61WN/Udf/MR+Vx+sGrg==, figureFileBig=UtvkU0ax5LOMFVooO3v56A==, tableContent=null), ArticleFig(id=1249044047277532146, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.7, caption=
Visual comparison of our method with the state-of-the-art methods, figureFileSmall=kHVy4BjbYoZni2vKHl6dFQ==, figureFileBig=57fPEvkm4J1o1GMfFrUtSA==, tableContent=null), ArticleFig(id=1249044047462081529, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图7, caption=
本文方法与现有先进方法的直观对比, figureFileSmall=kHVy4BjbYoZni2vKHl6dFQ==, figureFileBig=57fPEvkm4J1o1GMfFrUtSA==, tableContent=null), ArticleFig(id=1249044049022362624, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.8, caption=
Comparison of details of prediction maps obtained by different edge feature extraction method, figureFileSmall=/Rk4H27UZDdYl/vwEAyhAg==, figureFileBig=TnNylwhufUu5hE70leHitg==, tableContent=null), ArticleFig(id=1249044049106247687, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图8, caption=
采用不同边缘特征提取方法得到的预测图细节对比, figureFileSmall=/Rk4H27UZDdYl/vwEAyhAg==, figureFileBig=TnNylwhufUu5hE70leHitg==, tableContent=null), ArticleFig(id=1249044049190133769, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Fig.9, caption=
Some failure cases of our method, figureFileSmall=klBTHQkna5CgSRztwKM0iQ==, figureFileBig=cuo1Tgp/W8Tw4CmPDG5BqA==, tableContent=null), ArticleFig(id=1249044049311768596, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=图9, caption=
失败案例, figureFileSmall=klBTHQkna5CgSRztwKM0iQ==, figureFileBig=cuo1Tgp/W8Tw4CmPDG5BqA==, tableContent=null), ArticleFig(id=1249044049429209116, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Tab.1, caption=
Quantitative evaluation
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 接收会议 | NJU2K数据集 | NLPR数据集 | STERE数据集 | SIP数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| DCF | CVPR 21 | 0.035 | 0.902 | 0.912 | 0.021 | 0.891 | 0.924 | 0.039 | 0.885 | 0.902 | 0.051 | 0.875 | 0.876 |
| CIRNet | TIP 22 | 0.035 | 0.927 | 0.925 | 0.023 | 0.924 | 0.933 | 0.038 | 0.914 | 0.917 | 0.052 | 0.896 | 0.888 |
| CM-LCG | TIP 22 | 0.043 | 0.915 | 0.913 | 0.029 | 0.906 | 0.922 | 0.043 | 0.906 | 0.910 | - | - | - |
| AILNet | ESWA 22 | 0.045 | 0.876 | 0.898 | 0.029 | 0.857 | 0.912 | 0.038 | 0.880 | 0.908 | 0.050 | 0.866 | 0.889 |
| SPSN | ECCV 22 | 0.032 | 0.920 | 0.918 | 0.023 | 0.910 | 0.923 | 0.035 | 0.900 | 0.907 | 0.042 | 0.899 | 0.892 |
| TMFNet | TETCI 22 | 0.041 | 0.882 | 0.910 | 0.027 | 0.867 | 0.921 | - | - | - | 0.057 | 0.853 | 0.874 |
| AFNet | Nuecom22 | 0.032 | 0.928 | 0.926 | 0.020 | 0.925 | 0.936 | 0.034 | 0.918 | 0.918 | 0.043 | 0.909 | 0.896 |
| JL-DCF | TPAMI 22 | 0.040 | 0.913 | 0.911 | 0.023 | 0.917 | 0.926 | 0.039 | 0.907 | 0.911 | 0.046 | 0.900 | 0.892 |
| EBFSP | TMM 22 | 0.038 | 0.895 | 0.907 | 0.028 | 0.887 | 0.909 | 0.041 | 0.873 | 0.900 | 0.052 | 0.863 | 0.877 |
| CAVER | TIP 23 | 0.031 | 0.925 | 0.921 | 0.020 | 0.921 | 0.929 | 0.033 | 0.912 | 0.913 | 0.042 | 0.902 | 0.893 |
| HINet | PR 23 | 0.039 | 0.914 | 0.915 | 0.026 | 0.906 | 0.922 | 0.049 | 0.883 | 0.892 | 0.066 | 0.855 | 0.856 |
| C2DFNet | TMM 23 | 0.039 | 0.909 | 0.908 | 0.022 | 0.917 | 0.928 | 0.038 | 0.897 | 0.902 | 0.053 | 0.877 | 0.872 |
| PICRNet | ACMM 23 | 0.029 | 0.931 | 0.927 | 0.019 | 0.928 | 0.935 | 0.031 | 0.920 | 0.921 | 0.053 | 0.883 | 0.872 |
| DGFNet | TMM 24 | 0.032 | 0.914 | 0.921 | 0.021 | 0.902 | 0.928 | 0.035 | 0.896 | 0.911 | 0.048 | 0.879 | 0.883 |
| FCFNet | TCSVT 24 | 0.034 | 0.923 | 0.918 | 0.024 | 0.911 | 0.924 | 0.038 | 0.906 | 0.906 | - | - | - |
| RD3D | TNNLS24 | 0.033 | 0.928 | 0.928 | 0.022 | 0.921 | 0.933 | 0.037 | 0.905 | 0.914 | 0.046 | 0.900 | 0.892 |
| CFADNet(本文) | - | 0.027 | 0.933 | 0.930 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 | 0.041 | 0.910 | 0.897 |
), ArticleFig(id=1249044049529872418, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=表1, caption=
定量评估
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | 接收会议 | NJU2K数据集 | NLPR数据集 | STERE数据集 | SIP数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| DCF | CVPR 21 | 0.035 | 0.902 | 0.912 | 0.021 | 0.891 | 0.924 | 0.039 | 0.885 | 0.902 | 0.051 | 0.875 | 0.876 |
| CIRNet | TIP 22 | 0.035 | 0.927 | 0.925 | 0.023 | 0.924 | 0.933 | 0.038 | 0.914 | 0.917 | 0.052 | 0.896 | 0.888 |
| CM-LCG | TIP 22 | 0.043 | 0.915 | 0.913 | 0.029 | 0.906 | 0.922 | 0.043 | 0.906 | 0.910 | - | - | - |
| AILNet | ESWA 22 | 0.045 | 0.876 | 0.898 | 0.029 | 0.857 | 0.912 | 0.038 | 0.880 | 0.908 | 0.050 | 0.866 | 0.889 |
| SPSN | ECCV 22 | 0.032 | 0.920 | 0.918 | 0.023 | 0.910 | 0.923 | 0.035 | 0.900 | 0.907 | 0.042 | 0.899 | 0.892 |
| TMFNet | TETCI 22 | 0.041 | 0.882 | 0.910 | 0.027 | 0.867 | 0.921 | - | - | - | 0.057 | 0.853 | 0.874 |
| AFNet | Nuecom22 | 0.032 | 0.928 | 0.926 | 0.020 | 0.925 | 0.936 | 0.034 | 0.918 | 0.918 | 0.043 | 0.909 | 0.896 |
| JL-DCF | TPAMI 22 | 0.040 | 0.913 | 0.911 | 0.023 | 0.917 | 0.926 | 0.039 | 0.907 | 0.911 | 0.046 | 0.900 | 0.892 |
| EBFSP | TMM 22 | 0.038 | 0.895 | 0.907 | 0.028 | 0.887 | 0.909 | 0.041 | 0.873 | 0.900 | 0.052 | 0.863 | 0.877 |
| CAVER | TIP 23 | 0.031 | 0.925 | 0.921 | 0.020 | 0.921 | 0.929 | 0.033 | 0.912 | 0.913 | 0.042 | 0.902 | 0.893 |
| HINet | PR 23 | 0.039 | 0.914 | 0.915 | 0.026 | 0.906 | 0.922 | 0.049 | 0.883 | 0.892 | 0.066 | 0.855 | 0.856 |
| C2DFNet | TMM 23 | 0.039 | 0.909 | 0.908 | 0.022 | 0.917 | 0.928 | 0.038 | 0.897 | 0.902 | 0.053 | 0.877 | 0.872 |
| PICRNet | ACMM 23 | 0.029 | 0.931 | 0.927 | 0.019 | 0.928 | 0.935 | 0.031 | 0.920 | 0.921 | 0.053 | 0.883 | 0.872 |
| DGFNet | TMM 24 | 0.032 | 0.914 | 0.921 | 0.021 | 0.902 | 0.928 | 0.035 | 0.896 | 0.911 | 0.048 | 0.879 | 0.883 |
| FCFNet | TCSVT 24 | 0.034 | 0.923 | 0.918 | 0.024 | 0.911 | 0.924 | 0.038 | 0.906 | 0.906 | - | - | - |
| RD3D | TNNLS24 | 0.033 | 0.928 | 0.928 | 0.022 | 0.921 | 0.933 | 0.037 | 0.905 | 0.914 | 0.046 | 0.900 | 0.892 |
| CFADNet(本文) | - | 0.027 | 0.933 | 0.930 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 | 0.041 | 0.910 | 0.897 |
), ArticleFig(id=1249044049617952811, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Tab.2, caption=
Quantitative comparison in terms of average precision and average recall with other methods
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 | SIP数据集 |
|---|
| Precavg | Recallavg | Precavg | Recallavg | Precavg | Recallavg | Precavg | Recallavg |
|---|
| DCF | 0.908 | 0.917 | 0.898 | 0.922 | 0.888 | 0.918 | 0.902 | 0.847 |
| SPSN | 0.918 | 0.924 | 0.901 | 0.924 | 0.893 | 0.924 | 0.901 | 0.894 |
| AFNet | 0.916 | 0.925 | 0.907 | 0.924 | 0.900 | 0.931 | 0.913 | 0.874 |
| CAVER | 0.924 | 0.929 | 0.917 | 0.924 | 0.904 | 0.930 | 0.922 | 0.876 |
| HINet | 0.909 | 0.908 | 0.896 | 0.909 | 0.868 | 0.892 | 0.885 | 0.808 |
| PICRNet | 0.900 | 0.894 | 0.911 | 0.921 | 0.869 | 0.873 | 0.887 | 0.864 |
| C2DFNet | 0.910 | 0.898 | 0.911 | 0.919 | 0.887 | 0.913 | 0.887 | 0.858 |
| RD3D | 0.917 | 0.925 | 0.904 | 0.923 | 0.884 | 0.926 | 0.907 | 0.872 |
| CFADNet(本文) | 0.927 | 0.937 | 0.926 | 0.938 | 0.909 | 0.946 | 0.922 | 0.882 |
), ArticleFig(id=1249044049727004720, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=表2, caption=
与其他方法的平均精度和平均召回率比较
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 | SIP数据集 |
|---|
| Precavg | Recallavg | Precavg | Recallavg | Precavg | Recallavg | Precavg | Recallavg |
|---|
| DCF | 0.908 | 0.917 | 0.898 | 0.922 | 0.888 | 0.918 | 0.902 | 0.847 |
| SPSN | 0.918 | 0.924 | 0.901 | 0.924 | 0.893 | 0.924 | 0.901 | 0.894 |
| AFNet | 0.916 | 0.925 | 0.907 | 0.924 | 0.900 | 0.931 | 0.913 | 0.874 |
| CAVER | 0.924 | 0.929 | 0.917 | 0.924 | 0.904 | 0.930 | 0.922 | 0.876 |
| HINet | 0.909 | 0.908 | 0.896 | 0.909 | 0.868 | 0.892 | 0.885 | 0.808 |
| PICRNet | 0.900 | 0.894 | 0.911 | 0.921 | 0.869 | 0.873 | 0.887 | 0.864 |
| C2DFNet | 0.910 | 0.898 | 0.911 | 0.919 | 0.887 | 0.913 | 0.887 | 0.858 |
| RD3D | 0.917 | 0.925 | 0.904 | 0.923 | 0.884 | 0.926 | 0.907 | 0.872 |
| CFADNet(本文) | 0.927 | 0.937 | 0.926 | 0.938 | 0.909 | 0.946 | 0.922 | 0.882 |
), ArticleFig(id=1249044049823473720, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Tab.3, caption=
Comparison of computational complexity and parameter size with other methods
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | FLOPs/G | 参数量/M |
|---|
| DCF | 55.48 | 107.29 |
| CIRNet | 156.34 | 82.08 |
| TMFNet | - | 266.7 |
| AFNet | 130.02 | 258.13 |
| HINet | 389.7 | 98.9 |
| C2DFNet | 22.047 | 47.52 |
| DGFNet | 74.89 | 42.14 |
| RD3D | 57.8 | 47.14 |
| CFADNet(本文) | 46.82 | 203.88 |
), ArticleFig(id=1249044049945108542, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=表3, caption=
与其他方法计算复杂度和参数量对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | FLOPs/G | 参数量/M |
|---|
| DCF | 55.48 | 107.29 |
| CIRNet | 156.34 | 82.08 |
| TMFNet | - | 266.7 |
| AFNet | 130.02 | 258.13 |
| HINet | 389.7 | 98.9 |
| C2DFNet | 22.047 | 47.52 |
| DGFNet | 74.89 | 42.14 |
| RD3D | 57.8 | 47.14 |
| CFADNet(本文) | 46.82 | 203.88 |
), ArticleFig(id=1249044050012217412, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Tab.4, caption=
Comparison experiment of CAFEM with other fusion methods
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| w/o CAFEM | 0.029 | 0.928 | 0.926 | 0.018 | 0.933 | 0.937 | 0.030 | 0.920 | 0.923 |
| CmPI | 0.030 | 0.929 | 0.925 | 0.018 | 0.931 | 0.938 | 0.032 | 0.915 | 0.919 |
| CAFEM | 0.027 | 0.933 | 0.930 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 |
), ArticleFig(id=1249044050083520587, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=表4, caption=
CAFEM与不同融合方法的对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| w/o CAFEM | 0.029 | 0.928 | 0.926 | 0.018 | 0.933 | 0.937 | 0.030 | 0.920 | 0.923 |
| CmPI | 0.030 | 0.929 | 0.925 | 0.018 | 0.931 | 0.938 | 0.032 | 0.915 | 0.919 |
| CAFEM | 0.027 | 0.933 | 0.930 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 |
), ArticleFig(id=1249044050171600978, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Tab.5, caption=
Ablation studies on the BFEM
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| w/o EE | 0.029 | 0.927 | 0.926 | 0.017 | 0.933 | 0.938 | 0.03 | 0.921 | 0.922 |
| BFEM | 0.027 | 0.933 | 0.93 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 |
), ArticleFig(id=1249044050272264280, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=表5, caption=
BFEM的消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| w/o EE | 0.029 | 0.927 | 0.926 | 0.017 | 0.933 | 0.938 | 0.03 | 0.921 | 0.922 |
| BFEM | 0.027 | 0.933 | 0.93 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 |
), ArticleFig(id=1249044050402287713, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=EN, label=Tab.6, caption=
Ablation studies on the loss function
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| FBCE | 0.034 | 0.910 | 0.921 | 0.020 | 0.905 | 0.911 | 0.036 | 0.903 | 0.910 |
| FBCE + FSSIM | 0.030 | 0.925 | 0.927 | 0.019 | 0.925 | 0.935 | 0.031 | 0.921 | 0.921 |
| F混合 | 0.032 | 0.917 | 0.924 | 0.021 | 0.918 | 0.928 | 0.033 | 0.912 | 0.917 |
| FBCE + FSSIM + FIoU | 0.027 | 0.933 | 0.930 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 |
), ArticleFig(id=1249044050515533930, tenantId=1146029695717560320, journalId=1249024232475115590, articleId=1249044017850294679, language=CN, label=表6, caption=
混合损失函数的消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方法 | NJU2K数据集 | NLPR数据集 | STERE数据集 |
|---|
| MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ | MAE ↓ | Fβ ↑ | Sα ↑ |
|---|
| FBCE | 0.034 | 0.910 | 0.921 | 0.020 | 0.905 | 0.911 | 0.036 | 0.903 | 0.910 |
| FBCE + FSSIM | 0.030 | 0.925 | 0.927 | 0.019 | 0.925 | 0.935 | 0.031 | 0.921 | 0.921 |
| F混合 | 0.032 | 0.917 | 0.924 | 0.021 | 0.918 | 0.928 | 0.033 | 0.912 | 0.917 |
| FBCE + FSSIM + FIoU | 0.027 | 0.933 | 0.930 | 0.017 | 0.934 | 0.939 | 0.028 | 0.923 | 0.925 |
)], attaches=null, journal=Journal(id=1249023527618129992, delFlag=0, nameCn=中国图象图形学报, nameEn=Journal of Image and Graphics, nameHistory1=null, nameHistory2=null, issn=1006-8961, eissn=null, cn=11-3758, coden=CODEN ZTTXFZ, periodic=0, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=uirXtX858YS3zEpFXZttJA==, journalPrice=null, startedYear=null, abbrevIsoEn=Journal of Image and Graphics, journalRemark=null, publicationField=null, createdTime=1775720014721, updatedTime=1775720337198, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=J, firstLetterEn=J, subjectCode=Engineering, subjectName=null, subjectCodeEn=Engineering, subjectNameEn=null, picCn=uirXtX858YS3zEpFXZttJA==, picEn=bud7qaxfvWHeFsbyBTAiKQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1249024880377786590, language=CN, name=中国图象图形学报, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1775720337242, updatedTime=1775720337242, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=e6369def-2842-41d8, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-editor&redirect_uri=https%3A%2F%2Fcjigeditor.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=9ccec05b-6bd, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=1e8a31c8-5434-4f78, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1249024880449089759, language=EN, name=Journal of Image and Graphics, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1775720337259, updatedTime=1775720337259, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=e6369def-2842-41d8, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-editor&redirect_uri=https%3A%2F%2Fcjigeditor.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=9ccec05b-6bd, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-cjig-author&redirect_uri=https%3A%2F%2Fcjig.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=1e8a31c8-5434-4f78, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1249024232475115590, websiteList=[Website(id=1249025782459334881, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1249024232475115590, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN, language=CN, createTime=1775720552315, createBy=18614031015, updateTime=1775720586268, updateBy=18614031015, name=中国图象图形学报-中文, tplId=1146099689490845704, title=中国图象图形学报, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1249026166254928133, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=articleTextType, value=kx, createTime=1775720643819, updateTime=1775720643819, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166221373698, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=banner, value=null, createTime=1775720643811, updateTime=1775720643811, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166271705352, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=grayFlag, value=0, createTime=1775720643823, updateTime=1775720643823, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166212985089, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/file/pic?fileId=TDRjKTHfgAnvFKZaDA70wA==, createTime=1775720643809, updateTime=1775720643809, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166288482570, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=minRunFlag, value=0, createTime=1775720643827, updateTime=1775720643827, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166246539524, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/file/pic, createTime=1775720643817, updateTime=1775720643817, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166280093961, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=silenceFlag, value=0, createTime=1775720643825, updateTime=1775720643825, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166233956611, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1775720643814, updateTime=1775720643814, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166259122438, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=themeColor, value=null, createTime=1775720643820, updateTime=1775720643820, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026166267511047, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782459334881, code=themeStyle, value=null, createTime=1775720643822, updateTime=1775720643822, creator=18614031015, updator=18614031015)]), Website(id=1249025782681633001, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1249024232475115590, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN, language=EN, createTime=1775720552368, createBy=18614031015, updateTime=1775720607118, updateBy=18614031015, name=中国图象图形学报-英文, tplId=1146101810881728533, title=Journal of Image and Graphics, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1249026195371786511, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=articleTextType, value=kx, createTime=1775720650761, updateTime=1775720650761, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195355009292, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=banner, value=null, createTime=1775720650757, updateTime=1775720650757, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195392758034, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=grayFlag, value=0, createTime=1775720650766, updateTime=1775720650766, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195342426379, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/file/pic?fileId=TDRjKTHfgAnvFKZaDA70wA==, createTime=1775720650754, updateTime=1775720650754, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195409535252, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=minRunFlag, value=0, createTime=1775720650770, updateTime=1775720650770, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195367592206, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/file/pic, createTime=1775720650760, updateTime=1775720650760, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195401146643, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=silenceFlag, value=0, createTime=1775720650768, updateTime=1775720650768, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195359203597, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1775720650758, updateTime=1775720650758, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195380175120, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=themeColor, value=null, createTime=1775720650763, updateTime=1775720650763, creator=18614031015, updator=18614031015), WebsiteProps(id=1249026195388563729, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1249025782681633001, code=themeStyle, value=null, createTime=1775720650765, updateTime=1775720650765, creator=18614031015, updator=18614031015)])], journalTitle=中国图象图形学报, weixinUrl=null, journalUrl=https://www.cjig.cn/, iacademicId=null, status=1, seqNo=null, journalTitleEn=Journal of Image and Graphics, journalPhotoCn=uirXtX858YS3zEpFXZttJA==, journalPhotoEn=bud7qaxfvWHeFsbyBTAiKQ==, journalFirstLetter=J, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/10.11834/jig.240653, detailUrlEn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/10.11834/jig.240653, pdfUrlCn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/CN/PDF/10.11834/jig.240653, pdfUrlEn=https://castjournals.cast.org.cn/joweb/zgtxtxxb/EN/PDF/10.11834/jig.240653, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)