Article(id=1203753459473428945, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1203753457208504777, articleNumber=null, orderNo=null, doi=10.12404/j.issn.1671-1815.2307782, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=research-article, receivedDate=1696608000000, receivedDateStr=2023-10-07, revisedDate=1729094400000, revisedDateStr=2024-10-17, acceptedDate=null, acceptedDateStr=null, onlineDate=1764926789395, onlineDateStr=2025-12-05, pubDate=1737129600000, pubDateStr=2025-01-18, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1764926789395, onlineIssueDateStr=2025-12-05, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1764926789395, creator=13701087609, updateTime=1764926789395, updator=13701087609, issue=Issue{id=1203753457208504777, tenantId=1146029695717560320, journalId=1146123166801305609, year='2025', volume='25', issue='2', pageStart='439', pageEnd='878', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=null, createTime=1764926788856, creator=13701087609, updateTime=1764928745558, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1203761664261858014, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1203753457208504777, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1203761664261858015, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1203753457208504777, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=649, endPage=656, ext={EN=ArticleExt(id=1203753460127740377, articleId=1203753459473428945, tenantId=1146029695717560320, journalId=1146123166801305609, language=EN, title=Chinese News Title Classification Based on Lightweight Improved ERNIE-RCNN, columnId=1156262729162810294, journalTitle=Science Technology and Engineering, columnName=Papers·Automation and Computational Technology, runingTitle=null, highlight=null, articleAbstract=
Aiming at the problems that the large-scale pre-training language model faces when dealing with news headlines, such as huge parameters, inefficient use of contextual semantic features and circular convolution neural network’s neglect of the importance of initial input elements, a news headline classification method that combines ERNIE(enhanced representation through knowledge integration) of mixture-of-expert model and recurrent convolution neural network with attention mechanism were proposed. Firstly, the text was encoded with the help of MoE’s improved ERNIE technology, and then the text was classified with attention RCNN (recurrent convolutional neural networks)on the basis of preserving the word order and characteristics of the text. In order to improve the classification ability, RCNN was improved by calculating the input fusion context weight. In the process of calculating the weights of experts in MoE, Gumbel-Softmax was selected as a new gating function to improve the traditional Softmax function, so as to better control the smoothness. According to the experimental results, it is found that compared with the traditional classification methods, the classification method proposed in this study shows significant advantages and greatly reduces the number of parameters. On this basis, the F1 value is increased by 0.51% compared with the traditional model. After the ablation experiment, the feasibility of this classification method in the classification task has been confirmed.
, correspAuthors=Zhi-xin ZHANG, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Li LI, Zhi-xin ZHANG, Xiao-long WANG), CN=ArticleExt(id=1203753462682071633, articleId=1203753459473428945, tenantId=1146029695717560320, journalId=1146123166801305609, language=CN, title=基于轻量化改进ERNIE-RCNN的中文新闻标题分类, columnId=1156262729783567290, journalTitle=科学技术与工程, columnName=论文·自动化技术、计算机技术, runingTitle=null, highlight=null, articleAbstract=
针对大型预训练语言模型在处理新闻标题时,面临参数规模庞大、无法高效利用上下文语意特征以及循环卷积神经网络对初始输入元素重要性忽视的问题,提出了一种融合混合专家模型(mixture-of-expert,MoE)的ERNIE与注意力机制的循环卷积神经网络(recurrent convolutional neural networks,RCNN)的新闻标题分类方法。首先,借助MoE改进ERNIE技术进行文本编码,随后利用注意力RCNN在保留文本词序和特征的基础上进行分类。为提高分类能力,通过计算输入的融合上下文权重对RCNN进行改进。在计算MoE中各个专家权重的过程中,选择Gumbel_Softmax作为新型的门控函数以改进传统的Softmax函数,从而更好地控制平滑程度。根据实验结果,发现相较于传统的分类方法,本文研究提出的分类方法展现出显著优势,极大地减少了参数数量。在此基础上,F1相较于传统模型提升了0.51%。经过消融实验的验证,该分类方法在分类任务上的可行性得到了证实。
, correspAuthors=张之欣, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=dSh2MWJjPlJ04Y5Q5Oi+eQ==, magXml=Fc+pKU7QYwBz2DtcPGij/g==, pdfUrl=null, pdf=zgteTkUTCn7CUqSVvTys+w==, pdfFileSize=3101034, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=TijwtFAnAg7Sy/oK3kPVtQ==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=5FiBR9r3LX+b4IXalt3/Ig==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=李莉, 张之欣, 王小龙)}, authors=[Author(id=1203787147070387075, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=haolily12@163.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1203787147338822547, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, authorId=1203787147070387075, language=EN, stringName=Li LI, firstName=Li, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China
2 Hebei Key Laboratory of Knowledge Computing for Energy & Power, Baoding 071003, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1203787147426902942, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, authorId=1203787147070387075, language=CN, stringName=李莉, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, 2, address=
1 华北电力大学控制与计算机工程学院, 保定 071003
2 河北省能源电力知识计算重点实验室, 保定 071003, bio={"content":"
李莉(1980—),女,汉族,重庆人,博士,副教授。研究方向:大数据分析、深度学习。E-mail:haolily12@163.com。
"}, bioImg=null, bioContent=
李莉(1980—),女,汉族,重庆人,博士,副教授。研究方向:大数据分析、深度学习。E-mail:haolily12@163.com。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1203787146780980076, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, xref=1, ext=[AuthorCompanyExt(id=1203787146785174381, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China), AuthorCompanyExt(id=1203787146793562990, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华北电力大学控制与计算机工程学院, 保定 071003)]), AuthorCompany(id=1203787146944557945, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, xref=2, ext=[AuthorCompanyExt(id=1203787146952946554, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146944557945, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 Hebei Key Laboratory of Knowledge Computing for Energy & Power, Baoding 071003, China), AuthorCompanyExt(id=1203787146957140859, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146944557945, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 河北省能源电力知识计算重点实验室, 保定 071003)])]), Author(id=1203787147544343469, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=2973916737@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1203787147678561206, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, authorId=1203787147544343469, language=EN, stringName=Zhi-xin ZHANG, firstName=Zhi-xin, middleName=null, lastName=ZHANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, *, address=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1203787147825361865, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, authorId=1203787147544343469, language=CN, stringName=张之欣, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, *, address=
1 华北电力大学控制与计算机工程学院, 保定 071003, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1203787146780980076, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, xref=1, ext=[AuthorCompanyExt(id=1203787146785174381, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China), AuthorCompanyExt(id=1203787146793562990, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华北电力大学控制与计算机工程学院, 保定 071003)])]), Author(id=1203787147984745428, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1203787148118963171, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, authorId=1203787147984745428, language=EN, stringName=Xiao-long WANG, firstName=Xiao-long, middleName=null, lastName=WANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1203787149377254387, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, authorId=1203787147984745428, language=CN, stringName=王小龙, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 华北电力大学控制与计算机工程学院, 保定 071003, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1203787146780980076, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, xref=1, ext=[AuthorCompanyExt(id=1203787146785174381, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China), AuthorCompanyExt(id=1203787146793562990, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华北电力大学控制与计算机工程学院, 保定 071003)])])], keywords=[Keyword(id=1203787149649883152, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, orderNo=1, keyword=MoE (mixture of experts)), Keyword(id=1203787149800878114, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, orderNo=2, keyword=ERNIE (enhanced representation through knowledge integration)), Keyword(id=1203787149893152816, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, orderNo=3, keyword=attention mechanism), Keyword(id=1203787149998010434, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, orderNo=4, keyword=RCNN (recurrent convolutional neural network)), Keyword(id=1203787150119645265, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, orderNo=5, keyword=text classification), Keyword(id=1203787150232891490, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, orderNo=1, keyword=混合专家系统), Keyword(id=1203787150442606700, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, orderNo=2, keyword=知识增强语义表示模型), Keyword(id=1203787150601990265, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, orderNo=3, keyword=注意力机制), Keyword(id=1203787150757179531, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, orderNo=4, keyword=循环卷积神经网络), Keyword(id=1203787150903980186, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, orderNo=5, keyword=文本分类)], refs=[Reference(id=1203787155534492199, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=33, pageStart=14264, pageEnd=14270, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=诸林云, 范菁, 曲金帅, journalName=科学技术与工程, refType=null, unstructuredReference=诸林云, 范菁, 曲金帅, 等. 基于BERT与多通道卷积神经网络的细粒度情感分类[J].
科学技术与工程,
2023,
23(33): 14264-14270., articleTitle=基于BERT与多通道卷积神经网络的细粒度情感分类, refAbstract=null), Reference(id=1203787155656127024, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2023, volume=23, issue=33, pageStart=14264, pageEnd=14270, url=null, language=null, rfNumber=[1], rfOrder=1, authorNames=Zhu Linyun, Fan Jing, Qu Jinshuai, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Zhu Linyun,
Fan Jing,
Qu Jinshuai, et al. Fine-grained sentiment classification based on BERT and multi-channel convolutional neural networks[J].
Science Technology and Engineering,
2023,
23(33): 14264-14270., articleTitle=Fine-grained sentiment classification based on BERT and multi-channel convolutional neural networks, refAbstract=null), Reference(id=1203787155760984638, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2021, volume=45, issue=11, pageStart=144, pageEnd=151, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=俞学豪, 赵子岩, 马应龙, journalName=电力系统自动化, refType=null, unstructuredReference=俞学豪, 赵子岩, 马应龙, 等. 基于BR和GBDT的电力信息通信客服系统多标签文本分类[J].
电力系统自动化,
2021,
45(11): 144-151., articleTitle=基于BR和GBDT的电力信息通信客服系统多标签文本分类, refAbstract=null), Reference(id=1203787155870036557, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2015, volume=45, issue=11, pageStart=144, pageEnd=151, url=null, language=null, rfNumber=[2], rfOrder=3, authorNames=Yu Xuehao, Zhao Ziyan, Ma Yinglong, journalName=Automation of Electric Power Systems, refType=null, unstructuredReference=
Yu Xuehao,
Zhao Ziyan,
Ma Yinglong, et al. Multi-label text classification of power information communication customer service system based on BR and GBDT[J].
Automation of Electric Power Systems,
2015,
45(11): 144-151., articleTitle=Multi-label text classification of power information communication customer service system based on BR and GBDT, refAbstract=null), Reference(id=1203787155991671388, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2023, volume=17, issue=12, pageStart=2840, pageEnd=2860, url=null, language=null, rfNumber=[3], rfOrder=4, authorNames=孟祥福, 霍红锦, 张霄雁, journalName=计算机科学与探索, refType=null, unstructuredReference=孟祥福, 霍红锦, 张霄雁, 等. 个性化新闻推荐方法研究综述[J].
计算机科学与探索,
2023,
17(12): 2840-2860., articleTitle=个性化新闻推荐方法研究综述, refAbstract=null), Reference(id=1203787156151054954, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2023, volume=17, issue=12, pageStart=2840, pageEnd=2860, url=null, language=null, rfNumber=[3], rfOrder=5, authorNames=Meng Xiangfu, Huo Hongjin, Zhang Xiaoyan, journalName=Exploration of Computer Science and Technology, refType=null, unstructuredReference=
Meng Xiangfu,
Huo Hongjin,
Zhang Xiaoyan, et al. Research review on personalized news recommendation methods[J].
Exploration of Computer Science and Technology,
2023,
17(12): 2840-2860., articleTitle=Research review on personalized news recommendation methods, refAbstract=null), Reference(id=1203787156281078390, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2023, volume=7, issue=4, pageStart=16, pageEnd=31, url=null, language=null, rfNumber=[4], rfOrder=6, authorNames=华玮, 吴思洋, 俞超, journalName=数据分析与知识发现, refType=null, unstructuredReference=华玮, 吴思洋, 俞超, 等. 面向网络舆情事件的多层次情感分歧度分析方法[J].
数据分析与知识发现,
2023,
7(4): 16-31., articleTitle=面向网络舆情事件的多层次情感分歧度分析方法, refAbstract=null), Reference(id=1203787156444656258, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2023, volume=7, issue=4, pageStart=16, pageEnd=31, url=null, language=null, rfNumber=[4], rfOrder=7, authorNames=Hua Wei, Wu Siyang, Yu Chao, journalName=Data Analysis and Knowledge Discovery, refType=null, unstructuredReference=
Hua Wei,
Wu Siyang,
Yu Chao, et al. Multi-level emotion divergence analysis method for network public opinion events[J].
Data Analysis and Knowledge Discovery,
2023,
7(4): 16-31., articleTitle=Multi-level emotion divergence analysis method for network public opinion events, refAbstract=null), Reference(id=1203787156612428435, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2021, volume=47, issue=8, pageStart=1, pageEnd=13, url=null, language=null, rfNumber=[5], rfOrder=8, authorNames=王军, 冯孙铖, 程勇, journalName=计算机工程, refType=null, unstructuredReference=王军, 冯孙铖, 程勇. 深度学习的轻量化神经网络结构研究综述[J].
计算机工程,
2021,
47(8): 1-13., articleTitle=深度学习的轻量化神经网络结构研究综述, refAbstract=null), Reference(id=1203787156755034781, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=201, issue=8, pageStart=1, pageEnd=13, url=null, language=null, rfNumber=[5], rfOrder=9, authorNames=Wang Jun, journalName=Computer Engineering, refType=null, unstructuredReference=
Wang Jun, Feng Suncheng, Cheng Yong. A review of lightweight neural network structures for deep learning[J].
Computer Engineering,
201,
47(8): 1-13., articleTitle=A review of lightweight neural network structures for deep learning, refAbstract=null), Reference(id=1203787156880863912, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2014, volume=null, issue=null, pageStart=1746, pageEnd=1751, url=null, language=null, rfNumber=[6], rfOrder=10, authorNames=Kim Y, journalName=Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP), refType=null, unstructuredReference=
Kim Y. Convolutional neural networks for sentence classification[C]//
Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP). Doha: EMNLP,
2014: 1746-1751., articleTitle=Convolutional neural networks for sentence classification, refAbstract=null), Reference(id=1203787156977332914, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[7], rfOrder=11, authorNames=Liu P, Qiu X, Huang X, journalName=arXiv preprint arXiv: 1605.05101, 2016, refType=null, unstructuredReference=
Liu P,
Qiu X,
Huang X. Recurrentneural network for text classification with multi-task learning[J].
arXiv preprint arXiv: 1605.05101, 2016., articleTitle=Recurrentneural network for text classification with multi-task learning, refAbstract=null), Reference(id=1203787157082190530, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[8], rfOrder=12, authorNames=Lai S, Xu L, Liu K, journalName=AAAI Press, refType=null, unstructuredReference=
Lai S,
Xu L,
Liu K, et al. Recurrent convolutional neural networks for text classification[J].
AAAI Press,
2015.DOI:
10.1609/aaai.v29i1.9513., articleTitle=Recurrent convolutional neural networks for text classification, refAbstract=null), Reference(id=1203787157874913998, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[9], rfOrder=13, authorNames=Joulin A, Grave E, Bojanowski P, journalName=arXiv preprint arXiv: 1607.01759, 2016, refType=null, unstructuredReference=
Joulin A,
Grave E,
Bojanowski P, et al. Bag of tricks for efficient text classification[J].
arXiv preprint arXiv: 1607.01759, 2016., articleTitle=Bag of tricks for efficient text classification, refAbstract=null), Reference(id=1203787157975577301, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2017, volume=5, issue=null, pageStart=135, pageEnd=146, url=null, language=null, rfNumber=[10], rfOrder=14, authorNames=Bojanowski P, Grave E, Joulin A, journalName=Transactions of the Association for Computational Linguistics, refType=null, unstructuredReference=
Bojanowski P,
Grave E,
Joulin A, et al. Enriching word vectors with subword information[J].
Transactions of the Association for Computational Linguistics,
2017,
5: 135-146., articleTitle=Enriching word vectors with subword information, refAbstract=null), Reference(id=1203787158084629221, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=562, pageEnd=570, url=null, language=null, rfNumber=[11], rfOrder=15, authorNames=Johnson R, Zhang T, journalName=Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics (Volume 1:Long Papers), refType=null, unstructuredReference=
Johnson R,
Zhang T. Deep pyramid convolutional neural networks for text categorization[C]//
Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics (Volume 1:Long Papers). Vancouver: DPCNN,
2017: 562-570., articleTitle=Deep pyramid convolutional neural networks for text categorization, refAbstract=null), Reference(id=1203787158197875438, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2020, volume=56, issue=23, pageStart=12, pageEnd=22, url=null, language=null, rfNumber=[12], rfOrder=16, authorNames=余同瑞, 金冉, 韩晓臻, journalName=计算机工程与应用, refType=null, unstructuredReference=余同瑞, 金冉, 韩晓臻, 等. 自然语言处理预训练模型的研究综述[J].
计算机工程与应用,
2020,
56(23): 12-22., articleTitle=自然语言处理预训练模型的研究综述, refAbstract=null), Reference(id=1203787158306927352, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2019, volume=56, issue=23, pageStart=12, pageEnd=22, url=null, language=null, rfNumber=[12], rfOrder=17, authorNames=Yu Tongrui, Jin Ran, Han Xiaozhen, journalName=Computer Engineering and Applications, refType=null, unstructuredReference=
Yu Tongrui,
Jin Ran,
Han Xiaozhen, et al. A review of research on pre-training models for natural language processing[J].
Computer Engineering and Applications,
2019,
56(23): 12-22., articleTitle=A review of research on pre-training models for natural language processing, refAbstract=null), Reference(id=1203787158390813438, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[13], rfOrder=18, authorNames=Devlin J, Chang M W, Lee K, journalName=arXiv preprint arXiv: 1810.04805, 2018, refType=null, unstructuredReference=
Devlin J,
Chang M W,
Lee K, et al. Bert: pretraining of deep bidirectional transformers for language understanding[J].
arXiv preprint arXiv: 1810.04805, 2018., articleTitle=Bert: pretraining of deep bidirectional transformers for language understanding, refAbstract=null), Reference(id=1203787158504059655, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[14], rfOrder=19, authorNames=Sun Y, Wang S, Li Y, journalName=arXiv preprint arXiv: 1904.09223, 2019, refType=null, unstructuredReference=
Sun Y,
Wang S,
Li Y, et al. Ernie: enhanced representation through knowledge integration[J].
arXiv preprint arXiv: 1904.09223, 2019., articleTitle=Ernie: enhanced representation through knowledge integration, refAbstract=null), Reference(id=1203787158629888787, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2022, volume=22, issue=20, pageStart=8761, pageEnd=8770, url=null, language=null, rfNumber=[15], rfOrder=20, authorNames=杨秀璋, 郭明镇, 候红涛, journalName=科学技术与工程, refType=null, unstructuredReference=杨秀璋, 郭明镇, 候红涛, 等. 融合情感词典的改进BiLSTM-CNN+Attention情感分类算法[J].
科学技术与工程,
2022,
22(20): 8761-8770., articleTitle=融合情感词典的改进BiLSTM-CNN+Attention情感分类算法, refAbstract=null), Reference(id=1203787158755717921, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2019, volume=22, issue=20, pageStart=8671, pageEnd=8770, url=null, language=null, rfNumber=[15], rfOrder=21, authorNames=Yang Xiuzhang, Guo Mingzhen, Hou Hongtao, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Yang Xiuzhang,
Guo Mingzhen,
Hou Hongtao, et al. Improved BiLSTM-CNN+Attention emotion classification algorithm based onIntegrated emotion dictionary[J].
Science Technology and Engineering,
2019,
22(20): 8671-8770., articleTitle=Improved BiLSTM-CNN+Attention emotion classification algorithm based onIntegrated emotion dictionary, refAbstract=null), Reference(id=1203787158948655917, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2021, volume=16, issue=2, pageStart=202, pageEnd=209, url=null, language=null, rfNumber=[16], rfOrder=22, authorNames=翟学明, 魏巍, journalName=智能系统学报, refType=null, unstructuredReference=翟学明, 魏巍. 混合神经网络和条件随机场相结合的文本情感分析[J].
智能系统学报,
2021,
16(2): 202-209., articleTitle=混合神经网络和条件随机场相结合的文本情感分析, refAbstract=null), Reference(id=1203787159187731269, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=201, issue=2, pageStart=202, pageEnd=209, url=null, language=null, rfNumber=[16], rfOrder=23, authorNames=Zhai Xueming, Wei Wei, journalName=Journal of Intelligent Systems, refType=null, unstructuredReference=
Zhai Xueming,
Wei Wei. Text sentiment analysis by combining hybrid neural networks and conditional random fields[J].
Journal of Intelligent Systems,
201,
16(2): 202-209., articleTitle=Text sentiment analysis by combining hybrid neural networks and conditional random fields, refAbstract=null), Reference(id=1203787159296783181, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2021, volume=35, issue=11, pageStart=70, pageEnd=79, url=null, language=null, rfNumber=[17], rfOrder=24, authorNames=陆晓蕾, 倪斌, journalName=中文信息学报, refType=null, unstructuredReference=陆晓蕾, 倪斌. 基于预训练语言模型的BERT-CNN多层级专利分类研究[J].
中文信息学报,
2021,
35(11): 70-79., articleTitle=基于预训练语言模型的BERT-CNN多层级专利分类研究, refAbstract=null), Reference(id=1203787159405835094, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2019, volume=35, issue=11, pageStart=70, pageEnd=79, url=null, language=null, rfNumber=[17], rfOrder=25, authorNames=Lu Xiaolei, Ni Bin, journalName=Journal of Chinese Information Technology, refType=null, unstructuredReference=
Lu Xiaolei,
Ni Bin. Research on BERT-CNN multi-level patent classification based onpre-trained language model[J].
Journal of Chinese Information Technology,
2019,
35(11): 70-79., articleTitle=Research on BERT-CNN multi-level patent classification based onpre-trained language model, refAbstract=null), Reference(id=1203787159556830050, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=1991, volume=3, issue=1, pageStart=79, pageEnd=87, url=null, language=null, rfNumber=[18], rfOrder=26, authorNames=Jacobs R A, Jordan M I, Nowlan S J, journalName=Neural Computation, refType=null, unstructuredReference=
Jacobs R A,
Jordan M I,
Nowlan S J, et al. Adaptive mixtures of local experts[J].
Neural Computation,
1991,
3(1): 79-87., articleTitle=Adaptive mixtures of local experts, refAbstract=null), Reference(id=1203787159670076270, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[19], rfOrder=27, authorNames=Shazeer N, Mirhoseini A, Maziarz K, journalName=arXiv preprint arXiv: 1701.06538, 2017, refType=null, unstructuredReference=
Shazeer N,
Mirhoseini A,
Maziarz K, et al. Outrageously large neural networks: the sparsely-gated mixture-of-experts layer[J].
arXiv preprint arXiv: 1701.06538, 2017., articleTitle=Outrageously large neural networks: the sparsely-gated mixture-of-experts layer, refAbstract=null), Reference(id=1203787159804294011, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[20], rfOrder=28, authorNames=Lepikhin D, Lee H J, Xu Y, journalName=arXiv preprint arXiv: 2006, refType=null, unstructuredReference=
Lepikhin D,
Lee H J,
Xu Y, et al. Gshard: scaling giant models with conditional computation and automatic sharding[J].
arXiv preprint arXiv: 2006.16668, 2020., articleTitle=Gshard: scaling giant models with conditional computation and automatic sharding, refAbstract=null), Reference(id=1203787159951094661, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2022, volume=23, issue=1, pageStart=5232, pageEnd=5270, url=null, language=null, rfNumber=[21], rfOrder=29, authorNames=Fedus W, Zoph B, Shazeer N, journalName=The Journal of Machine Learning Research, refType=null, unstructuredReference=
Fedus W,
Zoph B,
Shazeer N. Switch transformers: scaling to trillion parameter models with simple and efficient sparsity[J].
The Journal of Machine Learning Research,
2022,
23(1): 5232-5270., articleTitle=Switch transformers: scaling to trillion parameter models with simple and efficient sparsity, refAbstract=null), Reference(id=1203787160081118094, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[22], rfOrder=30, authorNames=Du N, Huang Y, Dai A M, journalName=arXiv preprint arXiv: 2112, refType=null, unstructuredReference=
Du N,
Huang Y,
Dai A M, et al. Glam: efficient scaling of language models with mixture-of-experts[J].
arXiv preprint arXiv: 2112.06905, 2021., articleTitle=Glam: efficient scaling of language models with mixture-of-experts, refAbstract=null), Reference(id=1203787160227918744, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2020, volume=33, issue=null, pageStart=1877, pageEnd=1901, url=null, language=null, rfNumber=[23], rfOrder=31, authorNames=Brown T, Mann B, Ryder N, journalName=Advances in Neural Information Processing Systems, refType=null, unstructuredReference=
Brown T,
Mann B,
Ryder N, et al. Language models are few-shot learners[J].
Advances in Neural Information Processing Systems,
2020,
33: 1877-1901., articleTitle=Language models are few-shot learners, refAbstract=null), Reference(id=1203787160408273823, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[24], rfOrder=32, authorNames=Xue F, Shi Z, Wei F, journalName=arXiv preprint arXiv: 2107, refType=null, unstructuredReference=
Xue F,
Shi Z,
Wei F, et al. Go wider instead of deeper[J].
arXiv preprint arXiv: 2107.11817, 2021., articleTitle=Go wider instead of deeper, refAbstract=null), Reference(id=1203787160584434599, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[25], rfOrder=33, authorNames=Zuo S, Zhang Q, Liang C, journalName=arXiv preprint arXiv: 2204, refType=null, unstructuredReference=
Zuo S,
Zhang Q,
Liang C, et al. Moebert: from bert to mixture-of-experts
via importance-guided adaptation[J].
arXiv preprint arXiv: 2204.07675, 2022., articleTitle=Moebert: from bert to mixture-of-experts
via importance-guided adaptation, refAbstract=null), Reference(id=1203787160701875122, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2015, volume=14, issue=7, pageStart=38, pageEnd=39, url=null, language=null, rfNumber=[26], rfOrder=34, authorNames=Hinton G, Vinyals O, Dean J, journalName=Computer Science, refType=null, unstructuredReference=
Hinton G,
Vinyals O,
Dean J. Distilling the knowledge in a neural network[J].
Computer Science,
2015,
14(7): 38-39., articleTitle=Distilling the knowledge in a neural network, refAbstract=null), Reference(id=1203787160819315644, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[27], rfOrder=35, authorNames=Jang E, Gu S, Poole B, journalName=arXiv preprint arXiv: 1611.01144, 2016, refType=null, unstructuredReference=
Jang E,
Gu S,
Poole B. Categorical reparameterization with gumbel-softmax[J].
arXiv preprint arXiv: 1611.01144, 2016., articleTitle=Categorical reparameterization with gumbel-softmax, refAbstract=null), Reference(id=1203787160974504902, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, doi=null, pmid=null, pmcid=null, year=2019, volume=29, issue=null, pageStart=1061, pageEnd=1073, url=null, language=null, rfNumber=[28], rfOrder=36, authorNames=Zhang P, Xue J, Lan C, journalName=IEEE Transactions on Image Processing, refType=null, unstructuredReference=
Zhang P,
Xue J,
Lan C, et al. EleAtt-RNN: adding attentiveness to neurons in recurrent neural networks[J].
IEEE Transactions on Image Processing,
2019,
29: 1061-1073., articleTitle=EleAtt-RNN: adding attentiveness to neurons in recurrent neural networks, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1203787146780980076, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, xref=1, ext=[AuthorCompanyExt(id=1203787146785174381, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 School of Control and Computer Engineering, North China Electric Power University, Baoding 071003,China), AuthorCompanyExt(id=1203787146793562990, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146780980076, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华北电力大学控制与计算机工程学院, 保定 071003)]), AuthorCompany(id=1203787146944557945, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, xref=2, ext=[AuthorCompanyExt(id=1203787146952946554, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146944557945, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 Hebei Key Laboratory of Knowledge Computing for Energy & Power, Baoding 071003, China), AuthorCompanyExt(id=1203787146957140859, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, companyId=1203787146944557945, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 河北省能源电力知识计算重点实验室, 保定 071003)])], figs=[ArticleFig(id=1203787151256301749, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Fig.1, caption=
The model framework of this paper, figureFileSmall=33YEGUqWMq3Thdpbf4v27A==, figureFileBig=78b1tdEretqAiXAgMdIYWQ==, tableContent=null), ArticleFig(id=1203787151386325190, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=图1, caption=
本文的模型框架, figureFileSmall=33YEGUqWMq3Thdpbf4v27A==, figureFileBig=78b1tdEretqAiXAgMdIYWQ==, tableContent=null), ArticleFig(id=1203787151575068894, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Fig.2, caption=
Improved encoder layer for ERNIE, figureFileSmall=cbTH6X5eHad3vo0qehleXw==, figureFileBig=21BVjSmVUTDaJ+2TKdetlQ==, tableContent=null), ArticleFig(id=1203787151663149290, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=图2, caption=
改进ERNIE的encoder层 G为门控单元
, figureFileSmall=cbTH6X5eHad3vo0qehleXw==, figureFileBig=21BVjSmVUTDaJ+2TKdetlQ==, tableContent=null), ArticleFig(id=1203787151747035381, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Fig.3, caption=
Sparsely-gated mixture-of-expert layer, figureFileSmall=IJlUhcifRUL4hlH0vZV5yA==, figureFileBig=qAy1NLy5T1z8+c7c3/LcSA==, tableContent=null), ArticleFig(id=1203787151877058825, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=图3, caption=
稀疏门控混合专家系统层 Ei为第i个词向量的加权,i=1,2,…,n
, figureFileSmall=IJlUhcifRUL4hlH0vZV5yA==, figureFileBig=qAy1NLy5T1z8+c7c3/LcSA==, tableContent=null), ArticleFig(id=1203787152007082259, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Fig.4, caption=
RCNN structure, figureFileSmall=3FI8T1emTmK4eHFbHSjYcg==, figureFileBig=SAP8E+Yep7/DMKCAl5ZlrA==, tableContent=null), ArticleFig(id=1203787152162271529, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=图4, caption=
RCNN结构, figureFileSmall=3FI8T1emTmK4eHFbHSjYcg==, figureFileBig=SAP8E+Yep7/DMKCAl5ZlrA==, tableContent=null), ArticleFig(id=1203787152262934838, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Fig.5, caption=
EleAtt-RNN structure, figureFileSmall=++aoV32ZtHFN0xop5qYfMA==, figureFileBig=5ny3xDIzatlshnaNNZZBOQ==, tableContent=null), ArticleFig(id=1203787152376181055, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=图5, caption=
EleAtt-RNN结构, figureFileSmall=++aoV32ZtHFN0xop5qYfMA==, figureFileBig=5ny3xDIzatlshnaNNZZBOQ==, tableContent=null), ArticleFig(id=1203787152518787406, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 1, caption=
Data sample
, figureFileSmall=null, figureFileBig=null, tableContent=
| 输入 | 类别 |
| 皇马剥开胜利有个不得不说问题 走了的人是否会被怀念 | 7 |
| 某知名女星边工作边犒劳员工 率12人齐赴戛纳玩 | 9 |
| 常州一小区现楼晃晃 10栋居民楼晃动半年多 | 1 |
| 多地学校探索多元化评价体系 学生全面发展受重视 | 3 |
| 顺义香悦四季95~115 m2 3居新房源在售享98折 | 1 |
), ArticleFig(id=1203787153693192540, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表1, caption=
数据示例
, figureFileSmall=null, figureFileBig=null, tableContent=
| 输入 | 类别 |
| 皇马剥开胜利有个不得不说问题 走了的人是否会被怀念 | 7 |
| 某知名女星边工作边犒劳员工 率12人齐赴戛纳玩 | 9 |
| 常州一小区现楼晃晃 10栋居民楼晃动半年多 | 1 |
| 多地学校探索多元化评价体系 学生全面发展受重视 | 3 |
| 顺义香悦四季95~115 m2 3居新房源在售享98折 | 1 |
), ArticleFig(id=1203787153789661540, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 2, caption=
Experimental configuration
, figureFileSmall=null, figureFileBig=null, tableContent=
| 环境 | 配置参数 |
| 处理器 | Intel(R) Core (TM) i7-7700K CPU @4.20 GHz |
| 显卡 | NVIDIA GEFORCE RTX 3080Ti |
| 内存 | 32 GB |
| 框架 | PyTorch 1.10 |
), ArticleFig(id=1203787153907102069, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表2, caption=
实验配置
, figureFileSmall=null, figureFileBig=null, tableContent=
| 环境 | 配置参数 |
| 处理器 | Intel(R) Core (TM) i7-7700K CPU @4.20 GHz |
| 显卡 | NVIDIA GEFORCE RTX 3080Ti |
| 内存 | 32 GB |
| 框架 | PyTorch 1.10 |
), ArticleFig(id=1203787154016153984, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 3, caption=
Comprehensive experimental results
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 精确率/% | 召回率/% | F1/% |
| TextCNN | 81.83 | 80.71 | 81.27 |
| BiGRU | 79.76 | 79.02 | 79.39 |
| RCNN | 83.77 | 82.15 | 82.95 |
| BERT | 90.68 | 90.55 | 90.61 |
| ERNIE | 91.04 | 90.99 | 91.01 |
| ERNIE+CNN | 92.32 | 92.28 | 92.29 |
| ERNIE+BiGRU | 92.56 | 92.51 | 92.53 |
| ERNIE+RCNN | 93.79 | 93.66 | 93.72 |
| 本文方法 | 94.26 | 94.21 | 94.23 |
), ArticleFig(id=1203787154234257805, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表3, caption=
综合实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 精确率/% | 召回率/% | F1/% |
| TextCNN | 81.83 | 80.71 | 81.27 |
| BiGRU | 79.76 | 79.02 | 79.39 |
| RCNN | 83.77 | 82.15 | 82.95 |
| BERT | 90.68 | 90.55 | 90.61 |
| ERNIE | 91.04 | 90.99 | 91.01 |
| ERNIE+CNN | 92.32 | 92.28 | 92.29 |
| ERNIE+BiGRU | 92.56 | 92.51 | 92.53 |
| ERNIE+RCNN | 93.79 | 93.66 | 93.72 |
| 本文方法 | 94.26 | 94.21 | 94.23 |
), ArticleFig(id=1203787154330726809, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 4, caption=
The experts compared the experimental results
, figureFileSmall=null, figureFileBig=null, tableContent=
| 专家数 | 精确率/% | 召回率/% | F1/% | 参数量/106 |
| 4 | 90.84 | 90.85 | 90.84 | 26.64 |
| 6 | 91.21 | 91.19 | 91.20 | 27.83 |
| 8 | 91.37 | 91.32 | 91.34 | 29.01 |
| 10 | 91.51 | 91.45 | 91.48 | 30.19 |
| 12 | 91.38 | 91.36 | 91.37 | 31.38 |
), ArticleFig(id=1203787154443973027, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表4, caption=
专家数对比实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 专家数 | 精确率/% | 召回率/% | F1/% | 参数量/106 |
| 4 | 90.84 | 90.85 | 90.84 | 26.64 |
| 6 | 91.21 | 91.19 | 91.20 | 27.83 |
| 8 | 91.37 | 91.32 | 91.34 | 29.01 |
| 10 | 91.51 | 91.45 | 91.48 | 30.19 |
| 12 | 91.38 | 91.36 | 91.37 | 31.38 |
), ArticleFig(id=1203787154578190776, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 5, caption=
Gating function comparison experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 门控函数 | 精确率/% | 召回率/% | F1/% |
| Softmax | 90.42 | 90.38 | 90.40 |
| Gumbel_Softmax | 91.51 | 91.49 | 91.48 |
), ArticleFig(id=1203787154762740168, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表5, caption=
门控函数对比实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 门控函数 | 精确率/% | 召回率/% | F1/% |
| Softmax | 90.42 | 90.38 | 90.40 |
| Gumbel_Softmax | 91.51 | 91.49 | 91.48 |
), ArticleFig(id=1203787154896957909, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 6, caption=
Classification error sample
, figureFileSmall=null, figureFileBig=null, tableContent=
| 输入 | 类别 | 预测 |
| 体育赛事与明星演唱会联动 为观众带来双重激情盛宴 | 7 | 9 |
| 广东高考满分作文17篇 一道语文题13万人吃鸭蛋 | 3 | 5 |
| 社会助力教育公平 偏远地区儿童获新知 | 4 | 3 |
| 糖价长期高位运行 果葡糖等替代品需求强劲 | 0 | 4 |
), ArticleFig(id=1203787155001815524, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表6, caption=
分类错误样本
, figureFileSmall=null, figureFileBig=null, tableContent=
| 输入 | 类别 | 预测 |
| 体育赛事与明星演唱会联动 为观众带来双重激情盛宴 | 7 | 9 |
| 广东高考满分作文17篇 一道语文题13万人吃鸭蛋 | 3 | 5 |
| 社会助力教育公平 偏远地区儿童获新知 | 4 | 3 |
| 糖价长期高位运行 果葡糖等替代品需求强劲 | 0 | 4 |
), ArticleFig(id=1203787155161199092, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=EN, label=Table 7, caption=
Ablation experiment
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 精确率/% | 召回率/% | F1/% | 参数量/106 |
| ERNIE-RCNN | 93.79 | 93.66 | 93.72 | 101.45 |
| ERNIE-Att-RCNN | 94.01 | 93.99 | 93.99 | 103.02 |
| 改进ERNIE-RCNN | 93.96 | 93.98 | 93.97 | 31.77 |
| 本文模型 | 94.26 | 94.21 | 94.23 | 33.34 |
), ArticleFig(id=1203787155261862403, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1203753459473428945, language=CN, label=表7, caption=
消融实验
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | 精确率/% | 召回率/% | F1/% | 参数量/106 |
| ERNIE-RCNN | 93.79 | 93.66 | 93.72 | 101.45 |
| ERNIE-Att-RCNN | 94.01 | 93.99 | 93.99 | 103.02 |
| 改进ERNIE-RCNN | 93.96 | 93.98 | 93.97 | 31.77 |
| 本文模型 | 94.26 | 94.21 | 94.23 | 33.34 |
)], attaches=null, journal=Journal(id=1146119176004939786, delFlag=0, nameCn=科学技术与工程, nameEn=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, issn=1671-1815, eissn=, cn=11-4688/T, coden=null, periodic=4, language=CN, oaType=是, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=UKU/O7GSka5polgCTkbIIw==, journalPrice=null, startedYear=null, abbrevIsoEn=Sci Technol Eng, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1754445529766, createdBy=null, updatedBy=13701087609, firstLetterCn=S, firstLetterEn=S, subjectCode=Natural Sciences, subjectName=自然科学, subjectCodeEn=Natural Sciences, subjectNameEn=null, picCn=UKU/O7GSka5polgCTkbIIw==, picEn=5hwlULoNwcbj3xUmVi9MAQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1159791870395564357, language=CN, name=科学技术与工程, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529793, updatedTime=1754445529793, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=http://www.stae.com.cn/jsygc/site/menus/20090429150146001, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1159791870441701702, language=EN, name=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529804, updatedTime=1754445529804, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146123166801305609, websiteList=[Website(id=1148243202391400884, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/CN, language=CN, createTime=1751692112777, createBy=18614031015, updateTime=1753520965431, updateBy=18614031015, name=科学技术与工程-中文站点, tplId=1146099689490845704, title=科学技术与工程, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148622798802673703, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=articleTextType, value=kx, createTime=1751782615614, updateTime=1751782615614, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798781702180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=banner, value=null, createTime=1751782615609, updateTime=1751782615609, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798769119267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1751782615606, updateTime=1751782615606, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798794285094, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782615612, updateTime=1751782615612, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798790090789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782615611, updateTime=1751782615611, creator=18614031015, updator=18614031015)]), Website(id=1155914124811976731, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/EN, language=EN, createTime=1753521003206, createBy=18614031015, updateTime=1753521003206, updateBy=18614031015, name=科学技术与工程-英文站点, tplId=1146101810881728533, title=Science Technology and Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155914371227308235, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=articleTextType, value=kx, createTime=1753521061952, updateTime=1753521061952, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371210531016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=banner, value=null, createTime=1753521061947, updateTime=1753521061947, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371202142407, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1753521061945, updateTime=1753521061945, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371223113930, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753521061950, updateTime=1753521061950, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371218919625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753521061949, updateTime=1753521061949, creator=18614031015, updator=18614031015)])], journalTitle=科学技术与工程, weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Science Technology and Engineering, journalPhotoCn=UKU/O7GSka5polgCTkbIIw==, journalPhotoEn=5hwlULoNwcbj3xUmVi9MAQ==, journalFirstLetter=S, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/10.12404/j.issn.1671-1815.2307782, detailUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/10.12404/j.issn.1671-1815.2307782, pdfUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/PDF/10.12404/j.issn.1671-1815.2307782, pdfUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/PDF/10.12404/j.issn.1671-1815.2307782, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)