Article(id=1268884547455320084, tenantId=1146029695717560320, journalId=1268266580820377661, issueId=1268884383122494171, articleNumber=null, orderNo=null, doi=10.3969/j.issn.1001-4632.2026.02.20, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=null, receivedDate=1750694400000, receivedDateStr=2025-06-24, revisedDate=1773244800000, revisedDateStr=2026-03-12, acceptedDate=null, acceptedDateStr=null, onlineDate=1780455250847, onlineDateStr=2026-06-03, pubDate=1772294400000, pubDateStr=2026-03-01, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1780455250847, onlineIssueDateStr=2026-06-03, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1780455250847, creator=13701087609, updateTime=1780455250847, updator=13701087609, issue=Issue{id=1268884383122494171, tenantId=1146029695717560320, journalId=1268266580820377661, year='2026', volume='47', issue='2', pageStart='1', pageEnd='255', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1780455211667, creator=13701087609, updateTime=1780455310713, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1268884798719300557, tenantId=1146029695717560320, journalId=1268266580820377661, issueId=1268884383122494171, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1268884798723494862, tenantId=1146029695717560320, journalId=1268266580820377661, issueId=1268884383122494171, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=232, endPage=243, ext={EN=ArticleExt(id=1268884548587782166, articleId=1268884547455320084, tenantId=1146029695717560320, journalId=1268266580820377661, language=EN, title=Research on the Application of Intelligent Recognition Technology for Sensitive Railway Ticket Data Based on Data Knowledge Base, columnId=null, journalTitle=China Railway Science, columnName=null, runingTitle=null, highlight=null, articleAbstract=
To address the data security risks arising from the explosive growth of railway passenger transport data, the core lies in achieving intelligent identification and dynamic protection of sensitive information. Then, an intelligent identification technology for sensitive data in railway passenger tickets based on data knowledge base is proposed. Firstly, a three-level knowledge base of "laws and regulations-industry standards-enterprise norms" is constructed. Secondly, combined with historical railway passenger ticket data, a multi-level intelligent identification algorithm for sensitive data is designed, thereby efficiently and accurately identifying sensitive information in multi-modal data. On this basis, the graph technology is finally introduced to construct a data asset and sensitive data lineage graph, and based on the topological relationship of data flow, the efficient propagation of sensitive information labels among related data nodes is achieved. The results show that the sensitive information identification efficiency of the proposed technology reaches about 217 000 messages per second in structured data processing, which is almost twice as high as the traditional solution. In unstructured data processing, through domain knowledge graphs injection, the F1 value of sensitive entity recognition is increased to 91.24%, and the context misjudgment rate is reduced to 5.88%. The accuracy of text extraction and sensitive information recognition of multimedia images reaches 93.71%. This technology can significantly improve the accuracy and processing efficiency of sensitive data identification in railway passenger tickets.
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Xiaopei HAO, Zhiyuan YAN, Junfeng ZHANG, Wen LI, Xiangkun LIU, Ruijun SHI), CN=ArticleExt(id=1268884555785207859, articleId=1268884547455320084, tenantId=1146029695717560320, journalId=1268266580820377661, language=CN, title=基于数据知识库的铁路客票敏感数据智能识别技术应用研究, columnId=0, journalTitle=中国铁道科学, columnName=, runingTitle=null, highlight=null, articleAbstract=
为应对铁路客运数据规模激增衍生的数据安全风险,实现敏感信息智能识别与动态防护,提出基于数据知识库的铁路客票敏感数据智能识别技术。通过构建“法律法规—行业标准—企业规范”3级知识库,结合铁路客票历史数据,设计多层次敏感数据智能识别算法,实现对多模态数据中敏感信息的高效精准识别。在此基础上引入图技术,构建数据资产及敏感数据血缘关系图谱,依据数据间流转拓扑关系,完成敏感信息标签在相关数据节点间的高效传播。结果表明:所提技术在结构化数据处理方面,可实现约21.7万条 · s-1的敏感信息识别效率,约为传统方案的2倍;在非结构化数据处理方面,通过领域知识图谱注入,将敏感实体识别的F1值提升至91.24%,上下文误判率下降至5.88%;多媒体图片文本提取及敏感信息识别准确率达93.71%。该技术可显著提升铁路客票敏感数据识别的准确性与处理效率。
, correspAuthors=null, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=Mm8jy/mt1Gr3CZuuiCOQqA==, magXml=8CK1WmY/8UI6XoYiVUCVUQ==, pdfUrl=null, pdf=CfVXle2jW/rDpZkCjiUGHg==, pdfFileSize=1525818, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=HeNmGk6RQioXXP5abmNlLA==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=w4KFwFPGH0ZNkrngYt77yA==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=郝晓培, 阎志远, 张军锋, 李雯, 刘相坤, 石瑞君)}, authors=[Author(id=1268884556217221177, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=linuxstar@126.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1268884556309495868, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884556217221177, language=EN, stringName=Xiaopei HAO, firstName=Xiaopei, middleName=null, lastName=HAO, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1268884556552765501, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884556217221177, language=CN, stringName=郝晓培, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081, bio={"content":"
郝晓培(1990—),男,河南林州人,助理研究员。E-mail:linuxstar@126.com
"}, bioImg=null, bioContent=
郝晓培(1990—),男,河南林州人,助理研究员。E-mail:linuxstar@126.com
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])]), Author(id=1268884556624068671, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1268884556980584513, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884556624068671, language=EN, stringName=Zhiyuan YAN, firstName=Zhiyuan, middleName=null, lastName=YAN, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1268884557064470594, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884556624068671, language=CN, stringName=阎志远, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])]), Author(id=1268884557404209220, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1268884557488095302, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884557404209220, language=EN, stringName=Junfeng ZHANG, firstName=Junfeng, middleName=null, lastName=ZHANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1268884557815251015, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884557404209220, language=CN, stringName=张军锋, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])]), Author(id=1268884557907525705, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=1556860343@qq.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1268884559618801739, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884557907525705, language=EN, stringName=Wen LI, firstName=Wen, middleName=null, lastName=LI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1268884559711076428, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884557907525705, language=CN, stringName=李雯, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])]), Author(id=1268884559912403022, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, orderNo=4, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1268884560021454928, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884559912403022, language=EN, stringName=Xiangkun LIU, firstName=Xiangkun, middleName=null, lastName=LIU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1268884560331833425, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884559912403022, language=CN, stringName=刘相坤, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])]), Author(id=1268884560386359379, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, orderNo=5, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1268884560755458133, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884560386359379, language=EN, stringName=Ruijun SHI, firstName=Ruijun, middleName=null, lastName=SHI, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1268884560822566998, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, authorId=1268884560386359379, language=CN, stringName=石瑞君, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])])], keywords=[Keyword(id=1268884561200054359, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, orderNo=1, keyword=Sensitive data), Keyword(id=1268884561279746136, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, orderNo=2, keyword=Knowledge base), Keyword(id=1268884561590124633, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, orderNo=3, keyword=Railway ticket), Keyword(id=1268884561678205018, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, orderNo=4, keyword=Intelligent recognition), Keyword(id=1268884562022137947, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, orderNo=5, keyword=Label propagation), Keyword(id=1268884562424791132, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, orderNo=6, keyword=Lineage graph), Keyword(id=1268884564010238045, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, orderNo=1, keyword=敏感数据), Keyword(id=1268884564106707038, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, orderNo=2, keyword=知识库), Keyword(id=1268884564186398815, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, orderNo=3, keyword=铁路客票), Keyword(id=1268884564521943136, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, orderNo=4, keyword=智能识别), Keyword(id=1268884564584857697, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, orderNo=5, keyword=标签传播), Keyword(id=1268884564945567842, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, orderNo=6, keyword=血缘关系图谱)], refs=[Reference(id=1268884569920012421, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2021, volume=42, issue=5, pageStart=162, pageEnd=173, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=单杏花, 张志强, 宁斐, journalName=中国铁道科学, refType=null, unstructuredReference=单杏花,张志强,宁斐,
等.中国铁路电子客票关键技术应用与系统实现[J].
中国铁道科学,
2021,
42 (5):162-173., articleTitle=中国铁路电子客票关键技术应用与系统实现, refAbstract=null), Reference(id=1268884570008092806, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2021, volume=42, issue=5, pageStart=162, pageEnd=173, url=null, language=null, rfNumber=[1], rfOrder=1, authorNames=SHAN Xinghua, ZHANG Zhiqiang, NING Fei, journalName=China Railway Science, refType=null, unstructuredReference=
SHAN Xinghua,
ZHANG Zhiqiang,
NING Fei,
et al. Key Technology Application and System Implementation of China Railway Electronic Ticket [J].
China Railway Science,
2021,
42 (5): 162-173. in Chinese, articleTitle=Key Technology Application and System Implementation of China Railway Electronic Ticket, refAbstract=null), Reference(id=1268884570087784583, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2024, volume=47, issue=23, pageStart=105, pageEnd=112, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=符泽凡, 姚竟发, 滕桂法, journalName=现代电子技术, refType=null, unstructuredReference=符泽凡,姚竟发,滕桂法.基于BERT模型的网站敏感信息识别及其变体还原技术研究[J].
现代电子技术,
2024,
47(23):105-112., articleTitle=基于BERT模型的网站敏感信息识别及其变体还原技术研究, refAbstract=null), Reference(id=1268884570159087752, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2024, volume=47, issue=23, pageStart=105, pageEnd=112, url=null, language=null, rfNumber=[2], rfOrder=3, authorNames=FU Zefan, YAO Jingfa, TENG Guifa, journalName=Modern Electronics Technique, refType=null, unstructuredReference=
FU Zefan,
YAO Jingfa,
TENG Guifa. Research on Website Sensitive Information Identification and Variant Restoration Technology Based on BERT Model [J].
Modern Electronics Technique,
2024,
47 (23): 105-112. in Chinese, articleTitle=Research on Website Sensitive Information Identification and Variant Restoration Technology Based on BERT Model, refAbstract=null), Reference(id=1268884570259751049, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2016, volume=50, issue=9, pageStart=80, pageEnd=84, url=null, language=null, rfNumber=[3], rfOrder=4, authorNames=李扬, 潘泉, 杨涛, journalName=西安交通大学学报, refType=null, unstructuredReference=李扬,潘泉,杨涛.基于短文本情感分析的敏感信息识别[J].
西安交通大学学报,
2016,
50(9):80-84., articleTitle=基于短文本情感分析的敏感信息识别, refAbstract=null), Reference(id=1268884570343637130, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2016, volume=50, issue=9, pageStart=80, pageEnd=84, url=null, language=null, rfNumber=[3], rfOrder=5, authorNames=LI Yang, PAN Quan, YANG Tao, journalName=Journal of Xi’an Jiaotong University, refType=null, unstructuredReference=
LI Yang,
PAN Quan,
YANG Tao. Sensitive Information Recognition Based on Short Text Sentiment Analysis [J].
Journal of Xi’an Jiaotong University,
2016,
50 (9): 80-84. in Chinese, articleTitle=Sensitive Information Recognition Based on Short Text Sentiment Analysis, refAbstract=null), Reference(id=1268884570427523211, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2019, volume=4, issue=5, pageStart=1385, pageEnd=1398, url=null, language=null, rfNumber=[4], rfOrder=6, authorNames=LI W P, WU H Y, YANG J, journalName=Discrete and Continuous Dynamical Systems-S, refType=null, unstructuredReference=
LI W P,
WU H Y,
YANG J. Intelligent Recognition Algorithm for Social Network Sensitive Information Based on Classification Technology [J].
Discrete and Continuous Dynamical Systems-S,
2019, 12 (
4/5): 1385-1398., articleTitle=Intelligent Recognition Algorithm for Social Network Sensitive Information Based on Classification Technology, refAbstract=null), Reference(id=1268884570507214988, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2019, volume=7, issue=null, pageStart=21527, pageEnd=21538, url=null, language=null, rfNumber=[5], rfOrder=7, authorNames=XU G, WU X, YAO H, journalName=IEEE Access, refType=null, unstructuredReference=
XU G,
WU X,
YAO H,
et al. Research on Topic Recognition of Network Sensitive Information Based on SW-LDA Model [J].
IEEE Access,
2019,
7: 21527-21538., articleTitle=Research on Topic Recognition of Network Sensitive Information Based on SW-LDA Model, refAbstract=null), Reference(id=1268884570582712461, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2019, volume=7, issue=null, pageStart=96177, pageEnd=96190, url=null, language=null, rfNumber=[6], rfOrder=8, authorNames=XU G, YU Z, CHEN Z, journalName=IEEE Access, refType=null, unstructuredReference=
XU G,
YU Z,
CHEN Z,
et al. Sensitive Information Topics-Based Sentiment Analysis Method for Big Data [J].
IEEE Access,
2019,
7: 96177-96190., articleTitle=Sensitive Information Topics-Based Sentiment Analysis Method for Big Data, refAbstract=null), Reference(id=1268884570674987150, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2007, volume=null, issue=null, pageStart=255, pageEnd=261, url=null, language=null, rfNumber=[7], rfOrder=9, authorNames=KRASSER S, TANG Y, GOULD J, journalName=null, refType=null, unstructuredReference=
KRASSER S,
TANG Y,
GOULD J,
et al. Identifying Image Spam Based on Header and File Properties Using C4.5 Decision Trees and Support Vector Machine Learning [C]// 2007 IEEE SMC Information Assurance and Security Workshop. New York: IEEE,
2007: 255-261., articleTitle=Identifying Image Spam Based on Header and File Properties Using C4.5 Decision Trees and Support Vector Machine Learning, refAbstract=null), Reference(id=1268884570750484623, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=433, pageEnd=443, url=null, language=null, rfNumber=[8], rfOrder=10, authorNames=WANG W, WU Y, PALAIAHNAKOTE S, journalName=null, refType=null, unstructuredReference=
WANG W,
WU Y,
PALAIAHNAKOTE S,
et al. Cloud of Line Distribution for Arbitrary Text Detection in Scene/Video/License Plate Images [C]// Advances in Multimedia Information Processing-PCM 2017. Cham: Springer International Publishing,
2018: 433-443., articleTitle=Cloud of Line Distribution for Arbitrary Text Detection in Scene/Video/License Plate Images, refAbstract=null), Reference(id=1268884570817593488, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2017, volume=39, issue=11, pageStart=2298, pageEnd=2304, url=null, language=null, rfNumber=[9], rfOrder=11, authorNames=SHI B, BAI X, YAO C, journalName=IEEE Transactions on Pattern Analysis and Machine Intelligence, refType=null, unstructuredReference=
SHI B,
BAI X,
YAO C. An End-to-End Trainable Neural Network for Image-Based Sequence Recognition and Its Application to Scene Text Recognition [J].
IEEE Transactions on Pattern Analysis and Machine Intelligence,
2017,
39 (11): 2298-2304, articleTitle=An End-to-End Trainable Neural Network for Image-Based Sequence Recognition and Its Application to Scene Text Recognition, refAbstract=null), Reference(id=1268884570893090961, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=5, pageStart=28, pageEnd=30, url=null, language=null, rfNumber=[10], rfOrder=12, authorNames=汪庆, 陈杰, journalName=网络安全技术与应用, refType=null, unstructuredReference=汪庆,陈杰.深度包检测技术中的正则表达式匹配研究综述[J].
网络安全技术与应用,
2024(5):28-30., articleTitle=深度包检测技术中的正则表达式匹配研究综述, refAbstract=null), Reference(id=1268884570968588434, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=5, pageStart=28, pageEnd=30, url=null, language=null, rfNumber=[10], rfOrder=13, authorNames=WANG Qing, CHEN Jie, journalName=Network Security Technology & Application, refType=null, unstructuredReference=
WANG Qing,
CHEN Jie. A Review of Regular Expression Matching Research in Deep Packet Inspection Technology [J].
Network Security Technology & Application,
2024 (5): 28-30. in Chinese, articleTitle=A Review of Regular Expression Matching Research in Deep Packet Inspection Technology, refAbstract=null), Reference(id=1268884571044085907, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2022, volume=44, issue=2, pageStart=581, pageEnd=590, url=null, language=null, rfNumber=[11], rfOrder=14, authorNames=姜海洋, 李雪菲, 杨晔, journalName=电子与信息学报, refType=null, unstructuredReference=姜海洋,李雪菲,杨晔.基于距离比较的AC自动机并行匹配算法[J].
电子与信息学报,
2022,
44(2):581-590., articleTitle=基于距离比较的AC自动机并行匹配算法, refAbstract=null), Reference(id=1268884571111194772, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2022, volume=44, issue=2, pageStart=581, pageEnd=590, url=null, language=null, rfNumber=[11], rfOrder=15, authorNames=JIANG Haiyang, LI Xuefei, YANG Ye, journalName=Journal of Electronics & Information Technology, refType=null, unstructuredReference=
JIANG Haiyang,
LI Xuefei,
YANG Ye,
et al. Distance Comparison Based Parallel Pattern Matching [J].
Journal of Electronics & Information Technology,
2022,
44 (2): 581-590. in Chinese, articleTitle=Distance Comparison Based Parallel Pattern Matching, refAbstract=null), Reference(id=1268884571195080853, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2025, volume=53, issue=7, pageStart=155, pageEnd=164, url=null, language=null, rfNumber=[12], rfOrder=16, authorNames=杨虹, 孟晓凯, 俞华, journalName=电力系统保护与控制, refType=null, unstructuredReference=杨虹,孟晓凯,俞华,
等.基于BERT模型的主设备缺陷诊断方法研究[J].
电力系统保护与控制,
2025,
53 (7):155-164., articleTitle=基于BERT模型的主设备缺陷诊断方法研究, refAbstract=null), Reference(id=1268884571283161238, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2025, volume=53, issue=7, pageStart=155, pageEnd=164, url=null, language=null, rfNumber=[12], rfOrder=17, authorNames=YANG Hong, MENG Xiaokai, YU Hua, journalName=Power System Protection and Control, refType=null, unstructuredReference=
YANG Hong,
MENG Xiaokai,
YU Hua,
et al. Research on Primary Equipment Defect Diagnosis Method Based on the BERT Model [J].
Power System Protection and Control,
2025,
53 (7): 155-164. in Chinese, articleTitle=Research on Primary Equipment Defect Diagnosis Method Based on the BERT Model, refAbstract=null), Reference(id=1268884572939911319, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2020, volume=42, issue=11, pageStart=1433, pageEnd=1448, url=null, language=null, rfNumber=[13], rfOrder=18, authorNames=白志程, 李擎, 陈鹏, journalName=工程科学学报, refType=null, unstructuredReference=白志程,李擎,陈鹏,
等.自然场景文本检测技术研究综述[J].
工程科学学报,
2020,
42(11):1433-1448., articleTitle=自然场景文本检测技术研究综述, refAbstract=null), Reference(id=1268884573040574616, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2020, volume=42, issue=11, pageStart=1433, pageEnd=1448, url=null, language=null, rfNumber=[13], rfOrder=19, authorNames=BAI Zhicheng, LI Qing, CHEN Peng, journalName=Chinese Journal of Engineering, refType=null, unstructuredReference=
BAI Zhicheng,
LI Qing,
CHEN Peng,
et al. Text Detection in Natural Scenes: a Literature Review [J].
Chinese Journal of Engineering,
2020,
42 (11): 1433-1448. in Chinese, articleTitle=Text Detection in Natural Scenes: a Literature Review, refAbstract=null), Reference(id=1268884573116072089, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=498, pageEnd=517, url=null, language=null, rfNumber=[14], rfOrder=20, authorNames=KIM G, HONG T, YIM M, journalName=null, refType=null, unstructuredReference=
KIM G,
HONG T, YIM M,
et al. OCR-Free Document Understanding Transformer [C]// Computer Vision-ECCV 2022. Cham: Springer Nature Switzerland,
2022: 498-517., articleTitle=OCR-Free Document Understanding Transformer, refAbstract=null), Reference(id=1268884573204152474, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[15], rfOrder=21, authorNames=RADFORD A, KIM J W, HALLACY C, journalName=ArXiv e-Prints, refType=null, unstructuredReference=
RADFORD A,
KIM J W,
HALLACY C,
et al. Learning Transferable Visual Models from Natural Language Supervision [J].
ArXiv e-Prints,
2021: arXiv:2103.00020 [cs. CV]., articleTitle=Learning Transferable Visual Models from Natural Language Supervision, refAbstract=null), Reference(id=1268884573279649947, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2012, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[16], rfOrder=22, authorNames=ISLAM N S, RAHMAN M W, JOSE J, journalName=null, refType=null, unstructuredReference=
ISLAM N S,
RAHMAN M W,
JOSE J,
et al. High Performance RDMA-Based Design of HDFS over InfiniBand [C]// SC’12: Proceedings of the International Conference on High Performance Computing, Networking, Storage and Analysis. New York: IEEE,
2012., articleTitle=High Performance RDMA-Based Design of HDFS over InfiniBand, refAbstract=null), Reference(id=1268884573355147420, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=135, pageEnd=146, url=null, language=null, rfNumber=[17], rfOrder=23, authorNames=MONDAL S, MUKHERJEE N, journalName=null, refType=null, unstructuredReference=
MONDAL S,
MUKHERJEE N. Efficient NoSQL Graph Database for Storage and Access of Health Data [C]// Computer Communication, Networking and IoT. Singapore: Springer,
2021: 135-146., articleTitle=Efficient NoSQL Graph Database for Storage and Access of Health Data, refAbstract=null), Reference(id=1268884573418061981, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2024, volume=41, issue=1, pageStart=76, pageEnd=82, url=null, language=null, rfNumber=[18], rfOrder=24, authorNames=潘晓华, 金泳, 高扬华, journalName=计算机应用研究, refType=null, unstructuredReference=潘晓华,金泳,高扬华,
等.面向复杂数据审计需求的数据血缘构建方法[J].
计算机应用研究,
2024,
41(1):76-82., articleTitle=面向复杂数据审计需求的数据血缘构建方法, refAbstract=null), Reference(id=1268884573480976542, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2024, volume=41, issue=1, pageStart=76, pageEnd=82, url=null, language=null, rfNumber=[18], rfOrder=25, authorNames=PAN Xiaohua, JIN Yong, GAO Yanghua, journalName=Application Research of Computers, refType=null, unstructuredReference=
PAN Xiaohua,
JIN Yong,
GAO Yanghua,
et al. Data Lineage Construction Method for Complex Data Audit Requirements [J].
Application Research of Computers,
2024,
41 (1): 76-82. in Chinese, articleTitle=Data Lineage Construction Method for Complex Data Audit Requirements, refAbstract=null), Reference(id=1268884573569056927, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, doi=null, pmid=null, pmcid=null, year=2025, volume=71, issue=2, pageStart=3930, pageEnd=3940, url=null, language=null, rfNumber=[19], rfOrder=26, authorNames=XIE Y R, journalName=IEEE Transactions on Consumer Electronics, refType=null, unstructuredReference=
XIE Y R. Application of CRNN and OpenGL in Intelligent Landscape Design Systems Utilizing Internet of Things, Explainable Artificial Intelligence, and Drone Technology [J].
IEEE Transactions on Consumer Electronics,
2025,
71 (2): 3930-3940., articleTitle=Application of CRNN and OpenGL in Intelligent Landscape Design Systems Utilizing Internet of Things, Explainable Artificial Intelligence, and Drone Technology, refAbstract=null)], funds=null, companyList=[AuthorCompany(id=1268884556133335093, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, xref=1., ext=[AuthorCompanyExt(id=1268884556145918006, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.Institute of Computing Technology, China Academy of Railway Sciences Corporation Limited, Beijing100081, China), AuthorCompanyExt(id=1268884556154306615, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, companyId=1268884556133335093, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1.中国铁道科学研究院集团有限公司 电子计算技术研究所,北京100081)])], figs=[ArticleFig(id=1268884565075591267, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=Mga69QWPI/uRfiw8yUThRA==, figureFileBig=HeNmGk6RQioXXP5abmNlLA==, tableContent=null), ArticleFig(id=1268884565398552676, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图1, caption=
铁路客运敏感信息识别体系框架, figureFileSmall=Mga69QWPI/uRfiw8yUThRA==, figureFileBig=HeNmGk6RQioXXP5abmNlLA==, tableContent=null), ArticleFig(id=1268884565553741925, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=ncbWDPtWJbaZaL8CVpFhhw==, figureFileBig=wSwF/4B0HSQ0OIMXUsfaQw==, tableContent=null), ArticleFig(id=1268884565784428646, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图2, caption=
铁路敏感信息知识库构建技术框架, figureFileSmall=ncbWDPtWJbaZaL8CVpFhhw==, figureFileBig=wSwF/4B0HSQ0OIMXUsfaQw==, tableContent=null), ArticleFig(id=1268884565859926119, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=l3gpRKNCLKMyTt06ayLU2w==, figureFileBig=+yQQWzZBCodjyyZqStcYtg==, tableContent=null), ArticleFig(id=1268884565922840680, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图3, caption=
铁路敏感信息知识库示例, figureFileSmall=l3gpRKNCLKMyTt06ayLU2w==, figureFileBig=+yQQWzZBCodjyyZqStcYtg==, tableContent=null), ArticleFig(id=1268884565989949545, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=qr3L2BW+nboElAMdSTh4+g==, figureFileBig=M6vruPIis7hQv5K6X3RD/g==, tableContent=null), ArticleFig(id=1268884566078029930, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图4, caption=
多模态敏感信息混合识别引擎数据处理链路, figureFileSmall=qr3L2BW+nboElAMdSTh4+g==, figureFileBig=M6vruPIis7hQv5K6X3RD/g==, tableContent=null), ArticleFig(id=1268884566145138795, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=TizC6hhHOXCE5fp1CFiMNQ==, figureFileBig=AYMRaTMEsjQ5NX9pnXSwSg==, tableContent=null), ArticleFig(id=1268884566224830572, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图5, caption=
融合的识别机制框架, figureFileSmall=TizC6hhHOXCE5fp1CFiMNQ==, figureFileBig=AYMRaTMEsjQ5NX9pnXSwSg==, tableContent=null), ArticleFig(id=1268884566291939437, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=8wBT/5WsEkgzN2opagISnw==, figureFileBig=3K5r1FHmGm0U96TycXpnaQ==, tableContent=null), ArticleFig(id=1268884566359048302, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图6, caption=
非结构化数据敏感信息识别模型架构, figureFileSmall=8wBT/5WsEkgzN2opagISnw==, figureFileBig=3K5r1FHmGm0U96TycXpnaQ==, tableContent=null), ArticleFig(id=1268884566463905903, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=H+HZpf6PEmCLIE28OnL2VA==, figureFileBig=F9iwX+h/cfXVUffRTnNVnw==, tableContent=null), ArticleFig(id=1268884566551986288, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图7, caption=
多媒体图像数据敏感信息识别框架, figureFileSmall=H+HZpf6PEmCLIE28OnL2VA==, figureFileBig=F9iwX+h/cfXVUffRTnNVnw==, tableContent=null), ArticleFig(id=1268884566644260977, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=+uFd3k1LtI0bFGgs8dOqcQ==, figureFileBig=gaDPcW+2QOVDbM3AZSVjjQ==, tableContent=null), ArticleFig(id=1268884566732341362, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图8, caption=
铁路客运系统数据流转关系(单位:条), figureFileSmall=+uFd3k1LtI0bFGgs8dOqcQ==, figureFileBig=gaDPcW+2QOVDbM3AZSVjjQ==, tableContent=null), ArticleFig(id=1268884568401674355, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=wIdaWiPZoeVulbwTZe5V/A==, figureFileBig=+QJ94a6gSod7Ig4f4SO4RA==, tableContent=null), ArticleFig(id=1268884568514920564, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图9, caption=
数据血缘关系图谱, figureFileSmall=wIdaWiPZoeVulbwTZe5V/A==, figureFileBig=+QJ94a6gSod7Ig4f4SO4RA==, tableContent=null), ArticleFig(id=1268884568598806645, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=v3IrCW5JlkSgkjwqJZDjYw==, figureFileBig=EFhAmd5tRLlhnAz9HlRLRg==, tableContent=null), ArticleFig(id=1268884568665915510, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=图10, caption=
场景3试验流程, figureFileSmall=v3IrCW5JlkSgkjwqJZDjYw==, figureFileBig=EFhAmd5tRLlhnAz9HlRLRg==, tableContent=null), ArticleFig(id=1268884568749801591, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 名称 | 依据 | 特征描述 | 典型示例 | 敏感程度 |
|---|
| 身份证号 | 《个人信息保护法》第4条 | 唯一绑定自然人身份,泄露可导致诈骗、身份冒用 | 110105******123X | 1.0 |
| 手机号 | 《网络安全法》第41条 | 结合其他信息可定位个人,易引发骚扰电话、钓鱼攻击 | 138****1111 | 0.9 |
| 出行记录 | 《数据安全法》第3条 | 反映个人行为轨迹,泄露可能威胁人身安全 | 20250423高铁G101次北京→上海 | 1.0 |
| 支付信息 | 《网络安全法》第21条 | 直接关联资金安全,泄露可能导致财产损失 | 银行卡号6217****1234 | 1.0 |
| 联系地址 | 《个人信息保护法》第6条 | 住址泄露易引发人身安全风险 | 北京市海淀区**路 | 0.8 |
| 未成年人信息 | 《个人信息保护法》第29条 | 不满14周岁人群信息受特殊保护,泄露危害更严重 | 儿童出生日期、监护人联系方式 | 1.0 |
| 违禁词库 | 法律法规/社会文化 | 暴恐违禁、文本色情、政治敏感、低俗辱骂等 | | 1.0 |
), ArticleFig(id=1268884568829493368, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表1, caption=
敏感信息实体(部分)
, figureFileSmall=null, figureFileBig=null, tableContent=
| 名称 | 依据 | 特征描述 | 典型示例 | 敏感程度 |
|---|
| 身份证号 | 《个人信息保护法》第4条 | 唯一绑定自然人身份,泄露可导致诈骗、身份冒用 | 110105******123X | 1.0 |
| 手机号 | 《网络安全法》第41条 | 结合其他信息可定位个人,易引发骚扰电话、钓鱼攻击 | 138****1111 | 0.9 |
| 出行记录 | 《数据安全法》第3条 | 反映个人行为轨迹,泄露可能威胁人身安全 | 20250423高铁G101次北京→上海 | 1.0 |
| 支付信息 | 《网络安全法》第21条 | 直接关联资金安全,泄露可能导致财产损失 | 银行卡号6217****1234 | 1.0 |
| 联系地址 | 《个人信息保护法》第6条 | 住址泄露易引发人身安全风险 | 北京市海淀区**路 | 0.8 |
| 未成年人信息 | 《个人信息保护法》第29条 | 不满14周岁人群信息受特殊保护,泄露危害更严重 | 儿童出生日期、监护人联系方式 | 1.0 |
| 违禁词库 | 法律法规/社会文化 | 暴恐违禁、文本色情、政治敏感、低俗辱骂等 | | 1.0 |
), ArticleFig(id=1268884568913379449, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 字段类型 | 正则表达式 |
|---|
| 身份证号 | /^[1-6]\d{5}(18|19|20)\d{2}(0[1-9]|1[0-2])(0[1-9]|[12]\d|3[01])\d{3}[\dXx]$/ |
| 手机号 | ^(?:(?:\+|00)86)?1(?:3\d|4[5-79]|5[0-35-9]|6[5-7]|7[0-8]|8\d|9[189])\d{8}$ |
| 电子邮箱 | ^[a-zA-Z0-9.!#$%&'*+/=?^_`{|}~-]+@[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\.[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)*\.[a-zA-Z]{2,}$ |
), ArticleFig(id=1268884568976294010, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表2, caption=
典型敏感信息字段及正则表达式
, figureFileSmall=null, figureFileBig=null, tableContent=
| 字段类型 | 正则表达式 |
|---|
| 身份证号 | /^[1-6]\d{5}(18|19|20)\d{2}(0[1-9]|1[0-2])(0[1-9]|[12]\d|3[01])\d{3}[\dXx]$/ |
| 手机号 | ^(?:(?:\+|00)86)?1(?:3\d|4[5-79]|5[0-35-9]|6[5-7]|7[0-8]|8\d|9[189])\d{8}$ |
| 电子邮箱 | ^[a-zA-Z0-9.!#$%&'*+/=?^_`{|}~-]+@[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?(?:\.[a-zA-Z0-9](?:[a-zA-Z0-9-]{0,61}[a-zA-Z0-9])?)*\.[a-zA-Z]{2,}$ |
), ArticleFig(id=1268884569064374395, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| Transformer层数 | 特征抽象重点 |
|---|
| 1—4 | 局部短语关联:“G3次”与“上海→北京西”; “身份证”与两个证件号的对应关系; “学生票”“儿童票”“成人票价”的近邻关联。 |
| 5—8 | 跨句逻辑关联:“购买了2张…但按成人票价出”的矛盾关系; “联系电话”与“199XXXX8765”的绑定; “以前可以正常购买”与当前异常的对比。 |
| 9—12 | 整体意图:“咨询学生票购票异常原因,并提供身份信息和联系方式”; 核心实体:身份证号、手机号、车次、时间、上下车站等关键信息的全局定位。 |
), ArticleFig(id=1268884569148260476, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表3, caption=
意图识别结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| Transformer层数 | 特征抽象重点 |
|---|
| 1—4 | 局部短语关联:“G3次”与“上海→北京西”; “身份证”与两个证件号的对应关系; “学生票”“儿童票”“成人票价”的近邻关联。 |
| 5—8 | 跨句逻辑关联:“购买了2张…但按成人票价出”的矛盾关系; “联系电话”与“199XXXX8765”的绑定; “以前可以正常购买”与当前异常的对比。 |
| 9—12 | 整体意图:“咨询学生票购票异常原因,并提供身份信息和联系方式”; 核心实体:身份证号、手机号、车次、时间、上下车站等关键信息的全局定位。 |
), ArticleFig(id=1268884569223757949, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 方案名称 | 动态规则扩展耗时/ms | 百万级数据处理耗时/s |
|---|
| 正则表达式 | | 18.0 |
| 传统AC自动机 | 202 | 10.2 |
| 改进型AC自动机 | 165 | 8.7 |
| 双阶段识别算法 | 127 | 4.6 |
), ArticleFig(id=1268884569337004158, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表4, caption=
结构化数据敏感信息识别模型验证结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 方案名称 | 动态规则扩展耗时/ms | 百万级数据处理耗时/s |
|---|
| 正则表达式 | | 18.0 |
| 传统AC自动机 | 202 | 10.2 |
| 改进型AC自动机 | 165 | 8.7 |
| 双阶段识别算法 | 127 | 4.6 |
), ArticleFig(id=1268884569437667455, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型名称 | 敏感实体F1值/% | 敏感信息上下文误判率/% |
|---|
| 原始BERT-base | 81.22 | 13.22 |
| BERT+规则后处理 | 84.27 | 10.21 |
| 通用BERT | 87.92 | 6.73 |
| 知识增强型BERT | 91.24 | 5.88 |
), ArticleFig(id=1268884569500582016, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表5, caption=
非结构化数据敏感信息识别模型验证结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型名称 | 敏感实体F1值/% | 敏感信息上下文误判率/% |
|---|
| 原始BERT-base | 81.22 | 13.22 |
| BERT+规则后处理 | 84.27 | 10.21 |
| 通用BERT | 87.92 | 6.73 |
| 知识增强型BERT | 91.24 | 5.88 |
), ArticleFig(id=1268884569580273793, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型名称 | F1值 |
|---|
| 原始BERT-base | 76.45 |
| BERT+规则后处理 | 80.12 |
| 通用BERT | 84.05 |
| 知识增强型BERT | 88.66 |
), ArticleFig(id=1268884569659965570, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表6, caption=
鲁棒性测试集上模型F1值对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型名称 | F1值 |
|---|
| 原始BERT-base | 76.45 |
| BERT+规则后处理 | 80.12 |
| 通用BERT | 84.05 |
| 知识增强型BERT | 88.66 |
), ArticleFig(id=1268884569731268739, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型名称 | 字符准确率/% | 字段完整率/% | 模糊图像性能衰减/% | 推理平均耗时/ms |
|---|
| CRNN | 80.94 | 62.41 | -21.71 | 91 |
| SATRN | 87.13 | 64.63 | -16.24 | 172 |
| OCR-Transformer | 93.71 | 91.12 | -8.32 | 128 |
), ArticleFig(id=1268884569819349124, tenantId=1146029695717560320, journalId=1268266580820377661, articleId=1268884547455320084, language=CN, label=表7, caption=
模型验证结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型名称 | 字符准确率/% | 字段完整率/% | 模糊图像性能衰减/% | 推理平均耗时/ms |
|---|
| CRNN | 80.94 | 62.41 | -21.71 | 91 |
| SATRN | 87.13 | 64.63 | -16.24 | 172 |
| OCR-Transformer | 93.71 | 91.12 | -8.32 | 128 |
)], attaches=null, journal=Journal(id=1268263582425694265, delFlag=0, nameCn=中国铁道科学, nameEn=China Railway Science, nameHistory1=null, nameHistory2=null, issn=1001-4632, eissn=null, cn=11-2480/U, coden=null, periodic=1, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=SSf6OdgUxD8PAfXgcRZgdw==, journalPrice=null, startedYear=null, abbrevIsoEn=China Railway Science, journalRemark=null, publicationField=null, createdTime=1780307201251, updatedTime=1780308512476, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=C, firstLetterEn=C, subjectCode=Engineering, subjectName=null, subjectCodeEn=Engineering, subjectNameEn=null, picCn=SSf6OdgUxD8PAfXgcRZgdw==, picEn=hwTX4BvIZYX9jqu505HCNA==, jcr=null, cjcr=null, exts=[JournalExt(id=1268269082185991091, language=CN, name=中国铁道科学, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1780308512493, updatedTime=1780308512493, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://zgtk.chinajournal.net.cn/EditorE3N/index.aspx?t=1, submissionEditorUrl=https://zgtk.chinajournal.net.cn/EditorE3N/index.aspx?t=3, submissionReviewUrl=https://zgtk.chinajournal.net.cn/EditorE3N/index.aspx?t=2, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1268269082236322740, language=EN, name=China Railway Science, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1780308512505, updatedTime=1780308512505, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://zgtk.chinajournal.net.cn/EditorE3N/index.aspx?t=1, submissionEditorUrl=https://zgtk.chinajournal.net.cn/EditorE3N/index.aspx?t=3, submissionReviewUrl=https://zgtk.chinajournal.net.cn/EditorE3N/index.aspx?t=2, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1268266580820377661, websiteList=[Website(id=1268603530098148336, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1268266580820377661, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtdkx/CN, language=CN, createTime=1780388251090, createBy=18614031015, updateTime=1780388320535, updateBy=18614031015, name=中国铁道科学-中文, tplId=1146099689490845704, title=中国铁道科学, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1268603928955486234, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=articleTextType, value=kx, createTime=1780388346184, updateTime=1780388346184, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928934514711, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=banner, value=null, createTime=1780388346179, updateTime=1780388346179, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928972263453, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=grayFlag, value=0, createTime=1780388346188, updateTime=1780388346188, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928926126102, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtdkx/CN/file/pic?fileId=x1EkISp0xx03nZZYvnfO1Q==, createTime=1780388346177, updateTime=1780388346177, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928984846367, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=minRunFlag, value=0, createTime=1780388346191, updateTime=1780388346191, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928947097625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtdkx/CN/file/pic, createTime=1780388346182, updateTime=1780388346182, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928976457758, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=silenceFlag, value=0, createTime=1780388346189, updateTime=1780388346189, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928938709016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1780388346180, updateTime=1780388346180, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928959680539, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=themeColor, value=null, createTime=1780388346185, updateTime=1780388346185, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603928963874844, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530098148336, code=themeStyle, value=null, createTime=1780388346186, updateTime=1780388346186, creator=18614031015, updator=18614031015)]), Website(id=1268603530697933815, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1268266580820377661, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/zgtdkx/EN, language=EN, createTime=1780388251232, createBy=18614031015, updateTime=1780388316834, updateBy=18614031015, name=中国铁道科学-英文, tplId=1146101810881728533, title=China Railway Science, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1268603954360385576, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=articleTextType, value=kx, createTime=1780388352241, updateTime=1780388352241, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954339414053, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=banner, value=null, createTime=1780388352236, updateTime=1780388352236, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954381357099, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=grayFlag, value=0, createTime=1780388352246, updateTime=1780388352246, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954331025444, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=logo, value=https://castjournals.cast.org.cn/joweb/zgtdkx/EN/file/pic?fileId=x1EkISp0xx03nZZYvnfO1Q==, createTime=1780388352234, updateTime=1780388352234, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954398134317, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=minRunFlag, value=0, createTime=1780388352250, updateTime=1780388352250, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954356191271, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/zgtdkx/EN/file/pic, createTime=1780388352240, updateTime=1780388352240, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954389745708, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=silenceFlag, value=0, createTime=1780388352248, updateTime=1780388352248, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954347802662, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1780388352238, updateTime=1780388352238, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954368774185, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=themeColor, value=null, createTime=1780388352243, updateTime=1780388352243, creator=18614031015, updator=18614031015), WebsiteProps(id=1268603954377162794, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1268603530697933815, code=themeStyle, value=null, createTime=1780388352245, updateTime=1780388352245, creator=18614031015, updator=18614031015)])], journalTitle=中国铁道科学, weixinUrl=null, journalUrl=https://zgtk.publish.founderss.cn/, iacademicId=null, status=1, seqNo=null, journalTitleEn=China Railway Science, journalPhotoCn=SSf6OdgUxD8PAfXgcRZgdw==, journalPhotoEn=hwTX4BvIZYX9jqu505HCNA==, journalFirstLetter=C, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/zgtdkx/CN/10.3969/j.issn.1001-4632.2026.02.20, detailUrlEn=https://castjournals.cast.org.cn/joweb/zgtdkx/EN/10.3969/j.issn.1001-4632.2026.02.20, pdfUrlCn=https://castjournals.cast.org.cn/joweb/zgtdkx/CN/PDF/10.3969/j.issn.1001-4632.2026.02.20, pdfUrlEn=https://castjournals.cast.org.cn/joweb/zgtdkx/EN/PDF/10.3969/j.issn.1001-4632.2026.02.20, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)