Article(id=1228279672316817439, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1228279664221815452, articleNumber=null, orderNo=null, doi=10.12404/j.issn.1671-1815.2409674, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=research-article, receivedDate=1735401600000, receivedDateStr=2024-12-29, revisedDate=1747584000000, revisedDateStr=2025-05-19, acceptedDate=null, acceptedDateStr=null, onlineDate=1770774294213, onlineDateStr=2026-02-11, pubDate=1754582400000, pubDateStr=2025-08-08, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1770774294213, onlineIssueDateStr=2026-02-11, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1770774294213, creator=13701087609, updateTime=1770774294213, updator=13701087609, issue=Issue{id=1228279664221815452, tenantId=1146029695717560320, journalId=1146123166801305609, year='2025', volume='25', issue='22', pageStart='9211', pageEnd='9648', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=1, specialIssue=null, createTime=1770774292283, creator=13701087609, updateTime=1770777611996, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1228293588207992892, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1228279664221815452, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1228293588207992893, tenantId=1146029695717560320, journalId=1146123166801305609, issueId=1228279664221815452, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=9427, endPage=9435, ext={EN=ArticleExt(id=1228279676297212133, articleId=1228279672316817439, tenantId=1146029695717560320, journalId=1146123166801305609, language=EN, title=Spoof Speech Detection with Channel-temporal Attention and Depthwise Separable Convolutions, columnId=1228279665928897192, journalTitle=Science Technology and Engineering, columnName=Papers·Automation and Computational Technology, runingTitle=null, highlight=null, articleAbstract=
The growing sophistication of deepfake speech poses significant security threats to ASV(automatic speaker verification) systems. Current anti-spoofing models based on CNNs(convolutional neural networks) are constrained by inadequate global feature extraction and limited generalization capability against unseen spoofing attacks. To address these challenges, a novel network architecture integrating CT-DSCNet(channel-temporal attention mechanisms with depthwise separable convolutions) was proposed. Building upon the RawNet2 framework, the developed model incorporates dual-domain attention modules to enhance discriminative feature representation while suppressing irrelevant acoustic artifacts. Furthermore, depthwise separable convolutional residual blocks were strategically implemented to optimize computational efficiency and real-time processing capabilities. Comprehensive evaluations were conducted across three benchmark datasets: ASVspoof2019 LA, ASVspoof2021 DF, and FMFCC-A. Experimental results demonstrate state-of-the-art performance with EER(equal error rate) of 1.53% on ASVspoof2019 LA, representing a 70.58% relative improvement over baseline systems. Notably, the proposed architecture exhibits superior cross-dataset generalization, achieving a 25.35% lower EER on the FMFCC-A evaluation set compared with conventional approaches. These findings validate the effectiveness of the hybrid attention-convolution design in advancing spoofing detection robustness and domain adaptability.
, correspAuthors=Hua-peng WANG, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Jia-qi FENG, Hua-peng WANG, Tian-ci LIU), CN=ArticleExt(id=1228279680579596836, articleId=1228279672316817439, tenantId=1146029695717560320, journalId=1146123166801305609, language=CN, title=融合通道-时间注意力和深度可分离卷积的欺骗语音检测, columnId=1228279666075697835, journalTitle=科学技术与工程, columnName=论文·自动化技术、计算机技术, runingTitle=null, highlight=null, articleAbstract=
自动说话人验证系统在应对日益逼真的深度伪造语音时,面临显著的欺骗攻击威胁。现有基于卷积神经网络的反欺骗模型在捕捉全局特征与应对未知类型语音伪造的泛化性能方面存在不足。为提升反欺骗检测效果,提出了一种融合通道-时间注意力机制与深度可分离卷积的网络模型CT-DSCNet。该模型在RawNet2基础上引入通道-时间注意力模块,增强对重要语音特征的关注,减少无关区域的干扰;同时采用深度可分离卷积残差块,优化计算效率与模型实时性。实验在ASVspoof2019、ASVspoof2021和FMFCC-A数据集上进行,结果显示CT-DSCNet在ASVspoof2019 LA测试集上的等错误率(equal error rate,EER)达到1.53%,较基线模型降低70.58%。在泛化能力方面相较其他模型也表现出色,在FMFCC-A评估集上的EER,较改进前模型相比提高了25.35%。实验验证了该方法在提升伪造语音检测性能和跨数据集适应性方面的有效性。
, correspAuthors=王华朋, authorNote=null, correspAuthorsNote=
, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=iYgLqVOKpjgouuRbMptRaQ==, magXml=2CORVIugeXj8pw+B7CjmeA==, pdfUrl=null, pdf=HqLbYQDJiUC7A46HpHXNNQ==, pdfFileSize=5941079, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=6AldmGDA75yvdy3BIRsjFA==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=PhemLeLFEBRdby+QZ+CW3w==, mapNumber=null, authorCompany=null, fund=null, authors=
, authorsList=冯嘉琪, 王华朋, 刘天赐)}, authors=[Author(id=1228369848326095702, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=18240668287@163.com, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1228369849722798937, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, authorId=1228369848326095702, language=EN, stringName=Jia-qi FENG, firstName=Jia-qi, middleName=null, lastName=FENG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1228369849836045149, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, authorId=1228369848326095702, language=CN, stringName=冯嘉琪, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854, bio={"content":"
冯嘉琪(2001—),女,汉族,河南新乡人,硕士研究生。研究方向:深度学习、语音检验。E-mail:18240668287@163.com。
"}, bioImg=null, bioContent=
冯嘉琪(2001—),女,汉族,河南新乡人,硕士研究生。研究方向:深度学习、语音检验。E-mail:18240668287@163.com。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1228369848238015313, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, xref=null, ext=[AuthorCompanyExt(id=1228369848242209618, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China), AuthorCompanyExt(id=1228369848250598227, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854)])]), Author(id=1228369849940902753, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=huapeng.wang@hotmail.com, emailSecond=null, emailThird=null, correspondingAuthor=1, authorType=1, ext={EN=AuthorExt(id=1228369850028983142, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, authorId=1228369849940902753, language=EN, stringName=Hua-peng WANG, firstName=Hua-peng, middleName=null, lastName=WANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1228369850146423656, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, authorId=1228369849940902753, language=CN, stringName=王华朋, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
*, address=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1228369848238015313, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, xref=null, ext=[AuthorCompanyExt(id=1228369848242209618, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China), AuthorCompanyExt(id=1228369848250598227, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854)])]), Author(id=1228369850251281262, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1228369850364527474, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, authorId=1228369850251281262, language=EN, stringName=Tian-ci LIU, firstName=Tian-ci, middleName=null, lastName=LIU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1228369850498745206, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, authorId=1228369850251281262, language=CN, stringName=刘天赐, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1228369848238015313, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, xref=null, ext=[AuthorCompanyExt(id=1228369848242209618, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China), AuthorCompanyExt(id=1228369848250598227, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854)])])], keywords=[Keyword(id=1228369850708460416, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, orderNo=1, keyword=deepfake speech), Keyword(id=1228369850783957892, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, orderNo=2, keyword=attention mechanism), Keyword(id=1228369850880426891, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, orderNo=3, keyword=depthwise separable convolution), Keyword(id=1228369850955924369, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, orderNo=4, keyword=speech anti-spoofing), Keyword(id=1228369851127890836, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, orderNo=1, keyword=深度伪造语音), Keyword(id=1228369851224359831, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, orderNo=2, keyword=注意力机制), Keyword(id=1228369851295663002, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, orderNo=3, keyword=深度可分离卷积), Keyword(id=1228369851375354783, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, orderNo=4, keyword=语音反欺骗)], refs=[Reference(id=1228369855850676305, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=5329, pageEnd=5333, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=Snyder D, Garcia-Romero D, Sell G, journalName=IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP), refType=null, unstructuredReference=
Snyder D,
Garcia-Romero D,
Sell G, et al. X-vectors: robust DNN embeddings for speaker recognition[C]//
IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP). Calgary: IEEE,
2018: 5329-5333., articleTitle=X-vectors: robust DNN embeddings for speaker recognition, refAbstract=null), Reference(id=1228369855934562390, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=2037, pageEnd=2041, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=Wu Z, Kinnunen T, Evans N, ASVspoof, journalName=Interspeech 2015, refType=null, unstructuredReference=
Wu Z,
Kinnunen T,
Evans N, et al. ASVspoof 2015: the first automatic speaker verification spoofing and countermeasures challenge[C]//
Interspeech 2015. Singapore: ISCA,
2015: 2037-2041., articleTitle=the first automatic speaker verification spoofing and countermeasures challenge, refAbstract=null), Reference(id=1228369856068780128, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2021, volume=3, issue=2, pageStart=252, pageEnd=265, url=null, language=null, rfNumber=[3], rfOrder=2, authorNames=Nautsch A, Wang X, Evans N, journalName=IEEE Transactions on Biometrics, Behavior, and Identity Science, refType=null, unstructuredReference=
Nautsch A,
Wang X,
Evans N, et al. ASVspoof 2019: spoofing counter measures for the detection of synthesized, converted and replayed speech[J].
IEEE Transactions on Biometrics, Behavior, and Identity Science,
2021,
3(2): 252-265., articleTitle=ASVspoof 2019: spoofing counter measures for the detection of synthesized, converted and replayed speech, refAbstract=null), Reference(id=1228369856161054823, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=2, pageEnd=6, url=null, language=null, rfNumber=[4], rfOrder=3, authorNames=Kinnunen T, Sahidullah M D, Delgado H, TheASVspoof, journalName=Interspeech 2017, refType=null, unstructuredReference=
Kinnunen T,
Sahidullah M D,
Delgado H, et al.
TheASVspoof 2017 challenge: assessing the limits of replay spoofing attack detection[C]//
Interspeech 2017. Singapore: ISCA,
2017: 2-6., articleTitle=assessing the limits of replay spoofing attack detection, refAbstract=null), Reference(id=1228369856236552300, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=47, pageEnd=54, url=null, language=null, rfNumber=[5], rfOrder=4, authorNames=Yamagishi J, Wang X, Todisco M, journalName=Edition of the Automatic Speaker Verification and Spoofing Countermeasures Challenge, refType=null, unstructuredReference=
Yamagishi J,
Wang X,
Todisco M, et al. ASVspoof 2021: accelerating progress in spoofed and deepfake speech detection[C]//
Edition of the Automatic Speaker Verification and Spoofing Countermeasures Challenge. Singapore: ISCA,
2021: 47-54., articleTitle=ASVspoof 2021: accelerating progress in spoofed and deepfake speech detection, refAbstract=null), Reference(id=1228369856333021300, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2020, volume=35, issue=5, pageStart=807, pageEnd=823, url=null, language=null, rfNumber=[6], rfOrder=5, authorNames=张雄伟, 李嘉康, 孙蒙, journalName=数据采集与处理, refType=null, unstructuredReference=张雄伟, 李嘉康, 孙蒙, 等. 语音欺骗检测方法的研究现状及展望[J].
数据采集与处理,
2020,
35(5): 807-823., articleTitle=语音欺骗检测方法的研究现状及展望, refAbstract=null), Reference(id=1228369856463044735, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2020, volume=35, issue=5, pageStart=807, pageEnd=823, url=null, language=null, rfNumber=[6], rfOrder=6, authorNames=Zhang Xiongwei, Li Jiakang, Sun Meng, journalName=Journal of Data Acquisition and Processing, refType=null, unstructuredReference=
Zhang Xiongwei,
Li Jiakang,
Sun Meng, et al. Speech anti-spoofing: the state of the art and prospects[J].
Journal of Data Acquisition and Processing,
2020,
35(5): 807-823., articleTitle=Speech anti-spoofing: the state of the art and prospects, refAbstract=null), Reference(id=1228369856559513733, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2017, volume=45, issue=null, pageStart=516, pageEnd=535, url=null, language=null, rfNumber=[7], rfOrder=7, authorNames=Todisco M, Delgado H, Evans N, journalName=Computer Speech & Language, refType=null, unstructuredReference=
Todisco M,
Delgado H,
Evans N. Constant Q cepstral coefficients: a spoofing countermeasure for automatic speaker verification[J].
Computer Speech & Language,
2017,
45: 516-535., articleTitle=Constant Q cepstral coefficients: a spoofing countermeasure for automatic speaker verification, refAbstract=null), Reference(id=1228369856672759951, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=29, issue=null, pageStart=1462, pageEnd=1466, url=null, language=null, rfNumber=[8], rfOrder=8, authorNames=Cui S, Huang B, Huang J, journalName=IEEE Signal Processing Letters, refType=null, unstructuredReference=
Cui S,
Huang B,
Huang J, et al. Synthetic speech detection based on local autoregression and variance statistics[J].
IEEE Signal Processing Letters,
2022,
29: 1462-1466., articleTitle=Synthetic speech detection based on local autoregression and variance statistics, refAbstract=null), Reference(id=1228369856781811860, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=2062, pageEnd=2066, url=null, language=null, rfNumber=[9], rfOrder=9, authorNames=Patel T B, Patil H A, journalName=Interspeech 2015, refType=null, unstructuredReference=
Patel T B,
Patil H A. Combining evidences from mel cepstral, cochlear filter cepstral and instantaneous frequency features for detection of natural vs. spoofed speech[C]//
Interspeech 2015. Singapore: ISCA,
2015: 2062-2066., articleTitle=Combining evidences from mel cepstral, cochlear filter cepstral and instantaneous frequency features for detection of natural vs. spoofed speech, refAbstract=null), Reference(id=1228369856949584028, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2020, volume=2020, issue=null, pageStart=1101, pageEnd=1105, url=null, language=null, rfNumber=[10], rfOrder=10, authorNames=Wu Z, Das R K, Yang J, journalName=Interspeech, refType=null, unstructuredReference=
Wu Z,
Das R K,
Yang J, et al. Light convolutional neural network with feature genuinization for detection of synthetic speech attacks[J].
Interspeech,
2020,
2020: 1101-1105., articleTitle=Light convolutional neural network with feature genuinization for detection of synthetic speech attacks, refAbstract=null), Reference(id=1228369857067024549, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=6367, pageEnd=6371, url=null, language=null, rfNumber=[11], rfOrder=11, authorNames=Jung J W, Heo H S, Tak H, journalName=ICASSP 2022—2022 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP), refType=null, unstructuredReference=
Jung J W,
Heo H S,
Tak H, et al. AASIST: audio anti-spoofing using integrated spectro-temporal graph attention networks[C]//
ICASSP 2022—2022 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP). Singapore: ICASSP,
2022: 6367-6371., articleTitle=AASIST: audio anti-spoofing using integrated spectro-temporal graph attention networks, refAbstract=null), Reference(id=1228369857289322676, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=6377, pageEnd=6381, url=null, language=null, rfNumber=[12], rfOrder=12, authorNames=Lei Z, Yan H, Liu C, journalName=ICASSP 2022—2022 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP), refType=null, unstructuredReference=
Lei Z,
Yan H,
Liu C, et al. Two-path GMM-ResNet and GMM-SENet for ASV spoofing detection[C]//
ICASSP 2022—2022 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP). Singapore: ICASSP,
2022: 6377-6381., articleTitle=Two-path GMM-ResNet and GMM-SENet for ASV spoofing detection, refAbstract=null), Reference(id=1228369858597945532, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2023, volume=11, issue=null, pageStart=140443, pageEnd=140450, url=null, language=null, rfNumber=[13], rfOrder=13, authorNames=Hu C, Zhou R, Yuan Q, journalName=IEEE Access, refType=null, unstructuredReference=
Hu C,
Zhou R,
Yuan Q. Synthetic speech spoofing detection based on online hard example mining[J].
IEEE Access,
2023,
11: 140443-140450., articleTitle=Synthetic speech spoofing detection based on online hard example mining, refAbstract=null), Reference(id=1228369858732163268, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=1, pageEnd=8, url=null, language=null, rfNumber=[14], rfOrder=14, authorNames=Tak H, Jung J W, Patino J, journalName=Edition of the Automatic Speaker Verification and Spoofing Countermeasures Challenge, refType=null, unstructuredReference=
Tak H,
Jung J W,
Patino J, et al. End-to-end spectro-temporal graph attention networks for speaker verification anti-spoofing and speech deepfake detection[C]//
Edition of the Automatic Speaker Verification and Spoofing Countermeasures Challenge. Singapore: ISCA,
2021: 1-8., articleTitle=End-to-end spectro-temporal graph attention networks for speaker verification anti-spoofing and speech deepfake detection, refAbstract=null), Reference(id=1228369858832826572, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=2356, pageEnd=2360, url=null, language=null, rfNumber=[15], rfOrder=15, authorNames=Tak H, Jung J W, Patino J, journalName=Interspeech, refType=null, unstructuredReference=
Tak H,
Jung J W,
Patino J, et al. Graph attention networks for anti-spoofing[C]//
Interspeech: International Conference on Speech Communication and Technology. Brno: ISCA,
2021: 2356-2360., articleTitle=Graph attention networks for anti-spoofing, refAbstract=null), Reference(id=1228369858950267095, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=22, issue=18, pageStart=7937, pageEnd=7944, url=null, language=null, rfNumber=[16], rfOrder=16, authorNames=杨海涛, 王华朋, 楚宪腾, journalName=科学技术与工程, refType=null, unstructuredReference=杨海涛, 王华朋, 楚宪腾, 等. 基于卷积循环神经网络的语音逻辑攻击检测[J].
科学技术与工程,
2022,
22(18): 7937-7944., articleTitle=基于卷积循环神经网络的语音逻辑攻击检测, refAbstract=null), Reference(id=1228369859055124702, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=22, issue=18, pageStart=7937, pageEnd=7944, url=null, language=null, rfNumber=[16], rfOrder=17, authorNames=Yang Haitao, Wang Huapeng, Chu Xianteng, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Yang Haitao,
Wang Huapeng,
Chu Xianteng, et al. Speech logic attack detection based on CNN-RNN-DNN network[J].
Science Technology and Engineering,
2022,
22(18): 7937-7944., articleTitle=Speech logic attack detection based on CNN-RNN-DNN network, refAbstract=null), Reference(id=1228369859155788010, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=6369, pageEnd=6373, url=null, language=null, rfNumber=[17], rfOrder=18, authorNames=Tak H, Patino J, Todisco M, journalName=ICASSP 2021—2021 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP), refType=null, unstructuredReference=
Tak H,
Patino J,
Todisco M, et al. End-to-end anti-spoofing with RawNet2[C]//
ICASSP 2021—2021 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP). Singapore: ICASSP,
2021: 6369-6373., articleTitle=End-to-end anti-spoofing with RawNet2, refAbstract=null), Reference(id=1228369859239674098, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=4381, pageEnd=4385, url=null, language=null, rfNumber=[18], rfOrder=19, authorNames=Zhang L, Li Y, Zhao H, journalName=Interspeech 2022, refType=null, unstructuredReference=
Zhang L,
Li Y,
Zhao H, et al. Backend ensemble for speaker verification and spoofing countermeasure[C]//
Interspeech 2022. Singapore: ISCA,
2022: 4381-4385., articleTitle=Backend ensemble for speaker verification and spoofing countermeasure, refAbstract=null), Reference(id=1228369859382280443, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2023, volume=null, issue=null, pageStart=1, pageEnd=5, url=null, language=null, rfNumber=[19], rfOrder=20, authorNames=Liu X, Liu M, Wang L, journalName=ICASSP 2023—2023 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP), refType=null, unstructuredReference=
Liu X,
Liu M,
Wang L, et al. Leveraging positional-related local-global dependency for synthetic speech detection[C]//
ICASSP 2023—2023 IEEE International Conference on Acoustics, Speech and Signal Processing(ICASSP). Rhodes Island: IEEE,
2023: 1-5., articleTitle=Leveraging positional-related local-global dependency for synthetic speech detection, refAbstract=null), Reference(id=1228369859478749446, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=null, pageStart=306, pageEnd=310, url=null, language=null, rfNumber=[20], rfOrder=21, authorNames=Ta B T, Nguyen T L, Dang D S, journalName=IEEE Ninth International Conference on Communications and Electronics(ICCE), refType=null, unstructuredReference=
Ta B T,
Nguyen T L,
Dang D S, et al. A multi-task conformer for spoofing aware speaker verification[C]//
IEEE Ninth International Conference on Communications and Electronics(ICCE). Nha Trang: ICCE,
2022: 306-310., articleTitle=A multi-task conformer for spoofing aware speaker verification, refAbstract=null), Reference(id=1228369859571024141, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=27, pageStart=11763, pageEnd=11773, url=null, language=null, rfNumber=[21], rfOrder=22, authorNames=万玫汐, 王华朋, 闫道申, journalName=科学技术与工程, refType=null, unstructuredReference=万玫汐, 王华朋, 闫道申, 等. 基于改进ECAPA-TDNN的法庭自动说话人识别[J].
科学技术与工程,
2024,
24(27): 11763-11773., articleTitle=基于改进ECAPA-TDNN的法庭自动说话人识别, refAbstract=null), Reference(id=1228369859705241881, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=27, pageStart=11763, pageEnd=11773, url=null, language=null, rfNumber=[21], rfOrder=23, authorNames=Wan Meixi, Wang Huapeng, Yan Daoshen, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Wan Meixi,
Wang Huapeng,
Yan Daoshen, et al. Forensic automatic speaker recognition based on enhanced ECAPA-TDNN[J].
Science Technology and Engineering,
2024,
24(27): 11763-11773., articleTitle=Forensic automatic speaker recognition based on enhanced ECAPA-TDNN, refAbstract=null), Reference(id=1228369859793322272, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=null, volume=null, issue=null, pageStart=1704.04861, pageEnd=null, url=null, language=null, rfNumber=[22], rfOrder=24, authorNames=Howard A, Zhu M, Chen B, journalName=arXiv: 2017, refType=null, unstructuredReference=
Howard A,
Zhu M,
Chen B, et al. MobileNets: efficient convolutional neural networks for mobile vision applications[J].
arXiv: 2017, 1704.04861., articleTitle=MobileNets: efficient convolutional neural networks for mobile vision applications, refAbstract=null), Reference(id=1228369859902374184, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1800, pageEnd=1807, url=null, language=null, rfNumber=[23], rfOrder=25, authorNames=Chollet F, journalName=IEEE Conference on Computer Vision and Pattern Recognition(CVPR), refType=null, unstructuredReference=
Chollet F. Xception: deep learning with depthwise separable convolutions[C]//
IEEE Conference on Computer Vision and Pattern Recognition(CVPR). Honolulu: IEEE Computer Society,
2017: 1800-1807., articleTitle=Xception: deep learning with depthwise separable convolutions, refAbstract=null), Reference(id=1228369860024009010, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2020, volume=64, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[24], rfOrder=26, authorNames=Wang X, Yamagishi J, Todisco M, journalName=Computer Speech & Language, refType=null, unstructuredReference=
Wang X,
Yamagishi J,
Todisco M, et al. ASVspoof 2019: a large-scale public database of synthesized, converted and replayed speech[J].
Computer Speech & Language,
2020,
64.DOI:
10.48550/arXiv. 1911.01601., articleTitle=ASVspoof 2019: a large-scale public database of synthesized, converted and replayed speech, refAbstract=null), Reference(id=1228369860116283707, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2110, volume=null, issue=null, pageStart=09441, pageEnd=null, url=null, language=null, rfNumber=[25], rfOrder=27, authorNames=Zhang Z, Gu Y, Yi X, journalName=arXiv: 2021, refType=null, unstructuredReference=
Zhang Z,
Gu Y,
Yi X, et al. FMFCC-A: a challenging mandarin dataset for synthetic speech detection[J].
arXiv: 2021,
2110.09441., articleTitle=FMFCC-A: a challenging mandarin dataset for synthetic speech detection, refAbstract=null), Reference(id=1228369860250501450, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2017, volume=45, issue=null, pageStart=516, pageEnd=535, url=null, language=null, rfNumber=[26], rfOrder=28, authorNames=Todisco M, Delgado H, Evans N, journalName=Computer Speech & Language, refType=null, unstructuredReference=
Todisco M,
Delgado H,
Evans N. Constant Q cepstral coefficients: a spoofing countermeasure for automatic speaker verification[J].
Computer Speech & Language,
2017,
45: 516-535., articleTitle=Constant Q cepstral coefficients: a spoofing countermeasure for automatic speaker verification, refAbstract=null), Reference(id=1228369860380524884, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2015, volume=null, issue=null, pageStart=2087, pageEnd=2091, url=null, language=null, rfNumber=[27], rfOrder=29, authorNames=Sahidullah M, Kinnunen T, Hanilçi C, journalName=Interspeech, refType=null, unstructuredReference=
Sahidullah M,
Kinnunen T,
Hanilçi C. A comparison of features for synthetic speech detection[C]//
Interspeech: International Conference on Speech Communication and Technology. Singapore: ISCA,
2015: 2087-2091., articleTitle=A comparison of features for synthetic speech detection, refAbstract=null), Reference(id=1228369860485382493, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2021, volume=null, issue=null, pageStart=4259, pageEnd=4263, url=null, language=null, rfNumber=[28], rfOrder=30, authorNames=Wang X, Yamagishi J, journalName=Interspeech, refType=null, unstructuredReference=
Wang X,
Yamagishi J. A comparative study on recent neural spoofing countermeasures for synthetic speech detection[C]//
Interspeech: International Conference on Speech Communication and Technology. Singapore: ISCA,
2021: 4259-4263., articleTitle=A comparative study on recent neural spoofing countermeasures for synthetic speech detection, refAbstract=null), Reference(id=1228369860619600231, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=7, pageStart=2804, pageEnd=2812, url=null, language=null, rfNumber=[29], rfOrder=31, authorNames=李俊屿, 卜凡亮, 谭林, journalName=科学技术与工程, refType=null, unstructuredReference=李俊屿, 卜凡亮, 谭林, 等. 基于多模态共享网络的自监督语音-人脸跨模态关联学习方法[J].
科学技术与工程,
2024,
24(7): 2804-2812., articleTitle=基于多模态共享网络的自监督语音-人脸跨模态关联学习方法, refAbstract=null), Reference(id=1228369860737040756, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, doi=null, pmid=null, pmcid=null, year=2024, volume=24, issue=7, pageStart=2804, pageEnd=2812, url=null, language=null, rfNumber=[29], rfOrder=32, authorNames=Li Junyu, Bu Fanliang, Tan Lin, journalName=Science Technology and Engineering, refType=null, unstructuredReference=
Li Junyu,
Bu Fanliang,
Tan Lin, et al. Self-supervised voice-face cross-modal association learning method
via multi-modal shared network[J].
Science Technology and Engineering,
2024,
24(7): 2804-2812., articleTitle=Self-supervised voice-face cross-modal association learning method
via multi-modal shared network, refAbstract=null)], funds=[Fund(id=1228369855242502184, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, awardId=2017YFC0821000, language=CN, fundingSource=国家重点研发计划(2017YFC0821000), fundOrder=null, country=null), Fund(id=1228369855347359790, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, awardId=司法鉴定科学研究院, language=CN, fundingSource=司法部司法鉴定重点实验室(司法鉴定科学研究院), fundOrder=null, country=null), Fund(id=1228369855460606004, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, awardId=KF202117, language=CN, fundingSource=司法部司法鉴定重点实验室(KF202117), fundOrder=null, country=null), Fund(id=1228369855573852222, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, awardId=2024YCZD05, language=CN, fundingSource=中国刑事警察学院研究生创新能力提升项目(2024YCZD05), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1228369848238015313, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, xref=null, ext=[AuthorCompanyExt(id=1228369848242209618, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=College of Public Security Information Technology and Intelligence, Criminal Investigation Police University of China, Shenyang 110854, China), AuthorCompanyExt(id=1228369848250598227, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, companyId=1228369848238015313, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=中国刑事警察学院公安信息技术与情报学院, 沈阳 110854)])], figs=[ArticleFig(id=1228369851589264296, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Fig.1, caption=
RawNet2 network architecture, figureFileSmall=oQBcYy1wW5/uFEyuaD57jA==, figureFileBig=HblCuMuK9oA4mbSQUEmLVg==, tableContent=null), ArticleFig(id=1228369851719287724, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=图1, caption=
RawNet2网络结构图, figureFileSmall=oQBcYy1wW5/uFEyuaD57jA==, figureFileBig=HblCuMuK9oA4mbSQUEmLVg==, tableContent=null), ArticleFig(id=1228369851840922547, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Fig.2, caption=
Schematic of depthwise separable convolution, figureFileSmall=pNTgHtQPCLNnT6dVbYquaw==, figureFileBig=1QCFPRh4QWcbG9aeF4Ut4g==, tableContent=null), ArticleFig(id=1228369851937391544, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=图2, caption=
深度可分离卷积示意图, figureFileSmall=pNTgHtQPCLNnT6dVbYquaw==, figureFileBig=1QCFPRh4QWcbG9aeF4Ut4g==, tableContent=null), ArticleFig(id=1228369852046443452, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Fig.3, caption=
General structure chart, figureFileSmall=+W0K+oiIju8UvJ9pcTnd6w==, figureFileBig=SGoaTC3zqdu3SvfsyDPWCg==, tableContent=null), ArticleFig(id=1228369852138718143, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=图3, caption=
总体结构图, figureFileSmall=+W0K+oiIju8UvJ9pcTnd6w==, figureFileBig=SGoaTC3zqdu3SvfsyDPWCg==, tableContent=null), ArticleFig(id=1228369852218409921, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Fig.4, caption=
Depthwise separable cconvolutional residual block, figureFileSmall=Dm1PgKzFy3zqtvnHtwPLfg==, figureFileBig=XhWqMpnzX5A7LfRhb9MC4w==, tableContent=null), ArticleFig(id=1228369852293907399, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=图4, caption=
深度可分离卷积残差块, figureFileSmall=Dm1PgKzFy3zqtvnHtwPLfg==, figureFileBig=XhWqMpnzX5A7LfRhb9MC4w==, tableContent=null), ArticleFig(id=1228369852386182094, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Fig.5, caption=
Residual block number and weighted method ablation experiment, figureFileSmall=rJr0NkkDq7w00TXnbyrMCg==, figureFileBig=qR/7tplBgCf4HiJUinzn9A==, tableContent=null), ArticleFig(id=1228369852495234006, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=图5, caption=
残差块数量和加权方法消融实验, figureFileSmall=rJr0NkkDq7w00TXnbyrMCg==, figureFileBig=qR/7tplBgCf4HiJUinzn9A==, tableContent=null), ArticleFig(id=1228369852570731481, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Table 1, caption=
CT-DSCNet network structure
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模块名称 | 内容 | 输出参数 |
| SinConv | 一维卷积+ BN+SeLU | (8,1 28, 64 472) |
| 通道-时间注意力 | 通道注意力块+ 时间注意力块+ 动态权重 | (8, 512, 16 118) |
| GRU | GRU(1 024) | (8, 16 118, 1 024) |
| 全连接层 | 1 024 | (8, 16 118, 512) |
| 全局池化 | — | (8,512) |
| 输出 | — | (8, 2) |
), ArticleFig(id=1228369852675589089, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=表1, caption=
CT-DSCNet网络结构
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模块名称 | 内容 | 输出参数 |
| SinConv | 一维卷积+ BN+SeLU | (8,1 28, 64 472) |
| 通道-时间注意力 | 通道注意力块+ 时间注意力块+ 动态权重 | (8, 512, 16 118) |
| GRU | GRU(1 024) | (8, 16 118, 1 024) |
| 全连接层 | 1 024 | (8, 16 118, 512) |
| 全局池化 | — | (8,512) |
| 输出 | — | (8, 2) |
), ArticleFig(id=1228369852780446692, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Table 2, caption=
Details of ASVspoof2019 LA dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 数据集 | 说话人数量 | 真实语音 | 合成语音 | 伪造种类 |
| 训练集 | 20 | 2 580 | 22 800 | A01-A06 |
| 开发集 | 20 | 2 548 | 22 296 | A01-A06 |
| 测试集 | 48 | 7 355 | 63 382 | A07-A19 |
), ArticleFig(id=1228369854172955626, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=表2, caption=
ASVspoof2019LA数据集详情
, figureFileSmall=null, figureFileBig=null, tableContent=
| 数据集 | 说话人数量 | 真实语音 | 合成语音 | 伪造种类 |
| 训练集 | 20 | 2 580 | 22 800 | A01-A06 |
| 开发集 | 20 | 2 548 | 22 296 | A01-A06 |
| 测试集 | 48 | 7 355 | 63 382 | A07-A19 |
), ArticleFig(id=1228369854340727793, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Table 3, caption=
Details of different evaluation dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 数据集 | 真实语音 | 合成语音 | 伪造种类 |
| ASVspoof2019LA测试集 | 7 355 | 63 382 | 13(A07-A19) |
| ASVspoof2021DF测试集 | 18 452 | 163 114 | >100(未知攻击) |
| FMFCC-A测试集 | 3 000 | 17 000 | 13(TTS系统) |
), ArticleFig(id=1228369854428808182, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=表3, caption=
不同测试集详情
, figureFileSmall=null, figureFileBig=null, tableContent=
| 数据集 | 真实语音 | 合成语音 | 伪造种类 |
| ASVspoof2019LA测试集 | 7 355 | 63 382 | 13(A07-A19) |
| ASVspoof2021DF测试集 | 18 452 | 163 114 | >100(未知攻击) |
| FMFCC-A测试集 | 3 000 | 17 000 | 13(TTS系统) |
), ArticleFig(id=1228369854533665789, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Table 4, caption=
Results of ablation experiments on the ASVspoof2019LA dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | EER/% | min tDCF |
| CA | TA | DSConv |
| — | — | — | 4.86 | 0.119 5 |
| √ | — | — | 3.67 | 0.098 8 |
| — | √ | — | 2.52 | 0.078 4 |
| √ | √ | — | 1.98 | 0.057 6 |
| √ | √ | √ | 1.43 | 0.043 2 |
), ArticleFig(id=1228369854646910980, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=表4, caption=
ASVspoof2019LA数据集消融实验结果
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | EER/% | min tDCF |
| CA | TA | DSConv |
| — | — | — | 4.86 | 0.119 5 |
| √ | — | — | 3.67 | 0.098 8 |
| — | √ | — | 2.52 | 0.078 4 |
| √ | √ | — | 1.98 | 0.057 6 |
| √ | √ | √ | 1.43 | 0.043 2 |
), ArticleFig(id=1228369854722408457, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Table 5, caption=
EER for ablation experiments on the FMFCC-A evaluation dataset
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | EER/% |
| RawNet2[16] | 26.63 |
| RawNet2# | 30.19 |
| RawNet2#+CA | 25.28 |
| RawNet2#+TA | 22.30 |
| RawNet2#+CA+TA | 20.59 |
| RawNet2#+CA+TA+DSC(CT-DSCNet) | 19.88 |
), ArticleFig(id=1228369854823071761, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=表5, caption=
在FMFCC-A评估集上消融实验的EER
, figureFileSmall=null, figureFileBig=null, tableContent=
| 模型 | EER/% |
| RawNet2[16] | 26.63 |
| RawNet2# | 30.19 |
| RawNet2#+CA | 25.28 |
| RawNet2#+TA | 22.30 |
| RawNet2#+CA+TA | 20.59 |
| RawNet2#+CA+TA+DSC(CT-DSCNet) | 19.88 |
), ArticleFig(id=1228369854911152150, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=EN, label=Table 6, caption=
Comparison of the CT-DSCNet with other models EER
, figureFileSmall=null, figureFileBig=null, tableContent=
| 系统 | ASVspoof2019LA | ASVspoof2021LA | ASVspoof2021DF |
| CQCC-GMM[27] | 9.57 | 15.62 | 25.56 |
| LFCC-GMM[28] | 8.09 | 19.30 | 25.25 |
| LFCC-LCNN[27] | — | 9.26 | 28.48 |
| RawNet2[16] | 4.86 | 9.50 | 22.38 |
| AASIST[11] | 1.04 | 6.24 | 20.29 |
| Rawformer[18] | 1.05 | 4.98 | — |
| CT-DSCNet | 1.43 | 3.86 | 18.01 |
), ArticleFig(id=1228369854990843930, tenantId=1146029695717560320, journalId=1146123166801305609, articleId=1228279672316817439, language=CN, label=表6, caption=
CT-DSCNet与其他模型EER的比较
, figureFileSmall=null, figureFileBig=null, tableContent=
| 系统 | ASVspoof2019LA | ASVspoof2021LA | ASVspoof2021DF |
| CQCC-GMM[27] | 9.57 | 15.62 | 25.56 |
| LFCC-GMM[28] | 8.09 | 19.30 | 25.25 |
| LFCC-LCNN[27] | — | 9.26 | 28.48 |
| RawNet2[16] | 4.86 | 9.50 | 22.38 |
| AASIST[11] | 1.04 | 6.24 | 20.29 |
| Rawformer[18] | 1.05 | 4.98 | — |
| CT-DSCNet | 1.43 | 3.86 | 18.01 |
)], attaches=null, journal=Journal(id=1146119176004939786, delFlag=0, nameCn=科学技术与工程, nameEn=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, issn=1671-1815, eissn=, cn=11-4688/T, coden=null, periodic=4, language=CN, oaType=是, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=UKU/O7GSka5polgCTkbIIw==, journalPrice=null, startedYear=null, abbrevIsoEn=Sci Technol Eng, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1754445529766, createdBy=null, updatedBy=13701087609, firstLetterCn=S, firstLetterEn=S, subjectCode=Natural Sciences, subjectName=自然科学, subjectCodeEn=Natural Sciences, subjectNameEn=null, picCn=UKU/O7GSka5polgCTkbIIw==, picEn=5hwlULoNwcbj3xUmVi9MAQ==, jcr=null, cjcr=null, exts=[JournalExt(id=1159791870395564357, language=CN, name=科学技术与工程, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529793, updatedTime=1754445529793, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=http://www.stae.com.cn/jsygc/site/menus/20090429150146001, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1159791870441701702, language=EN, name=Science Technology and Engineering, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=http://www.stae.com.cn/jsygc/home, createdTime=1754445529804, updatedTime=1754445529804, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=http://www.stae.com.cn/jsygc/author/login, submissionEditorUrl=http://www.stae.com.cn/jsygc/editor/login, submissionReviewUrl=http://www.stae.com.cn/jsygc/reviewer/login, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146123166801305609, websiteList=[Website(id=1148243202391400884, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/CN, language=CN, createTime=1751692112777, createBy=18614031015, updateTime=1753520965431, updateBy=18614031015, name=科学技术与工程-中文站点, tplId=1146099689490845704, title=科学技术与工程, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148622798802673703, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=articleTextType, value=kx, createTime=1751782615614, updateTime=1751782615614, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798781702180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=banner, value=null, createTime=1751782615609, updateTime=1751782615609, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798769119267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1751782615606, updateTime=1751782615606, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798794285094, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782615612, updateTime=1751782615612, creator=18614031015, updator=18614031015), WebsiteProps(id=1148622798790090789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202391400884, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782615611, updateTime=1751782615611, creator=18614031015, updator=18614031015)]), Website(id=1155914124811976731, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146123166801305609, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/kxjsygc/EN, language=EN, createTime=1753521003206, createBy=18614031015, updateTime=1753521003206, updateBy=18614031015, name=科学技术与工程-英文站点, tplId=1146101810881728533, title=Science Technology and Engineering, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155914371227308235, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=articleTextType, value=kx, createTime=1753521061952, updateTime=1753521061952, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371210531016, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=banner, value=null, createTime=1753521061947, updateTime=1753521061947, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371202142407, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=j86gbwi+p0Idkyl5SzIlmQ==, createTime=1753521061945, updateTime=1753521061945, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371223113930, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753521061950, updateTime=1753521061950, creator=18614031015, updator=18614031015), WebsiteProps(id=1155914371218919625, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155914124811976731, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753521061949, updateTime=1753521061949, creator=18614031015, updator=18614031015)])], journalTitle=科学技术与工程, weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Science Technology and Engineering, journalPhotoCn=UKU/O7GSka5polgCTkbIIw==, journalPhotoEn=5hwlULoNwcbj3xUmVi9MAQ==, journalFirstLetter=S, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/10.12404/j.issn.1671-1815.2409674, detailUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/10.12404/j.issn.1671-1815.2409674, pdfUrlCn=https://castjournals.cast.org.cn/joweb/kxjsygc/CN/PDF/10.12404/j.issn.1671-1815.2409674, pdfUrlEn=https://castjournals.cast.org.cn/joweb/kxjsygc/EN/PDF/10.12404/j.issn.1671-1815.2409674, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)