Article(id=1220368076957208837, tenantId=1146029695717560320, journalId=1146119989267898375, issueId=1220368072699986922, articleNumber=null, orderNo=null, doi=10.7654/j.issn.2097-1974.20250601, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=research-article, receivedDate=1751644800000, receivedDateStr=2025-07-05, revisedDate=1757865600000, revisedDateStr=2025-09-15, acceptedDate=null, acceptedDateStr=null, onlineDate=1768888022889, onlineDateStr=2026-01-20, pubDate=1766592000000, pubDateStr=2025-12-25, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1768888022889, onlineIssueDateStr=2026-01-20, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1768888022889, creator=13701087609, updateTime=1768888022889, updator=13701087609, issue=Issue{id=1220368072699986922, tenantId=1146029695717560320, journalId=1146119989267898375, year='2025', volume='48', issue='6', pageStart='1', pageEnd='106', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=null, createTime=1768888021873, creator=13701087609, updateTime=1768888582821, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1220370425566118679, tenantId=1146029695717560320, journalId=1146119989267898375, issueId=1220368072699986922, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1220370425570312984, tenantId=1146029695717560320, journalId=1146119989267898375, issueId=1220368072699986922, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=1, endPage=9, ext={EN=ArticleExt(id=1220368077271781639, articleId=1220368076957208837, tenantId=1146029695717560320, journalId=1146119989267898375, language=EN, title=Attitude Control of High-speed Vehicles Based on Improved TD3 Reinforcement Learning, columnId=1154057568293999177, journalTitle=Missiles and Space Vehicles, columnName=Launch Vehicle and Missile, runingTitle=null, highlight=null, articleAbstract=
To address the challenges of strong nonlinearity, high uncertainty, and rapid time-varying parameters during the reentry phase of high-speed vehicles, this study proposes an end-to-end intelligent attitude control method based on an improved Twin Delayed Deep Deterministic Policy Gradient algorithm, aligned with the demands of intelligent spacecraft development. To overcome the issues of training instability and convergence difficulties in TD3-based attitude control learning, two key innovations are introduced: a hybrid reward mechanism combining continuous tracking error penalties and sparse task-completion rewards is designed within the Markov Decision Process framework to synergistically guide agent convergence. Prior knowledge constraints derived from modern control theory are incorporated into the training process, proposing a behavior cloning-based optimization strategy for the Actor network to balance expert experience imitation and cumulative reward maximization. Simulation results show that the proposed method can accurately track the three-channel attitude commands under 14 combinations of parameter deviations.
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Weili WANG, Wanwei HUANG, Xiaodong LIU, Kunfeng LU, Chenhui JIA), CN=ArticleExt(id=1220368079935164706, articleId=1220368076957208837, tenantId=1146029695717560320, journalId=1146119989267898375, language=CN, title=基于改进型TD3强化学习的高速飞行器姿态控制, columnId=1154057568814092874, journalTitle=导弹与航天运载技术(中英文), columnName=运载器及导弹总体技术, runingTitle=null, highlight=null, articleAbstract=
针对高速飞行器再入段面临的强非线性、高不确定性以及参数快时变等挑战,结合航天器智能化发展需求,提出了一种改进型的双延迟深度确定性策略梯度(Twin Delayed Deep Deterministic Policy Gradient,TD3)端到端智能姿态控制方法。为解决TD3算法在姿态控制学习过程中存在训练不稳定、收敛困难的问题,在其马尔可夫决策过程中,设计了混合奖励机制,融合连续跟踪误差惩罚和稀疏任务完成奖励,协同引导智能体收敛;在其训练过程中,引入基于现代控制理论的先验知识约束,提出了基于行为克隆的Actor网络优化更新策略,以平衡专家经验模仿与累计回报最大化目标。仿真结果表明,在14种参数偏差组合的工况下,所提方法能够精确跟踪三通道姿态指令。
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=zoeMds9kydM2qRBy+JBlJg==, magXml=8NJkGaWluWSOikQRUTjrug==, pdfUrl=null, pdf=csrVoAizV5M55Qiwx/B8Qw==, pdfFileSize=2452360, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=Z5yNutYvEhj9ORCqs04PPA==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=yAguE0gbogfC37Kvv+T9rQ==, mapNumber=null, authorCompany=null, fund=null, authors=
王伟丽(1997—),女,博士研究生,主要研究方向为飞行器智能控制、自适应控制等。
黄万伟(1970—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
刘晓东(1987—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
路坤锋(1983—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
贾晨辉(1985—),男,博士,高级工程师,主要研究方向为飞行器制导与控制、智能控制等。
, authorsList=王伟丽, 黄万伟, 刘晓东, 路坤锋, 贾晨辉)}, authors=[Author(id=1220376972228739344, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1220376972300042514, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972228739344, language=EN, stringName=Weili WANG, firstName=Weili, middleName=null, lastName=WANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1220376972354568467, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972228739344, language=CN, stringName=王伟丽, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854, bio={"content":"
王伟丽(1997—),女,博士研究生,主要研究方向为飞行器智能控制、自适应控制等。
"}, bioImg=null, bioContent=
王伟丽(1997—),女,博士研究生,主要研究方向为飞行器智能控制、自适应控制等。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1220376972165824780, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, xref=null, ext=[AuthorCompanyExt(id=1220376972174213389, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854), AuthorCompanyExt(id=1220376972178407694, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854)])]), Author(id=1220376972417483029, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1220376972476203287, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972417483029, language=EN, stringName=Wanwei HUANG, firstName=Wanwei, middleName=null, lastName=HUANG, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1220376972530729240, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972417483029, language=CN, stringName=黄万伟, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854, bio={"content":"
黄万伟(1970—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
"}, bioImg=null, bioContent=
黄万伟(1970—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1220376972165824780, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, xref=null, ext=[AuthorCompanyExt(id=1220376972174213389, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854), AuthorCompanyExt(id=1220376972178407694, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854)])]), Author(id=1220376972597838106, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1220376972664946972, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972597838106, language=EN, stringName=Xiaodong LIU, firstName=Xiaodong, middleName=null, lastName=LIU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1220376972732055837, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972597838106, language=CN, stringName=刘晓东, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854, bio={"content":"
刘晓东(1987—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
"}, bioImg=null, bioContent=
刘晓东(1987—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1220376972165824780, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, xref=null, ext=[AuthorCompanyExt(id=1220376972174213389, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854), AuthorCompanyExt(id=1220376972178407694, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854)])]), Author(id=1220376972786581791, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1220376972862079265, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972786581791, language=EN, stringName=Kunfeng LU, firstName=Kunfeng, middleName=null, lastName=LU, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1220376972924993826, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376972786581791, language=CN, stringName=路坤锋, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854, bio={"content":"
路坤锋(1983—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
"}, bioImg=null, bioContent=
路坤锋(1983—),男,博士,研究员,主要研究方向为飞行器制导与控制、智能控制、自适应控制等。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1220376972165824780, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, xref=null, ext=[AuthorCompanyExt(id=1220376972174213389, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854), AuthorCompanyExt(id=1220376972178407694, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854)])]), Author(id=1220376974195867940, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, orderNo=4, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1220376974317502758, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376974195867940, language=EN, stringName=Chenhui JIA, firstName=Chenhui, middleName=null, lastName=JIA, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1220376974472692007, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, authorId=1220376974195867940, language=CN, stringName=贾晨辉, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=null, address=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854, bio={"content":"
贾晨辉(1985—),男,博士,高级工程师,主要研究方向为飞行器制导与控制、智能控制等。
"}, bioImg=null, bioContent=
贾晨辉(1985—),男,博士,高级工程师,主要研究方向为飞行器制导与控制、智能控制等。
, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1220376972165824780, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, xref=null, ext=[AuthorCompanyExt(id=1220376972174213389, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854), AuthorCompanyExt(id=1220376972178407694, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854)])])], keywords=[Keyword(id=1220376974623686952, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, orderNo=1, keyword=high-speed vehicles), Keyword(id=1220376974699184425, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, orderNo=2, keyword=attitude control), Keyword(id=1220376974757904682, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, orderNo=3, keyword=deep reinforcement learning), Keyword(id=1220376974833402155, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, orderNo=4, keyword=behavior cloning), Keyword(id=1220376974917288236, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, orderNo=5, keyword=strongly adaptive control), Keyword(id=1220376974976008493, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, orderNo=1, keyword=高速飞行器), Keyword(id=1220376975038923054, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, orderNo=2, keyword=姿态控制), Keyword(id=1220376975114420527, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, orderNo=3, keyword=深度强化学习), Keyword(id=1220376975210889520, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, orderNo=4, keyword=行为克隆), Keyword(id=1220376975269609777, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, orderNo=5, keyword=强适应控制)], refs=[Reference(id=1220376977333207373, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2023, volume=6, issue=3, pageStart=39, pageEnd=51, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=刘双喜, 刘世俊, 李勇, journalName=空天防御, refType=null, unstructuredReference=刘双喜, 刘世俊, 李勇, 等. 国外高超声速飞行器及防御体系发展现状[J].
空天防御,
2023,
6(3): 39-51., articleTitle=国外高超声速飞行器及防御体系发展现状, refAbstract=null), Reference(id=1220376977391927630, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2023, volume=6, issue=3, pageStart=39, pageEnd=51, url=null, language=null, rfNumber=[1], rfOrder=1, authorNames=LIU Shuangxi, LIU Shijun, LI Yong, journalName=Air and Space Defense, refType=null, unstructuredReference=
LIU Shuangxi,
LIU Shijun,
LI Yong, et al. Current developments in foreign hypersonic vehicles and defense systems[J].
Air and Space Defense,
2023,
6(3): 39-51., articleTitle=null, refAbstract=null), Reference(id=1220376978679578959, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=1, pageStart=64, pageEnd=70, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=樊轶, 秦昌茂, 董添, journalName=导弹与航天运载技术(中英文), refType=null, unstructuredReference=樊轶, 秦昌茂, 董添, 等. 基于MIMO-ESO的高速飞行器自抗扰控制[J].
导弹与航天运载技术(中英文),
2024(1): 64-70., articleTitle=基于MIMO-ESO的高速飞行器自抗扰控制, refAbstract=null), Reference(id=1220376978767659344, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2024, volume=null, issue=1, pageStart=64, pageEnd=70, url=null, language=null, rfNumber=[2], rfOrder=3, authorNames=FAN Yi, QIN Changmao, DONG Tian, journalName=Missiles and Space Vehicles, refType=null, unstructuredReference=
FAN Yi,
QIN Changmao,
DONG Tian, et al. ADRC attitude controller design for hypersonic vehicle based on MIMO-ESO[J].
Missiles and Space Vehicles,
2024(1): 64-70., articleTitle=null, refAbstract=null), Reference(id=1220376978834768209, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2021, volume=42, issue=11, pageStart=8, pageEnd=17, url=null, language=null, rfNumber=[3], rfOrder=4, authorNames=包为民, journalName=航空学报, refType=null, unstructuredReference=包为民. 航天智能控制技术让运载火箭“会学习”[J].
航空学报,
2021,
42(11): 8-17., articleTitle=航天智能控制技术让运载火箭“会学习”, refAbstract=null), Reference(id=1220376978910265682, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2021, volume=42, issue=11, pageStart=8, pageEnd=17, url=null, language=null, rfNumber=[3], rfOrder=5, authorNames=BAO Weimin, journalName=Acta Aeronautica et Astronautica Sinica, refType=null, unstructuredReference=
BAO Weimin. Space intelligent control technology enables launch vehicle to “self-learning”[J].
Acta Aeronautica et Astronautica Sinica,
2021,
42(11): 8-17., articleTitle=null, refAbstract=null), Reference(id=1220376978977374547, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2022, volume=9, issue=9, pageStart=1561, pageEnd=1573, url=null, language=null, rfNumber=[4], rfOrder=6, authorNames=ZHANG Z Y, MO Z B, CHEN Y T, journalName=IEEE-CAA Journal of Automatica Sinica, refType=null, unstructuredReference=
ZHANG Z Y,
MO Z B,
CHEN Y T, et al. Reinforcement learning behavioral control for nonlinear autonomous system[J].
IEEE-CAA Journal of Automatica Sinica,
2022,
9(9): 1561-1573., articleTitle=Reinforcement learning behavioral control for nonlinear autonomous system, refAbstract=null), Reference(id=1220376979044483412, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=null, issue=22, pageStart=8187, pageEnd=8199, url=null, language=null, rfNumber=[5], rfOrder=7, authorNames=LUO B, SUN J Y, TANG R, journalName=IEEE Transactions on Automation Science and Engineering, refType=null, unstructuredReference=
LUO B,
SUN J Y,
TANG R, et al. Reinforcement learning-based 3D trajectory tracking control of hypersonic gliding vehicles with time-varying uncertainties[J].
IEEE Transactions on Automation Science and Engineering,
2025(22): 8187-8199., articleTitle=Reinforcement learning-based 3D trajectory tracking control of hypersonic gliding vehicles with time-varying uncertainties, refAbstract=null), Reference(id=1220376979107397973, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=96, pageStart=105537, pageEnd=null, url=null, language=null, rfNumber=[6], rfOrder=8, authorNames=LIU C, DONG C Y, ZHOU Z J, journalName=Aerospace Science and Technology, refType=null, unstructuredReference=
LIU C,
DONG C Y,
ZHOU Z J, et al. Barrier Lyapunov function based reinforcement learning control for air-breathing hypersonic vehicle with variable geometry inlet[J].
Aerospace Science and Technology,
2020(96): 105537., articleTitle=Barrier Lyapunov function based reinforcement learning control for air-breathing hypersonic vehicle with variable geometry inlet, refAbstract=null), Reference(id=1220376979174506838, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=8, issue=2, pageStart=201, pageEnd=209, url=null, language=null, rfNumber=[7], rfOrder=9, authorNames=LU K F, WANG W L, LIU X D, journalName=Advances in Astronautics, refType=null, unstructuredReference=
LU K F,
WANG W L,
LIU X D, et al. Research progress and prospect of high-speed vehicle control technology based on reinforcement learning[J].
Advances in Astronautics,
2025,
8(2): 201-209., articleTitle=Research progress and prospect of high-speed vehicle control technology based on reinforcement learning, refAbstract=null), Reference(id=1220376979233227095, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2022, volume=null, issue=198, pageStart=606, pageEnd=616, url=null, language=null, rfNumber=[8], rfOrder=10, authorNames=WANG G, AN H, WANG Y, journalName=Acta Astronautica, refType=null, unstructuredReference=
WANG G,
AN H,
WANG Y, et al. Intelligent control of air-breathing hypersonic vehicles subject to path and angle-of-attack constrai-nts[J].
Acta Astronautica,
2022(198): 606-616., articleTitle=Intelligent control of air-breathing hypersonic vehicles subject to path and angle-of-attack constrai-nts, refAbstract=null), Reference(id=1220376979317113176, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2024, volume=31, issue=4, pageStart=577, pageEnd=582, url=null, language=null, rfNumber=[9], rfOrder=11, authorNames=GAO Q, LI X, JI Y, journalName=Control Engineering of China, refType=null, unstructuredReference=
GAO Q,
LI X,
JI Y, et al. Research on active disturbance rejection control of hypersonic vehicle based on Q-learning[J].
Control Engineering of China,
2024,
31(4): 577-582., articleTitle=Research on active disturbance rejection control of hypersonic vehicle based on Q-learning, refAbstract=null), Reference(id=1220376979380027737, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2024, volume=36, issue=8, pageStart=4071, pageEnd=4081, url=null, language=null, rfNumber=[10], rfOrder=12, authorNames=LI X, JI Y H, SONG Y, journalName=Neural Computing and Applications, refType=null, unstructuredReference=
LI X,
JI Y H,
SONG Y, et al. Modified deep deterministic policy gradient based on active disturbance rejection control for hypersonic vehicles[J].
Neural Computing and Applications,
2024,
36(8): 4071-4081., articleTitle=Modified deep deterministic policy gradient based on active disturbance rejection control for hypersonic vehicles, refAbstract=null), Reference(id=1220376979451330906, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2024, volume=45, issue=7, pageStart=1100, pageEnd=1110, url=null, language=null, rfNumber=[11], rfOrder=13, authorNames=路坤锋, 贾晨辉, 黄旭, journalName=宇航学报, refType=null, unstructuredReference=路坤锋, 贾晨辉, 黄旭, 等. 面向变构型飞行器的强化学习位置姿态一体化控制方法[J].
宇航学报,
2024,
45(7): 1100-1110., articleTitle=面向变构型飞行器的强化学习位置姿态一体化控制方法, refAbstract=null), Reference(id=1220376979514245467, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2024, volume=45, issue=7, pageStart=1100, pageEnd=1110, url=null, language=null, rfNumber=[11], rfOrder=14, authorNames=LU Kunfeng, JIA Chenhui, HUANG Xu, journalName=Journal of Astronautics, refType=null, unstructuredReference=
LU Kunfeng,
JIA Chenhui,
HUANG Xu, et al. Reinforcement learning-based integrated position and attitude control method towards morphing flight vehicles[J].
Journal of Astronautics,
2024,
45(7): 1100-1110., articleTitle=null, refAbstract=null), Reference(id=1220376979589742940, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=46, issue=8, pageStart=298, pageEnd=313, url=null, language=null, rfNumber=[12], rfOrder=15, authorNames=姜凌峰, 李新凯, 张海, journalName=航空学报, refType=null, unstructuredReference=姜凌峰, 李新凯, 张海, 等. 基于改进TD3算法的无人机动态环境无地图导航[J].
航空学报,
2025,
46(8): 298-313., articleTitle=基于改进TD3算法的无人机动态环境无地图导航, refAbstract=null), Reference(id=1220376979652657501, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=46, issue=8, pageStart=298, pageEnd=313, url=null, language=null, rfNumber=[12], rfOrder=16, authorNames=JIANG Lingfeng, LI Xinkai, ZHANG Hai, journalName=Acta aeronautica et Astronautica Sinica, refType=null, unstructuredReference=
JIANG Lingfeng,
LI Xinkai,
ZHANG Hai, et al. Mapless navigation of UAVs in dynamic environments based on an improved TD3 algorithm[J].
Acta aeronautica et Astronautica Sinica,
2025,
46(8): 298-313., articleTitle=null, refAbstract=null), Reference(id=1220376979707183454, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=34, issue=2, pageStart=61, pageEnd=73, url=null, language=null, rfNumber=[13], rfOrder=17, authorNames=彭博, 王晓波, 魏祥麟, journalName=计算机系统应用, refType=null, unstructuredReference=彭博, 王晓波, 魏祥麟, 等. 基于SPER-TD3的无人机编队三维航迹规划[J].
计算机系统应用,
2025,
34(2): 61-73., articleTitle=基于SPER-TD3的无人机编队三维航迹规划, refAbstract=null), Reference(id=1220376979765903711, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=34, issue=2, pageStart=61, pageEnd=73, url=null, language=null, rfNumber=[13], rfOrder=18, authorNames=PENG Bo, WANG Xiaobo, WEI Xianglin, journalName=Computer Systems & Applications, refType=null, unstructuredReference=
PENG Bo,
WANG Xiaobo,
WEI Xianglin, et al. 3D trajectory planning for unmanned aerial vehicle formation based on SPER-TD3[J].
Computer Systems & Applications,
2025,
34(2): 61-73., articleTitle=null, refAbstract=null), Reference(id=1220376979824623968, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=42, issue=4, pageStart=1003, pageEnd=1010, url=null, language=null, rfNumber=[14], rfOrder=19, authorNames=闫雷鸣, 刘健, 朱永昕, journalName=计算机应用研究, refType=null, unstructuredReference=闫雷鸣, 刘健, 朱永昕. DPC-DQRL: 动态行为克隆约束的离线-在线双Q值强化学习[J].
计算机应用研究,
2025,
42(4): 1003-1010., articleTitle=DPC-DQRL: 动态行为克隆约束的离线-在线双Q值强化学习, refAbstract=null), Reference(id=1220376979887538529, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2025, volume=42, issue=4, pageStart=1003, pageEnd=1010, url=null, language=null, rfNumber=[14], rfOrder=20, authorNames=YAN Leiming, LIU Jian, ZHU Yongxin, journalName=Application Research of Computers, refType=null, unstructuredReference=
YAN Leiming,
LIU Jian,
ZHU Yongxin. DPC-DQRL: offline to online double Q value reinforcement learning with dynamic behavior cloning constraints[J].
Application Research of Computers,
2025,
42(4): 1003-1010., articleTitle=null, refAbstract=null), Reference(id=1220376979954647394, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2015, volume=36, issue=8, pageStart=916, pageEnd=922, url=null, language=null, rfNumber=[15], rfOrder=21, authorNames=刘晓东, 黄万伟, 禹春梅, journalName=宇航学报, refType=null, unstructuredReference=刘晓东, 黄万伟, 禹春梅. 含扩张状态观测器的高超声速飞行器动态面姿态控制[J].
宇航学报,
2015,
36(8): 916-922., articleTitle=含扩张状态观测器的高超声速飞行器动态面姿态控制, refAbstract=null), Reference(id=1220376980021756259, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2015, volume=36, issue=8, pageStart=916, pageEnd=922, url=null, language=null, rfNumber=[15], rfOrder=22, authorNames=LIU Xiaodong, HUANG Wanwei, YU Chunmei, journalName=Journal of Astronautics, refType=null, unstructuredReference=
LIU Xiaodong,
HUANG Wanwei,
YU Chunmei. Dynamic surface attitude control for hypersonic vehicle containing extended state observer[J].
Journal of Astronautics,
2015,
36(8): 916-922., articleTitle=null, refAbstract=null), Reference(id=1220376980088865124, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2023, volume=44, issue=8, pageStart=1113, pageEnd=1126, url=null, language=null, rfNumber=[16], rfOrder=23, authorNames=黄旭, 柳嘉润, 张远, journalName=宇航学报, refType=null, unstructuredReference=黄旭, 柳嘉润, 张远, 等. 知识与数据混合驱动的高速飞行控制方法综述[J].
宇航学报,
2023,
44(8): 1113-1126., articleTitle=知识与数据混合驱动的高速飞行控制方法综述, refAbstract=null), Reference(id=1220376980155973989, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2023, volume=44, issue=8, pageStart=1113, pageEnd=1126, url=null, language=null, rfNumber=[16], rfOrder=24, authorNames=HUANG Xu, LIU Jiarun, ZHANG Yuan, journalName=Journal of Astronautics, refType=null, unstructuredReference=
HUANG Xu,
LIU Jiarun,
ZHANG Yuan, et al. Review on knowledge-based and data-driver cooperating control methods of high-speed vehicle[J].
Journal of Astronautics,
2023,
44(8): 1113-1126., articleTitle=null, refAbstract=null), Reference(id=1220376980214694246, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=66, pageStart=164, pageEnd=175, url=null, language=null, rfNumber=[17], rfOrder=25, authorNames=LIU X, HUANG W, DU L, journalName=ISA Transactions, refType=null, unstructuredReference=
LIU X,
HUANG W,
DU L. An integrated guidance and control approach in three-dimensional space for hypersonic missile constrained by impact angles[J].
ISA Transactions,
2017(66): 164-175., articleTitle=An integrated guidance and control approach in three-dimensional space for hypersonic missile constrained by impact angles, refAbstract=null)], funds=[Fund(id=1220376977190601036, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, awardId=U24B20159, language=CN, fundingSource=国家自然科学基金(U24B20159), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1220376972165824780, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, xref=null, ext=[AuthorCompanyExt(id=1220376972174213389, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=National Key Laboratory of Science and Technology on Aerospace Intelligent Control, Beijing AerospaceAutomatic Control Institute, Beijing, 100854), AuthorCompanyExt(id=1220376972178407694, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, companyId=1220376972165824780, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=北京航天自动控制研究所,宇航智能控制技术全国重点实验室,北京,100854)])], figs=[ArticleFig(id=1220376975433187634, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.1, caption=
Typical unpowered high-speed vehicle, figureFileSmall=rb3v+lObYXMR8Yo4pmSgmQ==, figureFileBig=VekLGfCfNZqNaGndzZAoaQ==, tableContent=null), ArticleFig(id=1220376975508685107, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图1, caption=
典型的无动力高速飞行器, figureFileSmall=rb3v+lObYXMR8Yo4pmSgmQ==, figureFileBig=VekLGfCfNZqNaGndzZAoaQ==, tableContent=null), ArticleFig(id=1220376975592571188, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.2, caption=
Online deployment of neural network model, figureFileSmall=P0ZyBkwZs9seTISyF0fKIA==, figureFileBig=2/KIidyeOQp5DpHvDMB14w==, tableContent=null), ArticleFig(id=1220376975663874357, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图2, caption=
神经网络模型的在线部署, figureFileSmall=P0ZyBkwZs9seTISyF0fKIA==, figureFileBig=2/KIidyeOQp5DpHvDMB14w==, tableContent=null), ArticleFig(id=1220376975726788918, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.3, caption=
Typical parameters of standard trajectories, figureFileSmall=geQ6cFh08dKvMW/Tp5IxLQ==, figureFileBig=uwOyyywQomyFnnjMmcU0EQ==, tableContent=null), ArticleFig(id=1220376975781314871, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图3, caption=
标准轨迹的典型参数, figureFileSmall=geQ6cFh08dKvMW/Tp5IxLQ==, figureFileBig=uwOyyywQomyFnnjMmcU0EQ==, tableContent=null), ArticleFig(id=1220376975840035128, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.4, caption=
Reward progression during training, figureFileSmall=QWRn34i3EGroLjq9m8WXGw==, figureFileBig=gIAEhwYna4DZ5Mo34oPIcA==, tableContent=null), ArticleFig(id=1220376975894561081, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图4, caption=
训练过程中的奖励值, figureFileSmall=QWRn34i3EGroLjq9m8WXGw==, figureFileBig=gIAEhwYna4DZ5Mo34oPIcA==, tableContent=null), ArticleFig(id=1220376975944892730, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.5, caption=
Attitude angle tracking effect, figureFileSmall=/dTNg7/rII8/hwnPvhG4CQ==, figureFileBig=WlkYokS99cEXAdVAzcjQAw==, tableContent=null), ArticleFig(id=1220376976024584507, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图5, caption=
姿态角跟踪效果, figureFileSmall=/dTNg7/rII8/hwnPvhG4CQ==, figureFileBig=WlkYokS99cEXAdVAzcjQAw==, tableContent=null), ArticleFig(id=1220376976074916156, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.6, caption=
Attitude angle tracking error, figureFileSmall=D4H94agU1Cq21w2pVMunRQ==, figureFileBig=o8qimmT9Vg60eqGmWLsp6g==, tableContent=null), ArticleFig(id=1220376976146219325, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图6, caption=
姿态角跟踪误差, figureFileSmall=D4H94agU1Cq21w2pVMunRQ==, figureFileBig=o8qimmT9Vg60eqGmWLsp6g==, tableContent=null), ArticleFig(id=1220376976225911102, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Fig.7, caption=
Three-axis rudder deflection of the KG-TD3 method, figureFileSmall=JHkOozLrZIqjsyrk1oj9Ew==, figureFileBig=SnCP8uWitNY26z+fUcJmgA==, tableContent=null), ArticleFig(id=1220376976276242751, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=图7, caption=
基于KG-TD3方法的三轴舵偏, figureFileSmall=JHkOozLrZIqjsyrk1oj9Ew==, figureFileBig=SnCP8uWitNY26z+fUcJmgA==, tableContent=null), ArticleFig(id=1220376976339157312, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 1: | 随机初始化策略网络和价值网络、 |
| 2: | 初始化目标策略网络参数和目标价值网络、 |
| 3: | 初始化经验回放缓冲区 |
| 4: | for episode = 1 todo |
| 5: | 初始化噪声用于噪声探索 |
| 6: | 策略网络接收初始观察状态 |
| 7: | fortodo |
| 8: | 根据当前策略和探索噪声选择动作 |
| 9: | 执行动作,获取奖励,观测新状态 |
| 10: | 经验存储:在中存储 |
| 11: | 经验回放:从中随机取出个 |
| 12: | |
| 13: | 两个目标价值网络预测:() |
| 14: | |
| 15: | 两个价值网络预测: |
| 16: | 最小化损失函数: 更新价值网络 |
| 17: | if mod then |
| 18: | |
| 19: | 最小化损失函数,更新策略网络 |
|
| 20: | 软更新目标策略网络 |
| 21: | 软更新目标价值网络 |
| 22: | end if |
| 23: | end for |
| 24: | end for |
), ArticleFig(id=1220376976439820609, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=, caption=, figureFileSmall=null, figureFileBig=null, tableContent=
| 1: | 随机初始化策略网络和价值网络、 |
| 2: | 初始化目标策略网络参数和目标价值网络、 |
| 3: | 初始化经验回放缓冲区 |
| 4: | for episode = 1 todo |
| 5: | 初始化噪声用于噪声探索 |
| 6: | 策略网络接收初始观察状态 |
| 7: | fortodo |
| 8: | 根据当前策略和探索噪声选择动作 |
| 9: | 执行动作,获取奖励,观测新状态 |
| 10: | 经验存储:在中存储 |
| 11: | 经验回放:从中随机取出个 |
| 12: | |
| 13: | 两个目标价值网络预测:() |
| 14: | |
| 15: | 两个价值网络预测: |
| 16: | 最小化损失函数: 更新价值网络 |
| 17: | if mod then |
| 18: | |
| 19: | 最小化损失函数,更新策略网络 |
|
| 20: | 软更新目标策略网络 |
| 21: | 软更新目标价值网络 |
| 22: | end if |
| 23: | end for |
| 24: | end for |
), ArticleFig(id=1220376976523706690, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Tab.1, caption=
Aircraft body parameters
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 数值 |
|---|
| /kg | 1 000 |
| /m | 0.7 |
| /(kg·m-2) | 3 000 |
| /m2 | 0.45 |
| /(kg·m-2) | 200 |
| /(kg·m-2) | 2 800 |
), ArticleFig(id=1220376976590815555, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=表1, caption=
飞行器机体参数
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 数值 |
|---|
| /kg | 1 000 |
| /m | 0.7 |
| /(kg·m-2) | 3 000 |
| /m2 | 0.45 |
| /(kg·m-2) | 200 |
| /(kg·m-2) | 2 800 |
), ArticleFig(id=1220376976645341508, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Tab.2, caption=
Network structure of the KG-TD3 algorithm
, figureFileSmall=null, figureFileBig=null, tableContent=
| 网络名称 | 层类型 | 神经元个数 | 激活函数 |
|---|
| Actor | 输入层 | 6 | None |
| 全连接层 | 128 | Relu |
| 输出层 | 3 | Tanh |
| Critic | 输入层 | 9 | None |
| 全连接层 | 512 | Relu |
| 全连接层 | 256 | Relu |
| 输出层 | 1 | Linear |
), ArticleFig(id=1220376976725033285, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=表2, caption=
KG-TD3算法的网络结构
, figureFileSmall=null, figureFileBig=null, tableContent=
| 网络名称 | 层类型 | 神经元个数 | 激活函数 |
|---|
| Actor | 输入层 | 6 | None |
| 全连接层 | 128 | Relu |
| 输出层 | 3 | Tanh |
| Critic | 输入层 | 9 | None |
| 全连接层 | 512 | Relu |
| 全连接层 | 256 | Relu |
| 输出层 | 1 | Linear |
), ArticleFig(id=1220376976775364934, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Tab.3, caption=
KG-TD3 algorithm training process hyper-parameters
, figureFileSmall=null, figureFileBig=null, tableContent=
| 超参数 | 数值 |
|---|
| 探索噪声 | |
| 目标策略平滑噪声 | |
| 延迟更新策略 | 2 |
| 目标网络更新率 | 0.005 |
| 批量大小 | 128 |
| Actor学习率 | |
| Critic学习率 | |
| 行为克隆权重 | 0.1 |
), ArticleFig(id=1220376976834085191, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=表3, caption=
KG-TD3算法训练过程超参数
, figureFileSmall=null, figureFileBig=null, tableContent=
| 超参数 | 数值 |
|---|
| 探索噪声 | |
| 目标策略平滑噪声 | |
| 延迟更新策略 | 2 |
| 目标网络更新率 | 0.005 |
| 批量大小 | 128 |
| Actor学习率 | |
| Critic学习率 | |
| 行为克隆权重 | 0.1 |
), ArticleFig(id=1220376976892805448, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Tab.4, caption=
Margins of error for parameters
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 偏差范围 |
|---|
| /(°) | 1 |
| /(°) | 3 |
| 10% |
| 20% |
| 15% |
| 20% |
| 20% |
| /(°) | 1 |
| 10% |
| 10% |
| 15% |
| 15% |
| 20% |
| 20% |
), ArticleFig(id=1220376976951525705, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=表4, caption=
参数偏差范围
, figureFileSmall=null, figureFileBig=null, tableContent=
| 参数 | 偏差范围 |
|---|
| /(°) | 1 |
| /(°) | 3 |
| 10% |
| 20% |
| 15% |
| 20% |
| 20% |
| /(°) | 1 |
| 10% |
| 10% |
| 15% |
| 15% |
| 20% |
| 20% |
), ArticleFig(id=1220376977010245962, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=EN, label=Tab.5, caption=
Comparison of attitude angle tracking errors
, figureFileSmall=null, figureFileBig=null, tableContent=
| 最大误差 | TD3 | KG-TD3 |
|---|
| MAX_/(°) | 2.403 | 0.420 |
| MAX_/(°) | 0.836 | 0.528 |
| MAX_/(°) | 34.563 | 0.725 |
), ArticleFig(id=1220376977073160523, tenantId=1146029695717560320, journalId=1146119989267898375, articleId=1220368076957208837, language=CN, label=表5, caption=
姿态角跟踪误差对比
, figureFileSmall=null, figureFileBig=null, tableContent=
| 最大误差 | TD3 | KG-TD3 |
|---|
| MAX_/(°) | 2.403 | 0.420 |
| MAX_/(°) | 0.836 | 0.528 |
| MAX_/(°) | 34.563 | 0.725 |
)], attaches=null, journal=Journal(id=1146118917132496903, delFlag=0, nameCn=导弹与航天运载技术(中英文), nameEn=Missiles and Space Vehicles, nameHistory1=null, nameHistory2=null, issn=2097-1974, eissn=, cn=10-1807/V, coden=null, periodic=1, language=CN, oaType=否, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=DdfacUcWE1ibGHaCsbhL8w==, journalPrice=null, startedYear=null, abbrevIsoEn=Miss Space Veh, journalRemark=null, publicationField=null, createdTime=null, updatedTime=1753780023753, createdBy=null, updatedBy=13701087609, firstLetterCn=M, firstLetterEn=M, subjectCode=Engineering, subjectName=工程, subjectCodeEn=Engineering, subjectNameEn=null, picCn=DdfacUcWE1ibGHaCsbhL8w==, picEn=jBog3LY3UHfAAYfYEqIBHg==, jcr=null, cjcr=null, exts=[JournalExt(id=1157000535829205111, language=CN, name=导弹与航天运载技术(中英文), nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1753780023772, updatedTime=1753780023772, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=null, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-ddht-author&redirect_uri=https%3A%2F%2Fddht.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=fefa73ea-30bb-4b68, submissionEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-ddht-author&redirect_uri=https%3A%2F%2Fddht.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=fefa73ea-30bb-4b68, submissionReviewUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-ddht-author&redirect_uri=https%3A%2F%2Fddht.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=fefa73ea-30bb-4b68, submissionCeEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-ddht-author&redirect_uri=https%3A%2F%2Fddht.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=fefa73ea-30bb-4b68, submissionAeEditorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-ddht-author&redirect_uri=https%3A%2F%2Fddht.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=fefa73ea-30bb-4b68, option={"copyright":""}), JournalExt(id=1157000535871148152, language=EN, name=Missiles and Space Vehicles, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=null, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1753780023782, updatedTime=1753780023782, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=null, submissionAuthorUrl=https://journal.ids.fzyun.cn/auth/realms/journal/protocol/openid-connect/auth?client_id=journal-ddht-author&redirect_uri=https%3A%2F%2Fddht.portal.founderss.cn%2Foauth%2Fcallback&response_type=code&scope=phone+openid+email+profile&state=fefa73ea-30bb-4b68, submissionEditorUrl=, submissionReviewUrl=, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1146119989267898375, websiteList=[Website(id=1148243202378817956, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146119989267898375, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/ddyht/CN, language=CN, createTime=1751692112774, createBy=18614031015, updateTime=1753519037132, updateBy=18614031015, name=导弹与航天运载技术-中文站点, tplId=1146099689490845704, title=导弹与航天运载技术(中英文), delFlag=0, indexPage=/home, props=[WebsiteProps(id=1148620442723704855, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202378817956, code=articleTextType, value=kx, createTime=1751782053881, updateTime=1751782053881, creator=18614031015, updator=18614031015), WebsiteProps(id=1148620442694344724, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202378817956, code=banner, value=null, createTime=1751782053874, updateTime=1751782053874, creator=18614031015, updator=18614031015), WebsiteProps(id=1148620442677567507, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202378817956, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=gfUyzanfTuxQ2yc+L/MeWA==, createTime=1751782053870, updateTime=1751782053870, creator=18614031015, updator=18614031015), WebsiteProps(id=1148620442711121942, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202378817956, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1751782053878, updateTime=1751782053878, creator=18614031015, updator=18614031015), WebsiteProps(id=1148620442706927637, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1148243202378817956, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1751782053877, updateTime=1751782053877, creator=18614031015, updator=18614031015)]), Website(id=1155906039850618895, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1146119989267898375, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/ddyht/EN, language=EN, createTime=1753519075604, createBy=18614031015, updateTime=1753519075604, updateBy=18614031015, name=导弹与航天运载技术-英文站点, tplId=1146101810881728533, title=Missiles and Space Vehicles, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1155907112585777347, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155906039850618895, code=articleTextType, value=kx, createTime=1753519331356, updateTime=1753519331356, creator=18614031015, updator=18614031015), WebsiteProps(id=1155907112556417216, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155906039850618895, code=banner, value=null, createTime=1753519331349, updateTime=1753519331349, creator=18614031015, updator=18614031015), WebsiteProps(id=1155907112552222911, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155906039850618895, code=logo, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic?fileId=gfUyzanfTuxQ2yc+L/MeWA==, createTime=1753519331348, updateTime=1753519331348, creator=18614031015, updator=18614031015), WebsiteProps(id=1155907112577388738, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155906039850618895, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/kjdb/CN/file/pic, createTime=1753519331354, updateTime=1753519331354, creator=18614031015, updator=18614031015), WebsiteProps(id=1155907112564805825, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1155906039850618895, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1753519331351, updateTime=1753519331351, creator=18614031015, updator=18614031015)])], journalTitle=导弹与航天运载技术(中英文), weixinUrl=null, journalUrl=null, iacademicId=null, status=0, seqNo=null, journalTitleEn=Missiles and Space Vehicles, journalPhotoCn=DdfacUcWE1ibGHaCsbhL8w==, journalPhotoEn=jBog3LY3UHfAAYfYEqIBHg==, journalFirstLetter=M, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=null, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/ddyht/CN/10.7654/j.issn.2097-1974.20250601, detailUrlEn=https://castjournals.cast.org.cn/joweb/ddyht/EN/10.7654/j.issn.2097-1974.20250601, pdfUrlCn=https://castjournals.cast.org.cn/joweb/ddyht/CN/PDF/10.7654/j.issn.2097-1974.20250601, pdfUrlEn=https://castjournals.cast.org.cn/joweb/ddyht/EN/PDF/10.7654/j.issn.2097-1974.20250601, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)